1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
|
using System.Net.Http.Headers;
using System.Text;
using System.Text.Json;
using System.Text.Json.Nodes;
using Microsoft.Extensions.Options;
using Tango.Portal.Chat.Web.Models;
using System.Text.RegularExpressions;
namespace Tango.Portal.Chat.Web.Services
{
public sealed class LlmClient
{
private readonly HttpClient _http;
private readonly LlmOptions _opt;
public sealed class AssistantRunResult
{
public string Answer { get; set; } = "";
public string ThreadId { get; set; } = "";
}
public enum AssistantType
{
Data,
Docs
}
public LlmClient(HttpClient http, IOptions<LlmOptions> opt)
{
_http = http;
_opt = opt.Value;
}
public async Task<ProposeKqlResult> ProposeKqlAsync(string question, string schemaJson, CancellationToken ct = default)
{
var system = string.Join("\n", new[] {
"You are a Kusto (KQL) assistant for Azure Data Explorer.",
"Use ONLY the tables/columns provided in the SCHEMA JSON that follows.",
"ALWAYS try to query for the least amount of data neccessary to answer the question.",
"Return a JSON object with fields: assistant, kql, parameters, parameterTypes (optional), assumptions, why.",
"When asked to query by months ago, convert number of months to days (e.g last to months = StartTime >= ago(60d))",
"When joining tables, this example for correct syntax: EventsTable | join kind=inner (EventTypesTable) on $left.EventTypeGuid == $right.GUID.",
"When querying MachinesTable you can fetch the machine's Organization and Site by joining the latest record from JobRunsTable by SerialNumber.",
"Output raw JSON ONLY (no code fences).",
@"Classify the user's question into exactly one of:
- ""data"": requires querying telemetry via KQL (numbers, trends, counts, rates, top-N, timelines).
- ""docs"": architectural/how-to/design/definitions/“what is/how do we” that do not require live data. place data or docs in the assistant field you return.
- ""none"": conversational content like Thank you/Hi/How are you. Or questions about why did you chose to execute the previouse KQL query the way you did and maybe ask for correction. In this case answer nicely and try to have a good conversation without going out of context.",
"If the question is classified as 'docs', set kql to an empty string and parameters to an empty object.",
});
var schemaBlock = $"SCHEMA:\n{schemaJson}";
var user = $"Question: {question}\n\n{schemaBlock}";
var payload = new
{
model = _opt.Model,
temperature = _opt.Temperature,
response_format = new { type = "json_object" },
messages = new object[] {
new { role = "system", content = system },
new { role = "user", content = user }
}
};
using var req = new HttpRequestMessage(HttpMethod.Post, _opt.Endpoint);
var json = JsonSerializer.Serialize(payload);
req.Content = new StringContent(json, Encoding.UTF8, "application/json");
if (_opt.IsAzure) req.Headers.Add("api-key", _opt.ApiKey);
else req.Headers.Authorization = new AuthenticationHeaderValue("Bearer", _opt.ApiKey);
using var resp = await _http.SendAsync(req, ct);
resp.EnsureSuccessStatusCode();
var body = await resp.Content.ReadAsStringAsync(ct);
var root = JsonNode.Parse(body)!.AsObject();
var content = root["choices"]![0]!["message"]!["content"]?.ToString() ?? "{}";
content = StripCodeFences(content);
var opts = new JsonSerializerOptions { PropertyNameCaseInsensitive = true };
opts.Converters.Add(new FlexibleStringListConverter());
try
{
var result = JsonSerializer.Deserialize<ProposeKqlResult>(content, opts);
if (result != null) return result;
}
catch (JsonException)
{
// fall back
}
// Lenient mapping
var node = JsonNode.Parse(content) as JsonObject ?? new JsonObject();
var kql = node["kql"]?.ToString() ?? string.Empty;
var parameters = new Dictionary<string, string>();
if (node["parameters"] is JsonObject pObj)
{
foreach (var kv in pObj)
parameters[kv.Key] = kv.Value?.ToString() ?? string.Empty;
}
List<string>? assumptions = null;
if (node.TryGetPropertyValue("assumptions", out var aNode) && aNode is not null)
{
assumptions = new List<string>();
if (aNode is JsonArray arr)
{
foreach (var el in arr) assumptions.Add(el?.ToString() ?? string.Empty);
}
else
{
assumptions.Add(aNode.ToString());
}
}
return new ProposeKqlResult
{
Kql = kql,
Parameters = parameters,
Assumptions = assumptions,
Why = node["why"]?.ToString()
};
}
public async Task<ProposeKqlResult> ProposeKqlAsync(String plannerPrompt,
string question, string schemaJson, IEnumerable<ChatMessage>? history, CancellationToken ct = default)
{
var messages = new List<object> { new { role = "system", content = plannerPrompt } };
if (history != null)
{
foreach (var m in history.TakeLast(6))
messages.Add(new { role = m.Role, content = m.Content, usedKql = m.UsedKql });
}
var schemaBlock = $"SCHEMA:\n{schemaJson}";
messages.Add(new { role = "user", content = $"Question: {question}\n\n{schemaBlock}" });
var payload = new
{
model = _opt.Model,
temperature = _opt.Temperature,
response_format = new { type = "json_object" },
messages = messages
};
using var req = new HttpRequestMessage(HttpMethod.Post, _opt.Endpoint);
req.Content = new StringContent(JsonSerializer.Serialize(payload), Encoding.UTF8, "application/json");
if (_opt.IsAzure) req.Headers.Add("api-key", _opt.ApiKey);
else req.Headers.Authorization = new AuthenticationHeaderValue("Bearer", _opt.ApiKey);
using var resp = await _http.SendAsync(req, ct);
resp.EnsureSuccessStatusCode();
var body = await resp.Content.ReadAsStringAsync(ct);
var root = JsonNode.Parse(body)!.AsObject();
var content = root["choices"]![0]!["message"]!["content"]?.ToString() ?? "{}";
content = StripCodeFences(content); // your existing helper
var opts = new JsonSerializerOptions { PropertyNameCaseInsensitive = true };
opts.Converters.Add(new FlexibleStringListConverter());
var result = JsonSerializer.Deserialize<ProposeKqlResult>(content, opts)
?? new ProposeKqlResult { Kql = "", Parameters = new() };
return result;
}
private static string StripCodeFences(string s)
{
if (string.IsNullOrWhiteSpace(s)) return s ?? string.Empty;
var t = s.Trim();
if (t.StartsWith("```"))
{
// Remove first line (the ```json or ``` block)
var firstNl = t.IndexOf('\n');
if (firstNl >= 0 && firstNl + 1 < t.Length)
{
var inner = t.Substring(firstNl + 1);
// Remove trailing fence
var fence = inner.LastIndexOf("```", StringComparison.Ordinal);
if (fence >= 0)
inner = inner.Substring(0, fence);
return inner.Trim();
}
}
return t;
}
public async Task<string> AnswerFromFactsAsync(string question, string factsJson, string kqlForDisplay, CancellationToken ct = default)
{
var system = string.Join("\n", new[] {
"You are a precise analyst.",
"Answer ONLY from the provided ADX facts. If insufficient, say so.",
"Be explicit about the time range and columns used.",
"Ink quantities are stored as nanoliters. Make them humanly readable by converting them to milliliters or liters depending on what makes more sense."
});
var user = $"Question: {question}\n\nFacts(JSON):\n{factsJson}\n\nKQL used:\n{kqlForDisplay}";
var payload = new
{
model = _opt.Model,
temperature = 0.2,
messages = new object[] {
new { role = "system", content = system },
new { role = "user", content = user }
}
};
using var req = new HttpRequestMessage(HttpMethod.Post, _opt.Endpoint);
var json = JsonSerializer.Serialize(payload);
req.Content = new StringContent(json, Encoding.UTF8, "application/json");
if (_opt.IsAzure) req.Headers.Add("api-key", _opt.ApiKey);
else req.Headers.Authorization = new AuthenticationHeaderValue("Bearer", _opt.ApiKey);
using var resp = await _http.SendAsync(req, ct);
resp.EnsureSuccessStatusCode();
var body = await resp.Content.ReadAsStringAsync(ct);
var root = JsonNode.Parse(body)!.AsObject();
var content = root["choices"]![0]!["message"]!["content"]!.ToString();
return content;
}
// Add once in your class
private void AddOpenAIHeaders(HttpRequestMessage req)
{
// MUST be a standard OpenAI key (sk-...), not an Azure key
req.Headers.Authorization =
new System.Net.Http.Headers.AuthenticationHeaderValue("Bearer", _opt.ApiKey);
// REQUIRED for Assistants v2
req.Headers.Add("OpenAI-Beta", "assistants=v2");
// If your org enforces projects or you want to scope, uncomment:
// req.Headers.Add("OpenAI-Organization", "<org_xxx>");
// req.Headers.Add("OpenAI-Project", "<proj_xxx>");
}
private static async Task<string> ReadBodyOrThrowAsync(HttpResponseMessage res, CancellationToken ct)
{
var body = await res.Content.ReadAsStringAsync(ct);
if (!res.IsSuccessStatusCode)
throw new HttpRequestException($"{(int)res.StatusCode} {res.ReasonPhrase}: {body}");
return body;
}
public async Task<string> AnswerWithAssistantAsync(
AssistantType assistant,
string question,
string factsJson,
string kql,
CancellationToken ct = default)
{
// 1) Create a thread (empty is fine)
using var tReq = new HttpRequestMessage(HttpMethod.Post, "https://api.openai.com/v1/threads")
{
Content = new StringContent("{}", System.Text.Encoding.UTF8, "application/json")
};
AddOpenAIHeaders(tReq);
var tBody = await ReadBodyOrThrowAsync(await _http.SendAsync(tReq, ct), ct);
var threadId = System.Text.Json.JsonDocument.Parse(tBody).RootElement.GetProperty("id").GetString();
// 2) Add a single user message with the three sections
String messageText = String.Empty;
if (assistant == AssistantType.Data)
{
messageText = $"Question:\n{question}\n\nFacts(JSON):\n{factsJson}\n\nKQL used:\n{kql}";
}
else
{
messageText = $"Question:\n{question}";
}
using var mReq = new HttpRequestMessage(HttpMethod.Post, $"https://api.openai.com/v1/threads/{threadId}/messages")
{
// v2 expects "content" to be an array of content parts
Content = JsonContent.Create(new
{
role = "user",
content = new object[] { new { type = "text", text = messageText } }
})
};
AddOpenAIHeaders(mReq);
await ReadBodyOrThrowAsync(await _http.SendAsync(mReq, ct), ct);
// 3) Create a run targeting your Assistant (must have File Search enabled & schema.json attached)
using var rReq = new HttpRequestMessage(HttpMethod.Post, $"https://api.openai.com/v1/threads/{threadId}/runs")
{
Content = JsonContent.Create(new
{
assistant_id = assistant == AssistantType.Data ? _opt.AnswererAssistantId : _opt.DocsAssistantId,
// You can override instructions here if you ever need to:
// instructions = "..."
})
};
AddOpenAIHeaders(rReq);
var rBody = await ReadBodyOrThrowAsync(await _http.SendAsync(rReq, ct), ct);
var runId = System.Text.Json.JsonDocument.Parse(rBody).RootElement.GetProperty("id").GetString();
// 4) Poll run until completed
while (true)
{
await Task.Delay(600, ct);
using var gReq = new HttpRequestMessage(HttpMethod.Get, $"https://api.openai.com/v1/threads/{threadId}/runs/{runId}");
AddOpenAIHeaders(gReq);
var gBody = await ReadBodyOrThrowAsync(await _http.SendAsync(gReq, ct), ct);
var root = System.Text.Json.JsonDocument.Parse(gBody).RootElement;
var status = root.GetProperty("status").GetString();
if (status == "completed") break;
if (status == "failed" || status == "cancelled" || status == "expired")
{
var lastError = root.TryGetProperty("last_error", out var le) ? le.ToString() : "unknown";
throw new Exception($"Assistant run {status}: {lastError}");
}
}
// 5) Fetch messages and return the latest assistant text
using var lReq = new HttpRequestMessage(HttpMethod.Get, $"https://api.openai.com/v1/threads/{threadId}/messages");
AddOpenAIHeaders(lReq);
var lBody = await ReadBodyOrThrowAsync(await _http.SendAsync(lReq, ct), ct);
using var doc = System.Text.Json.JsonDocument.Parse(lBody);
// Messages are returned most-recent-first; take the first assistant message
foreach (var msg in doc.RootElement.GetProperty("data").EnumerateArray())
{
var role = msg.GetProperty("role").GetString();
if (role == "assistant")
{
foreach (var part in msg.GetProperty("content").EnumerateArray())
{
if (part.GetProperty("type").GetString() == "text")
return part.GetProperty("text").GetProperty("value").GetString() ?? "";
}
}
}
return "(no assistant message found)";
}
public async Task<AssistantRunResult> AnswerWithAssistantAsync(
AssistantType assistant,
string question,
string factsJson,
string kql,
string? threadId,
CancellationToken ct = default)
{
// 1) Use existing thread or create a new one
if (string.IsNullOrEmpty(threadId))
{
using var tReq = new HttpRequestMessage(HttpMethod.Post, "https://api.openai.com/v1/threads")
{ Content = new StringContent("{}", Encoding.UTF8, "application/json") };
AddOpenAIHeaders(tReq);
var tBody = await ReadBodyOrThrowAsync(await _http.SendAsync(tReq, ct), ct);
threadId = System.Text.Json.JsonDocument.Parse(tBody).RootElement.GetProperty("id").GetString();
}
// 2) Add the user message (same text you build today)
var messageText = assistant == AssistantType.Data
? $"Question:\n{question}\n\nFacts(JSON):\n{factsJson}\n\nKQL used:\n{kql}"
: $"Question:\n{question}";
using (var mReq = new HttpRequestMessage(HttpMethod.Post, $"https://api.openai.com/v1/threads/{threadId}/messages")
{ Content = JsonContent.Create(new { role = "user", content = new object[] { new { type = "text", text = messageText } } }) })
{
AddOpenAIHeaders(mReq);
await ReadBodyOrThrowAsync(await _http.SendAsync(mReq, ct), ct);
}
// 3) Run with the correct assistant id (unchanged logic)
using (var rReq = new HttpRequestMessage(HttpMethod.Post, $"https://api.openai.com/v1/threads/{threadId}/runs")
{ Content = JsonContent.Create(new { assistant_id = assistant == AssistantType.Data ? _opt.AnswererAssistantId : _opt.DocsAssistantId }) })
{
AddOpenAIHeaders(rReq);
var rBody = await ReadBodyOrThrowAsync(await _http.SendAsync(rReq, ct), ct);
var runId = System.Text.Json.JsonDocument.Parse(rBody).RootElement.GetProperty("id").GetString();
// Poll until completed (same as your existing loop)
while (true)
{
await Task.Delay(600, ct);
using var gReq = new HttpRequestMessage(HttpMethod.Get, $"https://api.openai.com/v1/threads/{threadId}/runs/{runId}");
AddOpenAIHeaders(gReq);
var gBody = await ReadBodyOrThrowAsync(await _http.SendAsync(gReq, ct), ct);
var root = System.Text.Json.JsonDocument.Parse(gBody).RootElement;
var status = root.GetProperty("status").GetString();
if (status == "completed") break;
if (status == "failed" || status == "cancelled" || status == "expired")
{
var lastError = root.TryGetProperty("last_error", out var le) ? le.ToString() : "unknown";
throw new Exception($"Assistant run {status}: {lastError}");
}
}
}
// 4) Fetch the latest assistant text and return it with the thread id
using var lReq = new HttpRequestMessage(HttpMethod.Get, $"https://api.openai.com/v1/threads/{threadId}/messages");
AddOpenAIHeaders(lReq);
var lBody = await ReadBodyOrThrowAsync(await _http.SendAsync(lReq, ct), ct);
using var doc = System.Text.Json.JsonDocument.Parse(lBody);
foreach (var msg in doc.RootElement.GetProperty("data").EnumerateArray())
{
if (msg.GetProperty("role").GetString() == "assistant")
{
foreach (var part in msg.GetProperty("content").EnumerateArray())
if (part.GetProperty("type").GetString() == "text")
{
var raw = part.GetProperty("text").GetProperty("value").GetString() ?? "";
var cleaned = assistant == AssistantType.Docs ? StripCitations(raw) : raw;
return new AssistantRunResult
{
Answer = cleaned,
ThreadId = threadId!
};
}
}
}
return new AssistantRunResult { Answer = "(no assistant message found)", ThreadId = threadId! };
}
private static string StripCitations(string s)
{
if (string.IsNullOrWhiteSpace(s)) return s ?? string.Empty;
// Remove any inline citation markers like: or
return Regex.Replace(s, @"\s*【[^】]*】", string.Empty);
}
}
}
|