add preliminary llm controller

2026-04-23 20:23:32 -05:00
parent 0bee59efe0
commit bf5885c4ed
3 changed files with 95 additions and 3 deletions
--- a/api/Program.cs
+++ b/api/Program.cs
@@ -29,6 +29,8 @@ builder.Services.AddScoped<UserService>();
 builder.Services.AddScoped<ItemService>();
 builder.Services.AddScoped<JwtService>();
 // if this grows sufficiently large we can put elsewhere
+// misc services that I didnt make
+builder.Services.AddHttpClient();

 // configuration for jwt authentication
 builder.Services.AddIdentity<User, IdentityRole>()
@@ -110,7 +112,7 @@ if (app.Environment.IsEnvironment("Development")) {
    app.UseHttpsRedirection();
 }

-app.MapControllers();
+app.MapControllers(); // automatically scours src/Controllers for controller classes

 // attempt enitity-framework migrations at startup. love you stack overflow
 using (var scope = app.Services.CreateScope()) {
@@ -125,7 +127,6 @@ using (var scope = app.Services.CreateScope()) {
            Thread.Sleep(5000);
        }
    }
-
 }

 app.Run();
--- a/api/src/Controllers/ItemsController.cs
+++ b/api/src/Controllers/ItemsController.cs
@@ -6,9 +6,11 @@ using agologumApi.Models;
 using agologumApi.Services;

 [ApiController]
-[Route("api/[controller]")]
+[Route("api/[controller]")] // generally good practice to make this explicit
 public class ItemsController : ControllerBase {

+    // TODO: (global) controller's might eventually need more services so its gonna be a good idea to give them more meaningful names
+    // i.e. just name it itemService_
    private readonly ItemService service_;

    public ItemsController(ItemService service) {
--- a/api/src/Controllers/LlmController.cs
+++ b/api/src/Controllers/LlmController.cs
@@ -0,0 +1,89 @@
+
+// system usings
+using Microsoft.AspNetCore.Mvc;
+using Microsoft.AspNetCore.Authorization;
+using System.Net.Http;
+using System.Text;
+using System.Text.Json;
+// agologum usings
+using agologumApi.Models;
+//using agologumApi.Services;
+
+[ApiController]
+[Route("api/chat")]
+public class LlmController : ControllerBase {
+
+    // eventually this will be where most of the app sits
+    // might create src/Services/Llm/... to better organize
+    // private readonly LlmService llmService_;
+    private readonly IHttpClientFactory httpClientFactory_;
+    private readonly string LLAMA_URL = "http://localhost:8010/completion"; // TODO: can just put this in appsettings
+
+    public LlmController(/* LlmService llmService, */ IHttpClientFactory httpClientFactory) {
+        // llmService_ = llmService;
+        httpClientFactory_ = httpClientFactory;
+    }
+
+    // posting to api/chat/stream with a prompt in the body will return an sse (server sent events) stream of the llm text
+    // [Authorize(Policy = Permission.SensitiveData_Read)] // will make secret after testing
+    [HttpPost("stream")]
+    public async Task streamPrompt([FromBody] PromptRequest prompt) {
+        
+        var httpClient = httpClientFactory_.CreateClient(); // recreating this on every prompt request? idk seems 🐟y
+
+        // json object for llama to parse
+        var llamaRequest = new {
+            prompt = prompt.Prompt, // alternative would be a messages array
+            stream = true, // real time token streaming
+            n_predict = 256 // max amount of tokens
+            // other options are temperature, top_p and top_k for vocabulary diversity, stop for stop tokens
+            // https://github.com/ggml-org/llama.cpp/blob/master/tools/server/README.md
+            // llm loras lol
+        };
+
+        // http request to send to the llama server
+        var httpRequest = new HttpRequestMessage(HttpMethod.Post, LLAMA_URL) {
+            Content = new StringContent(JsonSerializer.Serialize(llamaRequest), Encoding.UTF8, "application/json")
+        };
+
+        // send request
+        var response = await httpClient.SendAsync(httpRequest, HttpCompletionOption.ResponseHeadersRead, HttpContext.RequestAborted);
+        response.EnsureSuccessStatusCode();
+        Response.StatusCode = 200;
+        Response.ContentType = "text/plain"; // because its async dotnet lets us do this monstrosity
+
+        // now to handle the response stream
+        await using var responseStream = await response.Content.ReadAsStreamAsync();
+        using var streamReader = new StreamReader(responseStream);
+        string? line;
+        // until the stream ends ...
+        while((line = await streamReader.ReadLineAsync()) != null) {
+            if(string.IsNullOrWhiteSpace(line)) continue; // skip if line is empty
+
+            // llama returns streams in the format data: { "response" }, so ignore if otherwise
+            if(line.StartsWith("data: ")) {
+                var json = line.Substring(6); // clip the "data: " portion
+                try {
+                    // parse the json sent back
+                    using var doc = JsonDocument.Parse(json);
+                    var root = doc.RootElement;
+                    if(root.TryGetProperty("content", out var content)) {
+                        var text = content.GetString();
+                        if(!string.IsNullOrEmpty(text)) {
+                            // theres actually something here, so respond
+                            await Response.WriteAsync(text);
+                            await Response.Body.FlushAsync(); // rely outwards as quickly as it flows in
+                        }
+                    }
+                } catch {
+                    // malformed response data
+                }
+            }
+        }
+    }
+
+}
+
+public class PromptRequest {
+    public string Prompt { get; set; } = "";
+}