Enhance LLM chat streaming and progress updates

- Implemented SignalR integration for real-time chat streaming in LlmController, allowing for progress updates during LLM interactions.
- Refactored AiChat component to handle streaming responses and display progress updates, including iteration status and tool call results.
- Introduced a new ProgressIndicator component to visually represent the current state of chat processing.
- Updated AiChatService to manage SignalR connections and handle streaming updates effectively, improving user experience during chat sessions.
- Enhanced error handling and messaging for better feedback during chat interactions.
This commit is contained in:
2026-01-06 18:57:17 +07:00
parent 86e056389d
commit 40a39849f5
5 changed files with 689 additions and 243 deletions

View File

@@ -1,9 +1,11 @@
using System.Text.Json;
using System.Text.RegularExpressions;
using Managing.Application.Abstractions.Services;
using Managing.Application.Hubs;
using Managing.Domain.Users;
using Microsoft.AspNetCore.Authorization;
using Microsoft.AspNetCore.Mvc;
using Microsoft.AspNetCore.SignalR;
using Microsoft.Extensions.Caching.Memory;
namespace Managing.Api.Controllers;
@@ -22,51 +24,50 @@ public class LlmController : BaseController
private readonly IMcpService _mcpService;
private readonly ILogger<LlmController> _logger;
private readonly IMemoryCache _cache;
private readonly IHubContext<LlmHub> _hubContext;
public LlmController(
ILlmService llmService,
IMcpService mcpService,
IUserService userService,
ILogger<LlmController> logger,
IMemoryCache cache) : base(userService)
IMemoryCache cache,
IHubContext<LlmHub> hubContext) : base(userService)
{
_llmService = llmService;
_mcpService = mcpService;
_logger = logger;
_cache = cache;
_hubContext = hubContext;
}
/// <summary>
/// Sends a chat message to an LLM with streaming progress updates (Server-Sent Events).
/// Sends a chat message to an LLM with streaming progress updates via SignalR.
/// Provides real-time updates about iterations, tool calls, and progress similar to Cursor/Claude.
/// Progress updates are sent via SignalR to the specified connectionId.
/// </summary>
/// <param name="request">The chat request with messages and optional provider/API key</param>
/// <returns>Stream of progress updates ending with final response</returns>
/// <param name="request">The chat request with messages, optional provider/API key, and SignalR connectionId</param>
/// <returns>OK status - updates are sent via SignalR</returns>
[HttpPost]
[Route("ChatStream")]
[Produces("text/event-stream")]
public async IAsyncEnumerable<LlmProgressUpdate> ChatStream([FromBody] LlmChatRequest request)
[Consumes("application/json")]
[Produces("application/json")]
public async Task<ActionResult> ChatStream([FromBody] LlmChatStreamRequest request)
{
if (request == null)
if (request == null || string.IsNullOrWhiteSpace(request.ConnectionId))
{
yield return new LlmProgressUpdate
{
Type = "error",
Message = "Chat request is required",
Error = "Chat request is required"
};
yield break;
return BadRequest("Chat request and connectionId are required");
}
if (request.Messages == null || !request.Messages.Any())
{
yield return new LlmProgressUpdate
await _hubContext.Clients.Client(request.ConnectionId).SendAsync("ProgressUpdate", new LlmProgressUpdate
{
Type = "error",
Message = "At least one message is required",
Error = "At least one message is required"
};
yield break;
});
return BadRequest("At least one message is required");
}
User? user = null;
@@ -81,29 +82,56 @@ public class LlmController : BaseController
if (user == null)
{
yield return new LlmProgressUpdate
await _hubContext.Clients.Client(request.ConnectionId).SendAsync("ProgressUpdate", new LlmProgressUpdate
{
Type = "error",
Message = "Error authenticating user",
Error = "Unable to authenticate user"
});
return Unauthorized("Unable to authenticate user");
}
// Process in background to avoid blocking the HTTP response
_ = Task.Run(async () =>
{
try
{
await ChatStreamInternal(request, user, request.ConnectionId);
}
catch (Exception ex)
{
_logger.LogError(ex, "Error processing chat stream for connection {ConnectionId}", request.ConnectionId);
await _hubContext.Clients.Client(request.ConnectionId).SendAsync("ProgressUpdate", new LlmProgressUpdate
{
Type = "error",
Message = $"Error processing chat: {ex.Message}",
Error = ex.Message
});
}
});
return Ok(new { Message = "Chat stream started", ConnectionId = request.ConnectionId });
}
private async Task ChatStreamInternal(LlmChatStreamRequest request, User user, string connectionId)
{
// Convert to LlmChatRequest for service calls
var chatRequest = new LlmChatRequest
{
Messages = request.Messages,
Provider = request.Provider,
ApiKey = request.ApiKey,
Stream = request.Stream,
Temperature = request.Temperature,
MaxTokens = request.MaxTokens,
Tools = request.Tools
};
yield break;
}
await foreach (var update in ChatStreamInternal(request, user))
{
yield return update;
}
}
private async IAsyncEnumerable<LlmProgressUpdate> ChatStreamInternal(LlmChatRequest request, User user)
{
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = "Initializing conversation and loading available tools..."
};
});
// Get available MCP tools (with caching for 5 minutes)
var availableTools = await _cache.GetOrCreateAsync("mcp_tools", async entry =>
@@ -111,19 +139,19 @@ public class LlmController : BaseController
entry.AbsoluteExpirationRelativeToNow = TimeSpan.FromMinutes(5);
return (await _mcpService.GetAvailableToolsAsync()).ToList();
});
request.Tools = availableTools;
chatRequest.Tools = availableTools;
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = $"Loaded {availableTools.Count} available tools. Preparing system context..."
};
});
// Add or prepend system message to ensure LLM knows it can respond directly
var existingSystemMessages = request.Messages.Where(m => m.Role == "system").ToList();
var existingSystemMessages = chatRequest.Messages.Where(m => m.Role == "system").ToList();
foreach (var msg in existingSystemMessages)
{
request.Messages.Remove(msg);
chatRequest.Messages.Remove(msg);
}
// Add explicit system message with domain expertise and tool guidance
@@ -132,37 +160,37 @@ public class LlmController : BaseController
Role = "system",
Content = BuildSystemMessage()
};
request.Messages.Insert(0, systemMessage);
chatRequest.Messages.Insert(0, systemMessage);
// Proactively inject backtest details fetching if user is asking for analysis
await InjectBacktestDetailsFetchingIfNeeded(request, user);
await InjectBacktestDetailsFetchingIfNeeded(chatRequest, user);
// Add helpful context extraction message if backtest ID was found
AddBacktestContextGuidance(request);
AddBacktestContextGuidance(chatRequest);
// Iterative tool calling: keep looping until we get a final answer without tool calls
int maxIterations = DetermineMaxIterations(request);
int maxIterations = DetermineMaxIterations(chatRequest);
int iteration = 0;
LlmChatResponse? finalResponse = null;
const int DelayBetweenIterationsMs = 500;
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = $"Starting analysis (up to {maxIterations} iterations may be needed)..."
};
});
while (iteration < maxIterations)
{
iteration++;
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "iteration_start",
Message = $"Iteration {iteration}/{maxIterations}: Analyzing your request and determining next steps...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
_logger.LogInformation("LLM chat iteration {Iteration}/{MaxIterations} for user {UserId}",
iteration, maxIterations, user.Id);
@@ -170,29 +198,29 @@ public class LlmController : BaseController
// Add delay between iterations to avoid rapid bursts and rate limiting
if (iteration > 1)
{
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = "Waiting briefly to respect rate limits...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
await Task.Delay(DelayBetweenIterationsMs);
}
// Trim context if conversation is getting too long
TrimConversationContext(request);
TrimConversationContext(chatRequest);
// Send chat request to LLM
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = $"Iteration {iteration}: Sending request to LLM...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
var response = await _llmService.ChatAsync(user, request);
var response = await _llmService.ChatAsync(user, chatRequest);
// If LLM doesn't want to call tools, we have our final answer
if (!response.RequiresToolExecution || response.ToolCalls == null || !response.ToolCalls.Any())
@@ -201,13 +229,13 @@ public class LlmController : BaseController
_logger.LogInformation("LLM provided final answer after {Iteration} iteration(s) for user {UserId}",
iteration, user.Id);
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = "Received final response. Preparing answer...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
break;
}
@@ -216,19 +244,19 @@ public class LlmController : BaseController
_logger.LogInformation("LLM requested {Count} tool calls in iteration {Iteration} for user {UserId}",
response.ToolCalls.Count, iteration, user.Id);
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = $"Iteration {iteration}: LLM requested {response.ToolCalls.Count} tool call(s). Executing tools...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
// Execute tool calls sequentially to allow progress updates
var toolResults = new List<LlmMessage>();
foreach (var toolCall in response.ToolCalls)
{
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "tool_call",
Message = $"Calling tool: {toolCall.Name}",
@@ -236,7 +264,7 @@ public class LlmController : BaseController
MaxIterations = maxIterations,
ToolName = toolCall.Name,
ToolArguments = toolCall.Arguments
};
});
var (success, result, error) = await ExecuteToolSafely(user, toolCall.Name, toolCall.Arguments, toolCall.Id, iteration, maxIterations);
@@ -245,14 +273,14 @@ public class LlmController : BaseController
_logger.LogInformation("Successfully executed tool {ToolName} in iteration {Iteration} for user {UserId}",
toolCall.Name, iteration, user.Id);
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "tool_result",
Message = $"Tool {toolCall.Name} completed successfully",
Iteration = iteration,
MaxIterations = maxIterations,
ToolName = toolCall.Name
};
});
toolResults.Add(new LlmMessage
{
@@ -266,7 +294,7 @@ public class LlmController : BaseController
_logger.LogError("Error executing tool {ToolName} in iteration {Iteration} for user {UserId}: {Error}",
toolCall.Name, iteration, user.Id, error);
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "tool_result",
Message = $"Tool {toolCall.Name} encountered an error: {error}",
@@ -274,7 +302,7 @@ public class LlmController : BaseController
MaxIterations = maxIterations,
ToolName = toolCall.Name,
Error = error
};
});
toolResults.Add(new LlmMessage
{
@@ -285,16 +313,16 @@ public class LlmController : BaseController
}
}
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = $"Iteration {iteration}: All tools completed. Analyzing results...",
Iteration = iteration,
MaxIterations = maxIterations
};
});
// Add assistant message with tool calls to conversation history
request.Messages.Add(new LlmMessage
chatRequest.Messages.Add(new LlmMessage
{
Role = "assistant",
Content = response.Content,
@@ -302,7 +330,7 @@ public class LlmController : BaseController
});
// Add tool results to conversation history
request.Messages.AddRange(toolResults);
chatRequest.Messages.AddRange(toolResults);
// Continue loop to get LLM's response to the tool results
}
@@ -313,26 +341,26 @@ public class LlmController : BaseController
_logger.LogWarning("Reached max iterations ({MaxIterations}) for user {UserId}. Returning last response.",
maxIterations, user.Id);
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "thinking",
Message = "Reached maximum iterations. Getting final response...",
Iteration = maxIterations,
MaxIterations = maxIterations
};
});
finalResponse = await _llmService.ChatAsync(user, request);
finalResponse = await _llmService.ChatAsync(user, chatRequest);
}
// Send final response
yield return new LlmProgressUpdate
await SendProgressUpdate(connectionId, new LlmProgressUpdate
{
Type = "final_response",
Message = "Analysis complete!",
Response = finalResponse,
Iteration = iteration,
MaxIterations = maxIterations
};
});
}
/// <summary>
@@ -919,4 +947,30 @@ public class LlmController : BaseController
_logger.LogWarning("No backtest ID found in conversation messages");
return null;
}
/// <summary>
/// Helper method to send progress update via SignalR
/// </summary>
private async Task SendProgressUpdate(string connectionId, LlmProgressUpdate update)
{
try
{
await _hubContext.Clients.Client(connectionId).SendAsync("ProgressUpdate", update);
}
catch (Exception ex)
{
_logger.LogError(ex, "Error sending progress update to connection {ConnectionId}", connectionId);
}
}
}
/// <summary>
/// Request model for LLM chat streaming via SignalR
/// </summary>
public class LlmChatStreamRequest : LlmChatRequest
{
/// <summary>
/// SignalR connection ID to send progress updates to
/// </summary>
public string ConnectionId { get; set; } = string.Empty;
}

View File

@@ -306,14 +306,26 @@ builder.Services
OnMessageReceived = context =>
{
// Skip token extraction for anonymous endpoints to avoid validation errors
var path = context.Request.Path.Value?.ToLower();
if (path != null && (path.EndsWith("/create-token") || path.EndsWith("/authenticate")))
var path = context.Request.Path.Value?.ToLower() ?? "";
if (!string.IsNullOrEmpty(path) && (path.EndsWith("/create-token") || path.EndsWith("/authenticate")))
{
// Clear any token to prevent validation on anonymous endpoints
context.Token = null;
return Task.CompletedTask;
}
// Extract token from query string for SignalR connections
// SignalR uses access_token query parameter for WebSocket connections
if (path.Contains("/bothub") || path.Contains("/backtesthub") || path.Contains("/llmhub"))
{
var accessToken = context.Request.Query["access_token"];
if (!string.IsNullOrEmpty(accessToken))
{
context.Token = accessToken;
return Task.CompletedTask;
}
}
// Handle tokens sent without "Bearer " prefix for authenticated endpoints
// The standard middleware expects "Bearer <token>" but some clients send just the token
if (string.IsNullOrEmpty(context.Token))
@@ -330,13 +342,6 @@ builder.Services
}
}
// If you want to get the token from a custom header or query string
// var accessToken = context.Request.Query["access_token"];
// if (!string.IsNullOrEmpty(accessToken) &&
// context.HttpContext.Request.Path.StartsWithSegments("/hub"))
// {
// context.Token = accessToken;
// }
return Task.CompletedTask;
},
OnAuthenticationFailed = context =>
@@ -438,7 +443,8 @@ builder.Services.AddCors(options =>
policy
.WithOrigins(allowedCorsOrigins)
.WithMethods("GET", "POST", "PUT", "DELETE", "OPTIONS", "PATCH")
.WithHeaders("Content-Type", "Authorization", "X-Requested-With", "X-Correlation-ID")
.WithHeaders("Content-Type", "Authorization", "X-Requested-With", "X-Correlation-ID",
"X-SignalR-User-Agent", "x-requested-with", "x-signalr-user-agent") // SignalR-specific headers
.WithExposedHeaders("Token-Expired", "X-Correlation-ID")
.AllowCredentials()
.SetPreflightMaxAge(TimeSpan.FromHours(24));
@@ -449,7 +455,8 @@ builder.Services.AddCors(options =>
policy
.AllowAnyMethod()
.AllowAnyHeader()
.SetIsOriginAllowed(_ => true);
.SetIsOriginAllowed(_ => true)
.AllowCredentials();
}
});
});
@@ -528,13 +535,16 @@ app.Use(async (context, next) =>
context.Response.Headers.Append("Referrer-Policy", "strict-origin-when-cross-origin");
context.Response.Headers.Append("Permissions-Policy", "geolocation=(), microphone=(), camera=()");
// Content Security Policy - only for non-Swagger endpoints
// Content Security Policy - exclude SignalR hubs and other special endpoints
if (!context.Request.Path.StartsWithSegments("/swagger") &&
!context.Request.Path.StartsWithSegments("/health") &&
!context.Request.Path.StartsWithSegments("/alive"))
!context.Request.Path.StartsWithSegments("/alive") &&
!context.Request.Path.StartsWithSegments("/bothub") &&
!context.Request.Path.StartsWithSegments("/backtesthub") &&
!context.Request.Path.StartsWithSegments("/llmhub"))
{
context.Response.Headers.Append("Content-Security-Policy",
"default-src 'self'; script-src 'self' 'unsafe-inline'; style-src 'self' 'unsafe-inline'; img-src 'self' data: https:; font-src 'self' data:;");
"default-src 'self'; script-src 'self' 'unsafe-inline'; style-src 'self' 'unsafe-inline'; img-src 'self' data: https:; font-src 'self' data:; connect-src 'self' ws: wss:;");
}
// Remove server header (optional - Kestrel can be configured separately)
@@ -577,6 +587,7 @@ app.UseEndpoints(endpoints =>
endpoints.MapControllers();
endpoints.MapHub<BotHub>("/bothub");
endpoints.MapHub<BacktestHub>("/backtesthub");
endpoints.MapHub<LlmHub>("/llmhub");
endpoints.MapHealthChecks("/health", new HealthCheckOptions
{

View File

@@ -0,0 +1,20 @@
using Microsoft.AspNetCore.Authorization;
using Microsoft.AspNetCore.SignalR;
namespace Managing.Application.Hubs;
/// <summary>
/// SignalR hub for LLM chat streaming with real-time progress updates
/// </summary>
[Authorize]
public class LlmHub : Hub
{
public override async Task OnConnectedAsync()
{
await base.OnConnectedAsync();
await Clients.Caller.SendAsync("Connected", "Connected to LlmHub!");
}
public string GetConnectionId() => Context.ConnectionId;
}

View File

@@ -1,13 +1,17 @@
import { useState, useRef, useEffect } from 'react'
import { LlmClient } from '../../generated/ManagingApi'
import { LlmMessage, LlmChatResponse } from '../../generated/ManagingApiTypes'
import { LlmMessage, LlmChatResponse, LlmProgressUpdate } from '../../generated/ManagingApiTypes'
import { AiChatService } from '../../services/aiChatService'
import useApiUrlStore from '../../app/store/apiStore'
interface Message {
role: 'user' | 'assistant' | 'system'
role: 'user' | 'assistant' | 'system' | 'progress'
content: string
timestamp: Date
progressType?: string
iteration?: number
maxIterations?: number
toolName?: string
}
interface AiChatProps {
@@ -26,12 +30,13 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
const [isLoading, setIsLoading] = useState(false)
const [provider, setProvider] = useState<string>('auto')
const [availableProviders, setAvailableProviders] = useState<string[]>([])
const [currentProgress, setCurrentProgress] = useState<LlmProgressUpdate | null>(null)
const messagesEndRef = useRef<HTMLDivElement>(null)
const { apiUrl, userToken } = useApiUrlStore()
useEffect(() => {
scrollToBottom()
}, [messages])
}, [messages, currentProgress])
useEffect(() => {
loadProviders()
@@ -44,7 +49,7 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
const loadProviders = async () => {
try {
const llmClient = new LlmClient({}, apiUrl)
const service = new AiChatService(llmClient)
const service = new AiChatService(llmClient, apiUrl)
const providers = await service.getProviders()
setAvailableProviders(['auto', ...providers])
} catch (error) {
@@ -64,14 +69,15 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
setMessages(prev => [...prev, userMessage])
setInput('')
setIsLoading(true)
setCurrentProgress(null)
try {
const llmClient = new LlmClient({}, apiUrl)
const service = new AiChatService(llmClient)
const service = new AiChatService(llmClient, apiUrl)
// Convert messages to LlmMessage format
const llmMessages: LlmMessage[] = messages
.filter(m => m.role !== 'system' || messages.indexOf(m) === 0) // Include only first system message
.filter(m => m.role !== 'system' && m.role !== 'progress') // Exclude system and progress messages
.map(m => ({
role: m.role,
content: m.content,
@@ -87,18 +93,66 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
toolCallId: undefined
})
const response: LlmChatResponse = await service.sendMessage(
// Use streaming
let finalResponse: LlmChatResponse | null = null
let lastUpdate: LlmProgressUpdate | null = null
for await (const update of service.sendMessageStream(
llmMessages,
provider === 'auto' ? undefined : provider
)
)) {
lastUpdate = update
setCurrentProgress(update)
const assistantMessage: Message = {
// Handle different update types
if (update.type === 'error') {
const errorMessage: Message = {
role: 'assistant',
content: response.content || 'No response from AI',
content: `Error: ${update.error || update.message || 'Failed to get response from AI'}`,
timestamp: new Date()
}
setMessages(prev => [...prev, errorMessage])
break
}
if (update.type === 'final_response' && update.response) {
finalResponse = update.response
}
}
// Add final response if we got one
if (finalResponse) {
const assistantMessage: Message = {
role: 'assistant',
content: finalResponse.content || 'No response from AI',
timestamp: new Date()
}
setMessages(prev => [...prev, assistantMessage])
} else if (lastUpdate && lastUpdate.type === 'final_response' && lastUpdate.response) {
// Fallback: check lastUpdate in case finalResponse wasn't set
const assistantMessage: Message = {
role: 'assistant',
content: lastUpdate.response.content || 'No response from AI',
timestamp: new Date()
}
setMessages(prev => [...prev, assistantMessage])
} else if (lastUpdate && lastUpdate.type === 'error') {
// Show error message
const errorMessage: Message = {
role: 'assistant',
content: `Error: ${lastUpdate.error || lastUpdate.message || 'Failed to get response from AI'}`,
timestamp: new Date()
}
setMessages(prev => [...prev, errorMessage])
} else {
// If we didn't get a final response, show the last progress message
const assistantMessage: Message = {
role: 'assistant',
content: lastUpdate?.message || 'Response incomplete',
timestamp: new Date()
}
setMessages(prev => [...prev, assistantMessage])
}
} catch (error: any) {
console.error('Error sending message:', error)
const errorMessage: Message = {
@@ -109,6 +163,7 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
setMessages(prev => [...prev, errorMessage])
} finally {
setIsLoading(false)
setCurrentProgress(null)
}
}
@@ -179,7 +234,17 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
</div>
</div>
))}
{isLoading && (
{/* Progress Updates */}
{isLoading && currentProgress && (
<div className="flex justify-start">
<div className="bg-base-200 p-3 rounded-lg max-w-[80%]">
<ProgressIndicator progress={currentProgress} />
</div>
</div>
)}
{isLoading && !currentProgress && (
<div className="flex justify-start">
<div className="bg-base-200 p-3 rounded-lg">
<div className="flex gap-1">
@@ -221,4 +286,80 @@ function AiChat({ onClose }: AiChatProps): JSX.Element {
)
}
// Progress Indicator Component
function ProgressIndicator({ progress }: { progress: LlmProgressUpdate }): JSX.Element {
const getIcon = () => {
switch (progress.type) {
case 'iteration_start':
return '🔄'
case 'thinking':
return '💭'
case 'tool_call':
return '🔧'
case 'tool_result':
return progress.error ? '❌' : '✅'
case 'final_response':
return '✨'
case 'error':
return '⚠️'
default:
return '⏳'
}
}
const getColor = () => {
switch (progress.type) {
case 'error':
return 'text-error'
case 'tool_result':
return progress.error ? 'text-error' : 'text-success'
case 'final_response':
return 'text-success'
default:
return 'text-info'
}
}
return (
<div className="space-y-2">
<div className="flex items-center gap-2">
<span className="text-lg">{getIcon()}</span>
<span className={`text-sm font-medium ${getColor()}`}>
{progress.message}
</span>
</div>
{progress.iteration && progress.maxIterations && (
<div className="flex items-center gap-2 text-xs text-base-content/60">
<progress
className="progress progress-primary w-32 h-2"
value={progress.iteration}
max={progress.maxIterations}
/>
<span>Iteration {progress.iteration}/{progress.maxIterations}</span>
</div>
)}
{progress.toolName && (
<div className="text-xs text-base-content/60 mt-1">
<span className="font-mono bg-base-300 px-2 py-1 rounded">
{progress.toolName}
{progress.toolArguments && Object.keys(progress.toolArguments).length > 0 && (
<span className="ml-1 opacity-60">
({Object.keys(progress.toolArguments).length} args)
</span>
)}
</span>
</div>
)}
{progress.error && (
<div className="text-xs text-error mt-1">
{progress.error}
</div>
)}
</div>
)
}
export default AiChat

View File

@@ -1,11 +1,115 @@
import { HubConnection, HubConnectionBuilder } from '@microsoft/signalr'
import { LlmClient } from '../generated/ManagingApi'
import { LlmChatRequest, LlmChatResponse, LlmMessage } from '../generated/ManagingApiTypes'
import { LlmChatRequest, LlmChatResponse, LlmMessage, LlmProgressUpdate } from '../generated/ManagingApiTypes'
import { Cookies } from 'react-cookie'
export class AiChatService {
private llmClient: LlmClient
private baseUrl: string
private hubConnection: HubConnection | null = null
constructor(llmClient: LlmClient) {
constructor(llmClient: LlmClient, baseUrl: string) {
this.llmClient = llmClient
this.baseUrl = baseUrl
}
/**
* Creates and connects to SignalR hub for LLM chat streaming
*/
async connectToHub(): Promise<HubConnection> {
if (this.hubConnection?.state === 'Connected') {
return this.hubConnection
}
// Clean up existing connection if any
if (this.hubConnection) {
try {
await this.hubConnection.stop()
} catch (e) {
// Ignore stop errors
}
this.hubConnection = null
}
const cookies = new Cookies()
const bearerToken = cookies.get('token')
if (!bearerToken) {
throw new Error('No authentication token found. Please log in first.')
}
// Ensure baseUrl doesn't have trailing slash
const baseUrl = this.baseUrl.endsWith('/') ? this.baseUrl.slice(0, -1) : this.baseUrl
const hubUrl = `${baseUrl}/llmhub`
console.log('Connecting to SignalR hub:', hubUrl)
const connection = new HubConnectionBuilder()
.withUrl(hubUrl, {
// Pass token via query string (standard for SignalR WebSocket connections)
// SignalR will add this as ?access_token=xxx to the negotiation request
accessTokenFactory: () => {
const token = cookies.get('token')
if (!token) {
console.error('Token not available in accessTokenFactory')
throw new Error('Token expired or not available')
}
console.log('Providing token for SignalR connection')
return token
}
})
.withAutomaticReconnect({
nextRetryDelayInMilliseconds: (retryContext) => {
// Exponential backoff: 0s, 2s, 10s, 30s
if (retryContext.previousRetryCount === 0) return 2000
if (retryContext.previousRetryCount === 1) return 10000
return 30000
}
})
.build()
// Add connection event handlers for debugging
connection.onclose((error) => {
console.log('SignalR connection closed', error)
this.hubConnection = null
})
connection.onreconnecting((error) => {
console.log('SignalR reconnecting', error)
})
connection.onreconnected((connectionId) => {
console.log('SignalR reconnected', connectionId)
})
try {
console.log('Starting SignalR connection...')
await connection.start()
console.log('SignalR connected successfully. Connection ID:', connection.connectionId)
this.hubConnection = connection
return connection
} catch (error: any) {
console.error('Failed to connect to SignalR hub:', error)
console.error('Error details:', {
message: error?.message,
stack: error?.stack,
hubUrl: hubUrl,
hasToken: !!bearerToken
})
// Clean up on failure
this.hubConnection = null
throw new Error(`Failed to connect to SignalR hub: ${error?.message || 'Unknown error'}. Check browser console for details.`)
}
}
/**
* Disconnects from SignalR hub
*/
async disconnectFromHub(): Promise<void> {
if (this.hubConnection) {
await this.hubConnection.stop()
this.hubConnection = null
}
}
/**
@@ -25,6 +129,122 @@ export class AiChatService {
return await this.llmClient.llm_Chat(request)
}
/**
* Send a chat message with streaming progress updates via SignalR
* Returns an async generator that yields progress updates in real-time
*/
async *sendMessageStream(
messages: LlmMessage[],
provider?: string,
apiKey?: string
): AsyncGenerator<LlmProgressUpdate, void, unknown> {
// Connect to SignalR hub
const connection = await this.connectToHub()
const connectionId = connection.connectionId
if (!connectionId) {
yield {
type: 'error',
message: 'Failed to get SignalR connection ID',
error: 'Connection ID not available'
}
return
}
const request = {
messages,
provider: provider || 'auto',
apiKey: apiKey,
stream: true,
temperature: 0.7,
maxTokens: 4096,
tools: undefined, // Will be populated by backend
connectionId: connectionId
}
// Queue for incoming updates
const updateQueue: LlmProgressUpdate[] = []
let isComplete = false
let resolver: ((update: LlmProgressUpdate) => void) | null = null
// Set up progress update handler
const handler = (update: LlmProgressUpdate) => {
if (resolver) {
resolver(update)
resolver = null
} else {
updateQueue.push(update)
}
if (update.type === 'final_response' || update.type === 'error') {
isComplete = true
}
}
connection.on('ProgressUpdate', handler)
try {
// Send chat request to backend
const cookies = new Cookies()
const bearerToken = cookies.get('token')
const response = await fetch(`${this.baseUrl}/Llm/ChatStream`, {
method: 'POST',
headers: {
'Content-Type': 'application/json',
...(bearerToken ? { Authorization: `Bearer ${bearerToken}` } : {})
},
body: JSON.stringify(request)
})
if (!response.ok) {
const errorText = await response.text()
yield {
type: 'error',
message: `HTTP ${response.status}: ${errorText}`,
error: errorText
}
return
}
// Yield updates as they arrive via SignalR
while (!isComplete) {
// Check if we have queued updates
if (updateQueue.length > 0) {
const update = updateQueue.shift()!
yield update
if (update.type === 'final_response' || update.type === 'error') {
break
}
} else {
// Wait for next update
const update = await new Promise<LlmProgressUpdate>((resolve) => {
resolver = resolve
})
yield update
if (update.type === 'final_response' || update.type === 'error') {
break
}
}
}
// Yield any remaining queued updates
while (updateQueue.length > 0) {
yield updateQueue.shift()!
}
} catch (e) {
const error = e instanceof Error ? e : new Error(String(e))
yield {
type: 'error',
message: `Error: ${error.message}`,
error: error.message
}
} finally {
// Clean up handler
connection.off('ProgressUpdate', handler)
}
}
/**
* Get available LLM providers
*/