Merge branch 'master' into ui

This commit is contained in:
Marco Minerva
2025-02-20 10:42:51 +01:00
4 changed files with 15 additions and 5 deletions
+1 -1
View File
@@ -6,7 +6,7 @@ The application is a Minimal API that exposes endpoints to load documents, gener
> [!NOTE] > [!NOTE]
> If you prefer to use straight SQL, check out the [sql branch](https://github.com/marcominerva/SqlDatabaseVectorSearch/tree/sql). > If you prefer to use straight SQL, check out the [sql branch](https://github.com/marcominerva/SqlDatabaseVectorSearch/tree/sql).
![SQL Database Vector Search](https://github.com/marcominerva/SqlDatabaseVectorSearch/blob/master/SqlDatabaseVectorSearch.png) ![SQL Database Vector Search](https://raw.githubusercontent.com/marcominerva/SqlDatabaseVectorSearch/refs/heads/master/SqlDatabaseVectorSearch.png)
## Setup ## Setup
@@ -156,7 +156,14 @@ public class ChatService(IChatCompletionService chatCompletionService, Tokenizer
} }
private async Task UpdateCacheAsync(Guid conversationId, ChatHistory chat, CancellationToken cancellationToken) private async Task UpdateCacheAsync(Guid conversationId, ChatHistory chat, CancellationToken cancellationToken)
=> await cache.SetAsync(conversationId.ToString(), chat, cancellationToken: cancellationToken); {
if (chat.Count > appSettings.MessageLimit)
{
chat.RemoveRange(0, chat.Count - appSettings.MessageLimit);
}
await cache.SetAsync(conversationId.ToString(), chat, cancellationToken: cancellationToken);
}
private async Task<ChatHistory> GetChatHistoryAsync(Guid conversationId, CancellationToken cancellationToken) private async Task<ChatHistory> GetChatHistoryAsync(Guid conversationId, CancellationToken cancellationToken)
{ {
@@ -15,4 +15,6 @@ public class AppSettings
public int MaxOutputTokens { get; init; } = 800; public int MaxOutputTokens { get; init; } = 800;
public TimeSpan MessageExpiration { get; init; } public TimeSpan MessageExpiration { get; init; }
public int MessageLimit { get; set; } = 20;
} }
+3 -2
View File
@@ -24,9 +24,10 @@
"MaxTokensPerParagraph": 1000, "MaxTokensPerParagraph": 1000,
"OverlapTokens": 100, "OverlapTokens": 100,
"MaxRelevantChunks": 10, "MaxRelevantChunks": 10,
"MaxInputTokens": 16385, "MaxInputTokens": 16384,
"MaxOutputTokens": 800, "MaxOutputTokens": 800,
"MessageExpiration": "00:05:00" "MessageExpiration": "00:05:00",
"MessageLimit": 20
}, },
"Logging": { "Logging": {
"LogLevel": { "LogLevel": {