From 248237d868ead9d570ac2553b9d1637f3c0b75e3 Mon Sep 17 00:00:00 2001 From: balex Date: Sat, 21 Feb 2026 21:57:50 +0100 Subject: [PATCH] vectorstore --- .../balex/rag/advisors/expansion/ExpansionQueryAdvisor.java | 1 + .../main/java/com/balex/rag/config/RagExpansionProperties.java | 3 ++- rag-service/src/main/resources/application.properties | 2 +- 3 files changed, 4 insertions(+), 2 deletions(-) diff --git a/rag-service/src/main/java/com/balex/rag/advisors/expansion/ExpansionQueryAdvisor.java b/rag-service/src/main/java/com/balex/rag/advisors/expansion/ExpansionQueryAdvisor.java index d51a4ff..ce4485f 100644 --- a/rag-service/src/main/java/com/balex/rag/advisors/expansion/ExpansionQueryAdvisor.java +++ b/rag-service/src/main/java/com/balex/rag/advisors/expansion/ExpansionQueryAdvisor.java @@ -49,6 +49,7 @@ public class ExpansionQueryAdvisor implements BaseAdvisor { public static ExpansionQueryAdvisorBuilder builder(ChatModel chatModel, RagExpansionProperties props) { return new ExpansionQueryAdvisorBuilder().chatClient(ChatClient.builder(chatModel) .defaultOptions(OpenAiChatOptions.builder() + .model(props.model()) .temperature(props.temperature()) .topP(props.topP()) .frequencyPenalty(props.repeatPenalty() - 1.0) // Ollama repeatPenalty 1.0 -> frequencyPenalty 0.0 diff --git a/rag-service/src/main/java/com/balex/rag/config/RagExpansionProperties.java b/rag-service/src/main/java/com/balex/rag/config/RagExpansionProperties.java index 21955cd..c7144dd 100644 --- a/rag-service/src/main/java/com/balex/rag/config/RagExpansionProperties.java +++ b/rag-service/src/main/java/com/balex/rag/config/RagExpansionProperties.java @@ -8,5 +8,6 @@ public record RagExpansionProperties( @DefaultValue("0.0") double temperature, @DefaultValue("1") int topK, @DefaultValue("0.1") double topP, - @DefaultValue("1.0") double repeatPenalty + @DefaultValue("1.0") double repeatPenalty, + @DefaultValue("llama-3.3-70b-versatile") String model ) {} diff --git a/rag-service/src/main/resources/application.properties b/rag-service/src/main/resources/application.properties index 84c1a5a..7eef244 100644 --- a/rag-service/src/main/resources/application.properties +++ b/rag-service/src/main/resources/application.properties @@ -1,7 +1,7 @@ spring.application.name=rag-service # --- LLM Provider: Groq (OpenAI-compatible API) --- -spring.ai.openai.base-url=${SPRING_AI_OPENAI_BASE_URL:https://api.groq.com/openai/v1} +spring.ai.openai.base-url=${SPRING_AI_OPENAI_BASE_URL:https://api.groq.com/openai} spring.ai.openai.api-key=${SPRING_AI_OPENAI_API_KEY:} spring.ai.openai.chat.model=${SPRING_AI_OPENAI_CHAT_MODEL:llama-3.3-70b-versatile} spring.jpa.hibernate.ddl-auto=update