GPU
This commit is contained in:
@@ -1,24 +1,29 @@
|
||||
spring.application.name=rag
|
||||
#spring.ai.ollama.base-url=http://localhost:11431
|
||||
spring.ai.ollama.base-url=http://localhost:11434
|
||||
#spring.ai.ollama.chat.model=gemma3:4b-it-q4_K_M
|
||||
spring.ai.ollama.chat.model=llama3.1:8b-instruct-q4_K_M
|
||||
jwt.secret=ywfI6dBznYmHbokihB/OBzZz6E0Fj+6PiqrM8dQ5c3t0HeYarblCbOGM8vQtOt472AtQ+MsCH7OVIKHOzjrPsQ==
|
||||
spring.application.name=rag-service
|
||||
|
||||
# --- LLM Provider: Groq (OpenAI-compatible API) ---
|
||||
spring.ai.openai.base-url=${SPRING_AI_OPENAI_BASE_URL:https://api.groq.com/openai/v1}
|
||||
spring.ai.openai.api-key=${SPRING_AI_OPENAI_API_KEY:}
|
||||
spring.ai.openai.chat.model=${SPRING_AI_OPENAI_CHAT_MODEL:llama-3.3-70b-versatile}
|
||||
|
||||
# --- Embedding model: use local pgvector with a lightweight model ---
|
||||
# Groq does not provide an embedding endpoint, so we disable OpenAI embedding auto-config
|
||||
# and rely on the pgvector store's existing embedding setup
|
||||
spring.ai.openai.embedding.enabled=false
|
||||
|
||||
jwt.secret=${JWT_SECRET:ywfI6dBznYmHbokihB/OBzZz6E0Fj+6PiqrM8dQ5c3t0HeYarblCbOGM8vQtOt472AtQ+MsCH7OVIKHOzjrPsQ==}
|
||||
jwt.expiration=103600000
|
||||
spring.datasource.url=jdbc:postgresql://localhost:5432/ragdb
|
||||
spring.datasource.username=postgres
|
||||
spring.datasource.password=postgres
|
||||
spring.datasource.url=${SPRING_DATASOURCE_URL:jdbc:postgresql://localhost:5432/ragdb}
|
||||
spring.datasource.username=${SPRING_DATASOURCE_USERNAME:postgres}
|
||||
spring.datasource.password=${SPRING_DATASOURCE_PASSWORD:postgres}
|
||||
logging.level.org.springframework.ai.chat.client.advisor=DEBUG
|
||||
logging.level.org.springframework.web.servlet.mvc.method.annotation.RequestMappingHandlerMapping=DEBUG
|
||||
logging.level.org.springframework.web=DEBUG
|
||||
logging.level.org.flywaydb=DEBUG
|
||||
logging.level.com.balex.rag.controller=DEBUG
|
||||
app.document.chunk-size=200
|
||||
#spring.main.allow-circular-references=true
|
||||
server.compression.enabled=false
|
||||
server.tomcat.connection-timeout=60000
|
||||
spring.mvc.async.request-timeout=60000
|
||||
#spring.main.web-application-type=reactive
|
||||
end.points.users=/users
|
||||
end.points.id=/{id}
|
||||
end.points.all=/all
|
||||
@@ -31,7 +36,7 @@ end.points.register=/register
|
||||
end.points.chat=/chat
|
||||
end.points.entry=/entry
|
||||
end.points.document=/documents
|
||||
rag.rerank-fetch-multiplier = 2
|
||||
rag.rerank-fetch-multiplier=2
|
||||
#Swagger
|
||||
swagger.servers.first=http://localhost:8080
|
||||
springdoc.swagger-ui.path=/swagger-ui.html
|
||||
|
||||
Reference in New Issue
Block a user