diff --git a/rag-service/pom.xml b/rag-service/pom.xml index fe29688..3280b2a 100644 --- a/rag-service/pom.xml +++ b/rag-service/pom.xml @@ -6,12 +6,11 @@ org.springframework.boot spring-boot-starter-parent 3.5.7 - + com.balex rag 0.0.1-SNAPSHOT - rag Backend for queries to RAG @@ -29,6 +28,7 @@ 25 1.0.3 + 2025.0.0 0.2.0 @@ -40,6 +40,16 @@ org.springframework.boot spring-boot-starter-validation + + + org.springframework.boot + spring-boot-starter-actuator + + + + org.springframework.cloud + spring-cloud-starter-consul-discovery + org.apache.commons commons-lang3 @@ -160,6 +170,13 @@ pom import + + org.springframework.cloud + spring-cloud-dependencies + ${spring-cloud.version} + pom + import + diff --git a/rag-service/src/main/resources/application.properties b/rag-service/src/main/resources/application.properties index 14e3da0..6a10acf 100644 --- a/rag-service/src/main/resources/application.properties +++ b/rag-service/src/main/resources/application.properties @@ -5,11 +5,21 @@ spring.ai.openai.base-url=${SPRING_AI_OPENAI_BASE_URL:https://api.groq.com/opena spring.ai.openai.api-key=${SPRING_AI_OPENAI_API_KEY:} spring.ai.openai.chat.model=${SPRING_AI_OPENAI_CHAT_MODEL:llama-3.3-70b-versatile} -# --- Embedding model: use local pgvector with a lightweight model --- -# Groq does not provide an embedding endpoint, so we disable OpenAI embedding auto-config -# and rely on the pgvector store's existing embedding setup +# --- Embedding model: local ONNX (Groq has no embedding API) --- spring.ai.openai.embedding.enabled=false +# --- Consul service discovery --- +spring.cloud.consul.host=${SPRING_CLOUD_CONSUL_HOST:localhost} +spring.cloud.consul.port=${SPRING_CLOUD_CONSUL_PORT:8500} +spring.cloud.consul.discovery.service-name=rag-service +spring.cloud.consul.discovery.instance-id=${spring.application.name}-${random.value} +spring.cloud.consul.discovery.prefer-ip-address=true +spring.cloud.consul.discovery.health-check-interval=10s + +# --- Actuator --- +management.endpoints.web.exposure.include=health,info +management.endpoint.health.show-details=always + jwt.secret=${JWT_SECRET:ywfI6dBznYmHbokihB/OBzZz6E0Fj+6PiqrM8dQ5c3t0HeYarblCbOGM8vQtOt472AtQ+MsCH7OVIKHOzjrPsQ==} jwt.expiration=103600000 spring.datasource.url=${SPRING_DATASOURCE_URL:jdbc:postgresql://localhost:5432/ragdb}