ai-lc4j-demos/demo-05/src/main/resources/application.yaml

27 lines
780 B
YAML

quarkus:
langchain4j:
openai:
api-key: #PUT_YOUR_TOKEN_HERE
base-url: https://inference-llama33-70b-maas.apps.ai.kvant.cloud/v1/
timeout: 60s
chat-model:
model-name: inference-llama33-70b
#model-name: gpt-4o-mini
temperature: 1.0
#max-tokens: 1000
#frequency-penalty: 2
frequency-penalty: 0
log-requests: true
log-responses: true
easy-rag:
max-segment-size: 100
max-overlap-size: 25
max-results: 3
path: src/main/resources/rag
reuse-embeddings:
enabled: true
l4j:
custom-embedding-model:
model-name: inference-multilingual-e5l
base-url: https://inference-multilingual-e5l-maas.apps.ai.kvant.cloud/v1
api-key: #PUT_YOUR_TOKEN_HERE