mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-06 04:34:57 +00:00
router table registration works
This commit is contained in:
parent
85d927adde
commit
951cc9d7b7
4 changed files with 91 additions and 27 deletions
|
@ -21,18 +21,22 @@ provider_routing_table:
|
|||
max_seq_len: 4096
|
||||
max_batch_size: 1
|
||||
- routing_key: Meta-Llama3.1-8B
|
||||
provider_id: remote::ollama
|
||||
config:
|
||||
url: http:ollama-url-1.com
|
||||
memory:
|
||||
- routing_key: keyvalue
|
||||
provider_id: remote::pgvector
|
||||
config:
|
||||
host: localhost
|
||||
port: 5432
|
||||
db: vectordb
|
||||
user: vectoruser
|
||||
password: xxxx
|
||||
- routing_key: vector
|
||||
provider_id: meta-reference
|
||||
config: {}
|
||||
config:
|
||||
model: Meta-Llama3.1-8B
|
||||
quantization: null
|
||||
torch_seed: null
|
||||
max_seq_len: 4096
|
||||
max_batch_size: 1
|
||||
# memory:
|
||||
# - routing_key: keyvalue
|
||||
# provider_id: remote::pgvector
|
||||
# config:
|
||||
# host: localhost
|
||||
# port: 5432
|
||||
# db: vectordb
|
||||
# user: vectoruser
|
||||
# password: xxxx
|
||||
# - routing_key: vector
|
||||
# provider_id: meta-reference
|
||||
# config: {}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue