models endpoint testing

This commit is contained in:
Xi Yan 2024-09-22 00:01:35 -07:00
parent c0199029e5
commit 0348f26e00
10 changed files with 235 additions and 79 deletions

View file

@ -7,6 +7,7 @@ apis_to_serve:
- safety
- agents
- memory
- models
provider_map:
inference:
provider_id: meta-reference
@ -16,6 +17,10 @@ provider_map:
torch_seed: null
max_seq_len: 4096
max_batch_size: 1
# inference:
# provider_id: remote::ollama
# config:
# url: https://xxx
safety:
provider_id: meta-reference
config: