fix issue w/ enforcing api

This commit is contained in:
Xi Yan 2024-10-23 15:15:52 -07:00
parent 21f2e9adf5
commit 07d45f2af3
3 changed files with 14 additions and 7 deletions

View file

@ -35,6 +35,7 @@ def builtin_automatically_routed_apis() -> List[AutoRoutedApiInfo]:
routing_table_api=Api.memory_banks,
router_api=Api.memory,
),
# TODO: re-enable once we have proper checking on builtin routing: Issue #297
AutoRoutedApiInfo(
routing_table_api=Api.datasets,
router_api=Api.datasetio,

View file

@ -288,6 +288,8 @@ def main(
apis_to_serve = set(impls.keys())
for inf in builtin_automatically_routed_apis():
if inf.router_api.value not in apis_to_serve:
continue
apis_to_serve.add(inf.routing_table_api.value)
apis_to_serve.add("inspect")

View file

@ -13,14 +13,18 @@ apis:
- safety
providers:
inference:
- provider_id: meta-reference
provider_type: meta-reference
- provider_id: tgi0
provider_type: remote::tgi
config:
model: Llama3.1-8B-Instruct
quantization: null
torch_seed: null
max_seq_len: 4096
max_batch_size: 1
url: http://127.0.0.1:5009
# - provider_id: meta-reference
# provider_type: meta-reference
# config:
# model: Llama3.1-8B-Instruct
# quantization: null
# torch_seed: null
# max_seq_len: 4096
# max_batch_size: 1
safety:
- provider_id: meta-reference
provider_type: meta-reference