This commit is contained in:
Xi Yan 2024-10-23 15:19:41 -07:00
parent 07d45f2af3
commit 47d9030542
3 changed files with 8 additions and 12 deletions

View file

@ -35,7 +35,6 @@ def builtin_automatically_routed_apis() -> List[AutoRoutedApiInfo]:
routing_table_api=Api.memory_banks, routing_table_api=Api.memory_banks,
router_api=Api.memory, router_api=Api.memory,
), ),
# TODO: re-enable once we have proper checking on builtin routing: Issue #297
AutoRoutedApiInfo( AutoRoutedApiInfo(
routing_table_api=Api.datasets, routing_table_api=Api.datasets,
router_api=Api.datasetio, router_api=Api.datasetio,

View file

@ -288,6 +288,7 @@ def main(
apis_to_serve = set(impls.keys()) apis_to_serve = set(impls.keys())
for inf in builtin_automatically_routed_apis(): for inf in builtin_automatically_routed_apis():
# if we do not serve the corresponding router API, we should not serve the routing table API
if inf.router_api.value not in apis_to_serve: if inf.router_api.value not in apis_to_serve:
continue continue
apis_to_serve.add(inf.routing_table_api.value) apis_to_serve.add(inf.routing_table_api.value)

View file

@ -13,18 +13,14 @@ apis:
- safety - safety
providers: providers:
inference: inference:
- provider_id: tgi0 - provider_id: meta-reference
provider_type: remote::tgi provider_type: meta-reference
config: config:
url: http://127.0.0.1:5009 model: Llama3.1-8B-Instruct
# - provider_id: meta-reference quantization: null
# provider_type: meta-reference torch_seed: null
# config: max_seq_len: 4096
# model: Llama3.1-8B-Instruct max_batch_size: 1
# quantization: null
# torch_seed: null
# max_seq_len: 4096
# max_batch_size: 1
safety: safety:
- provider_id: meta-reference - provider_id: meta-reference
provider_type: meta-reference provider_type: meta-reference