fix issue w/ enforcing api

2025-07-29 07:14:20 +00:00 · 2024-10-23 15:15:52 -07:00 · 2024-10-23 15:15:52 -07:00 · 07d45f2af3
commit 07d45f2af3
parent 21f2e9adf5
3 changed files with 14 additions and 7 deletions
--- a/llama_stack/distribution/distribution.py
+++ b/llama_stack/distribution/distribution.py
@ -35,6 +35,7 @@ def builtin_automatically_routed_apis() -> List[AutoRoutedApiInfo]:
            routing_table_api=Api.memory_banks,
            router_api=Api.memory,
        ),
+        # TODO: re-enable once we have proper checking on builtin routing: Issue #297
        AutoRoutedApiInfo(
            routing_table_api=Api.datasets,
            router_api=Api.datasetio,
--- a/llama_stack/distribution/server/server.py
+++ b/llama_stack/distribution/server/server.py
@ -288,6 +288,8 @@ def main(
        apis_to_serve = set(impls.keys())

    for inf in builtin_automatically_routed_apis():
+        if inf.router_api.value not in apis_to_serve:
+            continue
        apis_to_serve.add(inf.routing_table_api.value)

    apis_to_serve.add("inspect")
--- a/tests/examples/local-run.yaml
+++ b/tests/examples/local-run.yaml
@ -13,14 +13,18 @@ apis:
 - safety
 providers:
  inference:
-  - provider_id: meta-reference
-    provider_type: meta-reference
+  - provider_id: tgi0
+    provider_type: remote::tgi
    config:
-      model: Llama3.1-8B-Instruct
-      quantization: null
-      torch_seed: null
-      max_seq_len: 4096
-      max_batch_size: 1
+      url: http://127.0.0.1:5009
+  # - provider_id: meta-reference
+  #   provider_type: meta-reference
+  #   config:
+  #     model: Llama3.1-8B-Instruct
+  #     quantization: null
+  #     torch_seed: null
+  #     max_seq_len: 4096
+  #     max_batch_size: 1
  safety:
  - provider_id: meta-reference
    provider_type: meta-reference