undo a typo, add a passthrough distribution

2025-12-04 02:03:44 +00:00 · 2024-08-02 20:48:53 -07:00 · 2024-08-02 20:48:53 -07:00 · 38fd76f85c
commit 38fd76f85c
parent 67229f23a4
2 changed files with 24 additions and 2 deletions
--- a/llama_toolchain/distribution/registry.py
+++ b/llama_toolchain/distribution/registry.py
@ -9,7 +9,7 @@ from typing import List, Optional
 from llama_toolchain.inference.adapters import available_inference_adapters
-from .datatypes import ApiSurface, Distribution
+from .datatypes import ApiSurface, Distribution, PassthroughApiAdapter
 # This is currently duplicated from `requirements.txt` with a few minor changes
 # dev-dependencies like "ufmt" etc. are nuked. A few specialized dependencies
@ -57,6 +57,28 @@ def available_distributions() -> List[Distribution]:
                ApiSurface.inference: inference_adapters_by_id["meta-reference"],
            },
        ),
        Distribution(
            name="full-passthrough",
            description="Point to remote services for all llama stack APIs",
            additional_pip_packages=[
                "python-dotenv",
                "blobfile",
                "codeshield",
                "fairscale",
                "fastapi",
                "fire",
                "flake8",
                "httpx",
                "huggingface-hub",
            ],
            adapters={
                ApiSurface.inference: PassthroughApiAdapter(
                    api_surface=ApiSurface.inference,
                    adapter_id="inference-passthrough",
                    base_url="http://localhost:5001",
                ),
            },
        ),
        Distribution(
            name="local-ollama",
            description="Like local-source, but use ollama for running LLM inference",
--- a/llama_toolchain/distribution/server.py
+++ b/llama_toolchain/distribution/server.py
@ -157,7 +157,7 @@ def create_dynamic_typed_route(func: Any):
                    )
            return StreamingResponse(
-                sse_generator(func(request2)), media_type="text/event-stream"
+                sse_generator(func(request)), media_type="text/event-stream"
            )
    else: