Allow setting environment variables from llama stack run and fix ollama

2025-12-17 17:59:52 +00:00 · 2024-11-17 19:33:48 -08:00 · 2024-11-17 19:33:48 -08:00 · b1d119466e
commit b1d119466e
parent a061f3f8c1
19 changed files with 129 additions and 55 deletions
--- a/llama_stack/templates/ollama/ollama.py
+++ b/llama_stack/templates/ollama/ollama.py
@ -23,9 +23,7 @@ def get_distribution_template() -> DistributionTemplate:
    inference_provider = Provider(
        provider_id="ollama",
        provider_type="remote::ollama",
-        config=OllamaImplConfig.sample_run_config(
-            port_str="${env.OLLAMA_PORT}",
-        ),
+        config=OllamaImplConfig.sample_run_config(),
    )

    inference_model = ModelInput(
@ -41,7 +39,7 @@ def get_distribution_template() -> DistributionTemplate:
        name="ollama",
        distro_type="self_hosted",
        description="Use (an external) Ollama server for running LLM inference",
-        docker_image="llamastack/distribution-ollama:test-0.0.52rc3",
+        docker_image=None,
        template_path=Path(__file__).parent / "doc_template.md",
        providers=providers,
        default_models=[inference_model, safety_model],
@ -74,9 +72,9 @@ def get_distribution_template() -> DistributionTemplate:
                "meta-llama/Llama-3.2-3B-Instruct",
                "Inference model loaded into the TGI server",
            ),
-            "OLLAMA_PORT": (
-                "14343",
-                "Port of the Ollama server",
+            "OLLAMA_URL": (
+                "http://host.docker.internal:11434",
+                "URL of the Ollama server",
            ),
            "SAFETY_MODEL": (
                "meta-llama/Llama-Guard-3-1B",