Ensure models are downloaded before serving in Ollama inference

2025-07-29 15:23:51 +00:00 · 2024-10-06 12:09:22 -04:00 · 2024-10-06 12:09:22 -04:00 · 969a11fb8a
commit 969a11fb8a
parent 0edf24b227
2 changed files with 8 additions and 9 deletions
--- a/llama_stack/providers/adapters/inference/ollama/init.py
+++ b/llama_stack/providers/adapters/inference/ollama/init.py
@ -15,12 +15,6 @@ async def get_adapter_impl(config: RemoteProviderConfig, _deps):
    from .ollama import OllamaInferenceAdapter
    impl = OllamaInferenceAdapter(config.url)
-
+    impl._deps = _deps
-    routing_key = _deps.get("routing_key")
+    await impl.initialize()
    if not routing_key:
        raise ValueError(
            "Routing key is required for the Ollama adapter but was not found."
        )
    await impl.initialize(routing_key)
    return impl
--- a/llama_stack/providers/adapters/inference/ollama/ollama.py
+++ b/llama_stack/providers/adapters/inference/ollama/ollama.py
@ -45,10 +45,15 @@ class OllamaInferenceAdapter(Inference, RoutableProviderForModels):
    def client(self) -> AsyncClient:
        return AsyncClient(host=self.url)
-    async def initialize(self, routing_key: str) -> None:
+    async def initialize(self) -> None:
        print("Initializing Ollama, checking connectivity to server...")
        try:
            await self.client.ps()
            routing_key = self._deps.get("routing_key")
            if not routing_key:
                raise ValueError(
                    "Routing key is required for the Ollama adapter but was not found."
                )
            ollama_model = self.map_to_provider_model(routing_key)
            print(f"Connected to Ollama server. Pre-downloading {ollama_model}...")
            await self.predownload_models(ollama_model)