diff --git a/llama_stack/providers/adapters/inference/ollama/__init__.py b/llama_stack/providers/adapters/inference/ollama/__init__.py index 7763af8d1..68c8077ff 100644 --- a/llama_stack/providers/adapters/inference/ollama/__init__.py +++ b/llama_stack/providers/adapters/inference/ollama/__init__.py @@ -4,16 +4,16 @@ # This source code is licensed under the terms described in the LICENSE file in # the root directory of this source tree. +from typing import List from llama_stack.distribution.datatypes import RemoteProviderConfig - class OllamaImplConfig(RemoteProviderConfig): port: int = 11434 + preload_models: List[str] = ["Llama3.1-8B-Instruct"] - -async def get_adapter_impl(config: RemoteProviderConfig, _deps): +async def get_adapter_impl(config: OllamaImplConfig, _deps): from .ollama import OllamaInferenceAdapter - impl = OllamaInferenceAdapter(config.url) + impl = OllamaInferenceAdapter(config.url, config.preload_models) await impl.initialize() return impl