more progress on auto-generation

2025-12-17 13:32:35 +00:00 · 2024-11-15 09:35:38 -08:00 · 2024-11-15 09:35:38 -08:00 · e4509cb568
commit e4509cb568
parent cfa913fdd5
10 changed files with 309 additions and 73 deletions
--- a/llama_stack/providers/remote/inference/ollama/init.py
+++ b/llama_stack/providers/remote/inference/ollama/init.py
@ -4,11 +4,34 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.

+from typing import Optional
+
 from llama_stack.distribution.datatypes import RemoteProviderConfig
+from llama_stack.providers.utils.docker.service_config import DockerComposeServiceConfig
+
+
+DEFAULT_OLLAMA_PORT = 11434


 class OllamaImplConfig(RemoteProviderConfig):
-    port: int = 11434
+    port: int = DEFAULT_OLLAMA_PORT
+
+    @classmethod
+    def sample_docker_compose_config(cls) -> Optional[DockerComposeServiceConfig]:
+        return DockerComposeServiceConfig(
+            image="ollama/ollama:latest",
+            volumes=["$HOME/.ollama:/root/.ollama"],
+            devices=["nvidia.com/gpu=all"],
+            deploy={
+                "resources": {
+                    "reservations": {
+                        "devices": [{"driver": "nvidia", "capabilities": ["gpu"]}]
+                    }
+                }
+            },
+            runtime="nvidia",
+            ports=[f"{DEFAULT_OLLAMA_PORT}:{DEFAULT_OLLAMA_PORT}"],
+        )


 async def get_adapter_impl(config: RemoteProviderConfig, _deps):