Start auto-generating { build, run, doc.md } for distributions

2025-12-17 09:32:36 +00:00 · 2024-11-14 17:44:45 -08:00 · 2024-11-14 17:44:45 -08:00 · cfa913fdd5
commit cfa913fdd5
parent 20bf2f50c2
11 changed files with 362 additions and 23 deletions
--- a/llama_stack/providers/remote/inference/vllm/config.py
+++ b/llama_stack/providers/remote/inference/vllm/config.py
@ -24,3 +24,12 @@ class VLLMInferenceAdapterConfig(BaseModel):
        default="fake",
        description="The API token",
    )
+
+    @classmethod
+    def sample_dict(cls):
+        # TODO: we may need two modes, one for conda and one for docker
+        return {
+            "url": "${env.VLLM_URL:http://host.docker.internal:5100/v1}",
+            "max_tokens": "${env.VLLM_MAX_TOKENS:4096}",
+            "api_token": "${env.VLLM_API_TOKEN:fake}",
+        }