address feedback

2025-12-21 03:02:25 +00:00 · 2024-11-08 16:11:53 -08:00 · 2024-11-08 16:11:53 -08:00 · d6a9a17828
commit d6a9a17828
parent 772e23e29e
4 changed files with 2 additions and 19 deletions
--- a/llama_stack/providers/inline/inference/vllm/vllm.py
+++ b/llama_stack/providers/inline/inference/vllm/vllm.py
@ -88,14 +88,6 @@ class VLLMInferenceImpl(Inference, ModelsProtocolPrivate):
            "You cannot dynamically add a model to a running vllm instance"
        )

-    async def list_models(self) -> List[Model]:
-        return [
-            Model(
-                identifier=self.config.model,
-                llama_model=self.config.model,
-            )
-        ]
-
    def _sampling_params(self, sampling_params: SamplingParams) -> VLLMSamplingParams:
        if sampling_params is None:
            return VLLMSamplingParams(max_tokens=self.config.max_tokens)