Improve VLLM model discovery error handling

• Add comprehensive error handling in check_model_availability method • Provide helpful error messages with actionable solutions for 404 errors • Warn when API token is set but model discovery is disabled
2025-12-14 12:12:45 +00:00 · 2025-10-06 12:56:05 +02:00 · 2025-10-06 12:56:05 +02:00 · e28bc93635
commit e28bc93635
parent e9214f9004
15 changed files with 69 additions and 50 deletions
--- a/llama_stack/distributions/ci-tests/run.yaml
+++ b/llama_stack/distributions/ci-tests/run.yaml
@ -31,7 +31,7 @@ providers:
      max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
      api_token: ${env.VLLM_API_TOKEN:=fake}
      tls_verify: ${env.VLLM_TLS_VERIFY:=true}
-      allow_listing_models: ${env.VLLM_ALLOW_LISTING_MODELS:=true}
+      enable_model_discovery: ${env.VLLM_ENABLE_MODEL_DISCOVERY:=true}
  - provider_id: ${env.TGI_URL:+tgi}
    provider_type: remote::tgi
    config: