diff --git a/llama_stack/providers/remote/inference/watsonx/config.py b/llama_stack/providers/remote/inference/watsonx/config.py index 0bffae38f..973b9b4d1 100644 --- a/llama_stack/providers/remote/inference/watsonx/config.py +++ b/llama_stack/providers/remote/inference/watsonx/config.py @@ -32,7 +32,7 @@ class WatsonXConfig(BaseModel): default_factory=lambda: os.getenv("WATSONX_PROJECT_ID"), description="The Project ID key, only needed of using the hosted service", ) - model_id: str | None = Field( + health_check_model_id: str | None = Field( default_factory=lambda: os.getenv("WATSONX_HEALTH_CHECK_MODEL_ID", "ibm/granite-3-8b-instruct"), description="The Model ID key, only needed of using the hosted service", ) diff --git a/llama_stack/providers/remote/inference/watsonx/watsonx.py b/llama_stack/providers/remote/inference/watsonx/watsonx.py index 7567fb814..3ec5fce66 100644 --- a/llama_stack/providers/remote/inference/watsonx/watsonx.py +++ b/llama_stack/providers/remote/inference/watsonx/watsonx.py @@ -91,7 +91,7 @@ class WatsonXInferenceAdapter(Inference, ModelRegistryHelper): HealthResponse: A dictionary containing the health status. """ try: - client_model = self._get_client(self._config.model_id) + client_model = self._get_client(self._config.health_check_model_id) client_model.get_details() return HealthResponse(status=HealthStatus.OK) except Exception as ex: