mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-01 03:58:40 +00:00
fix review comment against health check env var naming
This commit is contained in:
parent
f235e2eca1
commit
61cd8540de
2 changed files with 3 additions and 1 deletions
|
@ -33,7 +33,7 @@ class WatsonXConfig(BaseModel):
|
||||||
description="The Project ID key, only needed of using the hosted service",
|
description="The Project ID key, only needed of using the hosted service",
|
||||||
)
|
)
|
||||||
model_id: str | None = Field(
|
model_id: str | None = Field(
|
||||||
default_factory=lambda: os.getenv("WATSONX_MODEL_ID", "ibm/granite-3-8b-instruct"),
|
default_factory=lambda: os.getenv("WATSONX_HEALTH_CHECK_MODEL_ID", "ibm/granite-3-8b-instruct"),
|
||||||
description="The Model ID key, only needed of using the hosted service",
|
description="The Model ID key, only needed of using the hosted service",
|
||||||
)
|
)
|
||||||
timeout: int = Field(
|
timeout: int = Field(
|
||||||
|
|
|
@ -85,6 +85,8 @@ class WatsonXInferenceAdapter(Inference, ModelRegistryHelper):
|
||||||
Performs a health check by verifying connectivity to the Watsonx server.
|
Performs a health check by verifying connectivity to the Watsonx server.
|
||||||
This method is used by the Provider API to verify
|
This method is used by the Provider API to verify
|
||||||
that the service is running correctly.
|
that the service is running correctly.
|
||||||
|
Specify the model ID as WATSONX_HEALTH_CHECK_MODEL_ID under env. var.
|
||||||
|
to use for the health check, which defaults to "ibm/granite-3-8b-instruct".
|
||||||
Returns:
|
Returns:
|
||||||
HealthResponse: A dictionary containing the health status.
|
HealthResponse: A dictionary containing the health status.
|
||||||
"""
|
"""
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue