mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-24 16:57:21 +00:00
# What does this PR do? on the path to maintainable impls of inference providers. make all configs instances of RemoteInferenceProviderConfig. ## Test Plan ci
34 lines
1 KiB
Python
34 lines
1 KiB
Python
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
import os
|
|
from typing import Any
|
|
|
|
from pydantic import Field, SecretStr
|
|
|
|
from llama_stack.providers.utils.inference.model_registry import RemoteInferenceProviderConfig
|
|
from llama_stack.schema_utils import json_schema_type
|
|
|
|
DEFAULT_BASE_URL = "https://api.cerebras.ai"
|
|
|
|
|
|
@json_schema_type
|
|
class CerebrasImplConfig(RemoteInferenceProviderConfig):
|
|
base_url: str = Field(
|
|
default=os.environ.get("CEREBRAS_BASE_URL", DEFAULT_BASE_URL),
|
|
description="Base URL for the Cerebras API",
|
|
)
|
|
api_key: SecretStr = Field(
|
|
default=SecretStr(os.environ.get("CEREBRAS_API_KEY")),
|
|
description="Cerebras API Key",
|
|
)
|
|
|
|
@classmethod
|
|
def sample_run_config(cls, api_key: str = "${env.CEREBRAS_API_KEY:=}", **kwargs) -> dict[str, Any]:
|
|
return {
|
|
"base_url": DEFAULT_BASE_URL,
|
|
"api_key": api_key,
|
|
}
|