mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-26 11:14:04 +00:00
* remove unused imports * fix AmazonConverseConfig * fix test * fix import * ruff check fixes * test fixes * fix testing * fix imports
132 lines
4.9 KiB
Python
132 lines
4.9 KiB
Python
from typing import Literal, Optional, Tuple, Union
|
|
|
|
from litellm.secret_managers.main import get_secret_str
|
|
|
|
from ...openai.chat.gpt_transformation import OpenAIGPTConfig
|
|
from ..embed.fireworks_ai_transformation import FireworksAIEmbeddingConfig
|
|
|
|
|
|
class FireworksAIConfig(OpenAIGPTConfig):
|
|
"""
|
|
Reference: https://docs.fireworks.ai/api-reference/post-chatcompletions
|
|
|
|
The class `FireworksAIConfig` provides configuration for the Fireworks's Chat Completions API interface. Below are the parameters:
|
|
"""
|
|
|
|
tools: Optional[list] = None
|
|
tool_choice: Optional[Union[str, dict]] = None
|
|
max_tokens: Optional[int] = None
|
|
temperature: Optional[int] = None
|
|
top_p: Optional[int] = None
|
|
top_k: Optional[int] = None
|
|
frequency_penalty: Optional[int] = None
|
|
presence_penalty: Optional[int] = None
|
|
n: Optional[int] = None
|
|
stop: Optional[Union[str, list]] = None
|
|
response_format: Optional[dict] = None
|
|
user: Optional[str] = None
|
|
logprobs: Optional[int] = None
|
|
|
|
# Non OpenAI parameters - Fireworks AI only params
|
|
prompt_truncate_length: Optional[int] = None
|
|
context_length_exceeded_behavior: Optional[Literal["error", "truncate"]] = None
|
|
|
|
def __init__(
|
|
self,
|
|
tools: Optional[list] = None,
|
|
tool_choice: Optional[Union[str, dict]] = None,
|
|
max_tokens: Optional[int] = None,
|
|
temperature: Optional[int] = None,
|
|
top_p: Optional[int] = None,
|
|
top_k: Optional[int] = None,
|
|
frequency_penalty: Optional[int] = None,
|
|
presence_penalty: Optional[int] = None,
|
|
n: Optional[int] = None,
|
|
stop: Optional[Union[str, list]] = None,
|
|
response_format: Optional[dict] = None,
|
|
user: Optional[str] = None,
|
|
logprobs: Optional[int] = None,
|
|
prompt_truncate_length: Optional[int] = None,
|
|
context_length_exceeded_behavior: Optional[Literal["error", "truncate"]] = None,
|
|
) -> None:
|
|
locals_ = locals().copy()
|
|
for key, value in locals_.items():
|
|
if key != "self" and value is not None:
|
|
setattr(self.__class__, key, value)
|
|
|
|
@classmethod
|
|
def get_config(cls):
|
|
return super().get_config()
|
|
|
|
def get_supported_openai_params(self, model: str):
|
|
return [
|
|
"stream",
|
|
"tools",
|
|
"tool_choice",
|
|
"max_completion_tokens",
|
|
"max_tokens",
|
|
"temperature",
|
|
"top_p",
|
|
"top_k",
|
|
"frequency_penalty",
|
|
"presence_penalty",
|
|
"n",
|
|
"stop",
|
|
"response_format",
|
|
"user",
|
|
"logprobs",
|
|
"prompt_truncate_length",
|
|
"context_length_exceeded_behavior",
|
|
]
|
|
|
|
def map_openai_params(
|
|
self,
|
|
non_default_params: dict,
|
|
optional_params: dict,
|
|
model: str,
|
|
drop_params: bool,
|
|
) -> dict:
|
|
|
|
supported_openai_params = self.get_supported_openai_params(model=model)
|
|
for param, value in non_default_params.items():
|
|
if param == "tool_choice":
|
|
if value == "required":
|
|
# relevant issue: https://github.com/BerriAI/litellm/issues/4416
|
|
optional_params["tool_choice"] = "any"
|
|
else:
|
|
# pass through the value of tool choice
|
|
optional_params["tool_choice"] = value
|
|
elif (
|
|
param == "response_format" and value.get("type", None) == "json_schema"
|
|
):
|
|
optional_params["response_format"] = {
|
|
"type": "json_object",
|
|
"schema": value["json_schema"]["schema"],
|
|
}
|
|
elif param == "max_completion_tokens":
|
|
optional_params["max_tokens"] = value
|
|
elif param in supported_openai_params:
|
|
if value is not None:
|
|
optional_params[param] = value
|
|
return optional_params
|
|
|
|
def _get_openai_compatible_provider_info(
|
|
self, model: str, api_base: Optional[str], api_key: Optional[str]
|
|
) -> Tuple[str, Optional[str], Optional[str]]:
|
|
if FireworksAIEmbeddingConfig().is_fireworks_embedding_model(model=model):
|
|
# fireworks embeddings models do not require accounts/fireworks prefix https://docs.fireworks.ai/api-reference/creates-an-embedding-vector-representing-the-input-text
|
|
pass
|
|
elif not model.startswith("accounts/"):
|
|
model = f"accounts/fireworks/models/{model}"
|
|
api_base = (
|
|
api_base
|
|
or get_secret_str("FIREWORKS_API_BASE")
|
|
or "https://api.fireworks.ai/inference/v1"
|
|
) # type: ignore
|
|
dynamic_api_key = api_key or (
|
|
get_secret_str("FIREWORKS_API_KEY")
|
|
or get_secret_str("FIREWORKS_AI_API_KEY")
|
|
or get_secret_str("FIREWORKSAI_API_KEY")
|
|
or get_secret_str("FIREWORKS_AI_TOKEN")
|
|
)
|
|
return model, api_base, dynamic_api_key
|