feat(ui/model_dashboard.tsx): add databricks models via admin ui

2024-05-23 20:28:54 -07:00 · 2024-05-23 20:28:54 -07:00 · f04e4b921b
commit f04e4b921b
parent c14584722e
11 changed files with 263 additions and 9 deletions
--- a/litellm/init.py
+++ b/litellm/init.py
@ -730,6 +730,7 @@ from .utils import (
    ModelResponse,
    ImageResponse,
    ImageObject,
    get_provider_fields,
 )
 from .llms.huggingface_restapi import HuggingfaceConfig
 from .llms.anthropic import AnthropicConfig
--- a/litellm/llms/databricks.py
+++ b/litellm/llms/databricks.py
@ -19,6 +19,7 @@ from litellm.llms.custom_httpx.http_handler import AsyncHTTPHandler, HTTPHandler
 from .base import BaseLLM
 import httpx  # type: ignore
 from litellm.types.llms.databricks import GenericStreamingChunk
 from litellm.types.utils import ProviderField
 class DatabricksError(Exception):
@ -76,6 +77,23 @@ class DatabricksConfig:
            and v is not None
        }
    def get_required_params(self) -> List[ProviderField]:
        """For a given provider, return it's required fields with a description"""
        return [
            ProviderField(
                field_name="api_key",
                field_type="string",
                field_description="Your Databricks API Key.",
                field_value="dapi...",
            ),
            ProviderField(
                field_name="api_base",
                field_type="string",
                field_description="Your Databricks API Base.",
                field_value="https://adb-..",
            ),
        ]
    def get_supported_openai_params(self):
        return ["stream", "stop", "temperature", "top_p", "max_tokens", "n"]
--- a/litellm/model_prices_and_context_window_backup.json
+++ b/litellm/model_prices_and_context_window_backup.json
@ -3390,9 +3390,10 @@
        "output_cost_per_token": 0.00000015,
        "litellm_provider": "anyscale", 
        "mode": "chat",
-        "supports_function_calling": true
+        "supports_function_calling": true,
        "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mistral-7B-Instruct-v0.1"
      },
-      "anyscale/Mixtral-8x7B-Instruct-v0.1": {
+      "anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1": {
        "max_tokens": 16384,
        "max_input_tokens": 16384,
        "max_output_tokens": 16384,
@ -3400,7 +3401,19 @@
        "output_cost_per_token": 0.00000015,
        "litellm_provider": "anyscale", 
        "mode": "chat",
-        "supports_function_calling": true
+        "supports_function_calling": true,
        "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mixtral-8x7B-Instruct-v0.1"
      },
      "anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1": {
        "max_tokens": 65536,
        "max_input_tokens": 65536,
        "max_output_tokens": 65536,
        "input_cost_per_token": 0.00000090, 
        "output_cost_per_token": 0.00000090,
        "litellm_provider": "anyscale", 
        "mode": "chat",
        "supports_function_calling": true,
        "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mixtral-8x22B-Instruct-v0.1"
      },
      "anyscale/HuggingFaceH4/zephyr-7b-beta": {
        "max_tokens": 16384,
@ -3411,6 +3424,16 @@
        "litellm_provider": "anyscale", 
        "mode": "chat"
      },
      "anyscale/google/gemma-7b-it": {
        "max_tokens": 8192,
        "max_input_tokens": 8192,
        "max_output_tokens": 8192,
        "input_cost_per_token": 0.00000015, 
        "output_cost_per_token": 0.00000015,
        "litellm_provider": "anyscale", 
        "mode": "chat",
        "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/google-gemma-7b-it"
      },
      "anyscale/meta-llama/Llama-2-7b-chat-hf": {
        "max_tokens": 4096,
        "max_input_tokens": 4096,
@ -3447,6 +3470,36 @@
        "litellm_provider": "anyscale", 
        "mode": "chat"
      },
      "anyscale/codellama/CodeLlama-70b-Instruct-hf": {
        "max_tokens": 4096,
        "max_input_tokens": 4096,
        "max_output_tokens": 4096,
        "input_cost_per_token": 0.000001, 
        "output_cost_per_token": 0.000001, 
        "litellm_provider": "anyscale", 
        "mode": "chat",
        "source" : "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/codellama-CodeLlama-70b-Instruct-hf"
      },
      "anyscale/meta-llama/Meta-Llama-3-8B-Instruct": {
        "max_tokens": 8192,
        "max_input_tokens": 8192,
        "max_output_tokens": 8192,
        "input_cost_per_token": 0.00000015, 
        "output_cost_per_token": 0.00000015, 
        "litellm_provider": "anyscale", 
        "mode": "chat",
        "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/meta-llama-Meta-Llama-3-8B-Instruct"
      },
      "anyscale/meta-llama/Meta-Llama-3-70B-Instruct": {
        "max_tokens": 8192,
        "max_input_tokens": 8192,
        "max_output_tokens": 8192,
        "input_cost_per_token": 0.00000100, 
        "output_cost_per_token": 0.00000100, 
        "litellm_provider": "anyscale", 
        "mode": "chat",
        "source" : "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/meta-llama-Meta-Llama-3-70B-Instruct"
      },
      "cloudflare/@cf/meta/llama-2-7b-chat-fp16": {
        "max_tokens": 3072, 
        "max_input_tokens": 3072, 
--- a/litellm/proxy/_types.py
+++ b/litellm/proxy/_types.py
@ -5,6 +5,7 @@ from typing import Optional, List, Union, Dict, Literal, Any
 from datetime import datetime
 import uuid, json, sys, os
 from litellm.types.router import UpdateRouterConfig
 from litellm.types.utils import ProviderField
 def hash_token(token: str):
@ -364,6 +365,11 @@ class ModelInfo(LiteLLMBase):
        return values
 class ProviderInfo(LiteLLMBase):
    name: str
    fields: List[ProviderField]
 class BlockUsers(LiteLLMBase):
    user_ids: List[str]  # required
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -9364,6 +9364,36 @@ async def delete_model(model_info: ModelInfoDelete):
        )
@router.get(
    "/model/settings",
    description="Returns provider name, description, and required parameters for each provider",
    tags=["model management"],
    dependencies=[Depends(user_api_key_auth)],
    include_in_schema=False,
 )
 async def model_settings():
    """
    Used by UI to generate 'model add' page
    {
        field_name=field_name,
        field_type=allowed_args[field_name]["type"], # string/int
        field_description=field_info.description or "", # human-friendly description
        field_value=general_settings.get(field_name, None), # example value
    }
    """
    returned_list = []
    for provider in litellm.provider_list:
        returned_list.append(
            ProviderInfo(
                name=provider,
                fields=litellm.get_provider_fields(custom_llm_provider=provider),
            )
        )
    return returned_list
 #### EXPERIMENTAL QUEUING ####
 async def _litellm_chat_completions_worker(data, user_api_key_dict):
    """
--- a/litellm/router.py
+++ b/litellm/router.py
@ -3342,10 +3342,14 @@ class Router:
                    non_default_params = litellm.utils.get_non_default_params(
                        passed_params=request_kwargs
                    )
                    special_params = ["response_object"]
                    # check if all params are supported
                    for k, v in non_default_params.items():
-                        if k not in supported_openai_params:
+                        if k not in supported_openai_params and k in special_params:
                            # if not -> invalid model
                            verbose_router_logger.debug(
                                f"INVALID MODEL INDEX @ REQUEST KWARG FILTERING, k={k}"
                            )
                            invalid_model_indices.append(idx)
        if len(invalid_model_indices) == len(_returned_deployments):
@ -3420,6 +3424,7 @@ class Router:
        ## get healthy deployments
        ### get all deployments
        healthy_deployments = [m for m in self.model_list if m["model_name"] == model]
        if len(healthy_deployments) == 0:
            # check if the user sent in a deployment name instead
            healthy_deployments = [
@ -3510,7 +3515,7 @@ class Router:
            if _allowed_model_region is None:
                _allowed_model_region = "n/a"
            raise ValueError(
-                f"{RouterErrors.no_deployments_available.value}, Try again in {self.cooldown_time} seconds. Passed model={model}. Enable pre-call-checks={self.enable_pre_call_checks}, allowed_model_region={_allowed_model_region}"
+                f"{RouterErrors.no_deployments_available.value}, Try again in {self.cooldown_time} seconds. Passed model={model}. pre-call-checks={self.enable_pre_call_checks}, allowed_model_region={_allowed_model_region}"
            )
        if (
--- a/litellm/types/utils.py
+++ b/litellm/types/utils.py
@ -1,6 +1,14 @@
-from typing import List, Optional, Union, Dict, Tuple, Literal, TypedDict
+from typing import List, Optional, Union, Dict, Tuple, Literal
 from typing_extensions import TypedDict
 class CostPerToken(TypedDict):
    input_cost_per_token: float
    output_cost_per_token: float
 class ProviderField(TypedDict):
    field_name: str
    field_type: Literal["string"]
    field_description: str
    field_value: str
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -34,7 +34,7 @@ from dataclasses import (
 import litellm._service_logger  # for storing API inputs, outputs, and metadata
 from litellm.llms.custom_httpx.http_handler import HTTPHandler
 from litellm.caching import DualCache
-from litellm.types.utils import CostPerToken
+from litellm.types.utils import CostPerToken, ProviderField
 oidc_cache = DualCache()
@ -7327,6 +7327,15 @@ def load_test_model(
        }
 def get_provider_fields(custom_llm_provider: str) -> List[ProviderField]:
    """Return the fields required for each provider"""
    if custom_llm_provider == "databricks":
        return litellm.DatabricksConfig().get_required_params()
    else:
        return []
 def validate_environment(model: Optional[str] = None) -> dict:
    """
    Checks if the environment variables are valid for the given model.
--- a/ui/litellm-dashboard/src/components/model_add/dynamic_form.tsx
+++ b/ui/litellm-dashboard/src/components/model_add/dynamic_form.tsx
@ -0,0 +1,47 @@
 import React from "react";
 import { Form, Input } from "antd";
 import { TextInput } from "@tremor/react";
 interface Field {
  field_name: string;
  field_type: string;
  field_description: string;
  field_value: string;
 }
 interface DynamicFieldsProps {
  fields: Field[];
  selectedProvider: string;
 }
 const getPlaceholder = (provider: string) => {
  // Implement your placeholder logic based on the provider
  return `Enter your ${provider} value here`;
 };
 const DynamicFields: React.FC<DynamicFieldsProps> = ({
  fields,
  selectedProvider,
 }) => {
  if (fields.length === 0) return null;
  return (
    <>
      {fields.map((field) => (
        <Form.Item
          key={field.field_name}
          rules={[{ required: true, message: "Required" }]}
          label={field.field_name
            .replace(/_/g, " ")
            .replace(/\b\w/g, (char) => char.toUpperCase())}
          name={field.field_name}
          tooltip={field.field_description}
          className="mb-2"
        >
          <TextInput placeholder={field.field_value} type="password" />
        </Form.Item>
      ))}
    </>
  );
 };
 export default DynamicFields;
--- a/ui/litellm-dashboard/src/components/model_dashboard.tsx
+++ b/ui/litellm-dashboard/src/components/model_dashboard.tsx
@ -48,6 +48,7 @@ import {
  modelMetricsSlowResponsesCall,
  getCallbacksCall,
  setCallbacksCall,
  modelSettingsCall,
 } from "./networking";
 import { BarChart, AreaChart } from "@tremor/react";
 import {
@ -84,6 +85,7 @@ import { UploadOutlined } from "@ant-design/icons";
 import type { UploadProps } from "antd";
 import { Upload } from "antd";
 import TimeToFirstToken from "./model_metrics/time_to_first_token";
 import DynamicFields from "./model_add/dynamic_form";
 interface ModelDashboardProps {
  accessToken: string | null;
  token: string | null;
@ -107,14 +109,27 @@ interface RetryPolicyObject {
 //["OpenAI", "Azure OpenAI", "Anthropic", "Gemini (Google AI Studio)", "Amazon Bedrock", "OpenAI-Compatible Endpoints (Groq, Together AI, Mistral AI, etc.)"]
 interface ProviderFields {
  field_name: string;
  field_type: string;
  field_description: string;
  field_value: string;
 }
 interface ProviderSettings {
  name: string;
  fields: ProviderFields[];
 }
 enum Providers {
  OpenAI = "OpenAI",
  Azure = "Azure",
  Anthropic = "Anthropic",
-  Google_AI_Studio = "Gemini (Google AI Studio)",
+  Google_AI_Studio = "Google AI Studio",
  Bedrock = "Amazon Bedrock",
  OpenAI_Compatible = "OpenAI-Compatible Endpoints (Groq, Together AI, Mistral AI, etc.)",
  Vertex_AI = "Vertex AI (Anthropic, Gemini, etc.)",
  Databricks = "Databricks",
 }
 const provider_map: Record<string, string> = {
@ -125,6 +140,7 @@ const provider_map: Record<string, string> = {
  Bedrock: "bedrock",
  OpenAI_Compatible: "openai",
  Vertex_AI: "vertex_ai",
  Databricks: "databricks",
 };
 const retry_policy_map: Record<string, string> = {
@ -247,6 +263,9 @@ const ModelDashboard: React.FC<ModelDashboardProps> = ({
    isNaN(Number(key))
  );
  const [providerSettings, setProviderSettings] = useState<ProviderSettings[]>(
    []
  );
  const [selectedProvider, setSelectedProvider] = useState<String>("OpenAI");
  const [healthCheckResponse, setHealthCheckResponse] = useState<string>("");
  const [editModalVisible, setEditModalVisible] = useState<boolean>(false);
@ -514,6 +533,9 @@ const ModelDashboard: React.FC<ModelDashboardProps> = ({
    }
    const fetchData = async () => {
      try {
        const _providerSettings = await modelSettingsCall(accessToken);
        setProviderSettings(_providerSettings);
        // Replace with your actual API call for model data
        const modelDataResponse = await modelInfoCall(
          accessToken,
@ -945,6 +967,18 @@ const ModelDashboard: React.FC<ModelDashboardProps> = ({
  console.log(`selectedProvider: ${selectedProvider}`);
  console.log(`providerModels.length: ${providerModels.length}`);
  const providerKey = Object.keys(Providers).find(
    (key) => (Providers as { [index: string]: any })[key] === selectedProvider
  );
  let dynamicProviderForm: ProviderSettings | undefined = undefined;
  if (providerKey) {
    dynamicProviderForm = providerSettings.find(
      (provider) => provider.name === provider_map[providerKey]
    );
  }
  return (
    <div style={{ width: "100%", height: "100%" }}>
      <TabGroup className="gap-2 p-8 h-[75vh] w-full mt-2">
@ -1278,6 +1312,7 @@ const ModelDashboard: React.FC<ModelDashboardProps> = ({
                      ))}
                    </Select>
                  </Form.Item>
                  <Form.Item
                    rules={[{ required: true, message: "Required" }]}
                    label="Public Model Name"
@ -1340,8 +1375,16 @@ const ModelDashboard: React.FC<ModelDashboardProps> = ({
                      </Text>
                    </Col>
                  </Row>
                  {dynamicProviderForm !== undefined &&
                    dynamicProviderForm.fields.length > 0 && (
                      <DynamicFields
                        fields={dynamicProviderForm.fields}
                        selectedProvider={dynamicProviderForm.name}
                      />
                    )}
                  {selectedProvider != Providers.Bedrock &&
-                    selectedProvider != Providers.Vertex_AI && (
+                    selectedProvider != Providers.Vertex_AI &&
                    dynamicProviderForm === undefined && (
                      <Form.Item
                        rules={[{ required: true, message: "Required" }]}
                        label="API Key"
--- a/ui/litellm-dashboard/src/components/networking.tsx
+++ b/ui/litellm-dashboard/src/components/networking.tsx
@ -62,6 +62,40 @@ export const modelCreateCall = async (
  }
 };
 export const modelSettingsCall = async (accessToken: String) => {
  /**
   * Get all configurable params for setting a model
   */
  try {
    let url = proxyBaseUrl
      ? `${proxyBaseUrl}/model/settings`
      : `/model/settings`;
    //message.info("Requesting model data");
    const response = await fetch(url, {
      method: "GET",
      headers: {
        Authorization: `Bearer ${accessToken}`,
        "Content-Type": "application/json",
      },
    });
    if (!response.ok) {
      const errorData = await response.text();
      message.error(errorData, 10);
      throw new Error("Network response was not ok");
    }
    const data = await response.json();
    //message.info("Received model data");
    return data;
    // Handle success - you might want to update some state or UI based on the created key
  } catch (error) {
    console.error("Failed to get callbacks:", error);
    throw error;
  }
 };
 export const modelDeleteCall = async (
  accessToken: string,
  model_id: string