diff --git a/.gitignore b/.gitignore index 00cd35c5b..de1c7598f 100644 --- a/.gitignore +++ b/.gitignore @@ -40,7 +40,7 @@ ui/litellm-dashboard/node_modules ui/litellm-dashboard/next-env.d.ts ui/litellm-dashboard/package.json ui/litellm-dashboard/package-lock.json -deploy/charts/litellm-helm/*.tgz -deploy/charts/litellm-helm/charts/* +deploy/charts/litellm/*.tgz +deploy/charts/litellm/charts/* deploy/charts/*.tgz litellm/proxy/vertex_key.json diff --git a/deploy/charts/litellm-helm/templates/deployment-ui.yaml b/deploy/charts/litellm-helm/templates/deployment-ui.yaml deleted file mode 100644 index f949e2029..000000000 --- a/deploy/charts/litellm-helm/templates/deployment-ui.yaml +++ /dev/null @@ -1,89 +0,0 @@ -{{- if .Values.ui.enabled -}} -apiVersion: apps/v1 -kind: Deployment -metadata: - name: {{ include "litellm.fullname" . }}-ui - labels: - {{- include "litellm.labels" . | nindent 4 }} -spec: - {{- if not .Values.ui.autoscaling.enabled }} - replicas: {{ .Values.ui.replicaCount }} - {{- end }} - selector: - matchLabels: - {{- include "litellm.ui.selectorLabels" . | nindent 6 }} - template: - metadata: - {{- with .Values.podAnnotations }} - annotations: - {{- toYaml . | nindent 8 }} - {{- end }} - labels: - {{- include "litellm.ui.labels" . | nindent 8 }} - {{- with .Values.ui.podLabels }} - {{- toYaml . | nindent 8 }} - {{- end }} - spec: - {{- with .Values.imagePullSecrets }} - imagePullSecrets: - {{- toYaml . | nindent 8 }} - {{- end }} - serviceAccountName: {{ include "litellm.serviceAccountName" . }} - securityContext: - {{- toYaml .Values.ui.podSecurityContext | nindent 8 }} - containers: - - name: {{ include "litellm.name" . }}-ui - securityContext: - {{- toYaml .Values.ui.securityContext | nindent 12 }} - image: "{{ .Values.ui.image.repository }}:{{ .Values.ui.image.tag | default (printf "main-%s" .Chart.AppVersion) }}" - imagePullPolicy: {{ .Values.ui.image.pullPolicy }} - env: - - name: BASE_URL - value: {{ (index .Values.ui.ingress.hosts 0).host | default "example.com" }} - ports: - - name: http - containerPort: {{ .Values.ui.service.port }} - protocol: TCP - livenessProbe: - httpGet: - path: / - port: http - readinessProbe: - httpGet: - path: / - port: http - # Give the container time to start up. Up to 5 minutes (10 * 30 seconds) - startupProbe: - httpGet: - path: / - port: http - failureThreshold: 30 - periodSeconds: 10 - resources: - {{- toYaml .Values.ui.resources | nindent 12 }} - volumeMounts: - - name: tmp - mountPath: /tmp - {{- with .Values.ui.volumeMounts }} - {{- toYaml . | nindent 12 }} - {{- end }} - volumes: - - name: tmp - emptyDir: - sizeLimit: 500Mi - {{- with .Values.ui.volumes }} - {{- toYaml . | nindent 8 }} - {{- end }} - {{- with .Values.ui.nodeSelector }} - nodeSelector: - {{- toYaml . | nindent 8 }} - {{- end }} - {{- with .Values.ui.affinity }} - affinity: - {{- toYaml . | nindent 8 }} - {{- end }} - {{- with .Values.ui.tolerations }} - tolerations: - {{- toYaml . | nindent 8 }} - {{- end }} -{{- end -}} \ No newline at end of file diff --git a/deploy/charts/litellm-helm/templates/ingress-ui.yaml b/deploy/charts/litellm-helm/templates/ingress-ui.yaml deleted file mode 100644 index 791ccf2b0..000000000 --- a/deploy/charts/litellm-helm/templates/ingress-ui.yaml +++ /dev/null @@ -1,61 +0,0 @@ -{{- if .Values.ui.ingress.enabled -}} -{{- $fullName := (printf "%s%s" (include "litellm.fullname" .) "-ui") -}} -{{- $svcPort := .Values.ui.service.port -}} -{{- if and .Values.ui.ingress.className (not (semverCompare ">=1.18-0" .Capabilities.KubeVersion.GitVersion)) }} - {{- if not (hasKey .Values.ui.ingress.annotations "kubernetes.io/ingress.class") }} - {{- $_ := set .Values.ui.ingress.annotations "kubernetes.io/ingress.class" .Values.ui.ingress.className}} - {{- end }} -{{- end }} -{{- if semverCompare ">=1.19-0" .Capabilities.KubeVersion.GitVersion -}} -apiVersion: networking.k8s.io/v1 -{{- else if semverCompare ">=1.14-0" .Capabilities.KubeVersion.GitVersion -}} -apiVersion: networking.k8s.io/v1beta1 -{{- else -}} -apiVersion: extensions/v1beta1 -{{- end }} -kind: Ingress -metadata: - name: {{ $fullName }} - labels: - {{- include "litellm.ui.labels" . | nindent 4 }} - {{- with .Values.ui.ingress.annotations }} - annotations: - {{- toYaml . | nindent 4 }} - {{- end }} -spec: - {{- if and .Values.ui.ingress.className (semverCompare ">=1.18-0" .Capabilities.KubeVersion.GitVersion) }} - ingressClassName: {{ .Values.ui.ingress.className }} - {{- end }} - {{- if .Values.ui.ingress.tls }} - tls: - {{- range .Values.ui.ingress.tls }} - - hosts: - {{- range .hosts }} - - {{ . | quote }} - {{- end }} - secretName: {{ .secretName }} - {{- end }} - {{- end }} - rules: - {{- range .Values.ui.ingress.hosts }} - - host: {{ .host | quote }} - http: - paths: - {{- range .paths }} - - path: {{ .path }} - {{- if and .pathType (semverCompare ">=1.18-0" $.Capabilities.KubeVersion.GitVersion) }} - pathType: {{ .pathType }} - {{- end }} - backend: - {{- if semverCompare ">=1.19-0" $.Capabilities.KubeVersion.GitVersion }} - service: - name: {{ $fullName }} - port: - number: {{ $svcPort }} - {{- else }} - serviceName: {{ $fullName }} - servicePort: {{ $svcPort }} - {{- end }} - {{- end }} - {{- end }} -{{- end }} diff --git a/deploy/charts/litellm-helm/templates/service-ui.yaml b/deploy/charts/litellm-helm/templates/service-ui.yaml deleted file mode 100644 index 50781899d..000000000 --- a/deploy/charts/litellm-helm/templates/service-ui.yaml +++ /dev/null @@ -1,17 +0,0 @@ -{{- if .Values.ui.enabled -}} -apiVersion: v1 -kind: Service -metadata: - name: {{ include "litellm.fullname" . }}-ui - labels: - {{- include "litellm.labels" . | nindent 4 }} -spec: - type: {{ .Values.ui.service.type }} - ports: - - port: {{ .Values.ui.service.port }} - targetPort: http - protocol: TCP - name: http - selector: - {{- include "litellm.ui.selectorLabels" . | nindent 4 }} -{{ end -}} \ No newline at end of file diff --git a/deploy/charts/litellm-helm/.helmignore b/deploy/charts/litellm/.helmignore similarity index 100% rename from deploy/charts/litellm-helm/.helmignore rename to deploy/charts/litellm/.helmignore diff --git a/deploy/charts/litellm-helm/Chart.lock b/deploy/charts/litellm/Chart.lock similarity index 100% rename from deploy/charts/litellm-helm/Chart.lock rename to deploy/charts/litellm/Chart.lock diff --git a/deploy/charts/litellm-helm/Chart.yaml b/deploy/charts/litellm/Chart.yaml similarity index 96% rename from deploy/charts/litellm-helm/Chart.yaml rename to deploy/charts/litellm/Chart.yaml index 80eaf87dd..6ecdebb50 100644 --- a/deploy/charts/litellm-helm/Chart.yaml +++ b/deploy/charts/litellm/Chart.yaml @@ -2,7 +2,7 @@ apiVersion: v2 # We can't call ourselves just "litellm" because then we couldn't publish to the # same OCI repository as the "litellm" OCI image -name: litellm-helm +name: litellm description: Call all LLM APIs using the OpenAI format # A chart can be either an 'application' or a 'library' chart. @@ -18,17 +18,16 @@ type: application # This is the chart version. This version number should be incremented each time you make changes # to the chart and its templates, including the app version. # Versions are expected to follow Semantic Versioning (https://semver.org/) -version: 0.1.0 +version: 0.2.0 # This is the version number of the application being deployed. This version number should be # incremented each time you make changes to the application. Versions are not expected to # follow Semantic Versioning. They should reflect the version the application is using. # It is recommended to use it with quotes. -appVersion: v1.18.9 +appVersion: v1.24.5 dependencies: - name: "postgresql" version: ">=13.3.0" repository: oci://registry-1.docker.io/bitnamicharts condition: db.deployStandalone - diff --git a/deploy/charts/litellm-helm/README.md b/deploy/charts/litellm/README.md similarity index 73% rename from deploy/charts/litellm-helm/README.md rename to deploy/charts/litellm/README.md index bf87501b3..daba8aa68 100644 --- a/deploy/charts/litellm-helm/README.md +++ b/deploy/charts/litellm/README.md @@ -43,20 +43,6 @@ data: type: Opaque ``` -### LiteLLM Admin UI Settings - -| Name | Description | Value | -| ---------------------------------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ----- | -| `ui.enabled` | Should the LiteLLM Admin UI be deployed | `true` | -| `ui.replicaCount` | The number of LiteLLM Admin UI pods to be deployed | `1` | -| `ui.image.repository` | LiteLLM Admin UI image repository | `ghcr.io/berriai/litellm` | -| `ui.image.pullPolicy` | LiteLLM Admin UI image pull policy | `IfNotPresent` | -| `ui.image.tag` | Overrides the image tag whose default the latest version of LiteLLM at the time this chart was published. | `""` | -| `ui.imagePullSecrets` | Registry credentials for the above images. | `[]` | -| `ui.service.type` | Kubernetes Service type (e.g. `LoadBalancer`, `ClusterIP`, etc.) | `ClusterIP` | -| `ui.service.port` | TCP port that the Kubernetes Service will listen on. Also the TCP port within the Pod that the web server will listen on. | `8000` | -| `ui.ingress.*` | See [values.yaml](./values.yaml) for example settings | N/A | - ### Database Settings | Name | Description | Value | | ---------------------------------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ----- | @@ -86,18 +72,18 @@ type: Opaque ``` ## Accessing the Admin UI -When browsing to the URL published per the settings in `ui.ingress.*`, you will +When browsing to the URL published per the settings in `ingress.*`, you will be prompted for **Admin Configuration**. The **Proxy Endpoint** is the internal -(from the `litellm-ui` pod's perspective) URL published by the `litellm-proxy` +(from the `litellm` pod's perspective) URL published by the `-litellm` Kubernetes Service. If the deployment uses the default settings for this -service, the **Proxy Endpoint** should be set to `http://litellm-proxy:8000`. +service, the **Proxy Endpoint** should be set to `http://-litellm:8000`. The **Proxy Key** is the value specified for `masterkey` or, if a `masterkey` was not provided to the helm command line, the `masterkey` is a randomly -generated string stored in the `litellm-masterkey` Kubernetes Secret. +generated string stored in the `-litellm-masterkey` Kubernetes Secret. ```bash -kubectl -n litellm get secret litellm-masterkey -o jsonpath="{.data.masterkey}" +kubectl -n litellm get secret -litellm-masterkey -o jsonpath="{.data.masterkey}" ``` ## Admin UI Limitations diff --git a/deploy/charts/litellm-helm/templates/NOTES.txt b/deploy/charts/litellm/templates/NOTES.txt similarity index 100% rename from deploy/charts/litellm-helm/templates/NOTES.txt rename to deploy/charts/litellm/templates/NOTES.txt diff --git a/deploy/charts/litellm-helm/templates/_helpers.tpl b/deploy/charts/litellm/templates/_helpers.tpl similarity index 79% rename from deploy/charts/litellm-helm/templates/_helpers.tpl rename to deploy/charts/litellm/templates/_helpers.tpl index 7e7aa8f4c..b8893d07c 100644 --- a/deploy/charts/litellm-helm/templates/_helpers.tpl +++ b/deploy/charts/litellm/templates/_helpers.tpl @@ -41,14 +41,6 @@ app.kubernetes.io/version: {{ .Chart.AppVersion | quote }} {{- end }} app.kubernetes.io/managed-by: {{ .Release.Service }} {{- end }} -{{- define "litellm.ui.labels" -}} -helm.sh/chart: {{ include "litellm.chart" . }} -{{ include "litellm.ui.selectorLabels" . }} -{{- if .Chart.AppVersion }} -app.kubernetes.io/version: {{ .Chart.AppVersion | quote }} -{{- end }} -app.kubernetes.io/managed-by: {{ .Release.Service }} -{{- end }} {{/* Selector labels @@ -57,10 +49,6 @@ Selector labels app.kubernetes.io/name: {{ include "litellm.name" . }} app.kubernetes.io/instance: {{ .Release.Name }} {{- end }} -{{- define "litellm.ui.selectorLabels" -}} -app.kubernetes.io/name: {{ include "litellm.name" . }}-ui -app.kubernetes.io/instance: {{ .Release.Name }} -{{- end }} {{/* Create the name of the service account to use diff --git a/deploy/charts/litellm-helm/templates/configmap-litellm.yaml b/deploy/charts/litellm/templates/configmap-litellm.yaml similarity index 100% rename from deploy/charts/litellm-helm/templates/configmap-litellm.yaml rename to deploy/charts/litellm/templates/configmap-litellm.yaml diff --git a/deploy/charts/litellm-helm/templates/deployment-proxy.yaml b/deploy/charts/litellm/templates/deployment.yaml similarity index 89% rename from deploy/charts/litellm-helm/templates/deployment-proxy.yaml rename to deploy/charts/litellm/templates/deployment.yaml index cdcd207c0..6ed112dac 100644 --- a/deploy/charts/litellm-helm/templates/deployment-proxy.yaml +++ b/deploy/charts/litellm/templates/deployment.yaml @@ -1,7 +1,7 @@ apiVersion: apps/v1 kind: Deployment metadata: - name: {{ include "litellm.fullname" . }}-proxy + name: {{ include "litellm.fullname" . }} labels: {{- include "litellm.labels" . | nindent 4 }} spec: @@ -41,12 +41,12 @@ spec: - name: DATABASE_USERNAME valueFrom: secretKeyRef: - name: {{ include "litellm.name" . }}-dbcredentials + name: {{ include "litellm.fullname" . }}-dbcredentials key: username - name: PGPASSWORD valueFrom: secretKeyRef: - name: {{ include "litellm.name" . }}-dbcredentials + name: {{ include "litellm.fullname" . }}-dbcredentials key: password - name: DATABASE_HOST value: {{ .Release.Name }}-postgresql @@ -108,12 +108,12 @@ spec: - name: DATABASE_USERNAME valueFrom: secretKeyRef: - name: {{ include "litellm.name" . }}-dbcredentials + name: {{ include "litellm.fullname" . }}-dbcredentials key: username - name: DATABASE_PASSWORD valueFrom: secretKeyRef: - name: {{ include "litellm.name" . }}-dbcredentials + name: {{ include "litellm.fullname" . }}-dbcredentials key: password - name: DATABASE_HOST value: {{ .Release.Name }}-postgresql @@ -140,7 +140,7 @@ spec: - name: PROXY_MASTER_KEY valueFrom: secretKeyRef: - name: {{ include "litellm.name" . }}-masterkey + name: {{ include "litellm.fullname" . }}-masterkey key: masterkey envFrom: {{- range .Values.environmentSecrets }} @@ -150,16 +150,7 @@ spec: args: - --config - /etc/litellm/config.yaml - # command: - # - bash - # - -c - # - | - # ls -la /etc/litellm/; cat /etc/litellm/config.yaml; export - # find / 2>/dev/null | grep -v -e '^/proc' -e '^/sys' -e '^/dev' >/tmp/before.list - # prisma generate - # find / 2>/dev/null | grep -v -e '^/proc' -e '^/sys' -e '^/dev' >/tmp/after.list - # diff -ruN /tmp/before.list /tmp/after.list - # sleep 3600 + - --run_gunicorn ports: - name: http containerPort: {{ .Values.service.port }} diff --git a/deploy/charts/litellm-helm/templates/hpa.yaml b/deploy/charts/litellm/templates/hpa.yaml similarity index 100% rename from deploy/charts/litellm-helm/templates/hpa.yaml rename to deploy/charts/litellm/templates/hpa.yaml diff --git a/deploy/charts/litellm-helm/templates/ingress-proxy.yaml b/deploy/charts/litellm/templates/ingress.yaml similarity index 96% rename from deploy/charts/litellm-helm/templates/ingress-proxy.yaml rename to deploy/charts/litellm/templates/ingress.yaml index 95bf83c99..09e8d715a 100644 --- a/deploy/charts/litellm-helm/templates/ingress-proxy.yaml +++ b/deploy/charts/litellm/templates/ingress.yaml @@ -1,5 +1,5 @@ {{- if .Values.ingress.enabled -}} -{{- $fullName := (printf "%s%s" (include "litellm.fullname" .) "-proxy") -}} +{{- $fullName := include "litellm.fullname" . -}} {{- $svcPort := .Values.service.port -}} {{- if and .Values.ingress.className (not (semverCompare ">=1.18-0" .Capabilities.KubeVersion.GitVersion)) }} {{- if not (hasKey .Values.ingress.annotations "kubernetes.io/ingress.class") }} diff --git a/deploy/charts/litellm-helm/templates/secret-dbcredentials.yaml b/deploy/charts/litellm/templates/secret-dbcredentials.yaml similarity index 87% rename from deploy/charts/litellm-helm/templates/secret-dbcredentials.yaml rename to deploy/charts/litellm/templates/secret-dbcredentials.yaml index fc688effb..8851f5802 100644 --- a/deploy/charts/litellm-helm/templates/secret-dbcredentials.yaml +++ b/deploy/charts/litellm/templates/secret-dbcredentials.yaml @@ -2,7 +2,7 @@ apiVersion: v1 kind: Secret metadata: - name: {{ include "litellm.name" . }}-dbcredentials + name: {{ include "litellm.fullname" . }}-dbcredentials data: # Password for the "postgres" user postgres-password: {{ ( index .Values.postgresql.auth "postgres-password") | default "litellm" | b64enc }} diff --git a/deploy/charts/litellm-helm/templates/secret-masterkey.yaml b/deploy/charts/litellm/templates/secret-masterkey.yaml similarity index 75% rename from deploy/charts/litellm-helm/templates/secret-masterkey.yaml rename to deploy/charts/litellm/templates/secret-masterkey.yaml index 8b22b476c..57b854cc0 100644 --- a/deploy/charts/litellm-helm/templates/secret-masterkey.yaml +++ b/deploy/charts/litellm/templates/secret-masterkey.yaml @@ -2,7 +2,7 @@ apiVersion: v1 kind: Secret metadata: - name: {{ include "litellm.name" . }}-masterkey + name: {{ include "litellm.fullname" . }}-masterkey data: masterkey: {{ $masterkey | b64enc }} type: Opaque \ No newline at end of file diff --git a/deploy/charts/litellm-helm/templates/service-proxy.yaml b/deploy/charts/litellm/templates/service.yaml similarity index 86% rename from deploy/charts/litellm-helm/templates/service-proxy.yaml rename to deploy/charts/litellm/templates/service.yaml index 3c3c744b5..40e7f27f1 100644 --- a/deploy/charts/litellm-helm/templates/service-proxy.yaml +++ b/deploy/charts/litellm/templates/service.yaml @@ -1,7 +1,7 @@ apiVersion: v1 kind: Service metadata: - name: {{ include "litellm.fullname" . }}-proxy + name: {{ include "litellm.fullname" . }} labels: {{- include "litellm.labels" . | nindent 4 }} spec: diff --git a/deploy/charts/litellm-helm/templates/serviceaccount.yaml b/deploy/charts/litellm/templates/serviceaccount.yaml similarity index 100% rename from deploy/charts/litellm-helm/templates/serviceaccount.yaml rename to deploy/charts/litellm/templates/serviceaccount.yaml diff --git a/deploy/charts/litellm-helm/templates/tests/test-connection.yaml b/deploy/charts/litellm/templates/tests/test-connection.yaml similarity index 92% rename from deploy/charts/litellm-helm/templates/tests/test-connection.yaml rename to deploy/charts/litellm/templates/tests/test-connection.yaml index 1f072069c..d2a4034b1 100644 --- a/deploy/charts/litellm-helm/templates/tests/test-connection.yaml +++ b/deploy/charts/litellm/templates/tests/test-connection.yaml @@ -11,5 +11,5 @@ spec: - name: wget image: busybox command: ['wget'] - args: ['{{ include "litellm.fullname" . }}:{{ .Values.service.port }}'] + args: ['{{ include "litellm.fullname" . }}:{{ .Values.service.port }}/health/readiness'] restartPolicy: Never diff --git a/deploy/charts/litellm-helm/values.yaml b/deploy/charts/litellm/values.yaml similarity index 80% rename from deploy/charts/litellm-helm/values.yaml rename to deploy/charts/litellm/values.yaml index 3c7131055..1b83fe801 100644 --- a/deploy/charts/litellm-helm/values.yaml +++ b/deploy/charts/litellm/values.yaml @@ -5,7 +5,9 @@ replicaCount: 1 image: - repository: ghcr.io/berriai/litellm + # Use "ghcr.io/berriai/litellm-database" for optimized image with database + # Alternatively, use "ghcr.io/berriai/litellm" for the default image + repository: ghcr.io/berriai/litellm-database pullPolicy: IfNotPresent # Overrides the image tag whose default is the chart appVersion. # tag: "main-latest" @@ -56,7 +58,7 @@ service: port: 8000 ingress: - enabled: true + enabled: false className: "nginx" annotations: {} # kubernetes.io/ingress.class: nginx @@ -71,6 +73,8 @@ ingress: # hosts: # - chart-example.local +# masterkey: changeit + # The elements within proxy_config are rendered as config.yaml for the proxy # Examples: https://github.com/BerriAI/litellm/tree/main/litellm/proxy/example_config_yaml # Reference: https://docs.litellm.ai/docs/proxy/configs @@ -159,61 +163,6 @@ postgresql: # A secret is created by this chart (litellm-helm) with the credentials that # the new Postgres instance should use. - existingSecret: litellm-dbcredentials - secretKeys: - userPasswordKey: password - -ui: - enabled: true - replicaCount: 1 - autoscaling: - enabled: false - image: - repository: ghcr.io/berriai/litellm-ui - pullPolicy: IfNotPresent - # Overrides the image tag whose default is the chart appVersion. - # tag: "main-latest" - # TODO: Switch to BerryAI repo and tags if/when they provide a ui image - # https://github.com/BerriAI/litellm/pull/1505 - tag: "" - - service: - type: ClusterIP - port: 8501 - - ingress: - enabled: true - className: "nginx" - annotations: {} - hosts: - - host: ui.example.local - paths: - - path: / - pathType: ImplementationSpecific - tls: [] - - podAnnotations: {} - podLabels: {} - - podSecurityContext: - fsGroup: 1000 - - securityContext: - capabilities: - drop: - - ALL - readOnlyRootFilesystem: true - runAsNonRoot: true - runAsUser: 1000 - - resources: {} - - volumes: [] - - volumeMounts: [] - - nodeSelector: {} - - tolerations: [] - - affinity: {} \ No newline at end of file + # existingSecret: "" + # secretKeys: + # userPasswordKey: password diff --git a/docs/my-website/docs/providers/gemini.md b/docs/my-website/docs/providers/gemini.md index 9d5eb298b..44d744866 100644 --- a/docs/my-website/docs/providers/gemini.md +++ b/docs/my-website/docs/providers/gemini.md @@ -16,6 +16,34 @@ response = completion( ) ``` +## Specifying Safety Settings +In certain use-cases you may need to make calls to the models and pass [safety settigns](https://ai.google.dev/docs/safety_setting_gemini) different from the defaults. To do so, simple pass the `safety_settings` argument to `completion` or `acompletion`. For example: + +```python +response = completion( + model="gemini/gemini-pro", + messages=[{"role": "user", "content": "write code for saying hi from LiteLLM"}] + safety_settings=[ + { + "category": "HARM_CATEGORY_HARASSMENT", + "threshold": "BLOCK_NONE", + }, + { + "category": "HARM_CATEGORY_HATE_SPEECH", + "threshold": "BLOCK_NONE", + }, + { + "category": "HARM_CATEGORY_SEXUALLY_EXPLICIT", + "threshold": "BLOCK_NONE", + }, + { + "category": "HARM_CATEGORY_DANGEROUS_CONTENT", + "threshold": "BLOCK_NONE", + }, + ] +) +``` + # Gemini-Pro-Vision LiteLLM Supports the following image types passed in `url` - Images with direct links - https://storage.googleapis.com/github-repo/img/gemini/intro/landmark3.jpg diff --git a/docs/my-website/docs/proxy/configs.md b/docs/my-website/docs/proxy/configs.md index 786df59c2..e9fd4cda4 100644 --- a/docs/my-website/docs/proxy/configs.md +++ b/docs/my-website/docs/proxy/configs.md @@ -538,17 +538,13 @@ model_list: # will route requests to the least busy ollama model api_base: "http://127.0.0.1:8003" ``` -## Max Parallel Requests -To rate limit a user based on the number of parallel requests, e.g.: -if user's parallel requests > x, send a 429 error -if user's parallel requests <= x, let them use the API freely. - -set the max parallel request limit on the config.yaml (note: this expects the user to be passing in an api key). +## Configure DB Pool Limits + Connection Timeouts ```yaml -general_settings: - max_parallel_requests: 100 # max parallel requests for a user = 100 +general_settings: + database_connection_pool_limit: 100 # sets connection pool for prisma client to postgres db at 100 + database_connection_timeout: 60 # sets a 60s timeout for any connection call to the db ``` ## All settings @@ -577,6 +573,8 @@ general_settings: "key_management_system": "google_kms", # either google_kms or azure_kms "master_key": "string", "database_url": "string", + "database_connection_pool_limit": 0, # default 100 + "database_connection_timeout": 0, # default 60s "database_type": "dynamo_db", "database_args": { "billing_mode": "PROVISIONED_THROUGHPUT", diff --git a/docs/my-website/docs/proxy/deploy.md b/docs/my-website/docs/proxy/deploy.md index c3a84f1ea..7ad7d8387 100644 --- a/docs/my-website/docs/proxy/deploy.md +++ b/docs/my-website/docs/proxy/deploy.md @@ -151,10 +151,54 @@ kubectl port-forward service/litellm-service 4000:4000 Your OpenAI proxy server is now running on `http://0.0.0.0:4000`. + + + +### Step 1. Clone the repository + +```bash +git clone https://github.com/BerriAI/litellm.git +``` + +### Step 2. Deploy with Helm + +```bash +helm install \ + --set masterkey=SuPeRsEcReT \ + mydeploy \ + deploy/charts/litellm +``` + +### Step 3. Expose the service to localhost + +```bash +kubectl \ + port-forward \ + service/mydeploy-litellm \ + 8000:8000 +``` + +Your OpenAI proxy server is now running on `http://127.0.0.1:8000`. + -## Setting SSL Certification +## Advanced Deployment Settings + +### Customization of the server root path + +:::info + +In a Kubernetes deployment, it's possible to utilize a shared DNS to host multiple applications by modifying the virtual service + +::: + +Customize the root path to eliminate the need for employing multiple DNS configurations during deployment. + +👉 Set `SERVER_ROOT_PATH` in your .env and this will be set as your server root path + + +### Setting SSL Certification Use this, If you need to set ssl certificates for your on prem litellm proxy diff --git a/docs/my-website/docs/proxy/pii_masking.md b/docs/my-website/docs/proxy/pii_masking.md index 348ce207d..dafb5876c 100644 --- a/docs/my-website/docs/proxy/pii_masking.md +++ b/docs/my-website/docs/proxy/pii_masking.md @@ -72,3 +72,78 @@ curl --location 'http://0.0.0.0:8000/key/generate' \ ``` +## Turn on/off per request + +The proxy support 2 request-level PII controls: + +- *no-pii*: Optional(bool) - Allow user to turn off pii masking per request. +- *output_parse_pii*: Optional(bool) - Allow user to turn off pii output parsing per request. + +### Usage + +**Step 1. Create key with pii permissions** + +Set `allow_pii_controls` to true for a given key. This will allow the user to set request-level PII controls. + +```bash +curl --location 'http://0.0.0.0:8000/key/generate' \ +--header 'Authorization: Bearer my-master-key' \ +--header 'Content-Type: application/json' \ +--data '{ + "permissions": {"allow_pii_controls": true} +}' +``` + +**Step 2. Turn off pii output parsing** + +```python +import os +from openai import OpenAI + +client = OpenAI( + # This is the default and can be omitted + api_key=os.environ.get("OPENAI_API_KEY"), + base_url="http://0.0.0.0:8000" +) + +chat_completion = client.chat.completions.create( + messages=[ + { + "role": "user", + "content": "My name is Jane Doe, my number is 8382043839", + } + ], + model="gpt-3.5-turbo", + extra_body={ + "content_safety": {"output_parse_pii": False} + } +) +``` + +**Step 3: See response** + +``` +{ + "id": "chatcmpl-8c5qbGTILZa1S4CK3b31yj5N40hFN", + "choices": [ + { + "finish_reason": "stop", + "index": 0, + "message": { + "content": "Hi [PERSON], what can I help you with?", + "role": "assistant" + } + } + ], + "created": 1704089632, + "model": "gpt-35-turbo", + "object": "chat.completion", + "system_fingerprint": null, + "usage": { + "completion_tokens": 47, + "prompt_tokens": 12, + "total_tokens": 59 + }, + "_response_ms": 1753.426 +} +``` \ No newline at end of file diff --git a/docs/my-website/docs/proxy/virtual_keys.md b/docs/my-website/docs/proxy/virtual_keys.md index 2be4b95c1..83994701c 100644 --- a/docs/my-website/docs/proxy/virtual_keys.md +++ b/docs/my-website/docs/proxy/virtual_keys.md @@ -93,6 +93,7 @@ Request Params: - `config`: *Optional[dict]* - any key-specific configs, overrides config in config.yaml - `spend`: *Optional[int]* - Amount spent by key. Default is 0. Will be updated by proxy whenever key is used. https://docs.litellm.ai/docs/proxy/virtual_keys#managing-auth---tracking-spend - `max_budget`: *Optional[float]* - Specify max budget for a given key. +- `model_max_budget`: *Optional[dict[str, float]]* - Specify max budget for each model, `model_max_budget={"gpt4": 0.5, "gpt-5": 0.01}` - `max_parallel_requests`: *Optional[int]* - Rate limit a user based on the number of parallel requests. Raises 429 error, if user's parallel requests > x. - `metadata`: *Optional[dict]* - Metadata for key, store information for key. Example metadata = {"team": "core-infra", "app": "app2", "email": "ishaan@berri.ai" } @@ -676,8 +677,6 @@ general_settings: ### [BETA] Dynamo DB -Only live in `v1.16.21.dev1`. - #### Step 1. Save keys to env ```shell diff --git a/docs/my-website/sidebars.js b/docs/my-website/sidebars.js index 83b409969..3badfc53a 100644 --- a/docs/my-website/sidebars.js +++ b/docs/my-website/sidebars.js @@ -129,7 +129,7 @@ const sidebars = { "proxy/caching", { "type": "category", - "label": "Logging, Alerting, Caching", + "label": "Logging, Alerting", "items": [ "proxy/logging", "proxy/alerting", diff --git a/enterprise/README.md b/enterprise/README.md index 483ee1e44..d5c27bab6 100644 --- a/enterprise/README.md +++ b/enterprise/README.md @@ -6,9 +6,4 @@ Code in this folder is licensed under a commercial license. Please review the [L 👉 **Using in an Enterprise / Need specific features ?** Meet with us [here](https://calendly.com/d/4mp-gd3-k5k/litellm-1-1-onboarding-chat?month=2024-02) -## Enterprise Features: - -- Track, View spend per tag https://docs.litellm.ai/docs/proxy/spend -- Custom API / microservice callbacks -- Google Text Moderation API - +See all Enterprise Features here 👉 [Docs](https://docs.litellm.ai/docs/proxy/enterprise) diff --git a/enterprise/enterprise_hooks/llama_guard.py b/enterprise/enterprise_hooks/llama_guard.py index 4d2139cd2..16eb3dcd1 100644 --- a/enterprise/enterprise_hooks/llama_guard.py +++ b/enterprise/enterprise_hooks/llama_guard.py @@ -110,7 +110,6 @@ class _ENTERPRISE_LlamaGuard(CustomLogger): -1 ] # get the last response - llama guard has a 4k token limit self.set_custom_prompt_template(messages=[safety_check_messages]) - # print(f"self.model: {self.model}") response = await litellm.acompletion( model=self.model, messages=[safety_check_messages], diff --git a/litellm/llms/gemini.py b/litellm/llms/gemini.py index 7e98345b3..2db27aeba 100644 --- a/litellm/llms/gemini.py +++ b/litellm/llms/gemini.py @@ -121,6 +121,13 @@ def completion( ## Load Config inference_params = copy.deepcopy(optional_params) stream = inference_params.pop("stream", None) + + # Handle safety settings + safety_settings_param = inference_params.pop("safety_settings", None) + safety_settings = None + if safety_settings_param: + safety_settings = [genai.types.SafetySettingDict(x) for x in safety_settings_param] + config = litellm.GeminiConfig.get_config() for k, v in config.items(): if ( @@ -141,11 +148,13 @@ def completion( response = _model.generate_content( contents=prompt, generation_config=genai.types.GenerationConfig(**inference_params), + safety_settings=safety_settings, ) else: response = _model.generate_content( contents=prompt, generation_config=genai.types.GenerationConfig(**inference_params), + safety_settings=safety_settings, stream=True, ) return response diff --git a/litellm/proxy/_experimental/out/404.html b/litellm/proxy/_experimental/out/404.html index 03563194a..0a15886c7 100644 --- a/litellm/proxy/_experimental/out/404.html +++ b/litellm/proxy/_experimental/out/404.html @@ -1 +1 @@ -404: This page could not be found.🚅 LiteLLM

404

This page could not be found.

\ No newline at end of file +404: This page could not be found.🚅 LiteLLM

404

This page could not be found.

\ No newline at end of file diff --git a/litellm/proxy/_experimental/out/_next/static/unBuvDqydg0yodtP5c3nQ/_buildManifest.js b/litellm/proxy/_experimental/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_buildManifest.js similarity index 100% rename from litellm/proxy/_experimental/out/_next/static/unBuvDqydg0yodtP5c3nQ/_buildManifest.js rename to litellm/proxy/_experimental/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_buildManifest.js diff --git a/litellm/proxy/_experimental/out/_next/static/unBuvDqydg0yodtP5c3nQ/_ssgManifest.js b/litellm/proxy/_experimental/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_ssgManifest.js similarity index 100% rename from litellm/proxy/_experimental/out/_next/static/unBuvDqydg0yodtP5c3nQ/_ssgManifest.js rename to litellm/proxy/_experimental/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_ssgManifest.js diff --git a/litellm/proxy/_experimental/out/_next/static/chunks/app/page-2322bcdc2ec71284.js b/litellm/proxy/_experimental/out/_next/static/chunks/app/page-2322bcdc2ec71284.js new file mode 100644 index 000000000..740eb87a2 --- /dev/null +++ b/litellm/proxy/_experimental/out/_next/static/chunks/app/page-2322bcdc2ec71284.js @@ -0,0 +1 @@ +(self.webpackChunk_N_E=self.webpackChunk_N_E||[]).push([[931],{20661:function(e,t,n){Promise.resolve().then(n.bind(n,48016))},48016:function(e,t,n){"use strict";n.r(t),n.d(t,{default:function(){return ec}});var s=n(3827),l=n(64090),r=n(47907),a=n(8792),o=n(2179),i=e=>{let{userID:t,userRole:n,userEmail:l}=e;return console.log("User ID:",t),console.log("userEmail:",l),(0,s.jsxs)("nav",{className:"left-0 right-0 top-0 flex justify-between items-center h-12 mb-4",children:[(0,s.jsx)("div",{className:"text-left mx-4 my-2 absolute top-0 left-0",children:(0,s.jsx)("div",{className:"flex flex-col items-center",children:(0,s.jsx)(a.default,{href:"/",children:(0,s.jsx)("button",{className:"text-gray-800 text-2xl px-4 py-1 rounded text-center",children:"\uD83D\uDE85 LiteLLM"})})})}),(0,s.jsx)("div",{className:"text-right mx-4 my-2 absolute top-0 right-0",children:(0,s.jsxs)(o.Z,{variant:"secondary",children:[l,(0,s.jsxs)("p",{children:["Role: ",n]}),(0,s.jsxs)("p",{children:["ID: ",t]})]})})]})},c=n(80588);let d=async(e,t,n)=>{try{if(console.log("Form Values in keyCreateCall:",n),n.description&&(n.metadata||(n.metadata={}),n.metadata.description=n.description,delete n.description,n.metadata=JSON.stringify(n.metadata)),n.metadata){console.log("formValues.metadata:",n.metadata);try{n.metadata=JSON.parse(n.metadata)}catch(e){throw c.ZP.error("Failed to parse metadata: "+e),Error("Failed to parse metadata: "+e)}}console.log("Form Values after check:",n);let s=await fetch("/key/generate",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({user_id:t,...n})});if(!s.ok){let e=await s.text();throw c.ZP.error("Failed to create key: "+e),console.error("Error response from the server:",e),Error("Network response was not ok")}let l=await s.json();return console.log("API Response:",l),l}catch(e){throw console.error("Failed to create key:",e),e}},m=async(e,t)=>{try{console.log("in keyDeleteCall:",t),c.ZP.info("Making key delete request");let n=await fetch("/key/delete",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:[t]})});if(!n.ok){let e=await n.text();throw c.ZP.error("Failed to delete key: "+e),Error("Network response was not ok")}let s=await n.json();return console.log(s),c.ZP.success("API Key Deleted"),s}catch(e){throw console.error("Failed to create key:",e),e}},h=async(e,t,n)=>{try{let s="/user/info";"App Owner"==n&&(s="".concat(s,"/?user_id=").concat(t)),c.ZP.info("Requesting user data");let l=await fetch(s,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!l.ok){let e=await l.text();throw c.ZP.error(e),Error("Network response was not ok")}let r=await l.json();return c.ZP.info("Received user data"),r}catch(e){throw console.error("Failed to create key:",e),e}},u=async(e,t,n)=>{try{c.ZP.info("Requesting model data");let t=await fetch("/model/info",{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!t.ok){let e=await t.text();throw c.ZP.error(e),Error("Network response was not ok")}let n=await t.json();return c.ZP.info("Received model data"),n}catch(e){throw console.error("Failed to create key:",e),e}},x=async(e,t)=>{try{let n="/spend/logs";console.log("in keySpendLogsCall:",n);let s=await fetch("".concat(n,"/?api_key=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to create key:",e),e}},p=async(e,t,n,s,l,r)=>{try{let t="/spend/logs";t="App Owner"==n?"".concat(t,"/?user_id=").concat(s,"&start_date=").concat(l,"&end_date=").concat(r):"".concat(t,"/?start_date=").concat(l,"&end_date=").concat(r),c.ZP.info("Making spend logs request");let a=await fetch(t,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!a.ok){let e=await a.text();throw c.ZP.error(e),Error("Network response was not ok")}let o=await a.json();return console.log(o),c.ZP.success("Spend Logs received"),o}catch(e){throw console.error("Failed to create key:",e),e}},j=async(e,t)=>{try{let n=await fetch("/v2/key/info",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:t})});if(!n.ok){let e=await n.text();throw c.ZP.error(e),Error("Network response was not ok")}let s=await n.json();return console.log(s),s}catch(e){throw console.error("Failed to create key:",e),e}},g=async(e,t)=>{try{let n="/spend/users";console.log("in spendUsersCall:",n);let s=await fetch("".concat(n,"/?user_id=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to get spend for user",e),e}};var y=n(10384),f=n(46453),Z=n(71801),w=n(13969),k=n(12143),_=n(77171),v=n(29714),b=n(88707),S=n(1861);let{Option:N}=w.default;var I=e=>{let{userID:t,userRole:n,accessToken:r,data:a,userModels:i,setData:m}=e,[h]=k.Z.useForm(),[u,x]=(0,l.useState)(!1),[p,j]=(0,l.useState)(null),g=()=>{x(!1),h.resetFields()},I=()=>{x(!1),j(null),h.resetFields()},A=async e=>{try{c.ZP.info("Making API Call"),x(!0);let n=await d(r,t,e);m(e=>e?[...e,n]:[n]),j(n.key),c.ZP.success("API Key Created"),h.resetFields(),localStorage.removeItem("userData"+t)}catch(e){console.error("Error creating the key:",e)}};return(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>x(!0),children:"+ Create New Key"}),(0,s.jsx)(_.Z,{title:"Create Key",visible:u,width:800,footer:null,onOk:g,onCancel:I,children:(0,s.jsxs)(k.Z,{form:h,onFinish:A,labelCol:{span:6},wrapperCol:{span:16},labelAlign:"left",children:["App Owner"===n||"Admin"===n?(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Models",name:"models",children:(0,s.jsx)(w.default,{mode:"multiple",placeholder:"Select models",style:{width:"100%"},children:i.map(e=>(0,s.jsx)(N,{value:e,children:e},e))})}),(0,s.jsx)(k.Z.Item,{label:"Max Budget (USD)",name:"max_budget",children:(0,s.jsx)(b.Z,{step:.01,precision:2,width:200})}),(0,s.jsx)(k.Z.Item,{label:"Duration (eg: 30s, 30h, 30d)",name:"duration",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Metadata",name:"metadata",children:(0,s.jsx)(v.Z.TextArea,{rows:4,placeholder:"Enter metadata as JSON"})})]}):(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID (Contact Group)",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Description",name:"description",children:(0,s.jsx)(v.Z.TextArea,{placeholder:"Enter description",rows:4})})]}),(0,s.jsx)("div",{style:{textAlign:"right",marginTop:"10px"},children:(0,s.jsx)(S.ZP,{htmlType:"submit",children:"Create Key"})})]})}),p&&(0,s.jsx)(_.Z,{title:"Save your key",visible:u,onOk:g,onCancel:I,footer:null,children:(0,s.jsxs)(f.Z,{numItems:1,className:"gap-2 w-full",children:[(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)("p",{children:["Please save this secret key somewhere safe and accessible. For security reasons, ",(0,s.jsx)("b",{children:"you will not be able to view it again"})," ","through your LiteLLM account. If you lose this secret key, you will need to generate a new one."]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:null!=p?(0,s.jsxs)(Z.Z,{children:["API Key: ",p]}):(0,s.jsx)(Z.Z,{children:"Key being created, this might take 30s"})})]})})]})},A=n(33393),C=n(13810),D=n(61244),T=n(10827),P=n(3851),E=n(2044),O=n(64167),R=n(74480),M=n(7178),U=n(42440),F=n(9853),L=n(67989),K=n(56863),z=e=>{let{token:t,accessToken:n,keySpend:r,keyBudget:a,keyName:i}=e,[c,d]=(0,l.useState)(!1),[m,h]=(0,l.useState)(null),[u,p]=(0,l.useState)(null),j=async()=>{try{if(null==n||null==t)return;console.log("accessToken: ".concat(n,"; token: ").concat(t));let e=await x(n,t);console.log("Response:",e);let s=Object.values(e).reduce((e,t)=>{let n=new Date(t.startTime),s=new Intl.DateTimeFormat("en-US",{day:"2-digit",month:"short"}).format(n);return e[s]=(e[s]||0)+t.spend,e},{}),l=Object.entries(s);l.sort((e,t)=>{let[n]=e,[s]=t,l=new Date(n),r=new Date(s);return l.getTime()-r.getTime()});let r=Object.fromEntries(l);console.log(r);let a=Object.values(e).reduce((e,t)=>{let n=t.user;return e[n]=(e[n]||0)+t.spend,e},{});console.log(s),console.log(a);let o=[];for(let[e,t]of Object.entries(r))o.push({day:e,spend:t});let i=Object.entries(a).sort((e,t)=>t[1]-e[1]).slice(0,5).map(e=>{let[t,n]=e;return{name:t,value:n}});h(o),p(i),console.log("arrayBarChart:",o)}catch(e){console.error("There was an error fetching the data",e)}};return t?(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>{console.log("Show Modal triggered"),d(!0),j()},children:"View Spend Report"}),(0,s.jsxs)(_.Z,{visible:c,width:1e3,onOk:()=>{d(!1)},onCancel:()=>{d(!1)},footer:null,children:[(0,s.jsxs)(U.Z,{style:{textAlign:"left"},children:["Key Name: ",i]}),(0,s.jsxs)(K.Z,{children:["Monthly Spend $",r]}),(0,s.jsx)(C.Z,{className:"mt-6 mb-6",children:m&&(0,s.jsx)(F.Z,{className:"mt-6",data:m,colors:["green"],index:"day",categories:["spend"],yAxisWidth:48})}),(0,s.jsx)(U.Z,{className:"mt-6",children:"Top 5 Users Spend (USD)"}),(0,s.jsx)(C.Z,{className:"mb-6",children:u&&(0,s.jsx)(L.Z,{className:"mt-6",data:u,color:"teal"})})]})]}):null},B=e=>{let{userID:t,accessToken:n,data:r,setData:a}=e,[i,c]=(0,l.useState)(!1),[d,h]=(0,l.useState)(!1),[u,x]=(0,l.useState)(null),p=async e=>{null!=r&&(x(e),localStorage.removeItem("userData"+t),h(!0))},j=async()=>{if(null!=u&&null!=r){try{await m(n,u);let e=r.filter(e=>e.token!==u);a(e)}catch(e){console.error("Error deleting the key:",e)}h(!1),x(null)}};if(null!=r)return console.log("RERENDER TRIGGERED"),(0,s.jsxs)(C.Z,{className:"w-full mx-auto flex-auto overflow-y-auto max-h-[50vh] mb-4",children:[(0,s.jsx)(U.Z,{children:"API Keys"}),(0,s.jsxs)(T.Z,{className:"mt-5",children:[(0,s.jsx)(O.Z,{children:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(R.Z,{children:"Key Alias"}),(0,s.jsx)(R.Z,{children:"Secret Key"}),(0,s.jsx)(R.Z,{children:"Spend (USD)"}),(0,s.jsx)(R.Z,{children:"Key Budget (USD)"}),(0,s.jsx)(R.Z,{children:"Team ID"}),(0,s.jsx)(R.Z,{children:"Metadata"}),(0,s.jsx)(R.Z,{children:"Models"}),(0,s.jsx)(R.Z,{children:"TPM / RPM Limits"}),(0,s.jsx)(R.Z,{children:"Expires"})]})}),(0,s.jsx)(P.Z,{children:r.map(e=>(console.log(e),"litellm-dashboard"===e.team_id)?null:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:null!=e.key_alias?(0,s.jsx)(Z.Z,{children:e.key_alias}):(0,s.jsx)(Z.Z,{children:"Not Set"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.key_name})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.spend})}),(0,s.jsx)(E.Z,{children:null!=e.max_budget?(0,s.jsx)(Z.Z,{children:e.max_budget}):(0,s.jsx)(Z.Z,{children:"Unlimited Budget"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.team_id})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.metadata)})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.models)})}),(0,s.jsx)(E.Z,{children:(0,s.jsxs)(Z.Z,{children:["TPM Limit: ",e.tpm_limit?e.tpm_limit:"Unlimited"," ",(0,s.jsx)("br",{})," RPM Limit:"," ",e.rpm_limit?e.rpm_limit:"Unlimited"]})}),(0,s.jsx)(E.Z,{children:null!=e.expires?(0,s.jsx)(Z.Z,{children:e.expires}):(0,s.jsx)(Z.Z,{children:"Never expires"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(D.Z,{onClick:()=>p(e.token),icon:A.Z,size:"sm"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(z,{token:e.token,accessToken:n,keySpend:e.spend,keyBudget:e.max_budget,keyName:e.key_name})})]},e.token))})]}),d&&(0,s.jsx)("div",{className:"fixed z-10 inset-0 overflow-y-auto",children:(0,s.jsxs)("div",{className:"flex items-end justify-center min-h-screen pt-4 px-4 pb-20 text-center sm:block sm:p-0",children:[(0,s.jsx)("div",{className:"fixed inset-0 transition-opacity","aria-hidden":"true",children:(0,s.jsx)("div",{className:"absolute inset-0 bg-gray-500 opacity-75"})}),(0,s.jsx)("span",{className:"hidden sm:inline-block sm:align-middle sm:h-screen","aria-hidden":"true",children:"​"}),(0,s.jsxs)("div",{className:"inline-block align-bottom bg-white rounded-lg text-left overflow-hidden shadow-xl transform transition-all sm:my-8 sm:align-middle sm:max-w-lg sm:w-full",children:[(0,s.jsx)("div",{className:"bg-white px-4 pt-5 pb-4 sm:p-6 sm:pb-4",children:(0,s.jsx)("div",{className:"sm:flex sm:items-start",children:(0,s.jsxs)("div",{className:"mt-3 text-center sm:mt-0 sm:ml-4 sm:text-left",children:[(0,s.jsx)("h3",{className:"text-lg leading-6 font-medium text-gray-900",children:"Delete Key"}),(0,s.jsx)("div",{className:"mt-2",children:(0,s.jsx)("p",{className:"text-sm text-gray-500",children:"Are you sure you want to delete this key ?"})})]})})}),(0,s.jsxs)("div",{className:"bg-gray-50 px-4 py-3 sm:px-6 sm:flex sm:flex-row-reverse",children:[(0,s.jsx)(o.Z,{onClick:j,color:"red",className:"ml-2",children:"Delete"}),(0,s.jsx)(o.Z,{onClick:()=>{h(!1),x(null)},children:"Cancel"})]})]})]})})]})},J=e=>{let{userID:t,userSpendData:n,userRole:r,accessToken:a}=e;console.log("User SpendData:",n);let[o,i]=(0,l.useState)(null==n?void 0:n.spend),[c,d]=(0,l.useState)((null==n?void 0:n.max_budget)||null);return(0,l.useEffect)(()=>{(async()=>{if("Admin"===r)try{let e=await g(a,"litellm-proxy-budget");console.log("Result from callSpendUsers:",e);let t=e[0];i(null==t?void 0:t.spend),d((null==t?void 0:t.max_budget)||null)}catch(e){console.error("Failed to get spend for user",e)}})()},[r,a,t]),(0,s.jsx)(s.Fragment,{children:(0,s.jsxs)(C.Z,{className:"mx-auto mb-4",children:[(0,s.jsxs)(K.Z,{children:["$",o]}),(0,s.jsxs)(U.Z,{children:["/ ",null!==c?"$".concat(c," limit"):"No limit"]})]})})},q=n(37963);console.log("isLocal:",!1);var G=e=>{let{userID:t,userRole:n,setUserRole:a,userEmail:o,setUserEmail:i}=e,[c,d]=(0,l.useState)(null),[m,x]=(0,l.useState)(null),p=(0,r.useSearchParams)();p.get("viewSpend"),(0,r.useRouter)();let j=p.get("token"),[g,Z]=(0,l.useState)(null),[w,k]=(0,l.useState)([]);if(window.addEventListener("beforeunload",function(){sessionStorage.clear()}),(0,l.useEffect)(()=>{if(j){let e=(0,q.o)(j);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),Z(e.key),e.user_role){let t=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",t),a(t)}else console.log("User role not defined");e.user_email?i(e.user_email):console.log("User Email is not set ".concat(e))}}if(t&&g&&n&&!c){let e=sessionStorage.getItem("userData"+t),s=sessionStorage.getItem("userSpendData"+t),l=sessionStorage.getItem("userModels"+t);e&&s&&l?(d(JSON.parse(e)),x(JSON.parse(s)),k(JSON.parse(l))):(async()=>{try{let e=await h(g,t,n);x(e.user_info),d(e.keys),sessionStorage.setItem("userData"+t,JSON.stringify(e.keys)),sessionStorage.setItem("userSpendData"+t,JSON.stringify(e.user_info));let s=await u(g,t,n);console.log("model_info:",s);let l=s.data.map(e=>e.model_name);console.log("available_model_names:",l),k(l),console.log("userModels:",w),sessionStorage.setItem("userModels"+t,JSON.stringify(l))}catch(e){console.error("There was an error fetching the data",e)}})()}},[t,j,g,c,n]),null==t||null==j){let e="/sso/key/generate";return console.log("Full URL:",e),window.location.href=e,null}return null==g?null:(null==n&&a("App Owner"),(0,s.jsx)("div",{children:(0,s.jsx)(f.Z,{numItems:1,className:"gap-0 p-10 h-[75vh] w-full",children:(0,s.jsxs)(y.Z,{numColSpan:1,children:[(0,s.jsx)(J,{userID:t,userSpendData:m,userRole:n,accessToken:g}),(0,s.jsx)(B,{userID:t,accessToken:g,data:c,setData:d}),(0,s.jsx)(I,{userID:t,userRole:n,userModels:w,accessToken:g,data:c,setData:d})]})})}))},$=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)({data:[]});if((0,l.useEffect)(()=>{if(!t||!n||!r||!a)return;let e=async()=>{try{let e=await u(t,a,r);console.log("Model data response:",e.data),i(e)}catch(e){console.error("There was an error fetching the model data",e)}};t&&n&&r&&a&&e()},[t,n,r,a]),!o)return(0,s.jsx)("div",{children:"Loading..."});for(let e=0;e(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:e.model_name})}),(0,s.jsx)(E.Z,{children:e.provider}),(0,s.jsx)(E.Z,{children:e.input_cost}),(0,s.jsx)(E.Z,{children:e.output_cost}),(0,s.jsx)(E.Z,{children:e.max_tokens})]},e.model_name))})]})})})})},V=n(92836),W=n(26734),H=n(41608),Y=n(32126),X=n(23682),Q=n(12968),ee=n(67951);async function et(e,t,n,s){console.log("isLocal:",!1);let l=window.location.origin,r=new Q.ZP.OpenAI({apiKey:s,baseURL:l,dangerouslyAllowBrowser:!0});for await(let s of(await r.chat.completions.create({model:n,stream:!0,messages:[{role:"user",content:e}]})))console.log(s),s.choices[0].delta.content&&t(s.choices[0].delta.content)}var en=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)(""),[c,d]=(0,l.useState)([]),[m,h]=(0,l.useState)(void 0),[x,p]=(0,l.useState)(null);(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{let e=await u(t,a,r);console.log("model_info:",e),(null==e?void 0:e.data.length)>0&&(p(e),h(e.data[0].model_name))})()},[t,a,r]);let j=(e,t)=>{d(n=>{let s=n[n.length-1];return s&&s.role===e?[...n.slice(0,n.length-1),{role:e,content:s.content+t}]:[...n,{role:e,content:t}]})},g=async()=>{if(""!==o.trim()&&t&&n&&r&&a){d(e=>[...e,{role:"user",content:o}]);try{m&&await et(o,e=>j("assistant",e),m,t)}catch(e){console.error("Error fetching model response",e),j("assistant","Error fetching model response")}i("")}};return(0,s.jsx)("div",{style:{width:"100%",position:"relative"},children:(0,s.jsx)(f.Z,{className:"gap-2 p-10 h-[75vh] w-full",children:(0,s.jsx)(C.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{className:"mt-4",children:[(0,s.jsx)(V.Z,{children:"Chat"}),(0,s.jsx)(V.Z,{children:"API Reference"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsxs)(Y.Z,{children:[(0,s.jsxs)("div",{children:[(0,s.jsx)("label",{children:"Select Model:"}),(0,s.jsx)("select",{value:m||"",onChange:e=>h(e.target.value),children:null==x?void 0:x.data.map(e=>(0,s.jsx)("option",{value:e.model_name,children:e.model_name},e.model_name))})]}),(0,s.jsxs)(T.Z,{className:"mt-5",style:{display:"block",maxHeight:"60vh",overflowY:"auto"},children:[(0,s.jsx)(O.Z,{children:(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:"Chat"})})})}),(0,s.jsx)(P.Z,{children:c.map((e,t)=>(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:"".concat(e.role,": ").concat(e.content)})},t))})]}),(0,s.jsx)("div",{className:"mt-3",style:{position:"absolute",bottom:5,width:"95%"},children:(0,s.jsxs)("div",{className:"flex",children:[(0,s.jsx)("input",{type:"text",value:o,onChange:e=>i(e.target.value),className:"flex-1 p-2 border rounded-md mr-2",placeholder:"Type your message..."}),(0,s.jsx)("button",{onClick:g,className:"p-2 bg-blue-500 text-white rounded-md",children:"Send"})]})})]}),(0,s.jsx)(Y.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{children:[(0,s.jsx)(V.Z,{children:"OpenAI Python SDK"}),(0,s.jsx)(V.Z,{children:"LlamaIndex"}),(0,s.jsx)(V.Z,{children:"Langchain Py"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport openai\nclient = openai.OpenAI(\n api_key="your_api_key",\n base_url="http://0.0.0.0:4000" # proxy base url\n)\n\nresponse = client.chat.completions.create(\n model="gpt-3.5-turbo", # model to use from Models Tab\n messages = [\n {\n "role": "user",\n "content": "this is a test request, write a short poem"\n }\n ],\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-openai-client",\n "generation_id": "openai-client-gen-id22",\n "trace_id": "openai-client-trace-id22",\n "trace_user_id": "openai-client-user-id2"\n }\n }\n)\n\nprint(response)\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport os, dotenv\n\nfrom llama_index.llms import AzureOpenAI\nfrom llama_index.embeddings import AzureOpenAIEmbedding\nfrom llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext\n\nllm = AzureOpenAI(\n engine="azure-gpt-3.5", # model_name on litellm proxy\n temperature=0.0,\n azure_endpoint="http://0.0.0.0:4000", # litellm proxy endpoint\n api_key="sk-1234", # litellm proxy API Key\n api_version="2023-07-01-preview",\n)\n\nembed_model = AzureOpenAIEmbedding(\n deployment_name="azure-embedding-model",\n azure_endpoint="http://0.0.0.0:4000",\n api_key="sk-1234",\n api_version="2023-07-01-preview",\n)\n\n\ndocuments = SimpleDirectoryReader("llama_index_data").load_data()\nservice_context = ServiceContext.from_defaults(llm=llm, embed_model=embed_model)\nindex = VectorStoreIndex.from_documents(documents, service_context=service_context)\n\nquery_engine = index.as_query_engine()\nresponse = query_engine.query("What did the author do growing up?")\nprint(response)\n\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nfrom langchain.chat_models import ChatOpenAI\nfrom langchain.prompts.chat import (\n ChatPromptTemplate,\n HumanMessagePromptTemplate,\n SystemMessagePromptTemplate,\n)\nfrom langchain.schema import HumanMessage, SystemMessage\n\nchat = ChatOpenAI(\n openai_api_base="http://0.0.0.0:8000",\n model = "gpt-3.5-turbo",\n temperature=0.1,\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-langchain-client",\n "generation_id": "langchain-client-gen-id22",\n "trace_id": "langchain-client-trace-id22",\n "trace_user_id": "langchain-client-user-id2"\n }\n }\n)\n\nmessages = [\n SystemMessage(\n content="You are a helpful assistant that im using to make a test request to."\n ),\n HumanMessage(\n content="test from litellm. tell me why it\'s amazing in 1 sentence"\n ),\n]\nresponse = chat(messages)\n\nprint(response)\n\n '})})]})]})})]})]})})})})},es=n(33509),el=n(30569);let{Sider:er}=es.default;var ea=e=>{let{setPage:t}=e;return(0,s.jsx)(es.default,{style:{minHeight:"100vh",maxWidth:"120px"},children:(0,s.jsx)(er,{width:120,children:(0,s.jsxs)(el.Z,{mode:"inline",defaultSelectedKeys:["1"],style:{height:"100%",borderRight:0},children:[(0,s.jsx)(el.Z.Item,{onClick:()=>t("api-keys"),children:"API Keys"},"1"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("models"),children:"Models"},"2"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("llm-playground"),children:"Chat UI"},"3"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("usage"),children:"Usage"},"4")]})})})};let eo=e=>{let{payload:t,active:n}=e;if(!n||!t)return null;let l=t[0].payload,r=l.startTime,a=Object.entries(l.models).map(e=>{let[t,n]=e;return[t,n]});a.sort((e,t)=>t[1]-e[1]);let o=a.slice(0,5);return(0,s.jsxs)("div",{className:"w-56 rounded-tremor-default border border-tremor-border bg-tremor-background p-2 text-tremor-default shadow-tremor-dropdown",children:[r,o.map(e=>{let[t,n]=e;return(0,s.jsx)("div",{className:"flex flex-1 space-x-10",children:(0,s.jsx)("div",{className:"p-2",children:(0,s.jsxs)("p",{className:"text-tremor-content text-xs",children:[t,":",(0,s.jsxs)("span",{className:"text-xs text-tremor-content-emphasis",children:[" ",n?n<.01?"<$0.01":n.toFixed(2):""]})]})})},t)})]})};var ei=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,o=new Date,[i,c]=(0,l.useState)([]),[d,m]=(0,l.useState)([]),[h,u]=(0,l.useState)([]),x=new Date(o.getFullYear(),o.getMonth(),1),g=new Date(o.getFullYear(),o.getMonth()+1,0),Z=k(x),w=k(g);function k(e){let t=e.getFullYear(),n=e.getMonth()+1,s=e.getDate();return"".concat(t,"-").concat(n<10?"0"+n:n,"-").concat(s<10?"0"+s:s)}return console.log("Start date is ".concat(Z)),console.log("End date is ".concat(w)),(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{try{await p(t,n,r,a,Z,w).then(async e=>{let n=(await j(t,function(e){let t=[];e.forEach(e=>{Object.entries(e).forEach(e=>{let[n,s]=e;"spend"!==n&&"startTime"!==n&&"models"!==n&&"users"!==n&&t.push({key:n,spend:s})})}),t.sort((e,t)=>Number(t.spend)-Number(e.spend));let n=t.slice(0,5).map(e=>e.key);return console.log("topKeys: ".concat(Object.keys(n[0]))),n}(e))).info.map(e=>({key:(e.key_name||e.key_alias||e.token).substring(0,7),spend:e.spend}));m(n),u(function(e){let t={};e.forEach(e=>{Object.entries(e.users).forEach(e=>{let[n,s]=e;""!==n&&null!=n&&"None"!=n&&(t[n]||(t[n]=0),t[n]+=s)})});let n=Object.entries(t).map(e=>{let[t,n]=e;return{user_id:t,spend:n}});n.sort((e,t)=>t.spend-e.spend);let s=n.slice(0,5);return console.log("topKeys: ".concat(Object.values(s[0]))),s}(e)),c(e)})}catch(e){console.error("There was an error fetching the data",e)}})()},[t,n,r,a,Z,w]),(0,s.jsx)("div",{style:{width:"100%"},children:(0,s.jsxs)(f.Z,{numItems:2,className:"gap-2 p-10 h-[75vh] w-full",children:[(0,s.jsx)(y.Z,{numColSpan:2,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Monthly Spend"}),(0,s.jsx)(F.Z,{data:i,index:"startTime",categories:["spend"],colors:["blue"],valueFormatter:e=>"$ ".concat(new Intl.NumberFormat("us").format(e).toString()),yAxisWidth:100,tickGap:5,customTooltip:eo})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top API Keys"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:d,index:"key",categories:["spend"],colors:["blue"],yAxisWidth:80,tickGap:5,layout:"vertical",showXAxis:!1,showLegend:!1})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top Users"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:h,index:"user_id",categories:["spend"],colors:["blue"],yAxisWidth:200,layout:"vertical",showXAxis:!1,showLegend:!1})]})})]})})},ec=()=>{let[e,t]=(0,l.useState)(null),[n,a]=(0,l.useState)(null),o=(0,r.useSearchParams)(),c=o.get("userID"),d=o.get("token"),[m,h]=(0,l.useState)("api-keys"),[u,x]=(0,l.useState)(null);return(0,l.useEffect)(()=>{if(d){let e=(0,q.o)(d);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),x(e.key),e.user_role){let n=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",n),t(n)}else console.log("User role not defined");e.user_email?a(e.user_email):console.log("User Email is not set ".concat(e))}}},[d]),(0,s.jsx)(l.Suspense,{fallback:(0,s.jsx)("div",{children:"Loading..."}),children:(0,s.jsxs)("div",{className:"flex flex-col min-h-screen",children:[(0,s.jsx)(i,{userID:c,userRole:e,userEmail:n}),(0,s.jsxs)("div",{className:"flex flex-1 overflow-auto",children:[(0,s.jsx)(ea,{setPage:h}),"api-keys"==m?(0,s.jsx)(G,{userID:c,userRole:e,setUserRole:t,userEmail:n,setUserEmail:a}):"models"==m?(0,s.jsx)($,{userID:c,userRole:e,token:d,accessToken:u}):"llm-playground"==m?(0,s.jsx)(en,{userID:c,userRole:e,token:d,accessToken:u}):(0,s.jsx)(ei,{userID:c,userRole:e,token:d,accessToken:u})]})]})})}}},function(e){e.O(0,[145,971,69,744],function(){return e(e.s=20661)}),_N_E=e.O()}]); \ No newline at end of file diff --git a/litellm/proxy/_experimental/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js b/litellm/proxy/_experimental/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js deleted file mode 100644 index 5402c8d1f..000000000 --- a/litellm/proxy/_experimental/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js +++ /dev/null @@ -1 +0,0 @@ -(self.webpackChunk_N_E=self.webpackChunk_N_E||[]).push([[931],{20661:function(e,t,n){Promise.resolve().then(n.bind(n,48016))},48016:function(e,t,n){"use strict";n.r(t),n.d(t,{default:function(){return ec}});var s=n(3827),l=n(64090),r=n(47907),a=n(8792),o=n(2179),i=e=>{let{userID:t,userRole:n,userEmail:l}=e;return console.log("User ID:",t),console.log("userEmail:",l),(0,s.jsxs)("nav",{className:"left-0 right-0 top-0 flex justify-between items-center h-12 mb-4",children:[(0,s.jsx)("div",{className:"text-left mx-4 my-2 absolute top-0 left-0",children:(0,s.jsx)("div",{className:"flex flex-col items-center",children:(0,s.jsx)(a.default,{href:"/",children:(0,s.jsx)("button",{className:"text-gray-800 text-2xl px-4 py-1 rounded text-center",children:"\uD83D\uDE85 LiteLLM"})})})}),(0,s.jsx)("div",{className:"text-right mx-4 my-2 absolute top-0 right-0",children:(0,s.jsxs)(o.Z,{variant:"secondary",children:[l,(0,s.jsxs)("p",{children:["Role: ",n]}),(0,s.jsxs)("p",{children:["ID: ",t]})]})})]})},c=n(80588);let d=async(e,t,n)=>{try{if(console.log("Form Values in keyCreateCall:",n),n.description&&(n.metadata||(n.metadata={}),n.metadata.description=n.description,delete n.description,n.metadata=JSON.stringify(n.metadata)),n.metadata){console.log("formValues.metadata:",n.metadata);try{n.metadata=JSON.parse(n.metadata)}catch(e){throw c.ZP.error("Failed to parse metadata: "+e),Error("Failed to parse metadata: "+e)}}console.log("Form Values after check:",n);let s=await fetch("/key/generate",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({user_id:t,...n})});if(!s.ok){let e=await s.text();throw c.ZP.error("Failed to create key: "+e),console.error("Error response from the server:",e),Error("Network response was not ok")}let l=await s.json();return console.log("API Response:",l),l}catch(e){throw console.error("Failed to create key:",e),e}},m=async(e,t)=>{try{console.log("in keyDeleteCall:",t),c.ZP.info("Making key delete request");let n=await fetch("/key/delete",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:[t]})});if(!n.ok){let e=await n.text();throw c.ZP.error("Failed to delete key: "+e),Error("Network response was not ok")}let s=await n.json();return console.log(s),c.ZP.success("API Key Deleted"),s}catch(e){throw console.error("Failed to create key:",e),e}},h=async(e,t,n)=>{try{let s="/user/info";"App Owner"==n&&(s="".concat(s,"/?user_id=").concat(t)),c.ZP.info("Requesting user data");let l=await fetch(s,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!l.ok){let e=await l.text();throw c.ZP.error(e),Error("Network response was not ok")}let r=await l.json();return c.ZP.info("Received user data"),r}catch(e){throw console.error("Failed to create key:",e),e}},u=async(e,t,n)=>{try{c.ZP.info("Requesting model data");let t=await fetch("/model/info",{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!t.ok){let e=await t.text();throw c.ZP.error(e),Error("Network response was not ok")}let n=await t.json();return c.ZP.info("Received model data"),n}catch(e){throw console.error("Failed to create key:",e),e}},x=async(e,t)=>{try{let n="/spend/logs";console.log("in keySpendLogsCall:",n);let s=await fetch("".concat(n,"/?api_key=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to create key:",e),e}},p=async(e,t,n,s,l,r)=>{try{let t="/spend/logs";t="App Owner"==n?"".concat(t,"/?user_id=").concat(s,"&start_date=").concat(l,"&end_date=").concat(r):"".concat(t,"/?start_date=").concat(l,"&end_date=").concat(r),c.ZP.info("Making spend logs request");let a=await fetch(t,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!a.ok){let e=await a.text();throw c.ZP.error(e),Error("Network response was not ok")}let o=await a.json();return console.log(o),c.ZP.success("Spend Logs received"),o}catch(e){throw console.error("Failed to create key:",e),e}},j=async(e,t)=>{try{let n=await fetch("/key/info",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:t})});if(!n.ok){let e=await n.text();throw c.ZP.error(e),Error("Network response was not ok")}let s=await n.json();return console.log(s),s}catch(e){throw console.error("Failed to create key:",e),e}},g=async(e,t)=>{try{let n="/spend/users";console.log("in spendUsersCall:",n);let s=await fetch("".concat(n,"/?user_id=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to get spend for user",e),e}};var y=n(10384),f=n(46453),Z=n(71801),w=n(13969),k=n(12143),_=n(77171),v=n(29714),b=n(88707),S=n(1861);let{Option:N}=w.default;var I=e=>{let{userID:t,userRole:n,accessToken:r,data:a,userModels:i,setData:m}=e,[h]=k.Z.useForm(),[u,x]=(0,l.useState)(!1),[p,j]=(0,l.useState)(null),g=()=>{x(!1),h.resetFields()},I=()=>{x(!1),j(null),h.resetFields()},A=async e=>{try{c.ZP.info("Making API Call"),x(!0);let n=await d(r,t,e);m(e=>e?[...e,n]:[n]),j(n.key),c.ZP.success("API Key Created"),h.resetFields(),localStorage.removeItem("userData"+t)}catch(e){console.error("Error creating the key:",e)}};return(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>x(!0),children:"+ Create New Key"}),(0,s.jsx)(_.Z,{title:"Create Key",visible:u,width:800,footer:null,onOk:g,onCancel:I,children:(0,s.jsxs)(k.Z,{form:h,onFinish:A,labelCol:{span:6},wrapperCol:{span:16},labelAlign:"left",children:["App Owner"===n||"Admin"===n?(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Models",name:"models",children:(0,s.jsx)(w.default,{mode:"multiple",placeholder:"Select models",style:{width:"100%"},children:i.map(e=>(0,s.jsx)(N,{value:e,children:e},e))})}),(0,s.jsx)(k.Z.Item,{label:"Max Budget (USD)",name:"max_budget",children:(0,s.jsx)(b.Z,{step:.01,precision:2,width:200})}),(0,s.jsx)(k.Z.Item,{label:"Duration (eg: 30s, 30h, 30d)",name:"duration",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Metadata",name:"metadata",children:(0,s.jsx)(v.Z.TextArea,{rows:4,placeholder:"Enter metadata as JSON"})})]}):(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID (Contact Group)",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Description",name:"description",children:(0,s.jsx)(v.Z.TextArea,{placeholder:"Enter description",rows:4})})]}),(0,s.jsx)("div",{style:{textAlign:"right",marginTop:"10px"},children:(0,s.jsx)(S.ZP,{htmlType:"submit",children:"Create Key"})})]})}),p&&(0,s.jsx)(_.Z,{title:"Save your key",visible:u,onOk:g,onCancel:I,footer:null,children:(0,s.jsxs)(f.Z,{numItems:1,className:"gap-2 w-full",children:[(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)("p",{children:["Please save this secret key somewhere safe and accessible. For security reasons, ",(0,s.jsx)("b",{children:"you will not be able to view it again"})," ","through your LiteLLM account. If you lose this secret key, you will need to generate a new one."]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:null!=p?(0,s.jsxs)(Z.Z,{children:["API Key: ",p]}):(0,s.jsx)(Z.Z,{children:"Key being created, this might take 30s"})})]})})]})},A=n(33393),C=n(13810),D=n(61244),T=n(10827),P=n(3851),E=n(2044),O=n(64167),R=n(74480),M=n(7178),U=n(42440),F=n(9853),K=n(67989),L=n(56863),z=e=>{let{token:t,accessToken:n,keySpend:r,keyBudget:a,keyName:i}=e,[c,d]=(0,l.useState)(!1),[m,h]=(0,l.useState)(null),[u,p]=(0,l.useState)(null),j=async()=>{try{if(null==n||null==t)return;console.log("accessToken: ".concat(n,"; token: ").concat(t));let e=await x(n,t);console.log("Response:",e);let s=Object.values(e).reduce((e,t)=>{let n=new Date(t.startTime),s=new Intl.DateTimeFormat("en-US",{day:"2-digit",month:"short"}).format(n);return e[s]=(e[s]||0)+t.spend,e},{}),l=Object.entries(s);l.sort((e,t)=>{let[n]=e,[s]=t,l=new Date(n),r=new Date(s);return l.getTime()-r.getTime()});let r=Object.fromEntries(l);console.log(r);let a=Object.values(e).reduce((e,t)=>{let n=t.user;return e[n]=(e[n]||0)+t.spend,e},{});console.log(s),console.log(a);let o=[];for(let[e,t]of Object.entries(r))o.push({day:e,spend:t});let i=Object.entries(a).sort((e,t)=>t[1]-e[1]).slice(0,5).map(e=>{let[t,n]=e;return{name:t,value:n}});h(o),p(i),console.log("arrayBarChart:",o)}catch(e){console.error("There was an error fetching the data",e)}};return t?(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>{console.log("Show Modal triggered"),d(!0),j()},children:"View Spend Report"}),(0,s.jsxs)(_.Z,{visible:c,width:1e3,onOk:()=>{d(!1)},onCancel:()=>{d(!1)},footer:null,children:[(0,s.jsxs)(U.Z,{style:{textAlign:"left"},children:["Key Name: ",i]}),(0,s.jsxs)(L.Z,{children:["Monthly Spend $",r]}),(0,s.jsx)(C.Z,{className:"mt-6 mb-6",children:m&&(0,s.jsx)(F.Z,{className:"mt-6",data:m,colors:["green"],index:"day",categories:["spend"],yAxisWidth:48})}),(0,s.jsx)(U.Z,{className:"mt-6",children:"Top 5 Users Spend (USD)"}),(0,s.jsx)(C.Z,{className:"mb-6",children:u&&(0,s.jsx)(K.Z,{className:"mt-6",data:u,color:"teal"})})]})]}):null},B=e=>{let{userID:t,accessToken:n,data:r,setData:a}=e,[i,c]=(0,l.useState)(!1),[d,h]=(0,l.useState)(!1),[u,x]=(0,l.useState)(null),p=async e=>{null!=r&&(x(e),localStorage.removeItem("userData"+t),h(!0))},j=async()=>{if(null!=u&&null!=r){try{await m(n,u);let e=r.filter(e=>e.token!==u);a(e)}catch(e){console.error("Error deleting the key:",e)}h(!1),x(null)}};if(null!=r)return console.log("RERENDER TRIGGERED"),(0,s.jsxs)(C.Z,{className:"w-full mx-auto flex-auto overflow-y-auto max-h-[50vh] mb-4",children:[(0,s.jsx)(U.Z,{children:"API Keys"}),(0,s.jsxs)(T.Z,{className:"mt-5",children:[(0,s.jsx)(O.Z,{children:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(R.Z,{children:"Key Alias"}),(0,s.jsx)(R.Z,{children:"Secret Key"}),(0,s.jsx)(R.Z,{children:"Spend (USD)"}),(0,s.jsx)(R.Z,{children:"Key Budget (USD)"}),(0,s.jsx)(R.Z,{children:"Team ID"}),(0,s.jsx)(R.Z,{children:"Metadata"}),(0,s.jsx)(R.Z,{children:"Models"}),(0,s.jsx)(R.Z,{children:"TPM / RPM Limits"}),(0,s.jsx)(R.Z,{children:"Expires"})]})}),(0,s.jsx)(P.Z,{children:r.map(e=>(console.log(e),"litellm-dashboard"===e.team_id)?null:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:null!=e.key_alias?(0,s.jsx)(Z.Z,{children:e.key_alias}):(0,s.jsx)(Z.Z,{children:"Not Set"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.key_name})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.spend})}),(0,s.jsx)(E.Z,{children:null!=e.max_budget?(0,s.jsx)(Z.Z,{children:e.max_budget}):(0,s.jsx)(Z.Z,{children:"Unlimited Budget"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.team_id})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.metadata)})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.models)})}),(0,s.jsx)(E.Z,{children:(0,s.jsxs)(Z.Z,{children:["TPM Limit: ",e.tpm_limit?e.tpm_limit:"Unlimited"," ",(0,s.jsx)("br",{})," RPM Limit:"," ",e.rpm_limit?e.rpm_limit:"Unlimited"]})}),(0,s.jsx)(E.Z,{children:null!=e.expires?(0,s.jsx)(Z.Z,{children:e.expires}):(0,s.jsx)(Z.Z,{children:"Never expires"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(D.Z,{onClick:()=>p(e.token),icon:A.Z,size:"sm"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(z,{token:e.token,accessToken:n,keySpend:e.spend,keyBudget:e.max_budget,keyName:e.key_name})})]},e.token))})]}),d&&(0,s.jsx)("div",{className:"fixed z-10 inset-0 overflow-y-auto",children:(0,s.jsxs)("div",{className:"flex items-end justify-center min-h-screen pt-4 px-4 pb-20 text-center sm:block sm:p-0",children:[(0,s.jsx)("div",{className:"fixed inset-0 transition-opacity","aria-hidden":"true",children:(0,s.jsx)("div",{className:"absolute inset-0 bg-gray-500 opacity-75"})}),(0,s.jsx)("span",{className:"hidden sm:inline-block sm:align-middle sm:h-screen","aria-hidden":"true",children:"​"}),(0,s.jsxs)("div",{className:"inline-block align-bottom bg-white rounded-lg text-left overflow-hidden shadow-xl transform transition-all sm:my-8 sm:align-middle sm:max-w-lg sm:w-full",children:[(0,s.jsx)("div",{className:"bg-white px-4 pt-5 pb-4 sm:p-6 sm:pb-4",children:(0,s.jsx)("div",{className:"sm:flex sm:items-start",children:(0,s.jsxs)("div",{className:"mt-3 text-center sm:mt-0 sm:ml-4 sm:text-left",children:[(0,s.jsx)("h3",{className:"text-lg leading-6 font-medium text-gray-900",children:"Delete Key"}),(0,s.jsx)("div",{className:"mt-2",children:(0,s.jsx)("p",{className:"text-sm text-gray-500",children:"Are you sure you want to delete this key ?"})})]})})}),(0,s.jsxs)("div",{className:"bg-gray-50 px-4 py-3 sm:px-6 sm:flex sm:flex-row-reverse",children:[(0,s.jsx)(o.Z,{onClick:j,color:"red",className:"ml-2",children:"Delete"}),(0,s.jsx)(o.Z,{onClick:()=>{h(!1),x(null)},children:"Cancel"})]})]})]})})]})},J=e=>{let{userID:t,userSpendData:n,userRole:r,accessToken:a}=e;console.log("User SpendData:",n);let[o,i]=(0,l.useState)(null==n?void 0:n.spend),[c,d]=(0,l.useState)((null==n?void 0:n.max_budget)||null);return(0,l.useEffect)(()=>{(async()=>{if("Admin"===r)try{let e=await g(a,"litellm-proxy-budget");console.log("Result from callSpendUsers:",e);let t=e[0];i(null==t?void 0:t.spend),d((null==t?void 0:t.max_budget)||null)}catch(e){console.error("Failed to get spend for user",e)}})()},[r,a,t]),(0,s.jsx)(s.Fragment,{children:(0,s.jsxs)(C.Z,{className:"mx-auto mb-4",children:[(0,s.jsxs)(L.Z,{children:["$",o]}),(0,s.jsxs)(U.Z,{children:["/ ",null!==c?"$".concat(c," limit"):"No limit"]})]})})},q=n(37963);console.log("isLocal:",!1);var G=e=>{let{userID:t,userRole:n,setUserRole:a,userEmail:o,setUserEmail:i}=e,[c,d]=(0,l.useState)(null),[m,x]=(0,l.useState)(null),p=(0,r.useSearchParams)();p.get("viewSpend"),(0,r.useRouter)();let j=p.get("token"),[g,Z]=(0,l.useState)(null),[w,k]=(0,l.useState)([]);if((0,l.useEffect)(()=>{if(j){let e=(0,q.o)(j);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),Z(e.key),e.user_role){let t=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",t),a(t)}else console.log("User role not defined");e.user_email?i(e.user_email):console.log("User Email is not set ".concat(e))}}if(t&&g&&n&&!c){let e=localStorage.getItem("userData"+t),s=localStorage.getItem("userSpendData"+t),l=localStorage.getItem("userModels"+t);e&&s&&l?(d(JSON.parse(e)),x(JSON.parse(s)),k(JSON.parse(l))):(async()=>{try{let e=await h(g,t,n);x(e.user_info),d(e.keys),localStorage.setItem("userData"+t,JSON.stringify(e.keys)),localStorage.setItem("userSpendData"+t,JSON.stringify(e.user_info));let s=await u(g,t,n);console.log("model_info:",s);let l=s.data.map(e=>e.model_name);console.log("available_model_names:",l),k(l),console.log("userModels:",w),localStorage.setItem("userModels"+t,JSON.stringify(l))}catch(e){console.error("There was an error fetching the data",e)}})()}},[t,j,g,c,n]),null==t||null==j){let e="/sso/key/generate";return console.log("Full URL:",e),window.location.href=e,null}return null==g?null:(null==n&&a("App Owner"),(0,s.jsx)("div",{children:(0,s.jsx)(f.Z,{numItems:1,className:"gap-0 p-10 h-[75vh] w-full",children:(0,s.jsxs)(y.Z,{numColSpan:1,children:[(0,s.jsx)(J,{userID:t,userSpendData:m,userRole:n,accessToken:g}),(0,s.jsx)(B,{userID:t,accessToken:g,data:c,setData:d}),(0,s.jsx)(I,{userID:t,userRole:n,userModels:w,accessToken:g,data:c,setData:d})]})})}))},$=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)({data:[]});if((0,l.useEffect)(()=>{if(!t||!n||!r||!a)return;let e=async()=>{try{let e=await u(t,a,r);console.log("Model data response:",e.data),i(e)}catch(e){console.error("There was an error fetching the model data",e)}};t&&n&&r&&a&&e()},[t,n,r,a]),!o)return(0,s.jsx)("div",{children:"Loading..."});for(let e=0;e(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:e.model_name})}),(0,s.jsx)(E.Z,{children:e.provider}),(0,s.jsx)(E.Z,{children:e.input_cost}),(0,s.jsx)(E.Z,{children:e.output_cost}),(0,s.jsx)(E.Z,{children:e.max_tokens})]},e.model_name))})]})})})})},V=n(92836),W=n(26734),H=n(41608),Y=n(32126),X=n(23682),Q=n(12968),ee=n(67951);async function et(e,t,n,s){console.log("isLocal:",!1);let l=window.location.origin,r=new Q.ZP.OpenAI({apiKey:s,baseURL:l,dangerouslyAllowBrowser:!0});for await(let s of(await r.chat.completions.create({model:n,stream:!0,messages:[{role:"user",content:e}]})))console.log(s),s.choices[0].delta.content&&t(s.choices[0].delta.content)}var en=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)(""),[c,d]=(0,l.useState)([]),[m,h]=(0,l.useState)(void 0),[x,p]=(0,l.useState)(null);(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{let e=await u(t,a,r);console.log("model_info:",e),(null==e?void 0:e.data.length)>0&&(p(e),h(e.data[0].model_name))})()},[t,a,r]);let j=(e,t)=>{d(n=>{let s=n[n.length-1];return s&&s.role===e?[...n.slice(0,n.length-1),{role:e,content:s.content+t}]:[...n,{role:e,content:t}]})},g=async()=>{if(""!==o.trim()&&t&&n&&r&&a){d(e=>[...e,{role:"user",content:o}]);try{m&&await et(o,e=>j("assistant",e),m,t)}catch(e){console.error("Error fetching model response",e),j("assistant","Error fetching model response")}i("")}};return(0,s.jsx)("div",{style:{width:"100%",position:"relative"},children:(0,s.jsx)(f.Z,{className:"gap-2 p-10 h-[75vh] w-full",children:(0,s.jsx)(C.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{className:"mt-4",children:[(0,s.jsx)(V.Z,{children:"Chat"}),(0,s.jsx)(V.Z,{children:"API Reference"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsxs)(Y.Z,{children:[(0,s.jsxs)("div",{children:[(0,s.jsx)("label",{children:"Select Model:"}),(0,s.jsx)("select",{value:m||"",onChange:e=>h(e.target.value),children:null==x?void 0:x.data.map(e=>(0,s.jsx)("option",{value:e.model_name,children:e.model_name},e.model_name))})]}),(0,s.jsxs)(T.Z,{className:"mt-5",style:{display:"block",maxHeight:"60vh",overflowY:"auto"},children:[(0,s.jsx)(O.Z,{children:(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:"Chat"})})})}),(0,s.jsx)(P.Z,{children:c.map((e,t)=>(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:"".concat(e.role,": ").concat(e.content)})},t))})]}),(0,s.jsx)("div",{className:"mt-3",style:{position:"absolute",bottom:5,width:"95%"},children:(0,s.jsxs)("div",{className:"flex",children:[(0,s.jsx)("input",{type:"text",value:o,onChange:e=>i(e.target.value),className:"flex-1 p-2 border rounded-md mr-2",placeholder:"Type your message..."}),(0,s.jsx)("button",{onClick:g,className:"p-2 bg-blue-500 text-white rounded-md",children:"Send"})]})})]}),(0,s.jsx)(Y.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{children:[(0,s.jsx)(V.Z,{children:"OpenAI Python SDK"}),(0,s.jsx)(V.Z,{children:"LlamaIndex"}),(0,s.jsx)(V.Z,{children:"Langchain Py"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport openai\nclient = openai.OpenAI(\n api_key="your_api_key",\n base_url="http://0.0.0.0:4000" # proxy base url\n)\n\nresponse = client.chat.completions.create(\n model="gpt-3.5-turbo", # model to use from Models Tab\n messages = [\n {\n "role": "user",\n "content": "this is a test request, write a short poem"\n }\n ],\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-openai-client",\n "generation_id": "openai-client-gen-id22",\n "trace_id": "openai-client-trace-id22",\n "trace_user_id": "openai-client-user-id2"\n }\n }\n)\n\nprint(response)\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport os, dotenv\n\nfrom llama_index.llms import AzureOpenAI\nfrom llama_index.embeddings import AzureOpenAIEmbedding\nfrom llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext\n\nllm = AzureOpenAI(\n engine="azure-gpt-3.5", # model_name on litellm proxy\n temperature=0.0,\n azure_endpoint="http://0.0.0.0:4000", # litellm proxy endpoint\n api_key="sk-1234", # litellm proxy API Key\n api_version="2023-07-01-preview",\n)\n\nembed_model = AzureOpenAIEmbedding(\n deployment_name="azure-embedding-model",\n azure_endpoint="http://0.0.0.0:4000",\n api_key="sk-1234",\n api_version="2023-07-01-preview",\n)\n\n\ndocuments = SimpleDirectoryReader("llama_index_data").load_data()\nservice_context = ServiceContext.from_defaults(llm=llm, embed_model=embed_model)\nindex = VectorStoreIndex.from_documents(documents, service_context=service_context)\n\nquery_engine = index.as_query_engine()\nresponse = query_engine.query("What did the author do growing up?")\nprint(response)\n\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nfrom langchain.chat_models import ChatOpenAI\nfrom langchain.prompts.chat import (\n ChatPromptTemplate,\n HumanMessagePromptTemplate,\n SystemMessagePromptTemplate,\n)\nfrom langchain.schema import HumanMessage, SystemMessage\n\nchat = ChatOpenAI(\n openai_api_base="http://0.0.0.0:8000",\n model = "gpt-3.5-turbo",\n temperature=0.1,\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-langchain-client",\n "generation_id": "langchain-client-gen-id22",\n "trace_id": "langchain-client-trace-id22",\n "trace_user_id": "langchain-client-user-id2"\n }\n }\n)\n\nmessages = [\n SystemMessage(\n content="You are a helpful assistant that im using to make a test request to."\n ),\n HumanMessage(\n content="test from litellm. tell me why it\'s amazing in 1 sentence"\n ),\n]\nresponse = chat(messages)\n\nprint(response)\n\n '})})]})]})})]})]})})})})},es=n(33509),el=n(30569);let{Sider:er}=es.default;var ea=e=>{let{setPage:t}=e;return(0,s.jsx)(es.default,{style:{minHeight:"100vh",maxWidth:"120px"},children:(0,s.jsx)(er,{width:120,children:(0,s.jsxs)(el.Z,{mode:"inline",defaultSelectedKeys:["1"],style:{height:"100%",borderRight:0},children:[(0,s.jsx)(el.Z.Item,{onClick:()=>t("api-keys"),children:"API Keys"},"1"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("models"),children:"Models"},"2"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("llm-playground"),children:"Chat UI"},"3"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("usage"),children:"Usage"},"4")]})})})};let eo=e=>{let{payload:t,active:n}=e;if(!n||!t)return null;let l=t[0].payload,r=l.startTime,a=Object.entries(l.models).map(e=>{let[t,n]=e;return[t,n]});a.sort((e,t)=>t[1]-e[1]);let o=a.slice(0,5);return(0,s.jsxs)("div",{className:"w-56 rounded-tremor-default border border-tremor-border bg-tremor-background p-2 text-tremor-default shadow-tremor-dropdown",children:[r,o.map(e=>{let[t,n]=e;return(0,s.jsx)("div",{className:"flex flex-1 space-x-10",children:(0,s.jsx)("div",{className:"p-2",children:(0,s.jsxs)("p",{className:"text-tremor-content text-xs",children:[t,":",(0,s.jsxs)("span",{className:"text-xs text-tremor-content-emphasis",children:[" ",n?n<.01?"<$0.01":n.toFixed(2):""]})]})})},t)})]})};var ei=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,o=new Date,[i,c]=(0,l.useState)([]),[d,m]=(0,l.useState)([]),[h,u]=(0,l.useState)([]),x=new Date(o.getFullYear(),o.getMonth(),1),g=new Date(o.getFullYear(),o.getMonth()+1,0),Z=k(x),w=k(g);function k(e){let t=e.getFullYear(),n=e.getMonth()+1,s=e.getDate();return"".concat(t,"-").concat(n<10?"0"+n:n,"-").concat(s<10?"0"+s:s)}return console.log("Start date is ".concat(Z)),console.log("End date is ".concat(w)),(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{try{await p(t,n,r,a,Z,w).then(async e=>{let n=(await j(t,function(e){let t=[];e.forEach(e=>{Object.entries(e).forEach(e=>{let[n,s]=e;"spend"!==n&&"startTime"!==n&&"models"!==n&&"users"!==n&&t.push({key:n,spend:s})})}),t.sort((e,t)=>Number(t.spend)-Number(e.spend));let n=t.slice(0,5).map(e=>e.key);return console.log("topKeys: ".concat(Object.keys(n[0]))),n}(e))).info.map(e=>({key:(e.key_name||e.key_alias||e.token).substring(0,7),spend:e.spend}));m(n),u(function(e){let t={};e.forEach(e=>{Object.entries(e.users).forEach(e=>{let[n,s]=e;""!==n&&null!=n&&"None"!=n&&(t[n]||(t[n]=0),t[n]+=s)})});let n=Object.entries(t).map(e=>{let[t,n]=e;return{user_id:t,spend:n}});n.sort((e,t)=>t.spend-e.spend);let s=n.slice(0,5);return console.log("topKeys: ".concat(Object.values(s[0]))),s}(e)),c(e)})}catch(e){console.error("There was an error fetching the data",e)}})()},[t,n,r,a,Z,w]),(0,s.jsx)("div",{style:{width:"100%"},children:(0,s.jsxs)(f.Z,{numItems:2,className:"gap-2 p-10 h-[75vh] w-full",children:[(0,s.jsx)(y.Z,{numColSpan:2,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Monthly Spend"}),(0,s.jsx)(F.Z,{data:i,index:"startTime",categories:["spend"],colors:["blue"],valueFormatter:e=>"$ ".concat(new Intl.NumberFormat("us").format(e).toString()),yAxisWidth:100,tickGap:5,customTooltip:eo})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top API Keys"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:d,index:"key",categories:["spend"],colors:["blue"],yAxisWidth:80,tickGap:5,layout:"vertical",showXAxis:!1,showLegend:!1})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top Users"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:h,index:"user_id",categories:["spend"],colors:["blue"],yAxisWidth:200,layout:"vertical",showXAxis:!1,showLegend:!1})]})})]})})},ec=()=>{let[e,t]=(0,l.useState)(null),[n,a]=(0,l.useState)(null),o=(0,r.useSearchParams)(),c=o.get("userID"),d=o.get("token"),[m,h]=(0,l.useState)("api-keys"),[u,x]=(0,l.useState)(null);return(0,l.useEffect)(()=>{if(d){let e=(0,q.o)(d);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),x(e.key),e.user_role){let n=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",n),t(n)}else console.log("User role not defined");e.user_email?a(e.user_email):console.log("User Email is not set ".concat(e))}}},[d]),(0,s.jsx)(l.Suspense,{fallback:(0,s.jsx)("div",{children:"Loading..."}),children:(0,s.jsxs)("div",{className:"flex flex-col min-h-screen",children:[(0,s.jsx)(i,{userID:c,userRole:e,userEmail:n}),(0,s.jsxs)("div",{className:"flex flex-1 overflow-auto",children:[(0,s.jsx)(ea,{setPage:h}),"api-keys"==m?(0,s.jsx)(G,{userID:c,userRole:e,setUserRole:t,userEmail:n,setUserEmail:a}):"models"==m?(0,s.jsx)($,{userID:c,userRole:e,token:d,accessToken:u}):"llm-playground"==m?(0,s.jsx)(en,{userID:c,userRole:e,token:d,accessToken:u}):(0,s.jsx)(ei,{userID:c,userRole:e,token:d,accessToken:u})]})]})})}}},function(e){e.O(0,[145,971,69,744],function(){return e(e.s=20661)}),_N_E=e.O()}]); \ No newline at end of file diff --git a/litellm/proxy/_experimental/out/index.html b/litellm/proxy/_experimental/out/index.html index 80296f4f6..a6994e708 100644 --- a/litellm/proxy/_experimental/out/index.html +++ b/litellm/proxy/_experimental/out/index.html @@ -1 +1 @@ -🚅 LiteLLM \ No newline at end of file +🚅 LiteLLM \ No newline at end of file diff --git a/litellm/proxy/_experimental/out/index.txt b/litellm/proxy/_experimental/out/index.txt index b6bb2c868..2356232b4 100644 --- a/litellm/proxy/_experimental/out/index.txt +++ b/litellm/proxy/_experimental/out/index.txt @@ -1,7 +1,7 @@ 2:I[77831,[],""] -3:I[48016,["145","static/chunks/145-9c160ad5539e000f.js","931","static/chunks/app/page-7bb820bd6902dbf2.js"],""] +3:I[48016,["145","static/chunks/145-9c160ad5539e000f.js","931","static/chunks/app/page-2322bcdc2ec71284.js"],""] 4:I[5613,[],""] 5:I[31778,[],""] -0:["unBuvDqydg0yodtP5c3nQ",[[["",{"children":["__PAGE__",{}]},"$undefined","$undefined",true],["",{"children":["__PAGE__",{},["$L1",["$","$L2",null,{"propsForComponent":{"params":{}},"Component":"$3","isStaticGeneration":true}],null]]},[null,["$","html",null,{"lang":"en","children":["$","body",null,{"className":"__className_c23dc8","children":["$","$L4",null,{"parallelRouterKey":"children","segmentPath":["children"],"loading":"$undefined","loadingStyles":"$undefined","loadingScripts":"$undefined","hasLoading":false,"error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L5",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":"404"}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],"notFoundStyles":[],"styles":null}]}]}],null]],[[["$","link","0",{"rel":"stylesheet","href":"/ui/_next/static/css/c18941d97fb7245b.css","precedence":"next","crossOrigin":""}]],"$L6"]]]] +0:["S_8LZOnl2nyURq-NYnh2p",[[["",{"children":["__PAGE__",{}]},"$undefined","$undefined",true],["",{"children":["__PAGE__",{},["$L1",["$","$L2",null,{"propsForComponent":{"params":{}},"Component":"$3","isStaticGeneration":true}],null]]},[null,["$","html",null,{"lang":"en","children":["$","body",null,{"className":"__className_c23dc8","children":["$","$L4",null,{"parallelRouterKey":"children","segmentPath":["children"],"loading":"$undefined","loadingStyles":"$undefined","loadingScripts":"$undefined","hasLoading":false,"error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L5",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":"404"}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],"notFoundStyles":[],"styles":null}]}]}],null]],[[["$","link","0",{"rel":"stylesheet","href":"/ui/_next/static/css/c18941d97fb7245b.css","precedence":"next","crossOrigin":""}]],"$L6"]]]] 6:[["$","meta","0",{"name":"viewport","content":"width=device-width, initial-scale=1"}],["$","meta","1",{"charSet":"utf-8"}],["$","title","2",{"children":"🚅 LiteLLM"}],["$","meta","3",{"name":"description","content":"LiteLLM Proxy Admin UI"}],["$","link","4",{"rel":"icon","href":"/ui/favicon.ico","type":"image/x-icon","sizes":"16x16"}],["$","meta","5",{"name":"next-size-adjust"}]] 1:null diff --git a/litellm/proxy/_types.py b/litellm/proxy/_types.py index 372b953e0..827a25a2b 100644 --- a/litellm/proxy/_types.py +++ b/litellm/proxy/_types.py @@ -155,6 +155,9 @@ class GenerateKeyRequest(GenerateRequestBase): aliases: Optional[dict] = {} config: Optional[dict] = {} permissions: Optional[dict] = {} + model_max_budget: Optional[dict] = ( + {} + ) # {"gpt-4": 5.0, "gpt-3.5-turbo": 5.0}, defaults to {} class GenerateKeyResponse(GenerateKeyRequest): @@ -167,7 +170,13 @@ class GenerateKeyResponse(GenerateKeyRequest): def set_model_info(cls, values): if values.get("token") is not None: values.update({"key": values.get("token")}) - dict_fields = ["metadata", "aliases", "config", "permissions"] + dict_fields = [ + "metadata", + "aliases", + "config", + "permissions", + "model_max_budget", + ] for field in dict_fields: value = values.get(field) if value is not None and isinstance(value, str): @@ -302,6 +311,13 @@ class ConfigGeneralSettings(LiteLLMBase): None, description="connect to a postgres db - needed for generating temporary keys + tracking spend / key", ) + database_connection_pool_limit: Optional[int] = Field( + 100, + description="default connection pool for prisma client connecting to postgres db", + ) + database_connection_timeout: Optional[float] = Field( + 60, description="default timeout for a connection to the database" + ) database_type: Optional[Literal["dynamo_db"]] = Field( None, description="to use dynamodb instead of postgres db" ) @@ -383,6 +399,8 @@ class LiteLLM_VerificationToken(LiteLLMBase): budget_reset_at: Optional[datetime] = None allowed_cache_controls: Optional[list] = [] permissions: Dict = {} + model_spend: Dict = {} + model_max_budget: Dict = {} class UserAPIKeyAuth( @@ -410,6 +428,8 @@ class LiteLLM_UserTable(LiteLLMBase): user_id: str max_budget: Optional[float] spend: float = 0.0 + model_max_budget: Optional[Dict] = {} + model_spend: Optional[Dict] = {} user_email: Optional[str] models: list = [] diff --git a/litellm/proxy/db/dynamo_db.py b/litellm/proxy/db/dynamo_db.py index 206fee777..08b365191 100644 --- a/litellm/proxy/db/dynamo_db.py +++ b/litellm/proxy/db/dynamo_db.py @@ -287,6 +287,8 @@ class DynamoDBWrapper(CustomDB): or k == "config" or k == "metadata" or k == "permissions" + or k == "model_spend" + or k == "model_max_budget" ) and v is not None and isinstance(v, str) diff --git a/litellm/proxy/hooks/presidio_pii_masking.py b/litellm/proxy/hooks/presidio_pii_masking.py index 6ea329613..031f4e2d4 100644 --- a/litellm/proxy/hooks/presidio_pii_masking.py +++ b/litellm/proxy/hooks/presidio_pii_masking.py @@ -119,6 +119,9 @@ class _OPTIONAL_PresidioPIIMasking(CustomLogger): call_type: str, ): """ + - Check if request turned off pii + - Check if user allowed to turn off pii (key permissions -> 'allow_pii_controls') + - Take the request data - Call /analyze -> get the results - Call /anonymize w/ the analyze results -> get the redacted text @@ -126,13 +129,59 @@ class _OPTIONAL_PresidioPIIMasking(CustomLogger): For multiple messages in /chat/completions, we'll need to call them in parallel. """ permissions = user_api_key_dict.permissions - - if permissions.get("pii", True) == False: # allow key to turn off pii masking - return data - output_parse_pii = permissions.get( "output_parse_pii", litellm.output_parse_pii ) # allow key to turn on/off output parsing for pii + no_pii = permissions.get( + "no-pii", None + ) # allow key to turn on/off pii masking (if user is allowed to set pii controls, then they can override the key defaults) + + if no_pii is None: + # check older way of turning on/off pii + no_pii = not permissions.get("pii", True) + + content_safety = data.get("content_safety", None) + verbose_proxy_logger.debug(f"content_safety: {content_safety}") + ## Request-level turn on/off PII controls ## + if content_safety is not None and isinstance(content_safety, dict): + # pii masking ## + if ( + content_safety.get("no-pii", None) is not None + and content_safety.get("no-pii") == True + ): + # check if user allowed to turn this off + if permissions.get("allow_pii_controls", False) == False: + raise HTTPException( + status_code=400, + detail={"error": "Not allowed to set PII controls per request"}, + ) + else: # user allowed to turn off pii masking + no_pii = content_safety.get("no-pii") + if not isinstance(no_pii, bool): + raise HTTPException( + status_code=400, + detail={"error": "no_pii needs to be a boolean value"}, + ) + ## pii output parsing ## + if content_safety.get("output_parse_pii", None) is not None: + # check if user allowed to turn this off + if permissions.get("allow_pii_controls", False) == False: + raise HTTPException( + status_code=400, + detail={"error": "Not allowed to set PII controls per request"}, + ) + else: # user allowed to turn on/off pii output parsing + output_parse_pii = content_safety.get("output_parse_pii") + if not isinstance(output_parse_pii, bool): + raise HTTPException( + status_code=400, + detail={ + "error": "output_parse_pii needs to be a boolean value" + }, + ) + + if no_pii == False: # turn off pii masking + return data if call_type == "completion": # /chat/completions requests messages = data["messages"] diff --git a/litellm/proxy/proxy_cli.py b/litellm/proxy/proxy_cli.py index de21d0147..f6034cba3 100644 --- a/litellm/proxy/proxy_cli.py +++ b/litellm/proxy/proxy_cli.py @@ -409,6 +409,8 @@ def run_server( "uvicorn, gunicorn needs to be imported. Run - `pip install 'litellm[proxy]'`" ) + db_connection_pool_limit = 100 + db_connection_timeout = 60 if config is not None: """ Allow user to pass in db url via config @@ -427,6 +429,12 @@ def run_server( proxy_config.load_config(router=None, config_file_path=config) ) database_url = general_settings.get("database_url", None) + db_connection_pool_limit = general_settings.get( + "database_connection_pool_limit", 100 + ) + db_connection_timeout = general_settings.get( + "database_connection_timeout", 60 + ) if database_url and database_url.startswith("os.environ/"): original_dir = os.getcwd() # set the working directory to where this script is @@ -447,14 +455,19 @@ def run_server( try: if os.getenv("DATABASE_URL", None) is not None: ### add connection pool + pool timeout args - params = {"connection_limit": 100, "pool_timeout": 60} + params = { + "connection_limit": db_connection_pool_limit, + "pool_timeout": db_connection_timeout, + } database_url = os.getenv("DATABASE_URL") modified_url = append_query_params(database_url, params) os.environ["DATABASE_URL"] = modified_url - ### if os.getenv("DIRECT_URL", None) is not None: ### add connection pool + pool timeout args - params = {"connection_limit": 100, "pool_timeout": 60} + params = { + "connection_limit": db_connection_pool_limit, + "pool_timeout": db_connection_timeout, + } database_url = os.getenv("DIRECT_URL") modified_url = append_query_params(database_url, params) os.environ["DIRECT_URL"] = modified_url diff --git a/litellm/proxy/proxy_server.py b/litellm/proxy/proxy_server.py index 3b6393dca..295c80941 100644 --- a/litellm/proxy/proxy_server.py +++ b/litellm/proxy/proxy_server.py @@ -93,6 +93,7 @@ from litellm.proxy.utils import ( html_form, _read_request_body, _is_valid_team_configs, + _is_user_proxy_admin, ) from litellm.proxy.secret_managers.google_kms import load_google_kms import pydantic @@ -143,6 +144,9 @@ app = FastAPI( title="LiteLLM API", description=f"Proxy Server to call 100+ LLMs in the OpenAI format\n\n{ui_message}", version=version, + root_path=os.environ.get( + "SERVER_ROOT_PATH", "" + ), # check if user passed root path, FastAPI defaults this value to "" ) @@ -376,6 +380,11 @@ async def user_api_key_auth( # 3. If 'user' passed to /chat/completions, /embeddings endpoint is in budget # 4. If token is expired # 5. If token spend is under Budget for the token + # 6. If token spend per model is under budget per model + + request_data = await _read_request_body( + request=request + ) # request data, used across all checks. Making this easily available # Check 1. If token can call model litellm.model_alias_map = valid_token.aliases @@ -450,7 +459,6 @@ async def user_api_key_auth( if ( litellm.max_user_budget is not None ): # Check if 'user' passed in /chat/completions is in budget, only checked if litellm.max_user_budget is set - request_data = await _read_request_body(request=request) user_passed_to_chat_completions = request_data.get("user", None) if user_passed_to_chat_completions is not None: user_id_list.append(user_passed_to_chat_completions) @@ -496,11 +504,7 @@ async def user_api_key_auth( continue assert isinstance(_user, dict) # check if user is admin # - if ( - _user.get("user_role", None) is not None - and _user.get("user_role") == "proxy_admin" - ): - return UserAPIKeyAuth(api_key=master_key) + # Token exists, not expired now check if its in budget for the user user_max_budget = _user.get("max_budget", None) user_current_spend = _user.get("spend", None) @@ -587,6 +591,25 @@ async def user_api_key_auth( f"ExceededTokenBudget: Current spend for token: {valid_token.spend}; Max Budget for Token: {valid_token.max_budget}" ) + # Check 5. Token Model Spend is under Model budget + max_budget_per_model = valid_token.model_max_budget + spend_per_model = valid_token.model_spend + + if max_budget_per_model is not None and spend_per_model is not None: + current_model = request_data.get("model") + if current_model is not None: + current_model_spend = spend_per_model.get(current_model, None) + current_model_budget = max_budget_per_model.get(current_model, None) + + if ( + current_model_spend is not None + and current_model_budget is not None + ): + if current_model_spend > current_model_budget: + raise Exception( + f"ExceededModelBudget: Current spend for model: {current_model_spend}; Max Budget for Model: {current_model_budget}" + ) + # Token passed all checks api_key = valid_token.token @@ -616,11 +639,15 @@ async def user_api_key_auth( ) ) if ( - route.startswith("/key/") - or route.startswith("/user/") - or route.startswith("/model/") - or route.startswith("/spend/") - ) and (not is_master_key_valid): + ( + route.startswith("/key/") + or route.startswith("/user/") + or route.startswith("/model/") + or route.startswith("/spend/") + ) + and (not is_master_key_valid) + and (not _is_user_proxy_admin(user_id_information)) + ): allow_user_auth = False if ( general_settings.get("allow_user_auth", False) == True @@ -712,9 +739,12 @@ async def user_api_key_auth( # Do something if the current route starts with any of the allowed routes pass else: - raise Exception( - f"This key is made for LiteLLM UI, Tried to access route: {route}. Not allowed" - ) + if _is_user_proxy_admin(user_id_information): + pass + else: + raise Exception( + f"This key is made for LiteLLM UI, Tried to access route: {route}. Not allowed" + ) return UserAPIKeyAuth(api_key=api_key, **valid_token_dict) except Exception as e: # verbose_proxy_logger.debug(f"An exception occurred - {traceback.format_exc()}") @@ -937,13 +967,26 @@ async def update_database( # Calculate the new cost by adding the existing cost and response_cost existing_spend_obj.spend = existing_spend + response_cost + # track cost per model, for the given user + spend_per_model = existing_spend_obj.model_spend or {} + current_model = kwargs.get("model") + + if current_model is not None and spend_per_model is not None: + if spend_per_model.get(current_model) is None: + spend_per_model[current_model] = response_cost + else: + spend_per_model[current_model] += response_cost + existing_spend_obj.model_spend = spend_per_model + valid_token = user_api_key_cache.get_cache(key=id) if valid_token is not None and isinstance(valid_token, dict): user_api_key_cache.set_cache( key=id, value=existing_spend_obj.json() ) - verbose_proxy_logger.debug(f"new cost: {existing_spend_obj.spend}") + verbose_proxy_logger.debug( + f"user - new cost: {existing_spend_obj.spend}, user_id: {id}" + ) data_list.append(existing_spend_obj) # Update the cost column for the given user id @@ -980,15 +1023,28 @@ async def update_database( # Calculate the new cost by adding the existing cost and response_cost new_spend = existing_spend + response_cost - verbose_proxy_logger.debug(f"new cost: {new_spend}") + # track cost per model, for the given key + spend_per_model = existing_spend_obj.model_spend or {} + current_model = kwargs.get("model") + if current_model is not None and spend_per_model is not None: + if spend_per_model.get(current_model) is None: + spend_per_model[current_model] = response_cost + else: + spend_per_model[current_model] += response_cost + + verbose_proxy_logger.debug( + f"new cost: {new_spend}, new spend per model: {spend_per_model}" + ) # Update the cost column for the given token await prisma_client.update_data( - token=token, data={"spend": new_spend} + token=token, + data={"spend": new_spend, "model_spend": spend_per_model}, ) valid_token = user_api_key_cache.get_cache(key=token) if valid_token is not None: valid_token.spend = new_spend + valid_token.model_spend = spend_per_model user_api_key_cache.set_cache(key=token, value=valid_token) elif custom_db_client is not None: # Fetch the existing cost for the given token @@ -1068,10 +1124,21 @@ async def update_database( # Calculate the new cost by adding the existing cost and response_cost new_spend = existing_spend + response_cost + # track cost per model, for the given team + spend_per_model = existing_spend_obj.model_spend or {} + current_model = kwargs.get("model") + if current_model is not None and spend_per_model is not None: + if spend_per_model.get(current_model) is None: + spend_per_model[current_model] = response_cost + else: + spend_per_model[current_model] += response_cost + verbose_proxy_logger.debug(f"new cost: {new_spend}") # Update the cost column for the given token await prisma_client.update_data( - team_id=team_id, data={"spend": new_spend}, table_name="team" + team_id=team_id, + data={"spend": new_spend, "model_spend": spend_per_model}, + table_name="team", ) elif custom_db_client is not None: @@ -1645,6 +1712,7 @@ async def generate_key_helper_fn( key_alias: Optional[str] = None, allowed_cache_controls: Optional[list] = [], permissions: Optional[dict] = {}, + model_max_budget: Optional[dict] = {}, ): global prisma_client, custom_db_client, user_api_key_cache @@ -1678,6 +1746,8 @@ async def generate_key_helper_fn( config_json = json.dumps(config) permissions_json = json.dumps(permissions) metadata_json = json.dumps(metadata) + model_max_budget_json = json.dumps(model_max_budget) + user_id = user_id or str(uuid.uuid4()) user_role = user_role or "app_user" tpm_limit = tpm_limit @@ -1720,6 +1790,7 @@ async def generate_key_helper_fn( "budget_reset_at": key_reset_at, "allowed_cache_controls": allowed_cache_controls, "permissions": permissions_json, + "model_max_budget": model_max_budget_json, } if ( general_settings.get("allow_user_auth", False) == True @@ -1735,6 +1806,11 @@ async def generate_key_helper_fn( saved_token["metadata"] = json.loads(saved_token["metadata"]) if isinstance(saved_token["permissions"], str): saved_token["permissions"] = json.loads(saved_token["permissions"]) + if isinstance(saved_token["model_max_budget"], str): + saved_token["model_max_budget"] = json.loads( + saved_token["model_max_budget"] + ) + if saved_token.get("expires", None) is not None and isinstance( saved_token["expires"], datetime ): @@ -3078,6 +3154,20 @@ async def generate_key_fn( - max_parallel_requests: Optional[int] - Rate limit a user based on the number of parallel requests. Raises 429 error, if user's parallel requests > x. - metadata: Optional[dict] - Metadata for key, store information for key. Example metadata = {"team": "core-infra", "app": "app2", "email": "ishaan@berri.ai" } - permissions: Optional[dict] - key-specific permissions. Currently just used for turning off pii masking (if connected). Example - {"pii": false} + - model_max_budget: Optional[dict] - key-specific model budget in USD. Example - {"text-davinci-002": 0.5, "gpt-3.5-turbo": 0.5}. IF null or {} then no model specific budget. + + Examples: + + 1. Allow users to turn on/off pii masking + + ```bash + curl --location 'http://0.0.0.0:8000/key/generate' \ + --header 'Authorization: Bearer sk-1234' \ + --header 'Content-Type: application/json' \ + --data '{ + "permissions": {"allow_pii_controls": true} + }' + ``` Returns: - key: (str) The generated api key @@ -4871,7 +4961,7 @@ async def auth_callback(request: Request): if user_id is None: user_id = getattr(result, "first_name", "") + getattr(result, "last_name", "") response = await generate_key_helper_fn( - **{"duration": "1hr", "key_max_budget": 0, "models": [], "aliases": {}, "config": {}, "spend": 0, "user_id": user_id, "team_id": "litellm-dashboard", "user_email": user_email} # type: ignore + **{"duration": "1hr", "key_max_budget": 0.01, "models": [], "aliases": {}, "config": {}, "spend": 0, "user_id": user_id, "team_id": "litellm-dashboard", "user_email": user_email} # type: ignore ) key = response["token"] # type: ignore user_id = response["user_id"] # type: ignore diff --git a/litellm/proxy/schema.prisma b/litellm/proxy/schema.prisma index 5a57b8808..101cf9b7f 100644 --- a/litellm/proxy/schema.prisma +++ b/litellm/proxy/schema.prisma @@ -24,6 +24,8 @@ model LiteLLM_TeamTable { budget_reset_at DateTime? created_at DateTime @default(now()) @map("created_at") updated_at DateTime @default(now()) @updatedAt @map("updated_at") + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // Track spend, rate limit, budget Users @@ -41,6 +43,8 @@ model LiteLLM_UserTable { budget_duration String? budget_reset_at DateTime? allowed_cache_controls String[] @default([]) + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // Generate Tokens for Proxy @@ -64,6 +68,8 @@ model LiteLLM_VerificationToken { budget_duration String? budget_reset_at DateTime? allowed_cache_controls String[] @default([]) + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // store proxy config.yaml diff --git a/litellm/proxy/utils.py b/litellm/proxy/utils.py index 7cc0f59f1..1cdacf76f 100644 --- a/litellm/proxy/utils.py +++ b/litellm/proxy/utils.py @@ -1379,19 +1379,22 @@ async def _read_request_body(request): """ import ast, json - request_data = {} - if request is None: - return request_data - body = await request.body() - - if body == b"" or body is None: - return request_data - body_str = body.decode() try: - request_data = ast.literal_eval(body_str) + request_data = {} + if request is None: + return request_data + body = await request.body() + + if body == b"" or body is None: + return request_data + body_str = body.decode() + try: + request_data = ast.literal_eval(body_str) + except: + request_data = json.loads(body_str) + return request_data except: - request_data = json.loads(body_str) - return request_data + return {} def _is_valid_team_configs(team_id=None, team_config=None, request_data=None): @@ -1408,6 +1411,22 @@ def _is_valid_team_configs(team_id=None, team_config=None, request_data=None): return +def _is_user_proxy_admin(user_id_information=None): + if ( + user_id_information == None + or len(user_id_information) == 0 + or user_id_information[0] == None + ): + return False + _user = user_id_information[0] + if ( + _user.get("user_role", None) is not None + and _user.get("user_role") == "proxy_admin" + ): + return True + return False + + # LiteLLM Admin UI - Non SSO Login html_form = """ diff --git a/litellm/tests/test_completion.py b/litellm/tests/test_completion.py index 475364bfa..f2186093a 100644 --- a/litellm/tests/test_completion.py +++ b/litellm/tests/test_completion.py @@ -1912,7 +1912,7 @@ def test_mistral_anyscale_stream(): # test_baseten_wizardLMcompletion_withbase() # def test_baseten_mosaic_ML_completion_withbase(): -# model_name = "31dxrj3" +# model_name = "31dxrj3", # litellm.api_base = "https://app.baseten.co" # try: # response = completion(model=model_name, messages=messages) diff --git a/litellm/tests/test_key_generate_prisma.py b/litellm/tests/test_key_generate_prisma.py index 89d4f4d3e..1f5507d3f 100644 --- a/litellm/tests/test_key_generate_prisma.py +++ b/litellm/tests/test_key_generate_prisma.py @@ -1101,6 +1101,116 @@ def test_call_with_key_over_budget(prisma_client): print(vars(e)) +def test_call_with_key_over_model_budget(prisma_client): + # 12. Make a call with a key over budget, expect to fail + setattr(litellm.proxy.proxy_server, "prisma_client", prisma_client) + setattr(litellm.proxy.proxy_server, "master_key", "sk-1234") + try: + + async def test(): + await litellm.proxy.proxy_server.prisma_client.connect() + + # set budget for chatgpt-v-2 to 0.000001, expect the next request to fail + request = GenerateKeyRequest( + max_budget=1000, + model_max_budget={ + "chatgpt-v-2": 0.000001, + }, + metadata={"user_api_key": 0.0001}, + ) + key = await generate_key_fn(request) + print(key) + + generated_key = key.key + user_id = key.user_id + bearer_token = "Bearer " + generated_key + + request = Request(scope={"type": "http"}) + request._url = URL(url="/chat/completions") + + async def return_body(): + return b'{"model": "chatgpt-v-2"}' + + request.body = return_body + + # use generated key to auth in + result = await user_api_key_auth(request=request, api_key=bearer_token) + print("result from user auth with new key", result) + + # update spend using track_cost callback, make 2nd request, it should fail + from litellm.proxy.proxy_server import ( + _PROXY_track_cost_callback as track_cost_callback, + ) + from litellm import ModelResponse, Choices, Message, Usage + from litellm.caching import Cache + + litellm.cache = Cache() + import time + + request_id = f"chatcmpl-e41836bb-bb8b-4df2-8e70-8f3e160155ac{time.time()}" + + resp = ModelResponse( + id=request_id, + choices=[ + Choices( + finish_reason=None, + index=0, + message=Message( + content=" Sure! Here is a short poem about the sky:\n\nA canvas of blue, a", + role="assistant", + ), + ) + ], + model="gpt-35-turbo", # azure always has model written like this + usage=Usage(prompt_tokens=210, completion_tokens=200, total_tokens=410), + ) + await track_cost_callback( + kwargs={ + "model": "chatgpt-v-2", + "stream": False, + "litellm_params": { + "metadata": { + "user_api_key": hash_token(generated_key), + "user_api_key_user_id": user_id, + } + }, + "response_cost": 0.00002, + }, + completion_response=resp, + start_time=datetime.now(), + end_time=datetime.now(), + ) + await asyncio.sleep(10) + # test spend_log was written and we can read it + spend_logs = await view_spend_logs(request_id=request_id) + + print("read spend logs", spend_logs) + assert len(spend_logs) == 1 + + spend_log = spend_logs[0] + + assert spend_log.request_id == request_id + assert spend_log.spend == float("2e-05") + assert spend_log.model == "chatgpt-v-2" + assert ( + spend_log.cache_key + == "a61ae14fe4a8b8014a61e6ae01a100c8bc6770ac37c293242afed954bc69207d" + ) + + # use generated key to auth in + result = await user_api_key_auth(request=request, api_key=bearer_token) + print("result from user auth with new key", result) + pytest.fail(f"This should have failed!. They key crossed it's budget") + + asyncio.run(test()) + except Exception as e: + # print(f"Error - {str(e)}") + traceback.print_exc() + error_detail = e.message + assert "Authentication Error, ExceededModelBudget:" in error_detail + print(vars(e)) + + @pytest.mark.asyncio() async def test_call_with_key_never_over_budget(prisma_client): # Make a call with a key with budget=None, it should never fail diff --git a/litellm/utils.py b/litellm/utils.py index 194c4e846..faa464448 100644 --- a/litellm/utils.py +++ b/litellm/utils.py @@ -89,7 +89,6 @@ from .exceptions import ( UnprocessableEntityError, ) -verbose_logger.debug(f"sys.path: {sys.path}") try: from .proxy.enterprise.enterprise_callbacks.generic_api_callback import ( GenericAPILogger, diff --git a/pyproject.toml b/pyproject.toml index f44ad2fbb..442c8ed04 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,11 +1,16 @@ [tool.poetry] name = "litellm" -version = "1.25.0" +version = "1.25.2" description = "Library to easily interface with LLM API providers" authors = ["BerriAI"] license = "MIT" readme = "README.md" +[tool.poetry.urls] +homepage = "https://litellm.ai" +repository = "https://github.com/BerriAI/litellm" +documentation = "https://docs.litellm.ai" + [tool.poetry.dependencies] python = ">=3.8.1,<4.0, !=3.9.7" openai = ">=1.0.0" @@ -69,7 +74,7 @@ requires = ["poetry-core", "wheel"] build-backend = "poetry.core.masonry.api" [tool.commitizen] -version = "1.25.0" +version = "1.25.2" version_files = [ "pyproject.toml:^version" ] diff --git a/schema.prisma b/schema.prisma index 5a57b8808..101cf9b7f 100644 --- a/schema.prisma +++ b/schema.prisma @@ -24,6 +24,8 @@ model LiteLLM_TeamTable { budget_reset_at DateTime? created_at DateTime @default(now()) @map("created_at") updated_at DateTime @default(now()) @updatedAt @map("updated_at") + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // Track spend, rate limit, budget Users @@ -41,6 +43,8 @@ model LiteLLM_UserTable { budget_duration String? budget_reset_at DateTime? allowed_cache_controls String[] @default([]) + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // Generate Tokens for Proxy @@ -64,6 +68,8 @@ model LiteLLM_VerificationToken { budget_duration String? budget_reset_at DateTime? allowed_cache_controls String[] @default([]) + model_spend Json @default("{}") + model_max_budget Json @default("{}") } // store proxy config.yaml diff --git a/ui/litellm-dashboard/out/404.html b/ui/litellm-dashboard/out/404.html index 03563194a..0a15886c7 100644 --- a/ui/litellm-dashboard/out/404.html +++ b/ui/litellm-dashboard/out/404.html @@ -1 +1 @@ -404: This page could not be found.🚅 LiteLLM

404

This page could not be found.

\ No newline at end of file +404: This page could not be found.🚅 LiteLLM

404

This page could not be found.

\ No newline at end of file diff --git a/ui/litellm-dashboard/out/_next/static/unBuvDqydg0yodtP5c3nQ/_buildManifest.js b/ui/litellm-dashboard/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_buildManifest.js similarity index 100% rename from ui/litellm-dashboard/out/_next/static/unBuvDqydg0yodtP5c3nQ/_buildManifest.js rename to ui/litellm-dashboard/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_buildManifest.js diff --git a/ui/litellm-dashboard/out/_next/static/unBuvDqydg0yodtP5c3nQ/_ssgManifest.js b/ui/litellm-dashboard/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_ssgManifest.js similarity index 100% rename from ui/litellm-dashboard/out/_next/static/unBuvDqydg0yodtP5c3nQ/_ssgManifest.js rename to ui/litellm-dashboard/out/_next/static/S_8LZOnl2nyURq-NYnh2p/_ssgManifest.js diff --git a/ui/litellm-dashboard/out/_next/static/chunks/app/page-2322bcdc2ec71284.js b/ui/litellm-dashboard/out/_next/static/chunks/app/page-2322bcdc2ec71284.js new file mode 100644 index 000000000..740eb87a2 --- /dev/null +++ b/ui/litellm-dashboard/out/_next/static/chunks/app/page-2322bcdc2ec71284.js @@ -0,0 +1 @@ +(self.webpackChunk_N_E=self.webpackChunk_N_E||[]).push([[931],{20661:function(e,t,n){Promise.resolve().then(n.bind(n,48016))},48016:function(e,t,n){"use strict";n.r(t),n.d(t,{default:function(){return ec}});var s=n(3827),l=n(64090),r=n(47907),a=n(8792),o=n(2179),i=e=>{let{userID:t,userRole:n,userEmail:l}=e;return console.log("User ID:",t),console.log("userEmail:",l),(0,s.jsxs)("nav",{className:"left-0 right-0 top-0 flex justify-between items-center h-12 mb-4",children:[(0,s.jsx)("div",{className:"text-left mx-4 my-2 absolute top-0 left-0",children:(0,s.jsx)("div",{className:"flex flex-col items-center",children:(0,s.jsx)(a.default,{href:"/",children:(0,s.jsx)("button",{className:"text-gray-800 text-2xl px-4 py-1 rounded text-center",children:"\uD83D\uDE85 LiteLLM"})})})}),(0,s.jsx)("div",{className:"text-right mx-4 my-2 absolute top-0 right-0",children:(0,s.jsxs)(o.Z,{variant:"secondary",children:[l,(0,s.jsxs)("p",{children:["Role: ",n]}),(0,s.jsxs)("p",{children:["ID: ",t]})]})})]})},c=n(80588);let d=async(e,t,n)=>{try{if(console.log("Form Values in keyCreateCall:",n),n.description&&(n.metadata||(n.metadata={}),n.metadata.description=n.description,delete n.description,n.metadata=JSON.stringify(n.metadata)),n.metadata){console.log("formValues.metadata:",n.metadata);try{n.metadata=JSON.parse(n.metadata)}catch(e){throw c.ZP.error("Failed to parse metadata: "+e),Error("Failed to parse metadata: "+e)}}console.log("Form Values after check:",n);let s=await fetch("/key/generate",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({user_id:t,...n})});if(!s.ok){let e=await s.text();throw c.ZP.error("Failed to create key: "+e),console.error("Error response from the server:",e),Error("Network response was not ok")}let l=await s.json();return console.log("API Response:",l),l}catch(e){throw console.error("Failed to create key:",e),e}},m=async(e,t)=>{try{console.log("in keyDeleteCall:",t),c.ZP.info("Making key delete request");let n=await fetch("/key/delete",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:[t]})});if(!n.ok){let e=await n.text();throw c.ZP.error("Failed to delete key: "+e),Error("Network response was not ok")}let s=await n.json();return console.log(s),c.ZP.success("API Key Deleted"),s}catch(e){throw console.error("Failed to create key:",e),e}},h=async(e,t,n)=>{try{let s="/user/info";"App Owner"==n&&(s="".concat(s,"/?user_id=").concat(t)),c.ZP.info("Requesting user data");let l=await fetch(s,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!l.ok){let e=await l.text();throw c.ZP.error(e),Error("Network response was not ok")}let r=await l.json();return c.ZP.info("Received user data"),r}catch(e){throw console.error("Failed to create key:",e),e}},u=async(e,t,n)=>{try{c.ZP.info("Requesting model data");let t=await fetch("/model/info",{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!t.ok){let e=await t.text();throw c.ZP.error(e),Error("Network response was not ok")}let n=await t.json();return c.ZP.info("Received model data"),n}catch(e){throw console.error("Failed to create key:",e),e}},x=async(e,t)=>{try{let n="/spend/logs";console.log("in keySpendLogsCall:",n);let s=await fetch("".concat(n,"/?api_key=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to create key:",e),e}},p=async(e,t,n,s,l,r)=>{try{let t="/spend/logs";t="App Owner"==n?"".concat(t,"/?user_id=").concat(s,"&start_date=").concat(l,"&end_date=").concat(r):"".concat(t,"/?start_date=").concat(l,"&end_date=").concat(r),c.ZP.info("Making spend logs request");let a=await fetch(t,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!a.ok){let e=await a.text();throw c.ZP.error(e),Error("Network response was not ok")}let o=await a.json();return console.log(o),c.ZP.success("Spend Logs received"),o}catch(e){throw console.error("Failed to create key:",e),e}},j=async(e,t)=>{try{let n=await fetch("/v2/key/info",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:t})});if(!n.ok){let e=await n.text();throw c.ZP.error(e),Error("Network response was not ok")}let s=await n.json();return console.log(s),s}catch(e){throw console.error("Failed to create key:",e),e}},g=async(e,t)=>{try{let n="/spend/users";console.log("in spendUsersCall:",n);let s=await fetch("".concat(n,"/?user_id=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to get spend for user",e),e}};var y=n(10384),f=n(46453),Z=n(71801),w=n(13969),k=n(12143),_=n(77171),v=n(29714),b=n(88707),S=n(1861);let{Option:N}=w.default;var I=e=>{let{userID:t,userRole:n,accessToken:r,data:a,userModels:i,setData:m}=e,[h]=k.Z.useForm(),[u,x]=(0,l.useState)(!1),[p,j]=(0,l.useState)(null),g=()=>{x(!1),h.resetFields()},I=()=>{x(!1),j(null),h.resetFields()},A=async e=>{try{c.ZP.info("Making API Call"),x(!0);let n=await d(r,t,e);m(e=>e?[...e,n]:[n]),j(n.key),c.ZP.success("API Key Created"),h.resetFields(),localStorage.removeItem("userData"+t)}catch(e){console.error("Error creating the key:",e)}};return(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>x(!0),children:"+ Create New Key"}),(0,s.jsx)(_.Z,{title:"Create Key",visible:u,width:800,footer:null,onOk:g,onCancel:I,children:(0,s.jsxs)(k.Z,{form:h,onFinish:A,labelCol:{span:6},wrapperCol:{span:16},labelAlign:"left",children:["App Owner"===n||"Admin"===n?(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Models",name:"models",children:(0,s.jsx)(w.default,{mode:"multiple",placeholder:"Select models",style:{width:"100%"},children:i.map(e=>(0,s.jsx)(N,{value:e,children:e},e))})}),(0,s.jsx)(k.Z.Item,{label:"Max Budget (USD)",name:"max_budget",children:(0,s.jsx)(b.Z,{step:.01,precision:2,width:200})}),(0,s.jsx)(k.Z.Item,{label:"Duration (eg: 30s, 30h, 30d)",name:"duration",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Metadata",name:"metadata",children:(0,s.jsx)(v.Z.TextArea,{rows:4,placeholder:"Enter metadata as JSON"})})]}):(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID (Contact Group)",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Description",name:"description",children:(0,s.jsx)(v.Z.TextArea,{placeholder:"Enter description",rows:4})})]}),(0,s.jsx)("div",{style:{textAlign:"right",marginTop:"10px"},children:(0,s.jsx)(S.ZP,{htmlType:"submit",children:"Create Key"})})]})}),p&&(0,s.jsx)(_.Z,{title:"Save your key",visible:u,onOk:g,onCancel:I,footer:null,children:(0,s.jsxs)(f.Z,{numItems:1,className:"gap-2 w-full",children:[(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)("p",{children:["Please save this secret key somewhere safe and accessible. For security reasons, ",(0,s.jsx)("b",{children:"you will not be able to view it again"})," ","through your LiteLLM account. If you lose this secret key, you will need to generate a new one."]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:null!=p?(0,s.jsxs)(Z.Z,{children:["API Key: ",p]}):(0,s.jsx)(Z.Z,{children:"Key being created, this might take 30s"})})]})})]})},A=n(33393),C=n(13810),D=n(61244),T=n(10827),P=n(3851),E=n(2044),O=n(64167),R=n(74480),M=n(7178),U=n(42440),F=n(9853),L=n(67989),K=n(56863),z=e=>{let{token:t,accessToken:n,keySpend:r,keyBudget:a,keyName:i}=e,[c,d]=(0,l.useState)(!1),[m,h]=(0,l.useState)(null),[u,p]=(0,l.useState)(null),j=async()=>{try{if(null==n||null==t)return;console.log("accessToken: ".concat(n,"; token: ").concat(t));let e=await x(n,t);console.log("Response:",e);let s=Object.values(e).reduce((e,t)=>{let n=new Date(t.startTime),s=new Intl.DateTimeFormat("en-US",{day:"2-digit",month:"short"}).format(n);return e[s]=(e[s]||0)+t.spend,e},{}),l=Object.entries(s);l.sort((e,t)=>{let[n]=e,[s]=t,l=new Date(n),r=new Date(s);return l.getTime()-r.getTime()});let r=Object.fromEntries(l);console.log(r);let a=Object.values(e).reduce((e,t)=>{let n=t.user;return e[n]=(e[n]||0)+t.spend,e},{});console.log(s),console.log(a);let o=[];for(let[e,t]of Object.entries(r))o.push({day:e,spend:t});let i=Object.entries(a).sort((e,t)=>t[1]-e[1]).slice(0,5).map(e=>{let[t,n]=e;return{name:t,value:n}});h(o),p(i),console.log("arrayBarChart:",o)}catch(e){console.error("There was an error fetching the data",e)}};return t?(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>{console.log("Show Modal triggered"),d(!0),j()},children:"View Spend Report"}),(0,s.jsxs)(_.Z,{visible:c,width:1e3,onOk:()=>{d(!1)},onCancel:()=>{d(!1)},footer:null,children:[(0,s.jsxs)(U.Z,{style:{textAlign:"left"},children:["Key Name: ",i]}),(0,s.jsxs)(K.Z,{children:["Monthly Spend $",r]}),(0,s.jsx)(C.Z,{className:"mt-6 mb-6",children:m&&(0,s.jsx)(F.Z,{className:"mt-6",data:m,colors:["green"],index:"day",categories:["spend"],yAxisWidth:48})}),(0,s.jsx)(U.Z,{className:"mt-6",children:"Top 5 Users Spend (USD)"}),(0,s.jsx)(C.Z,{className:"mb-6",children:u&&(0,s.jsx)(L.Z,{className:"mt-6",data:u,color:"teal"})})]})]}):null},B=e=>{let{userID:t,accessToken:n,data:r,setData:a}=e,[i,c]=(0,l.useState)(!1),[d,h]=(0,l.useState)(!1),[u,x]=(0,l.useState)(null),p=async e=>{null!=r&&(x(e),localStorage.removeItem("userData"+t),h(!0))},j=async()=>{if(null!=u&&null!=r){try{await m(n,u);let e=r.filter(e=>e.token!==u);a(e)}catch(e){console.error("Error deleting the key:",e)}h(!1),x(null)}};if(null!=r)return console.log("RERENDER TRIGGERED"),(0,s.jsxs)(C.Z,{className:"w-full mx-auto flex-auto overflow-y-auto max-h-[50vh] mb-4",children:[(0,s.jsx)(U.Z,{children:"API Keys"}),(0,s.jsxs)(T.Z,{className:"mt-5",children:[(0,s.jsx)(O.Z,{children:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(R.Z,{children:"Key Alias"}),(0,s.jsx)(R.Z,{children:"Secret Key"}),(0,s.jsx)(R.Z,{children:"Spend (USD)"}),(0,s.jsx)(R.Z,{children:"Key Budget (USD)"}),(0,s.jsx)(R.Z,{children:"Team ID"}),(0,s.jsx)(R.Z,{children:"Metadata"}),(0,s.jsx)(R.Z,{children:"Models"}),(0,s.jsx)(R.Z,{children:"TPM / RPM Limits"}),(0,s.jsx)(R.Z,{children:"Expires"})]})}),(0,s.jsx)(P.Z,{children:r.map(e=>(console.log(e),"litellm-dashboard"===e.team_id)?null:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:null!=e.key_alias?(0,s.jsx)(Z.Z,{children:e.key_alias}):(0,s.jsx)(Z.Z,{children:"Not Set"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.key_name})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.spend})}),(0,s.jsx)(E.Z,{children:null!=e.max_budget?(0,s.jsx)(Z.Z,{children:e.max_budget}):(0,s.jsx)(Z.Z,{children:"Unlimited Budget"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.team_id})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.metadata)})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.models)})}),(0,s.jsx)(E.Z,{children:(0,s.jsxs)(Z.Z,{children:["TPM Limit: ",e.tpm_limit?e.tpm_limit:"Unlimited"," ",(0,s.jsx)("br",{})," RPM Limit:"," ",e.rpm_limit?e.rpm_limit:"Unlimited"]})}),(0,s.jsx)(E.Z,{children:null!=e.expires?(0,s.jsx)(Z.Z,{children:e.expires}):(0,s.jsx)(Z.Z,{children:"Never expires"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(D.Z,{onClick:()=>p(e.token),icon:A.Z,size:"sm"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(z,{token:e.token,accessToken:n,keySpend:e.spend,keyBudget:e.max_budget,keyName:e.key_name})})]},e.token))})]}),d&&(0,s.jsx)("div",{className:"fixed z-10 inset-0 overflow-y-auto",children:(0,s.jsxs)("div",{className:"flex items-end justify-center min-h-screen pt-4 px-4 pb-20 text-center sm:block sm:p-0",children:[(0,s.jsx)("div",{className:"fixed inset-0 transition-opacity","aria-hidden":"true",children:(0,s.jsx)("div",{className:"absolute inset-0 bg-gray-500 opacity-75"})}),(0,s.jsx)("span",{className:"hidden sm:inline-block sm:align-middle sm:h-screen","aria-hidden":"true",children:"​"}),(0,s.jsxs)("div",{className:"inline-block align-bottom bg-white rounded-lg text-left overflow-hidden shadow-xl transform transition-all sm:my-8 sm:align-middle sm:max-w-lg sm:w-full",children:[(0,s.jsx)("div",{className:"bg-white px-4 pt-5 pb-4 sm:p-6 sm:pb-4",children:(0,s.jsx)("div",{className:"sm:flex sm:items-start",children:(0,s.jsxs)("div",{className:"mt-3 text-center sm:mt-0 sm:ml-4 sm:text-left",children:[(0,s.jsx)("h3",{className:"text-lg leading-6 font-medium text-gray-900",children:"Delete Key"}),(0,s.jsx)("div",{className:"mt-2",children:(0,s.jsx)("p",{className:"text-sm text-gray-500",children:"Are you sure you want to delete this key ?"})})]})})}),(0,s.jsxs)("div",{className:"bg-gray-50 px-4 py-3 sm:px-6 sm:flex sm:flex-row-reverse",children:[(0,s.jsx)(o.Z,{onClick:j,color:"red",className:"ml-2",children:"Delete"}),(0,s.jsx)(o.Z,{onClick:()=>{h(!1),x(null)},children:"Cancel"})]})]})]})})]})},J=e=>{let{userID:t,userSpendData:n,userRole:r,accessToken:a}=e;console.log("User SpendData:",n);let[o,i]=(0,l.useState)(null==n?void 0:n.spend),[c,d]=(0,l.useState)((null==n?void 0:n.max_budget)||null);return(0,l.useEffect)(()=>{(async()=>{if("Admin"===r)try{let e=await g(a,"litellm-proxy-budget");console.log("Result from callSpendUsers:",e);let t=e[0];i(null==t?void 0:t.spend),d((null==t?void 0:t.max_budget)||null)}catch(e){console.error("Failed to get spend for user",e)}})()},[r,a,t]),(0,s.jsx)(s.Fragment,{children:(0,s.jsxs)(C.Z,{className:"mx-auto mb-4",children:[(0,s.jsxs)(K.Z,{children:["$",o]}),(0,s.jsxs)(U.Z,{children:["/ ",null!==c?"$".concat(c," limit"):"No limit"]})]})})},q=n(37963);console.log("isLocal:",!1);var G=e=>{let{userID:t,userRole:n,setUserRole:a,userEmail:o,setUserEmail:i}=e,[c,d]=(0,l.useState)(null),[m,x]=(0,l.useState)(null),p=(0,r.useSearchParams)();p.get("viewSpend"),(0,r.useRouter)();let j=p.get("token"),[g,Z]=(0,l.useState)(null),[w,k]=(0,l.useState)([]);if(window.addEventListener("beforeunload",function(){sessionStorage.clear()}),(0,l.useEffect)(()=>{if(j){let e=(0,q.o)(j);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),Z(e.key),e.user_role){let t=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",t),a(t)}else console.log("User role not defined");e.user_email?i(e.user_email):console.log("User Email is not set ".concat(e))}}if(t&&g&&n&&!c){let e=sessionStorage.getItem("userData"+t),s=sessionStorage.getItem("userSpendData"+t),l=sessionStorage.getItem("userModels"+t);e&&s&&l?(d(JSON.parse(e)),x(JSON.parse(s)),k(JSON.parse(l))):(async()=>{try{let e=await h(g,t,n);x(e.user_info),d(e.keys),sessionStorage.setItem("userData"+t,JSON.stringify(e.keys)),sessionStorage.setItem("userSpendData"+t,JSON.stringify(e.user_info));let s=await u(g,t,n);console.log("model_info:",s);let l=s.data.map(e=>e.model_name);console.log("available_model_names:",l),k(l),console.log("userModels:",w),sessionStorage.setItem("userModels"+t,JSON.stringify(l))}catch(e){console.error("There was an error fetching the data",e)}})()}},[t,j,g,c,n]),null==t||null==j){let e="/sso/key/generate";return console.log("Full URL:",e),window.location.href=e,null}return null==g?null:(null==n&&a("App Owner"),(0,s.jsx)("div",{children:(0,s.jsx)(f.Z,{numItems:1,className:"gap-0 p-10 h-[75vh] w-full",children:(0,s.jsxs)(y.Z,{numColSpan:1,children:[(0,s.jsx)(J,{userID:t,userSpendData:m,userRole:n,accessToken:g}),(0,s.jsx)(B,{userID:t,accessToken:g,data:c,setData:d}),(0,s.jsx)(I,{userID:t,userRole:n,userModels:w,accessToken:g,data:c,setData:d})]})})}))},$=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)({data:[]});if((0,l.useEffect)(()=>{if(!t||!n||!r||!a)return;let e=async()=>{try{let e=await u(t,a,r);console.log("Model data response:",e.data),i(e)}catch(e){console.error("There was an error fetching the model data",e)}};t&&n&&r&&a&&e()},[t,n,r,a]),!o)return(0,s.jsx)("div",{children:"Loading..."});for(let e=0;e(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:e.model_name})}),(0,s.jsx)(E.Z,{children:e.provider}),(0,s.jsx)(E.Z,{children:e.input_cost}),(0,s.jsx)(E.Z,{children:e.output_cost}),(0,s.jsx)(E.Z,{children:e.max_tokens})]},e.model_name))})]})})})})},V=n(92836),W=n(26734),H=n(41608),Y=n(32126),X=n(23682),Q=n(12968),ee=n(67951);async function et(e,t,n,s){console.log("isLocal:",!1);let l=window.location.origin,r=new Q.ZP.OpenAI({apiKey:s,baseURL:l,dangerouslyAllowBrowser:!0});for await(let s of(await r.chat.completions.create({model:n,stream:!0,messages:[{role:"user",content:e}]})))console.log(s),s.choices[0].delta.content&&t(s.choices[0].delta.content)}var en=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)(""),[c,d]=(0,l.useState)([]),[m,h]=(0,l.useState)(void 0),[x,p]=(0,l.useState)(null);(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{let e=await u(t,a,r);console.log("model_info:",e),(null==e?void 0:e.data.length)>0&&(p(e),h(e.data[0].model_name))})()},[t,a,r]);let j=(e,t)=>{d(n=>{let s=n[n.length-1];return s&&s.role===e?[...n.slice(0,n.length-1),{role:e,content:s.content+t}]:[...n,{role:e,content:t}]})},g=async()=>{if(""!==o.trim()&&t&&n&&r&&a){d(e=>[...e,{role:"user",content:o}]);try{m&&await et(o,e=>j("assistant",e),m,t)}catch(e){console.error("Error fetching model response",e),j("assistant","Error fetching model response")}i("")}};return(0,s.jsx)("div",{style:{width:"100%",position:"relative"},children:(0,s.jsx)(f.Z,{className:"gap-2 p-10 h-[75vh] w-full",children:(0,s.jsx)(C.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{className:"mt-4",children:[(0,s.jsx)(V.Z,{children:"Chat"}),(0,s.jsx)(V.Z,{children:"API Reference"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsxs)(Y.Z,{children:[(0,s.jsxs)("div",{children:[(0,s.jsx)("label",{children:"Select Model:"}),(0,s.jsx)("select",{value:m||"",onChange:e=>h(e.target.value),children:null==x?void 0:x.data.map(e=>(0,s.jsx)("option",{value:e.model_name,children:e.model_name},e.model_name))})]}),(0,s.jsxs)(T.Z,{className:"mt-5",style:{display:"block",maxHeight:"60vh",overflowY:"auto"},children:[(0,s.jsx)(O.Z,{children:(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:"Chat"})})})}),(0,s.jsx)(P.Z,{children:c.map((e,t)=>(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:"".concat(e.role,": ").concat(e.content)})},t))})]}),(0,s.jsx)("div",{className:"mt-3",style:{position:"absolute",bottom:5,width:"95%"},children:(0,s.jsxs)("div",{className:"flex",children:[(0,s.jsx)("input",{type:"text",value:o,onChange:e=>i(e.target.value),className:"flex-1 p-2 border rounded-md mr-2",placeholder:"Type your message..."}),(0,s.jsx)("button",{onClick:g,className:"p-2 bg-blue-500 text-white rounded-md",children:"Send"})]})})]}),(0,s.jsx)(Y.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{children:[(0,s.jsx)(V.Z,{children:"OpenAI Python SDK"}),(0,s.jsx)(V.Z,{children:"LlamaIndex"}),(0,s.jsx)(V.Z,{children:"Langchain Py"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport openai\nclient = openai.OpenAI(\n api_key="your_api_key",\n base_url="http://0.0.0.0:4000" # proxy base url\n)\n\nresponse = client.chat.completions.create(\n model="gpt-3.5-turbo", # model to use from Models Tab\n messages = [\n {\n "role": "user",\n "content": "this is a test request, write a short poem"\n }\n ],\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-openai-client",\n "generation_id": "openai-client-gen-id22",\n "trace_id": "openai-client-trace-id22",\n "trace_user_id": "openai-client-user-id2"\n }\n }\n)\n\nprint(response)\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport os, dotenv\n\nfrom llama_index.llms import AzureOpenAI\nfrom llama_index.embeddings import AzureOpenAIEmbedding\nfrom llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext\n\nllm = AzureOpenAI(\n engine="azure-gpt-3.5", # model_name on litellm proxy\n temperature=0.0,\n azure_endpoint="http://0.0.0.0:4000", # litellm proxy endpoint\n api_key="sk-1234", # litellm proxy API Key\n api_version="2023-07-01-preview",\n)\n\nembed_model = AzureOpenAIEmbedding(\n deployment_name="azure-embedding-model",\n azure_endpoint="http://0.0.0.0:4000",\n api_key="sk-1234",\n api_version="2023-07-01-preview",\n)\n\n\ndocuments = SimpleDirectoryReader("llama_index_data").load_data()\nservice_context = ServiceContext.from_defaults(llm=llm, embed_model=embed_model)\nindex = VectorStoreIndex.from_documents(documents, service_context=service_context)\n\nquery_engine = index.as_query_engine()\nresponse = query_engine.query("What did the author do growing up?")\nprint(response)\n\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nfrom langchain.chat_models import ChatOpenAI\nfrom langchain.prompts.chat import (\n ChatPromptTemplate,\n HumanMessagePromptTemplate,\n SystemMessagePromptTemplate,\n)\nfrom langchain.schema import HumanMessage, SystemMessage\n\nchat = ChatOpenAI(\n openai_api_base="http://0.0.0.0:8000",\n model = "gpt-3.5-turbo",\n temperature=0.1,\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-langchain-client",\n "generation_id": "langchain-client-gen-id22",\n "trace_id": "langchain-client-trace-id22",\n "trace_user_id": "langchain-client-user-id2"\n }\n }\n)\n\nmessages = [\n SystemMessage(\n content="You are a helpful assistant that im using to make a test request to."\n ),\n HumanMessage(\n content="test from litellm. tell me why it\'s amazing in 1 sentence"\n ),\n]\nresponse = chat(messages)\n\nprint(response)\n\n '})})]})]})})]})]})})})})},es=n(33509),el=n(30569);let{Sider:er}=es.default;var ea=e=>{let{setPage:t}=e;return(0,s.jsx)(es.default,{style:{minHeight:"100vh",maxWidth:"120px"},children:(0,s.jsx)(er,{width:120,children:(0,s.jsxs)(el.Z,{mode:"inline",defaultSelectedKeys:["1"],style:{height:"100%",borderRight:0},children:[(0,s.jsx)(el.Z.Item,{onClick:()=>t("api-keys"),children:"API Keys"},"1"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("models"),children:"Models"},"2"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("llm-playground"),children:"Chat UI"},"3"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("usage"),children:"Usage"},"4")]})})})};let eo=e=>{let{payload:t,active:n}=e;if(!n||!t)return null;let l=t[0].payload,r=l.startTime,a=Object.entries(l.models).map(e=>{let[t,n]=e;return[t,n]});a.sort((e,t)=>t[1]-e[1]);let o=a.slice(0,5);return(0,s.jsxs)("div",{className:"w-56 rounded-tremor-default border border-tremor-border bg-tremor-background p-2 text-tremor-default shadow-tremor-dropdown",children:[r,o.map(e=>{let[t,n]=e;return(0,s.jsx)("div",{className:"flex flex-1 space-x-10",children:(0,s.jsx)("div",{className:"p-2",children:(0,s.jsxs)("p",{className:"text-tremor-content text-xs",children:[t,":",(0,s.jsxs)("span",{className:"text-xs text-tremor-content-emphasis",children:[" ",n?n<.01?"<$0.01":n.toFixed(2):""]})]})})},t)})]})};var ei=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,o=new Date,[i,c]=(0,l.useState)([]),[d,m]=(0,l.useState)([]),[h,u]=(0,l.useState)([]),x=new Date(o.getFullYear(),o.getMonth(),1),g=new Date(o.getFullYear(),o.getMonth()+1,0),Z=k(x),w=k(g);function k(e){let t=e.getFullYear(),n=e.getMonth()+1,s=e.getDate();return"".concat(t,"-").concat(n<10?"0"+n:n,"-").concat(s<10?"0"+s:s)}return console.log("Start date is ".concat(Z)),console.log("End date is ".concat(w)),(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{try{await p(t,n,r,a,Z,w).then(async e=>{let n=(await j(t,function(e){let t=[];e.forEach(e=>{Object.entries(e).forEach(e=>{let[n,s]=e;"spend"!==n&&"startTime"!==n&&"models"!==n&&"users"!==n&&t.push({key:n,spend:s})})}),t.sort((e,t)=>Number(t.spend)-Number(e.spend));let n=t.slice(0,5).map(e=>e.key);return console.log("topKeys: ".concat(Object.keys(n[0]))),n}(e))).info.map(e=>({key:(e.key_name||e.key_alias||e.token).substring(0,7),spend:e.spend}));m(n),u(function(e){let t={};e.forEach(e=>{Object.entries(e.users).forEach(e=>{let[n,s]=e;""!==n&&null!=n&&"None"!=n&&(t[n]||(t[n]=0),t[n]+=s)})});let n=Object.entries(t).map(e=>{let[t,n]=e;return{user_id:t,spend:n}});n.sort((e,t)=>t.spend-e.spend);let s=n.slice(0,5);return console.log("topKeys: ".concat(Object.values(s[0]))),s}(e)),c(e)})}catch(e){console.error("There was an error fetching the data",e)}})()},[t,n,r,a,Z,w]),(0,s.jsx)("div",{style:{width:"100%"},children:(0,s.jsxs)(f.Z,{numItems:2,className:"gap-2 p-10 h-[75vh] w-full",children:[(0,s.jsx)(y.Z,{numColSpan:2,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Monthly Spend"}),(0,s.jsx)(F.Z,{data:i,index:"startTime",categories:["spend"],colors:["blue"],valueFormatter:e=>"$ ".concat(new Intl.NumberFormat("us").format(e).toString()),yAxisWidth:100,tickGap:5,customTooltip:eo})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top API Keys"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:d,index:"key",categories:["spend"],colors:["blue"],yAxisWidth:80,tickGap:5,layout:"vertical",showXAxis:!1,showLegend:!1})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top Users"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:h,index:"user_id",categories:["spend"],colors:["blue"],yAxisWidth:200,layout:"vertical",showXAxis:!1,showLegend:!1})]})})]})})},ec=()=>{let[e,t]=(0,l.useState)(null),[n,a]=(0,l.useState)(null),o=(0,r.useSearchParams)(),c=o.get("userID"),d=o.get("token"),[m,h]=(0,l.useState)("api-keys"),[u,x]=(0,l.useState)(null);return(0,l.useEffect)(()=>{if(d){let e=(0,q.o)(d);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),x(e.key),e.user_role){let n=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",n),t(n)}else console.log("User role not defined");e.user_email?a(e.user_email):console.log("User Email is not set ".concat(e))}}},[d]),(0,s.jsx)(l.Suspense,{fallback:(0,s.jsx)("div",{children:"Loading..."}),children:(0,s.jsxs)("div",{className:"flex flex-col min-h-screen",children:[(0,s.jsx)(i,{userID:c,userRole:e,userEmail:n}),(0,s.jsxs)("div",{className:"flex flex-1 overflow-auto",children:[(0,s.jsx)(ea,{setPage:h}),"api-keys"==m?(0,s.jsx)(G,{userID:c,userRole:e,setUserRole:t,userEmail:n,setUserEmail:a}):"models"==m?(0,s.jsx)($,{userID:c,userRole:e,token:d,accessToken:u}):"llm-playground"==m?(0,s.jsx)(en,{userID:c,userRole:e,token:d,accessToken:u}):(0,s.jsx)(ei,{userID:c,userRole:e,token:d,accessToken:u})]})]})})}}},function(e){e.O(0,[145,971,69,744],function(){return e(e.s=20661)}),_N_E=e.O()}]); \ No newline at end of file diff --git a/ui/litellm-dashboard/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js b/ui/litellm-dashboard/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js deleted file mode 100644 index 5402c8d1f..000000000 --- a/ui/litellm-dashboard/out/_next/static/chunks/app/page-7bb820bd6902dbf2.js +++ /dev/null @@ -1 +0,0 @@ -(self.webpackChunk_N_E=self.webpackChunk_N_E||[]).push([[931],{20661:function(e,t,n){Promise.resolve().then(n.bind(n,48016))},48016:function(e,t,n){"use strict";n.r(t),n.d(t,{default:function(){return ec}});var s=n(3827),l=n(64090),r=n(47907),a=n(8792),o=n(2179),i=e=>{let{userID:t,userRole:n,userEmail:l}=e;return console.log("User ID:",t),console.log("userEmail:",l),(0,s.jsxs)("nav",{className:"left-0 right-0 top-0 flex justify-between items-center h-12 mb-4",children:[(0,s.jsx)("div",{className:"text-left mx-4 my-2 absolute top-0 left-0",children:(0,s.jsx)("div",{className:"flex flex-col items-center",children:(0,s.jsx)(a.default,{href:"/",children:(0,s.jsx)("button",{className:"text-gray-800 text-2xl px-4 py-1 rounded text-center",children:"\uD83D\uDE85 LiteLLM"})})})}),(0,s.jsx)("div",{className:"text-right mx-4 my-2 absolute top-0 right-0",children:(0,s.jsxs)(o.Z,{variant:"secondary",children:[l,(0,s.jsxs)("p",{children:["Role: ",n]}),(0,s.jsxs)("p",{children:["ID: ",t]})]})})]})},c=n(80588);let d=async(e,t,n)=>{try{if(console.log("Form Values in keyCreateCall:",n),n.description&&(n.metadata||(n.metadata={}),n.metadata.description=n.description,delete n.description,n.metadata=JSON.stringify(n.metadata)),n.metadata){console.log("formValues.metadata:",n.metadata);try{n.metadata=JSON.parse(n.metadata)}catch(e){throw c.ZP.error("Failed to parse metadata: "+e),Error("Failed to parse metadata: "+e)}}console.log("Form Values after check:",n);let s=await fetch("/key/generate",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({user_id:t,...n})});if(!s.ok){let e=await s.text();throw c.ZP.error("Failed to create key: "+e),console.error("Error response from the server:",e),Error("Network response was not ok")}let l=await s.json();return console.log("API Response:",l),l}catch(e){throw console.error("Failed to create key:",e),e}},m=async(e,t)=>{try{console.log("in keyDeleteCall:",t),c.ZP.info("Making key delete request");let n=await fetch("/key/delete",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:[t]})});if(!n.ok){let e=await n.text();throw c.ZP.error("Failed to delete key: "+e),Error("Network response was not ok")}let s=await n.json();return console.log(s),c.ZP.success("API Key Deleted"),s}catch(e){throw console.error("Failed to create key:",e),e}},h=async(e,t,n)=>{try{let s="/user/info";"App Owner"==n&&(s="".concat(s,"/?user_id=").concat(t)),c.ZP.info("Requesting user data");let l=await fetch(s,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!l.ok){let e=await l.text();throw c.ZP.error(e),Error("Network response was not ok")}let r=await l.json();return c.ZP.info("Received user data"),r}catch(e){throw console.error("Failed to create key:",e),e}},u=async(e,t,n)=>{try{c.ZP.info("Requesting model data");let t=await fetch("/model/info",{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!t.ok){let e=await t.text();throw c.ZP.error(e),Error("Network response was not ok")}let n=await t.json();return c.ZP.info("Received model data"),n}catch(e){throw console.error("Failed to create key:",e),e}},x=async(e,t)=>{try{let n="/spend/logs";console.log("in keySpendLogsCall:",n);let s=await fetch("".concat(n,"/?api_key=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to create key:",e),e}},p=async(e,t,n,s,l,r)=>{try{let t="/spend/logs";t="App Owner"==n?"".concat(t,"/?user_id=").concat(s,"&start_date=").concat(l,"&end_date=").concat(r):"".concat(t,"/?start_date=").concat(l,"&end_date=").concat(r),c.ZP.info("Making spend logs request");let a=await fetch(t,{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!a.ok){let e=await a.text();throw c.ZP.error(e),Error("Network response was not ok")}let o=await a.json();return console.log(o),c.ZP.success("Spend Logs received"),o}catch(e){throw console.error("Failed to create key:",e),e}},j=async(e,t)=>{try{let n=await fetch("/key/info",{method:"POST",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"},body:JSON.stringify({keys:t})});if(!n.ok){let e=await n.text();throw c.ZP.error(e),Error("Network response was not ok")}let s=await n.json();return console.log(s),s}catch(e){throw console.error("Failed to create key:",e),e}},g=async(e,t)=>{try{let n="/spend/users";console.log("in spendUsersCall:",n);let s=await fetch("".concat(n,"/?user_id=").concat(t),{method:"GET",headers:{Authorization:"Bearer ".concat(e),"Content-Type":"application/json"}});if(!s.ok){let e=await s.text();throw c.ZP.error(e),Error("Network response was not ok")}let l=await s.json();return console.log(l),l}catch(e){throw console.error("Failed to get spend for user",e),e}};var y=n(10384),f=n(46453),Z=n(71801),w=n(13969),k=n(12143),_=n(77171),v=n(29714),b=n(88707),S=n(1861);let{Option:N}=w.default;var I=e=>{let{userID:t,userRole:n,accessToken:r,data:a,userModels:i,setData:m}=e,[h]=k.Z.useForm(),[u,x]=(0,l.useState)(!1),[p,j]=(0,l.useState)(null),g=()=>{x(!1),h.resetFields()},I=()=>{x(!1),j(null),h.resetFields()},A=async e=>{try{c.ZP.info("Making API Call"),x(!0);let n=await d(r,t,e);m(e=>e?[...e,n]:[n]),j(n.key),c.ZP.success("API Key Created"),h.resetFields(),localStorage.removeItem("userData"+t)}catch(e){console.error("Error creating the key:",e)}};return(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>x(!0),children:"+ Create New Key"}),(0,s.jsx)(_.Z,{title:"Create Key",visible:u,width:800,footer:null,onOk:g,onCancel:I,children:(0,s.jsxs)(k.Z,{form:h,onFinish:A,labelCol:{span:6},wrapperCol:{span:16},labelAlign:"left",children:["App Owner"===n||"Admin"===n?(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Models",name:"models",children:(0,s.jsx)(w.default,{mode:"multiple",placeholder:"Select models",style:{width:"100%"},children:i.map(e=>(0,s.jsx)(N,{value:e,children:e},e))})}),(0,s.jsx)(k.Z.Item,{label:"Max Budget (USD)",name:"max_budget",children:(0,s.jsx)(b.Z,{step:.01,precision:2,width:200})}),(0,s.jsx)(k.Z.Item,{label:"Duration (eg: 30s, 30h, 30d)",name:"duration",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Metadata",name:"metadata",children:(0,s.jsx)(v.Z.TextArea,{rows:4,placeholder:"Enter metadata as JSON"})})]}):(0,s.jsxs)(s.Fragment,{children:[(0,s.jsx)(k.Z.Item,{label:"Key Name",name:"key_alias",children:(0,s.jsx)(v.Z,{})}),(0,s.jsx)(k.Z.Item,{label:"Team ID (Contact Group)",name:"team_id",children:(0,s.jsx)(v.Z,{placeholder:"ai_team"})}),(0,s.jsx)(k.Z.Item,{label:"Description",name:"description",children:(0,s.jsx)(v.Z.TextArea,{placeholder:"Enter description",rows:4})})]}),(0,s.jsx)("div",{style:{textAlign:"right",marginTop:"10px"},children:(0,s.jsx)(S.ZP,{htmlType:"submit",children:"Create Key"})})]})}),p&&(0,s.jsx)(_.Z,{title:"Save your key",visible:u,onOk:g,onCancel:I,footer:null,children:(0,s.jsxs)(f.Z,{numItems:1,className:"gap-2 w-full",children:[(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)("p",{children:["Please save this secret key somewhere safe and accessible. For security reasons, ",(0,s.jsx)("b",{children:"you will not be able to view it again"})," ","through your LiteLLM account. If you lose this secret key, you will need to generate a new one."]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:null!=p?(0,s.jsxs)(Z.Z,{children:["API Key: ",p]}):(0,s.jsx)(Z.Z,{children:"Key being created, this might take 30s"})})]})})]})},A=n(33393),C=n(13810),D=n(61244),T=n(10827),P=n(3851),E=n(2044),O=n(64167),R=n(74480),M=n(7178),U=n(42440),F=n(9853),K=n(67989),L=n(56863),z=e=>{let{token:t,accessToken:n,keySpend:r,keyBudget:a,keyName:i}=e,[c,d]=(0,l.useState)(!1),[m,h]=(0,l.useState)(null),[u,p]=(0,l.useState)(null),j=async()=>{try{if(null==n||null==t)return;console.log("accessToken: ".concat(n,"; token: ").concat(t));let e=await x(n,t);console.log("Response:",e);let s=Object.values(e).reduce((e,t)=>{let n=new Date(t.startTime),s=new Intl.DateTimeFormat("en-US",{day:"2-digit",month:"short"}).format(n);return e[s]=(e[s]||0)+t.spend,e},{}),l=Object.entries(s);l.sort((e,t)=>{let[n]=e,[s]=t,l=new Date(n),r=new Date(s);return l.getTime()-r.getTime()});let r=Object.fromEntries(l);console.log(r);let a=Object.values(e).reduce((e,t)=>{let n=t.user;return e[n]=(e[n]||0)+t.spend,e},{});console.log(s),console.log(a);let o=[];for(let[e,t]of Object.entries(r))o.push({day:e,spend:t});let i=Object.entries(a).sort((e,t)=>t[1]-e[1]).slice(0,5).map(e=>{let[t,n]=e;return{name:t,value:n}});h(o),p(i),console.log("arrayBarChart:",o)}catch(e){console.error("There was an error fetching the data",e)}};return t?(0,s.jsxs)("div",{children:[(0,s.jsx)(o.Z,{className:"mx-auto",onClick:()=>{console.log("Show Modal triggered"),d(!0),j()},children:"View Spend Report"}),(0,s.jsxs)(_.Z,{visible:c,width:1e3,onOk:()=>{d(!1)},onCancel:()=>{d(!1)},footer:null,children:[(0,s.jsxs)(U.Z,{style:{textAlign:"left"},children:["Key Name: ",i]}),(0,s.jsxs)(L.Z,{children:["Monthly Spend $",r]}),(0,s.jsx)(C.Z,{className:"mt-6 mb-6",children:m&&(0,s.jsx)(F.Z,{className:"mt-6",data:m,colors:["green"],index:"day",categories:["spend"],yAxisWidth:48})}),(0,s.jsx)(U.Z,{className:"mt-6",children:"Top 5 Users Spend (USD)"}),(0,s.jsx)(C.Z,{className:"mb-6",children:u&&(0,s.jsx)(K.Z,{className:"mt-6",data:u,color:"teal"})})]})]}):null},B=e=>{let{userID:t,accessToken:n,data:r,setData:a}=e,[i,c]=(0,l.useState)(!1),[d,h]=(0,l.useState)(!1),[u,x]=(0,l.useState)(null),p=async e=>{null!=r&&(x(e),localStorage.removeItem("userData"+t),h(!0))},j=async()=>{if(null!=u&&null!=r){try{await m(n,u);let e=r.filter(e=>e.token!==u);a(e)}catch(e){console.error("Error deleting the key:",e)}h(!1),x(null)}};if(null!=r)return console.log("RERENDER TRIGGERED"),(0,s.jsxs)(C.Z,{className:"w-full mx-auto flex-auto overflow-y-auto max-h-[50vh] mb-4",children:[(0,s.jsx)(U.Z,{children:"API Keys"}),(0,s.jsxs)(T.Z,{className:"mt-5",children:[(0,s.jsx)(O.Z,{children:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(R.Z,{children:"Key Alias"}),(0,s.jsx)(R.Z,{children:"Secret Key"}),(0,s.jsx)(R.Z,{children:"Spend (USD)"}),(0,s.jsx)(R.Z,{children:"Key Budget (USD)"}),(0,s.jsx)(R.Z,{children:"Team ID"}),(0,s.jsx)(R.Z,{children:"Metadata"}),(0,s.jsx)(R.Z,{children:"Models"}),(0,s.jsx)(R.Z,{children:"TPM / RPM Limits"}),(0,s.jsx)(R.Z,{children:"Expires"})]})}),(0,s.jsx)(P.Z,{children:r.map(e=>(console.log(e),"litellm-dashboard"===e.team_id)?null:(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:null!=e.key_alias?(0,s.jsx)(Z.Z,{children:e.key_alias}):(0,s.jsx)(Z.Z,{children:"Not Set"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.key_name})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.spend})}),(0,s.jsx)(E.Z,{children:null!=e.max_budget?(0,s.jsx)(Z.Z,{children:e.max_budget}):(0,s.jsx)(Z.Z,{children:"Unlimited Budget"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:e.team_id})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.metadata)})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(Z.Z,{children:JSON.stringify(e.models)})}),(0,s.jsx)(E.Z,{children:(0,s.jsxs)(Z.Z,{children:["TPM Limit: ",e.tpm_limit?e.tpm_limit:"Unlimited"," ",(0,s.jsx)("br",{})," RPM Limit:"," ",e.rpm_limit?e.rpm_limit:"Unlimited"]})}),(0,s.jsx)(E.Z,{children:null!=e.expires?(0,s.jsx)(Z.Z,{children:e.expires}):(0,s.jsx)(Z.Z,{children:"Never expires"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(D.Z,{onClick:()=>p(e.token),icon:A.Z,size:"sm"})}),(0,s.jsx)(E.Z,{children:(0,s.jsx)(z,{token:e.token,accessToken:n,keySpend:e.spend,keyBudget:e.max_budget,keyName:e.key_name})})]},e.token))})]}),d&&(0,s.jsx)("div",{className:"fixed z-10 inset-0 overflow-y-auto",children:(0,s.jsxs)("div",{className:"flex items-end justify-center min-h-screen pt-4 px-4 pb-20 text-center sm:block sm:p-0",children:[(0,s.jsx)("div",{className:"fixed inset-0 transition-opacity","aria-hidden":"true",children:(0,s.jsx)("div",{className:"absolute inset-0 bg-gray-500 opacity-75"})}),(0,s.jsx)("span",{className:"hidden sm:inline-block sm:align-middle sm:h-screen","aria-hidden":"true",children:"​"}),(0,s.jsxs)("div",{className:"inline-block align-bottom bg-white rounded-lg text-left overflow-hidden shadow-xl transform transition-all sm:my-8 sm:align-middle sm:max-w-lg sm:w-full",children:[(0,s.jsx)("div",{className:"bg-white px-4 pt-5 pb-4 sm:p-6 sm:pb-4",children:(0,s.jsx)("div",{className:"sm:flex sm:items-start",children:(0,s.jsxs)("div",{className:"mt-3 text-center sm:mt-0 sm:ml-4 sm:text-left",children:[(0,s.jsx)("h3",{className:"text-lg leading-6 font-medium text-gray-900",children:"Delete Key"}),(0,s.jsx)("div",{className:"mt-2",children:(0,s.jsx)("p",{className:"text-sm text-gray-500",children:"Are you sure you want to delete this key ?"})})]})})}),(0,s.jsxs)("div",{className:"bg-gray-50 px-4 py-3 sm:px-6 sm:flex sm:flex-row-reverse",children:[(0,s.jsx)(o.Z,{onClick:j,color:"red",className:"ml-2",children:"Delete"}),(0,s.jsx)(o.Z,{onClick:()=>{h(!1),x(null)},children:"Cancel"})]})]})]})})]})},J=e=>{let{userID:t,userSpendData:n,userRole:r,accessToken:a}=e;console.log("User SpendData:",n);let[o,i]=(0,l.useState)(null==n?void 0:n.spend),[c,d]=(0,l.useState)((null==n?void 0:n.max_budget)||null);return(0,l.useEffect)(()=>{(async()=>{if("Admin"===r)try{let e=await g(a,"litellm-proxy-budget");console.log("Result from callSpendUsers:",e);let t=e[0];i(null==t?void 0:t.spend),d((null==t?void 0:t.max_budget)||null)}catch(e){console.error("Failed to get spend for user",e)}})()},[r,a,t]),(0,s.jsx)(s.Fragment,{children:(0,s.jsxs)(C.Z,{className:"mx-auto mb-4",children:[(0,s.jsxs)(L.Z,{children:["$",o]}),(0,s.jsxs)(U.Z,{children:["/ ",null!==c?"$".concat(c," limit"):"No limit"]})]})})},q=n(37963);console.log("isLocal:",!1);var G=e=>{let{userID:t,userRole:n,setUserRole:a,userEmail:o,setUserEmail:i}=e,[c,d]=(0,l.useState)(null),[m,x]=(0,l.useState)(null),p=(0,r.useSearchParams)();p.get("viewSpend"),(0,r.useRouter)();let j=p.get("token"),[g,Z]=(0,l.useState)(null),[w,k]=(0,l.useState)([]);if((0,l.useEffect)(()=>{if(j){let e=(0,q.o)(j);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),Z(e.key),e.user_role){let t=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",t),a(t)}else console.log("User role not defined");e.user_email?i(e.user_email):console.log("User Email is not set ".concat(e))}}if(t&&g&&n&&!c){let e=localStorage.getItem("userData"+t),s=localStorage.getItem("userSpendData"+t),l=localStorage.getItem("userModels"+t);e&&s&&l?(d(JSON.parse(e)),x(JSON.parse(s)),k(JSON.parse(l))):(async()=>{try{let e=await h(g,t,n);x(e.user_info),d(e.keys),localStorage.setItem("userData"+t,JSON.stringify(e.keys)),localStorage.setItem("userSpendData"+t,JSON.stringify(e.user_info));let s=await u(g,t,n);console.log("model_info:",s);let l=s.data.map(e=>e.model_name);console.log("available_model_names:",l),k(l),console.log("userModels:",w),localStorage.setItem("userModels"+t,JSON.stringify(l))}catch(e){console.error("There was an error fetching the data",e)}})()}},[t,j,g,c,n]),null==t||null==j){let e="/sso/key/generate";return console.log("Full URL:",e),window.location.href=e,null}return null==g?null:(null==n&&a("App Owner"),(0,s.jsx)("div",{children:(0,s.jsx)(f.Z,{numItems:1,className:"gap-0 p-10 h-[75vh] w-full",children:(0,s.jsxs)(y.Z,{numColSpan:1,children:[(0,s.jsx)(J,{userID:t,userSpendData:m,userRole:n,accessToken:g}),(0,s.jsx)(B,{userID:t,accessToken:g,data:c,setData:d}),(0,s.jsx)(I,{userID:t,userRole:n,userModels:w,accessToken:g,data:c,setData:d})]})})}))},$=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)({data:[]});if((0,l.useEffect)(()=>{if(!t||!n||!r||!a)return;let e=async()=>{try{let e=await u(t,a,r);console.log("Model data response:",e.data),i(e)}catch(e){console.error("There was an error fetching the model data",e)}};t&&n&&r&&a&&e()},[t,n,r,a]),!o)return(0,s.jsx)("div",{children:"Loading..."});for(let e=0;e(0,s.jsxs)(M.Z,{children:[(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:e.model_name})}),(0,s.jsx)(E.Z,{children:e.provider}),(0,s.jsx)(E.Z,{children:e.input_cost}),(0,s.jsx)(E.Z,{children:e.output_cost}),(0,s.jsx)(E.Z,{children:e.max_tokens})]},e.model_name))})]})})})})},V=n(92836),W=n(26734),H=n(41608),Y=n(32126),X=n(23682),Q=n(12968),ee=n(67951);async function et(e,t,n,s){console.log("isLocal:",!1);let l=window.location.origin,r=new Q.ZP.OpenAI({apiKey:s,baseURL:l,dangerouslyAllowBrowser:!0});for await(let s of(await r.chat.completions.create({model:n,stream:!0,messages:[{role:"user",content:e}]})))console.log(s),s.choices[0].delta.content&&t(s.choices[0].delta.content)}var en=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,[o,i]=(0,l.useState)(""),[c,d]=(0,l.useState)([]),[m,h]=(0,l.useState)(void 0),[x,p]=(0,l.useState)(null);(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{let e=await u(t,a,r);console.log("model_info:",e),(null==e?void 0:e.data.length)>0&&(p(e),h(e.data[0].model_name))})()},[t,a,r]);let j=(e,t)=>{d(n=>{let s=n[n.length-1];return s&&s.role===e?[...n.slice(0,n.length-1),{role:e,content:s.content+t}]:[...n,{role:e,content:t}]})},g=async()=>{if(""!==o.trim()&&t&&n&&r&&a){d(e=>[...e,{role:"user",content:o}]);try{m&&await et(o,e=>j("assistant",e),m,t)}catch(e){console.error("Error fetching model response",e),j("assistant","Error fetching model response")}i("")}};return(0,s.jsx)("div",{style:{width:"100%",position:"relative"},children:(0,s.jsx)(f.Z,{className:"gap-2 p-10 h-[75vh] w-full",children:(0,s.jsx)(C.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{className:"mt-4",children:[(0,s.jsx)(V.Z,{children:"Chat"}),(0,s.jsx)(V.Z,{children:"API Reference"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsxs)(Y.Z,{children:[(0,s.jsxs)("div",{children:[(0,s.jsx)("label",{children:"Select Model:"}),(0,s.jsx)("select",{value:m||"",onChange:e=>h(e.target.value),children:null==x?void 0:x.data.map(e=>(0,s.jsx)("option",{value:e.model_name,children:e.model_name},e.model_name))})]}),(0,s.jsxs)(T.Z,{className:"mt-5",style:{display:"block",maxHeight:"60vh",overflowY:"auto"},children:[(0,s.jsx)(O.Z,{children:(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:(0,s.jsx)(U.Z,{children:"Chat"})})})}),(0,s.jsx)(P.Z,{children:c.map((e,t)=>(0,s.jsx)(M.Z,{children:(0,s.jsx)(E.Z,{children:"".concat(e.role,": ").concat(e.content)})},t))})]}),(0,s.jsx)("div",{className:"mt-3",style:{position:"absolute",bottom:5,width:"95%"},children:(0,s.jsxs)("div",{className:"flex",children:[(0,s.jsx)("input",{type:"text",value:o,onChange:e=>i(e.target.value),className:"flex-1 p-2 border rounded-md mr-2",placeholder:"Type your message..."}),(0,s.jsx)("button",{onClick:g,className:"p-2 bg-blue-500 text-white rounded-md",children:"Send"})]})})]}),(0,s.jsx)(Y.Z,{children:(0,s.jsxs)(W.Z,{children:[(0,s.jsxs)(H.Z,{children:[(0,s.jsx)(V.Z,{children:"OpenAI Python SDK"}),(0,s.jsx)(V.Z,{children:"LlamaIndex"}),(0,s.jsx)(V.Z,{children:"Langchain Py"})]}),(0,s.jsxs)(X.Z,{children:[(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport openai\nclient = openai.OpenAI(\n api_key="your_api_key",\n base_url="http://0.0.0.0:4000" # proxy base url\n)\n\nresponse = client.chat.completions.create(\n model="gpt-3.5-turbo", # model to use from Models Tab\n messages = [\n {\n "role": "user",\n "content": "this is a test request, write a short poem"\n }\n ],\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-openai-client",\n "generation_id": "openai-client-gen-id22",\n "trace_id": "openai-client-trace-id22",\n "trace_user_id": "openai-client-user-id2"\n }\n }\n)\n\nprint(response)\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nimport os, dotenv\n\nfrom llama_index.llms import AzureOpenAI\nfrom llama_index.embeddings import AzureOpenAIEmbedding\nfrom llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext\n\nllm = AzureOpenAI(\n engine="azure-gpt-3.5", # model_name on litellm proxy\n temperature=0.0,\n azure_endpoint="http://0.0.0.0:4000", # litellm proxy endpoint\n api_key="sk-1234", # litellm proxy API Key\n api_version="2023-07-01-preview",\n)\n\nembed_model = AzureOpenAIEmbedding(\n deployment_name="azure-embedding-model",\n azure_endpoint="http://0.0.0.0:4000",\n api_key="sk-1234",\n api_version="2023-07-01-preview",\n)\n\n\ndocuments = SimpleDirectoryReader("llama_index_data").load_data()\nservice_context = ServiceContext.from_defaults(llm=llm, embed_model=embed_model)\nindex = VectorStoreIndex.from_documents(documents, service_context=service_context)\n\nquery_engine = index.as_query_engine()\nresponse = query_engine.query("What did the author do growing up?")\nprint(response)\n\n '})}),(0,s.jsx)(Y.Z,{children:(0,s.jsx)(ee.Z,{language:"python",children:'\nfrom langchain.chat_models import ChatOpenAI\nfrom langchain.prompts.chat import (\n ChatPromptTemplate,\n HumanMessagePromptTemplate,\n SystemMessagePromptTemplate,\n)\nfrom langchain.schema import HumanMessage, SystemMessage\n\nchat = ChatOpenAI(\n openai_api_base="http://0.0.0.0:8000",\n model = "gpt-3.5-turbo",\n temperature=0.1,\n extra_body={\n "metadata": {\n "generation_name": "ishaan-generation-langchain-client",\n "generation_id": "langchain-client-gen-id22",\n "trace_id": "langchain-client-trace-id22",\n "trace_user_id": "langchain-client-user-id2"\n }\n }\n)\n\nmessages = [\n SystemMessage(\n content="You are a helpful assistant that im using to make a test request to."\n ),\n HumanMessage(\n content="test from litellm. tell me why it\'s amazing in 1 sentence"\n ),\n]\nresponse = chat(messages)\n\nprint(response)\n\n '})})]})]})})]})]})})})})},es=n(33509),el=n(30569);let{Sider:er}=es.default;var ea=e=>{let{setPage:t}=e;return(0,s.jsx)(es.default,{style:{minHeight:"100vh",maxWidth:"120px"},children:(0,s.jsx)(er,{width:120,children:(0,s.jsxs)(el.Z,{mode:"inline",defaultSelectedKeys:["1"],style:{height:"100%",borderRight:0},children:[(0,s.jsx)(el.Z.Item,{onClick:()=>t("api-keys"),children:"API Keys"},"1"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("models"),children:"Models"},"2"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("llm-playground"),children:"Chat UI"},"3"),(0,s.jsx)(el.Z.Item,{onClick:()=>t("usage"),children:"Usage"},"4")]})})})};let eo=e=>{let{payload:t,active:n}=e;if(!n||!t)return null;let l=t[0].payload,r=l.startTime,a=Object.entries(l.models).map(e=>{let[t,n]=e;return[t,n]});a.sort((e,t)=>t[1]-e[1]);let o=a.slice(0,5);return(0,s.jsxs)("div",{className:"w-56 rounded-tremor-default border border-tremor-border bg-tremor-background p-2 text-tremor-default shadow-tremor-dropdown",children:[r,o.map(e=>{let[t,n]=e;return(0,s.jsx)("div",{className:"flex flex-1 space-x-10",children:(0,s.jsx)("div",{className:"p-2",children:(0,s.jsxs)("p",{className:"text-tremor-content text-xs",children:[t,":",(0,s.jsxs)("span",{className:"text-xs text-tremor-content-emphasis",children:[" ",n?n<.01?"<$0.01":n.toFixed(2):""]})]})})},t)})]})};var ei=e=>{let{accessToken:t,token:n,userRole:r,userID:a}=e,o=new Date,[i,c]=(0,l.useState)([]),[d,m]=(0,l.useState)([]),[h,u]=(0,l.useState)([]),x=new Date(o.getFullYear(),o.getMonth(),1),g=new Date(o.getFullYear(),o.getMonth()+1,0),Z=k(x),w=k(g);function k(e){let t=e.getFullYear(),n=e.getMonth()+1,s=e.getDate();return"".concat(t,"-").concat(n<10?"0"+n:n,"-").concat(s<10?"0"+s:s)}return console.log("Start date is ".concat(Z)),console.log("End date is ".concat(w)),(0,l.useEffect)(()=>{t&&n&&r&&a&&(async()=>{try{await p(t,n,r,a,Z,w).then(async e=>{let n=(await j(t,function(e){let t=[];e.forEach(e=>{Object.entries(e).forEach(e=>{let[n,s]=e;"spend"!==n&&"startTime"!==n&&"models"!==n&&"users"!==n&&t.push({key:n,spend:s})})}),t.sort((e,t)=>Number(t.spend)-Number(e.spend));let n=t.slice(0,5).map(e=>e.key);return console.log("topKeys: ".concat(Object.keys(n[0]))),n}(e))).info.map(e=>({key:(e.key_name||e.key_alias||e.token).substring(0,7),spend:e.spend}));m(n),u(function(e){let t={};e.forEach(e=>{Object.entries(e.users).forEach(e=>{let[n,s]=e;""!==n&&null!=n&&"None"!=n&&(t[n]||(t[n]=0),t[n]+=s)})});let n=Object.entries(t).map(e=>{let[t,n]=e;return{user_id:t,spend:n}});n.sort((e,t)=>t.spend-e.spend);let s=n.slice(0,5);return console.log("topKeys: ".concat(Object.values(s[0]))),s}(e)),c(e)})}catch(e){console.error("There was an error fetching the data",e)}})()},[t,n,r,a,Z,w]),(0,s.jsx)("div",{style:{width:"100%"},children:(0,s.jsxs)(f.Z,{numItems:2,className:"gap-2 p-10 h-[75vh] w-full",children:[(0,s.jsx)(y.Z,{numColSpan:2,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Monthly Spend"}),(0,s.jsx)(F.Z,{data:i,index:"startTime",categories:["spend"],colors:["blue"],valueFormatter:e=>"$ ".concat(new Intl.NumberFormat("us").format(e).toString()),yAxisWidth:100,tickGap:5,customTooltip:eo})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top API Keys"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:d,index:"key",categories:["spend"],colors:["blue"],yAxisWidth:80,tickGap:5,layout:"vertical",showXAxis:!1,showLegend:!1})]})}),(0,s.jsx)(y.Z,{numColSpan:1,children:(0,s.jsxs)(C.Z,{children:[(0,s.jsx)(U.Z,{children:"Top Users"}),(0,s.jsx)(F.Z,{className:"mt-4 h-40",data:h,index:"user_id",categories:["spend"],colors:["blue"],yAxisWidth:200,layout:"vertical",showXAxis:!1,showLegend:!1})]})})]})})},ec=()=>{let[e,t]=(0,l.useState)(null),[n,a]=(0,l.useState)(null),o=(0,r.useSearchParams)(),c=o.get("userID"),d=o.get("token"),[m,h]=(0,l.useState)("api-keys"),[u,x]=(0,l.useState)(null);return(0,l.useEffect)(()=>{if(d){let e=(0,q.o)(d);if(e){if(console.log("Decoded token:",e),console.log("Decoded key:",e.key),x(e.key),e.user_role){let n=function(e){if(!e)return"Undefined Role";switch(console.log("Received user role: ".concat(e)),e.toLowerCase()){case"app_owner":case"demo_app_owner":return"App Owner";case"app_admin":return"Admin";case"app_user":return"App User";default:return"Unknown Role"}}(e.user_role);console.log("Decoded user_role:",n),t(n)}else console.log("User role not defined");e.user_email?a(e.user_email):console.log("User Email is not set ".concat(e))}}},[d]),(0,s.jsx)(l.Suspense,{fallback:(0,s.jsx)("div",{children:"Loading..."}),children:(0,s.jsxs)("div",{className:"flex flex-col min-h-screen",children:[(0,s.jsx)(i,{userID:c,userRole:e,userEmail:n}),(0,s.jsxs)("div",{className:"flex flex-1 overflow-auto",children:[(0,s.jsx)(ea,{setPage:h}),"api-keys"==m?(0,s.jsx)(G,{userID:c,userRole:e,setUserRole:t,userEmail:n,setUserEmail:a}):"models"==m?(0,s.jsx)($,{userID:c,userRole:e,token:d,accessToken:u}):"llm-playground"==m?(0,s.jsx)(en,{userID:c,userRole:e,token:d,accessToken:u}):(0,s.jsx)(ei,{userID:c,userRole:e,token:d,accessToken:u})]})]})})}}},function(e){e.O(0,[145,971,69,744],function(){return e(e.s=20661)}),_N_E=e.O()}]); \ No newline at end of file diff --git a/ui/litellm-dashboard/out/index.html b/ui/litellm-dashboard/out/index.html index 80296f4f6..a6994e708 100644 --- a/ui/litellm-dashboard/out/index.html +++ b/ui/litellm-dashboard/out/index.html @@ -1 +1 @@ -🚅 LiteLLM \ No newline at end of file +🚅 LiteLLM \ No newline at end of file diff --git a/ui/litellm-dashboard/out/index.txt b/ui/litellm-dashboard/out/index.txt index b6bb2c868..2356232b4 100644 --- a/ui/litellm-dashboard/out/index.txt +++ b/ui/litellm-dashboard/out/index.txt @@ -1,7 +1,7 @@ 2:I[77831,[],""] -3:I[48016,["145","static/chunks/145-9c160ad5539e000f.js","931","static/chunks/app/page-7bb820bd6902dbf2.js"],""] +3:I[48016,["145","static/chunks/145-9c160ad5539e000f.js","931","static/chunks/app/page-2322bcdc2ec71284.js"],""] 4:I[5613,[],""] 5:I[31778,[],""] -0:["unBuvDqydg0yodtP5c3nQ",[[["",{"children":["__PAGE__",{}]},"$undefined","$undefined",true],["",{"children":["__PAGE__",{},["$L1",["$","$L2",null,{"propsForComponent":{"params":{}},"Component":"$3","isStaticGeneration":true}],null]]},[null,["$","html",null,{"lang":"en","children":["$","body",null,{"className":"__className_c23dc8","children":["$","$L4",null,{"parallelRouterKey":"children","segmentPath":["children"],"loading":"$undefined","loadingStyles":"$undefined","loadingScripts":"$undefined","hasLoading":false,"error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L5",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":"404"}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],"notFoundStyles":[],"styles":null}]}]}],null]],[[["$","link","0",{"rel":"stylesheet","href":"/ui/_next/static/css/c18941d97fb7245b.css","precedence":"next","crossOrigin":""}]],"$L6"]]]] +0:["S_8LZOnl2nyURq-NYnh2p",[[["",{"children":["__PAGE__",{}]},"$undefined","$undefined",true],["",{"children":["__PAGE__",{},["$L1",["$","$L2",null,{"propsForComponent":{"params":{}},"Component":"$3","isStaticGeneration":true}],null]]},[null,["$","html",null,{"lang":"en","children":["$","body",null,{"className":"__className_c23dc8","children":["$","$L4",null,{"parallelRouterKey":"children","segmentPath":["children"],"loading":"$undefined","loadingStyles":"$undefined","loadingScripts":"$undefined","hasLoading":false,"error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L5",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":"404"}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],"notFoundStyles":[],"styles":null}]}]}],null]],[[["$","link","0",{"rel":"stylesheet","href":"/ui/_next/static/css/c18941d97fb7245b.css","precedence":"next","crossOrigin":""}]],"$L6"]]]] 6:[["$","meta","0",{"name":"viewport","content":"width=device-width, initial-scale=1"}],["$","meta","1",{"charSet":"utf-8"}],["$","title","2",{"children":"🚅 LiteLLM"}],["$","meta","3",{"name":"description","content":"LiteLLM Proxy Admin UI"}],["$","link","4",{"rel":"icon","href":"/ui/favicon.ico","type":"image/x-icon","sizes":"16x16"}],["$","meta","5",{"name":"next-size-adjust"}]] 1:null diff --git a/ui/litellm-dashboard/src/components/networking.tsx b/ui/litellm-dashboard/src/components/networking.tsx index 7905ed7db..5874ae2a9 100644 --- a/ui/litellm-dashboard/src/components/networking.tsx +++ b/ui/litellm-dashboard/src/components/networking.tsx @@ -239,7 +239,7 @@ export const userSpendLogsCall = async ( export const keyInfoCall = async (accessToken: String, keys: String[]) => { try { - let url = proxyBaseUrl ? `${proxyBaseUrl}/v2/key/info` : `/key/info`; + let url = proxyBaseUrl ? `${proxyBaseUrl}/v2/key/info` : `/v2/key/info`; const response = await fetch(url, { method: "POST", diff --git a/ui/litellm-dashboard/src/components/user_dashboard.tsx b/ui/litellm-dashboard/src/components/user_dashboard.tsx index bf95d09f7..f3f24e444 100644 --- a/ui/litellm-dashboard/src/components/user_dashboard.tsx +++ b/ui/litellm-dashboard/src/components/user_dashboard.tsx @@ -49,6 +49,14 @@ const UserDashboard: React.FC = ({ const [accessToken, setAccessToken] = useState(null); const [userModels, setUserModels] = useState([]); + // check if window is not undefined + if (typeof window !== "undefined") { + window.addEventListener('beforeunload', function() { + // Clear session storage + sessionStorage.clear(); + }); + } + function formatUserRole(userRole: string) { if (!userRole) { return "Undefined Role"; @@ -70,6 +78,7 @@ const UserDashboard: React.FC = ({ // Moved useEffect inside the component and used a condition to run fetch only if the params are available useEffect(() => { + if (token) { const decoded = jwtDecode(token) as { [key: string]: any }; if (decoded) { @@ -97,22 +106,22 @@ const UserDashboard: React.FC = ({ } } if (userID && accessToken && userRole && !data) { - const cachedData = localStorage.getItem("userData" + userID); - const cachedSpendData = localStorage.getItem("userSpendData" + userID); - const cachedUserModels = localStorage.getItem("userModels" + userID); + const cachedData = sessionStorage.getItem("userData" + userID); + const cachedSpendData = sessionStorage.getItem("userSpendData" + userID); + const cachedUserModels = sessionStorage.getItem("userModels" + userID); if (cachedData && cachedSpendData && cachedUserModels) { setData(JSON.parse(cachedData)); setUserSpendData(JSON.parse(cachedSpendData)); setUserModels(JSON.parse(cachedUserModels)); - + } else { const fetchData = async () => { try { const response = await userInfoCall(accessToken, userID, userRole); setUserSpendData(response["user_info"]); setData(response["keys"]); // Assuming this is the correct path to your data - localStorage.setItem("userData" + userID, JSON.stringify(response["keys"])); - localStorage.setItem( + sessionStorage.setItem("userData" + userID, JSON.stringify(response["keys"])); + sessionStorage.setItem( "userSpendData" + userID, JSON.stringify(response["user_info"]) ); @@ -126,7 +135,7 @@ const UserDashboard: React.FC = ({ console.log("userModels:", userModels); - localStorage.setItem("userModels" + userID, JSON.stringify(available_model_names)); + sessionStorage.setItem("userModels" + userID, JSON.stringify(available_model_names));