(feat) proxy add openapi.json

2025-04-24 18:24:20 +00:00 · 2023-10-25 08:47:29 -07:00 · 2023-10-25 08:47:29 -07:00 · 9714b85cac
commit 9714b85cac
parent 92e240e474
1 changed files with 219 additions and 0 deletions
--- a/openai-proxy/openapi.json
+++ b/openai-proxy/openapi.json
@ -0,0 +1,219 @@
+{
+    "openapi": "3.0.0",
+    "info": {
+      "version": "1.0.0",
+      "title": "LiteLLM API",
+      "description": "API for LiteLLM"
+    },
+    "paths": {
+     "/chat/completions": {
+    "post": {
+      "summary": "Create chat completion for 100+ LLM APIs",
+      "requestBody": {
+        "required": true,
+        "content": {
+          "application/json": {
+            "schema": {
+              "type": "object",
+              "properties": {
+                "model": {
+                  "type": "string",
+                  "description": "ID of the model to use"
+                },
+                "messages": {
+                  "type": "array",
+                  "items": {
+                    "type": "object",
+                    "properties": {
+                      "role": {
+                        "type": "string",
+                        "description": "The role of the message's author"
+                      },
+                      "content": {
+                        "type": "string",
+                        "description": "The contents of the message"
+                      },
+                      "name": {
+                        "type": "string",
+                        "description": "The name of the author of the message"
+                      },
+                      "function_call": {
+                        "type": "object",
+                        "description": "The name and arguments of a function that should be called"
+                      }
+                    }
+                  }
+                },
+                "functions": {
+                  "type": "array",
+                  "items": {
+                    "type": "object",
+                    "properties": {
+                      "name": {
+                        "type": "string",
+                        "description": "The name of the function to be called"
+                      },
+                      "description": {
+                        "type": "string",
+                        "description": "A description explaining what the function does"
+                      },
+                      "parameters": {
+                        "type": "object",
+                        "description": "The parameters that the function accepts"
+                      },
+                      "function_call": {
+                        "type": "string",
+                        "description": "Controls how the model responds to function calls"
+                      }
+                    }
+                  }
+                },
+                "temperature": {
+                  "type": "number",
+                  "description": "The sampling temperature to be used"
+                },
+                "top_p": {
+                  "type": "number",
+                  "description": "An alternative to sampling with temperature"
+                },
+                "n": {
+                  "type": "integer",
+                  "description": "The number of chat completion choices to generate for each input message"
+                },
+                "stream": {
+                  "type": "boolean",
+                  "description": "If set to true, it sends partial message deltas"
+                },
+                "stop": {
+                  "type": "array",
+                  "items": {
+                    "type": "string"
+                  },
+                  "description": "Up to 4 sequences where the API will stop generating further tokens"
+                },
+                "max_tokens": {
+                  "type": "integer",
+                  "description": "The maximum number of tokens to generate in the chat completion"
+                },
+                "presence_penalty": {
+                  "type": "number",
+                  "description": "It is used to penalize new tokens based on their existence in the text so far"
+                },
+                "frequency_penalty": {
+                  "type": "number",
+                  "description": "It is used to penalize new tokens based on their frequency in the text so far"
+                },
+                "logit_bias": {
+                  "type": "object",
+                  "description": "Used to modify the probability of specific tokens appearing in the completion"
+                },
+                "user": {
+                  "type": "string",
+                  "description": "A unique identifier representing your end-user"
+                }
+              }
+            }
+          }
+        }
+      },
+      "responses": {
+        "200": {
+          "description": "Successful operation",
+          "content": {
+            "application/json": {
+              "schema": {
+                "type": "object",
+                "properties": {
+                  "choices": {
+                    "type": "array",
+                    "items": {
+                      "type": "object",
+                      "properties": {
+                        "finish_reason": {
+                          "type": "string"
+                        },
+                        "index": {
+                          "type": "integer"
+                        },
+                        "message": {
+                          "type": "object",
+                          "properties": {
+                            "role": {
+                              "type": "string"
+                            },
+                            "content": {
+                              "type": "string"
+                            }
+                          }
+                        }
+                      }
+                    }
+                  },
+                  "created": {
+                    "type": "string"
+                  },
+                  "model": {
+                    "type": "string"
+                  },
+                  "usage": {
+                    "type": "object",
+                    "properties": {
+                      "prompt_tokens": {
+                        "type": "integer"
+                      },
+                      "completion_tokens": {
+                        "type": "integer"
+                      },
+                      "total_tokens": {
+                        "type": "integer"
+                      }
+                    }
+                  }
+                }
+              }
+            }
+          }
+        },
+        "500": {
+          "description": "Server error"
+        }
+      }
+    }
+  },
+  
+      "/completions": {
+        "post": {
+          "summary": "Create completion",
+          "responses": {
+            "200": {
+              "description": "Successful operation"
+            },
+            "500": {
+              "description": "Server error"
+            }
+          }
+        }
+      },
+      "/models": {
+        "get": {
+          "summary": "Get models",
+          "responses": {
+            "200": {
+              "description": "Successful operation"
+            }
+          }
+        }
+      },
+      "/": {
+        "get": {
+          "summary": "Swagger docs",
+          "responses": {
+            "200": {
+              "description": "Successful operation"
+            }
+          }
+        }
+      }
+    }
+  }
+