docs - have 1 section for routing +load balancing (#6884)

* docs - have 1 section for routing +load balancing

* remove emoji
This commit is contained in:
Ishaan Jaff 2024-11-23 15:56:57 -08:00 committed by GitHub
parent 50314a66ca
commit afc69761de
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
4 changed files with 14 additions and 9 deletions

View file

@ -1,4 +1,4 @@
# Multiple Instances
# Proxy - Load Balancing
Load balance multiple instances of the same model
The proxy will handle routing requests (using LiteLLM's Router). **Set `rpm` in the config if you want maximize throughput**

View file

@ -2,7 +2,7 @@ import Image from '@theme/IdealImage';
import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';
# Fallbacks, Load Balancing, Retries
# Proxy - Fallbacks, Retries
- Quick Start [load balancing](#test---load-balancing)
- Quick Start [client side fallbacks](#test---client-side-fallbacks)

View file

@ -1,4 +1,4 @@
# 👥 Team-based Routing
# Team-based Routing
## Routing
Route calls to different model groups based on the team-id

View file

@ -96,11 +96,10 @@ const sidebars = {
label: "Spend Tracking + Budgets",
items: ["proxy/cost_tracking", "proxy/users", "proxy/custom_pricing", "proxy/team_budgets", "proxy/billing", "proxy/customers"],
},
"proxy/reliability",
{
type: "category",
label: "Routing",
items: ["proxy/load_balancing", "proxy/tag_routing", "proxy/provider_budget_routing", "proxy/team_based_routing", "proxy/customer_routing",],
type: "link",
label: "Load Balancing, Routing, Fallbacks",
href: "https://docs.litellm.ai/docs/routing-load-balancing",
},
{
type: "category",
@ -267,8 +266,14 @@ const sidebars = {
},
{
type: "category",
label: "Load Balancing",
items: ["routing", "scheduler"],
label: "Load Balancing & Routing",
link: {
type: "generated-index",
title: "Load Balancing & Routing",
description: "Learn how to load balance, route, and set fallbacks for your LLM requests",
slug: "/routing-load-balancing",
},
items: ["routing", "scheduler", "proxy/load_balancing", "proxy/reliability", "proxy/tag_routing", "proxy/provider_budget_routing", "proxy/team_based_routing", "proxy/customer_routing"],
},
{
type: "category",