From 326ed210973e3f1ac872ff23fee0a8ad90f35524 Mon Sep 17 00:00:00 2001 From: Ishaan Jaff Date: Sat, 23 Nov 2024 12:22:17 -0800 Subject: [PATCH 1/2] docs - have 1 section for routing +load balancing --- docs/my-website/docs/proxy/load_balancing.md | 2 +- docs/my-website/docs/proxy/reliability.md | 2 +- docs/my-website/sidebars.js | 17 +++++++++++------ 3 files changed, 13 insertions(+), 8 deletions(-) diff --git a/docs/my-website/docs/proxy/load_balancing.md b/docs/my-website/docs/proxy/load_balancing.md index 20b803777..dc5724066 100644 --- a/docs/my-website/docs/proxy/load_balancing.md +++ b/docs/my-website/docs/proxy/load_balancing.md @@ -1,4 +1,4 @@ -# Multiple Instances +# Proxy - Load Balancing Load balance multiple instances of the same model The proxy will handle routing requests (using LiteLLM's Router). **Set `rpm` in the config if you want maximize throughput** diff --git a/docs/my-website/docs/proxy/reliability.md b/docs/my-website/docs/proxy/reliability.md index 73f25f817..1e6d0e26c 100644 --- a/docs/my-website/docs/proxy/reliability.md +++ b/docs/my-website/docs/proxy/reliability.md @@ -2,7 +2,7 @@ import Image from '@theme/IdealImage'; import Tabs from '@theme/Tabs'; import TabItem from '@theme/TabItem'; -# Fallbacks, Load Balancing, Retries +# Proxy - Fallbacks, Retries - Quick Start [load balancing](#test---load-balancing) - Quick Start [client side fallbacks](#test---client-side-fallbacks) diff --git a/docs/my-website/sidebars.js b/docs/my-website/sidebars.js index f2bb1c5e9..0821ac257 100644 --- a/docs/my-website/sidebars.js +++ b/docs/my-website/sidebars.js @@ -96,11 +96,10 @@ const sidebars = { label: "Spend Tracking + Budgets", items: ["proxy/cost_tracking", "proxy/users", "proxy/custom_pricing", "proxy/team_budgets", "proxy/billing", "proxy/customers"], }, - "proxy/reliability", { - type: "category", - label: "Routing", - items: ["proxy/load_balancing", "proxy/tag_routing", "proxy/provider_budget_routing", "proxy/team_based_routing", "proxy/customer_routing",], + type: "link", + label: "Load Balancing, Routing, Fallbacks", + href: "https://docs.litellm.ai/docs/routing-load-balancing", }, { type: "category", @@ -267,8 +266,14 @@ const sidebars = { }, { type: "category", - label: "Load Balancing", - items: ["routing", "scheduler"], + label: "Load Balancing & Routing", + link: { + type: "generated-index", + title: "Load Balancing & Routing", + description: "Learn how to load balance, route, and set fallbacks for your LLM requests", + slug: "/routing-load-balancing", + }, + items: ["routing", "scheduler", "proxy/load_balancing", "proxy/reliability", "proxy/tag_routing", "proxy/provider_budget_routing", "proxy/team_based_routing", "proxy/customer_routing"], }, { type: "category", From 1fc3f89f83caa914db5e7f02f1a109597996d5db Mon Sep 17 00:00:00 2001 From: Ishaan Jaff Date: Sat, 23 Nov 2024 12:24:06 -0800 Subject: [PATCH 2/2] remove emoji --- docs/my-website/docs/proxy/team_based_routing.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/my-website/docs/proxy/team_based_routing.md b/docs/my-website/docs/proxy/team_based_routing.md index 89b18ec63..bda286f4a 100644 --- a/docs/my-website/docs/proxy/team_based_routing.md +++ b/docs/my-website/docs/proxy/team_based_routing.md @@ -1,4 +1,4 @@ -# 👥 Team-based Routing +# Team-based Routing ## Routing Route calls to different model groups based on the team-id