diff --git a/docs/my-website/docs/proxy/prometheus.md b/docs/my-website/docs/proxy/prometheus.md
index 34a1034a9..6c856f58b 100644
--- a/docs/my-website/docs/proxy/prometheus.md
+++ b/docs/my-website/docs/proxy/prometheus.md
@@ -75,6 +75,12 @@ http://localhost:4000/metrics
 | `deployment_state`             | The state of the deployment: 0 = healthy, 1 = partial outage, 2 = complete outage. |
 | `litellm_remaining_requests_metric`             | Track `x-ratelimit-remaining-requests` returned from LLM API Deployment |
 | `litellm_remaining_tokens`                | Track `x-ratelimit-remaining-tokens` return from LLM API Deployment |
+ `llm_deployment_success_responses`              |  Total number of successful LLM API calls for deployment                               |
+| `llm_deployment_failure_responses`              | Total number of failed LLM API calls for deployment                                   |
+| `llm_deployment_total_requests`                 | Total number of LLM API calls for deployment - success + failure                      |
+| `llm_deployment_latency_per_output_token`       | Latency per output token for deployment                                                          |
+| `llm_deployment_successful_fallbacks`           |  Number of successful fallback requests from primary model -> fallback model        |
+| `llm_deployment_failed_fallbacks`               | Number of failed fallback requests from primary model -> fallback model            |
 
 
 
diff --git a/litellm/integrations/prometheus.py b/litellm/integrations/prometheus.py
index 8e31bca13..8797807ac 100644
--- a/litellm/integrations/prometheus.py
+++ b/litellm/integrations/prometheus.py
@@ -172,12 +172,12 @@ class PrometheusLogger(CustomLogger):
 
                 self.llm_deployment_successful_fallbacks = Counter(
                     "llm_deployment_successful_fallbacks",
-                    "LLM Deployment Analytics - Number of successful fallback workloads",
+                    "LLM Deployment Analytics - Number of successful fallback requests from primary model -> fallback model",
                     ["primary_model", "fallback_model"],
                 )
                 self.llm_deployment_failed_fallbacks = Counter(
                     "llm_deployment_failed_fallbacks",
-                    "LLM Deployment Analytics - Number of failed fallback workloads",
+                    "LLM Deployment Analytics - Number of failed fallback requests from primary model -> fallback model",
                     ["primary_model", "fallback_model"],
                 )