From c5288800210a0a6ff853ed750eee7534576205ab Mon Sep 17 00:00:00 2001
From: Krrish Dholakia <krrishdholakia@gmail.com>
Date: Wed, 18 Oct 2023 11:27:18 -0700
Subject: [PATCH] docs(redis_cache.md): create a separate file for redis cache
 docs

---
 docs/my-website/docs/caching/caching.md     | 73 ---------------------
 docs/my-website/docs/caching/redis_cache.md | 73 +++++++++++++++++++++
 docs/my-website/sidebars.js                 |  1 +
 3 files changed, 74 insertions(+), 73 deletions(-)
 create mode 100644 docs/my-website/docs/caching/redis_cache.md
diff --git a/docs/my-website/docs/caching/caching.md b/docs/my-website/docs/caching/caching.md
index 069434b20..251b3e583 100644
--- a/docs/my-website/docs/caching/caching.md
+++ b/docs/my-website/docs/caching/caching.md
@@ -32,79 +32,6 @@ response2 = completion(
 # response1 == response2, response 1 is cached
 ```
 
-## Using Redis Cache with LiteLLM
-### Pre-requisites
-Install redis
-```
-pip install redis
-```
-For the hosted version you can setup your own Redis DB here: https://app.redislabs.com/
-### Usage
-```python
-import litellm
-from litellm import completion
-from litellm.caching import Cache
-litellm.cache = Cache(type="redis", host=<host>, port=<port>, password=<password>)
-
-# Make completion calls
-response1 = completion(
-    model="gpt-3.5-turbo", 
-    messages=[{"role": "user", "content": "Tell me a joke."}],
-    caching=True
-)
-response2 = completion(
-    model="gpt-3.5-turbo", 
-    messages=[{"role": "user", "content": "Tell me a joke."}],
-    caching=True
-)
-
-# response1 == response2, response 1 is cached
-```
-
-### Custom Cache Keys:
-
-Define function to return cache key
-```python
-# this function takes in *args, **kwargs and returns the key you want to use for caching
-def custom_get_cache_key(*args, **kwargs):
-    # return key to use for your cache:
-    key = kwargs.get("model", "") + str(kwargs.get("messages", "")) + str(kwargs.get("temperature", "")) + str(kwargs.get("logit_bias", ""))
-    print("key for cache", key)
-    return key
-
-```
-
-Set your function as litellm.cache.get_cache_key
-```python
-from litellm.caching import Cache
-
-cache = Cache(type="redis", host=os.environ['REDIS_HOST'], port=os.environ['REDIS_PORT'], password=os.environ['REDIS_PASSWORD'])
-
-cache.get_cache_key = custom_get_cache_key # set get_cache_key function for your cache
-
-litellm.cache = cache # set litellm.cache to your cache 
-
-```
-
-### Detecting Cached Responses
-For resposes that were returned as cache hit, the response includes a param `cache` = True 
-
-Example response with cache hit
-```python
-{
-    'cache': True,
-    'id': 'chatcmpl-7wggdzd6OXhgE2YhcLJHJNZsEWzZ2', 
-    'created': 1694221467, 
-    'model': 'gpt-3.5-turbo-0613', 
-    'choices': [
-        {
-            'index': 0, 'message': {'role': 'assistant', 'content': 'I\'m sorry, but I couldn\'t find any information about "litellm" or how many stars it has. It is possible that you may be referring to a specific product, service, or platform that I am not familiar with. Can you please provide more context or clarify your question?'
-        }, 'finish_reason': 'stop'}
-    ], 
-    'usage': {'prompt_tokens': 17, 'completion_tokens': 59, 'total_tokens': 76}, 
-}
-
-```
 ## Caching with Streaming 
 LiteLLM can cache your streamed responses for you
 
diff --git a/docs/my-website/docs/caching/redis_cache.md b/docs/my-website/docs/caching/redis_cache.md
new file mode 100644
index 000000000..f0fcc6952
--- /dev/null
+++ b/docs/my-website/docs/caching/redis_cache.md
@@ -0,0 +1,73 @@
+# Redis Cache
+### Pre-requisites
+Install redis
+```
+pip install redis
+```
+For the hosted version you can setup your own Redis DB here: https://app.redislabs.com/
+### Usage
+```python
+import litellm
+from litellm import completion
+from litellm.caching import Cache
+litellm.cache = Cache(type="redis", host=<host>, port=<port>, password=<password>)
+
+# Make completion calls
+response1 = completion(
+    model="gpt-3.5-turbo", 
+    messages=[{"role": "user", "content": "Tell me a joke."}],
+    caching=True
+)
+response2 = completion(
+    model="gpt-3.5-turbo", 
+    messages=[{"role": "user", "content": "Tell me a joke."}],
+    caching=True
+)
+
+# response1 == response2, response 1 is cached
+```
+
+### Custom Cache Keys:
+
+Define function to return cache key
+```python
+# this function takes in *args, **kwargs and returns the key you want to use for caching
+def custom_get_cache_key(*args, **kwargs):
+    # return key to use for your cache:
+    key = kwargs.get("model", "") + str(kwargs.get("messages", "")) + str(kwargs.get("temperature", "")) + str(kwargs.get("logit_bias", ""))
+    print("key for cache", key)
+    return key
+
+```
+
+Set your function as litellm.cache.get_cache_key
+```python
+from litellm.caching import Cache
+
+cache = Cache(type="redis", host=os.environ['REDIS_HOST'], port=os.environ['REDIS_PORT'], password=os.environ['REDIS_PASSWORD'])
+
+cache.get_cache_key = custom_get_cache_key # set get_cache_key function for your cache
+
+litellm.cache = cache # set litellm.cache to your cache 
+
+```
+
+### Detecting Cached Responses
+For resposes that were returned as cache hit, the response includes a param `cache` = True 
+
+Example response with cache hit
+```python
+{
+    'cache': True,
+    'id': 'chatcmpl-7wggdzd6OXhgE2YhcLJHJNZsEWzZ2', 
+    'created': 1694221467, 
+    'model': 'gpt-3.5-turbo-0613', 
+    'choices': [
+        {
+            'index': 0, 'message': {'role': 'assistant', 'content': 'I\'m sorry, but I couldn\'t find any information about "litellm" or how many stars it has. It is possible that you may be referring to a specific product, service, or platform that I am not familiar with. Can you please provide more context or clarify your question?'
+        }, 'finish_reason': 'stop'}
+    ], 
+    'usage': {'prompt_tokens': 17, 'completion_tokens': 59, 'total_tokens': 76}, 
+}
+
+```
\ No newline at end of file
diff --git a/docs/my-website/sidebars.js b/docs/my-website/sidebars.js
index addcfe62e..a62e14236 100644
--- a/docs/my-website/sidebars.js
+++ b/docs/my-website/sidebars.js
@@ -130,6 +130,7 @@ const sidebars = {
       label: "Caching",
       items: [
         "caching/caching",
+        "caching/redis_cache",
         "caching/caching_api",
         "caching/gpt_cache",
       ],