Merge pull request #5402 from ajeetdsouza/patch-1

docs: add time.sleep() between streaming calls
2024-08-28 07:38:15 -07:00 · 2024-08-28 07:38:15 -07:00 · 3df1186d72
commit 3df1186d72
parent f1147696a3 0533f77138
1 changed files with 4 additions and 1 deletions
--- a/docs/my-website/docs/caching/caching_api.md
+++ b/docs/my-website/docs/caching/caching_api.md
@ -51,8 +51,10 @@ LiteLLM can cache your streamed responses for you
 ### Usage
 ```python
 import litellm
+import time
 from litellm import completion
 from litellm.caching import Cache
+
 litellm.cache = Cache(type="hosted")

 # Make completion calls
@ -64,6 +66,7 @@ response1 = completion(
 for chunk in response1:
    print(chunk)

+time.sleep(1) # cache is updated asynchronously

 response2 = completion(
    model="gpt-3.5-turbo",