(feat) ollama raise Exceptions + use LiteLLM stream wrapper

2025-04-26 03:04:13 +00:00 · 2023-10-11 16:59:28 -07:00 · 2023-10-11 16:59:28 -07:00 · 7b3ee8d129
commit 7b3ee8d129
parent 689acb8a08
1 changed files with 15 additions and 1 deletions
--- a/litellm/llms/ollama.py
+++ b/litellm/llms/ollama.py
@ -131,13 +131,20 @@ def get_ollama_response_stream(
                    for chunk in chunks:
                        if chunk.strip() != "":
                            j = json.loads(chunk)
+                            if "error" in j:
+                                completion_obj = {
+                                    "role": "assistant",
+                                    "content": "",
+                                    "error": j
+                                }
+                                yield completion_obj
                            if "response" in j:
                                completion_obj = {
                                    "role": "assistant",
                                    "content": "",
                                }
                                completion_obj["content"] = j["response"]
-                                yield {"choices": [{"delta": completion_obj}]}
+                                yield completion_obj
                except Exception as e:
                    traceback.print_exc()
                    print(f"Error decoding JSON: {e}")
@ -176,6 +183,13 @@ if async_generator_imported:
                        for chunk in chunks:
                            if chunk.strip() != "":
                                j = json.loads(chunk)
+                                if "error" in j:
+                                    completion_obj = {
+                                        "role": "assistant",
+                                        "content": "",
+                                        "error": j
+                                    }
+                                    await yield_({"choices": [{"delta": completion_obj}]})
                                if "response" in j:
                                    completion_obj = {
                                        "role": "assistant",