refactor: add black formatting

2023-12-25 14:10:38 +05:30 · 2023-12-25 14:10:38 +05:30 · 4905929de3
commit 4905929de3
parent b87d630b0a
156 changed files with 19723 additions and 10869 deletions
--- a/cookbook/benchmark/benchmark.py
+++ b/cookbook/benchmark/benchmark.py
@ -9,33 +9,37 @@ import os

 # Define the list of models to benchmark
 # select any LLM listed here: https://docs.litellm.ai/docs/providers
-models = ['gpt-3.5-turbo', 'claude-2']
+models = ["gpt-3.5-turbo", "claude-2"]

 # Enter LLM API keys
 # https://docs.litellm.ai/docs/providers
-os.environ['OPENAI_API_KEY'] = ""
-os.environ['ANTHROPIC_API_KEY'] = ""
+os.environ["OPENAI_API_KEY"] = ""
+os.environ["ANTHROPIC_API_KEY"] = ""

 # List of questions to benchmark (replace with your questions)
-questions = [
-    "When will BerriAI IPO?",
-    "When will LiteLLM hit $100M ARR?"
-]
+questions = ["When will BerriAI IPO?", "When will LiteLLM hit $100M ARR?"]

-# Enter your system prompt here 
+# Enter your system prompt here
 system_prompt = """
 You are LiteLLMs helpful assistant
 """

+
@click.command()
-@click.option('--system-prompt', default="You are a helpful assistant that can answer questions.", help="System prompt for the conversation.")
+@click.option(
+    "--system-prompt",
+    default="You are a helpful assistant that can answer questions.",
+    help="System prompt for the conversation.",
+)
 def main(system_prompt):
    for question in questions:
        data = []  # Data for the current question

        with tqdm(total=len(models)) as pbar:
            for model in models:
-                colored_description = colored(f"Running question: {question} for model: {model}", 'green')
+                colored_description = colored(
+                    f"Running question: {question} for model: {model}", "green"
+                )
                pbar.set_description(colored_description)
                start_time = time.time()

@ -44,35 +48,43 @@ def main(system_prompt):
                    max_tokens=500,
                    messages=[
                        {"role": "system", "content": system_prompt},
-                        {"role": "user", "content": question}
+                        {"role": "user", "content": question},
                    ],
                )

                end = time.time()
                total_time = end - start_time
                cost = completion_cost(completion_response=response)
-                raw_response = response['choices'][0]['message']['content']
+                raw_response = response["choices"][0]["message"]["content"]

-                data.append({
-                    'Model': colored(model, 'light_blue'),
-                    'Response': raw_response,  # Colorize the response
-                    'ResponseTime': colored(f"{total_time:.2f} seconds", "red"),
-                    'Cost': colored(f"${cost:.6f}", 'green'),  # Colorize the cost
-                })
+                data.append(
+                    {
+                        "Model": colored(model, "light_blue"),
+                        "Response": raw_response,  # Colorize the response
+                        "ResponseTime": colored(f"{total_time:.2f} seconds", "red"),
+                        "Cost": colored(f"${cost:.6f}", "green"),  # Colorize the cost
+                    }
+                )

                pbar.update(1)

        # Separate headers from the data
-        headers = ['Model', 'Response', 'Response Time (seconds)', 'Cost ($)']
+        headers = ["Model", "Response", "Response Time (seconds)", "Cost ($)"]
        colwidths = [15, 80, 15, 10]

        # Create a nicely formatted table for the current question
-        table = tabulate([list(d.values()) for d in data], headers, tablefmt="grid", maxcolwidths=colwidths)
-        
+        table = tabulate(
+            [list(d.values()) for d in data],
+            headers,
+            tablefmt="grid",
+            maxcolwidths=colwidths,
+        )
+
        # Print the table for the current question
-        colored_question = colored(question, 'green')
+        colored_question = colored(question, "green")
        click.echo(f"\nBenchmark Results for '{colored_question}':")
        click.echo(table)  # Display the formatted table

-if __name__ == '__main__':
+
+if __name__ == "__main__":
    main()
--- a/cookbook/benchmark/eval_suites_mlflow_autoevals/auto_evals.py
+++ b/cookbook/benchmark/eval_suites_mlflow_autoevals/auto_evals.py
@ -1,25 +1,22 @@
 import sys, os
 import traceback
 from dotenv import load_dotenv
+
 load_dotenv()

 import litellm
 from litellm import embedding, completion, completion_cost

 from autoevals.llm import *
+
 ###################
 import litellm

 # litellm completion call
 question = "which country has the highest population"
 response = litellm.completion(
-    model = "gpt-3.5-turbo",
-    messages = [
-        {
-            "role": "user",
-            "content": question
-        }
-    ],
+    model="gpt-3.5-turbo",
+    messages=[{"role": "user", "content": question}],
 )
 print(response)
 # use the auto eval Factuality() evaluator
@ -27,9 +24,11 @@ print(response)
 print("calling evaluator")
 evaluator = Factuality()
 result = evaluator(
-    output=response.choices[0]["message"]["content"],       # response from litellm.completion()
-    expected="India",                                       # expected output
-    input=question                                          # question passed to litellm.completion
+    output=response.choices[0]["message"][
+        "content"
+    ],  # response from litellm.completion()
+    expected="India",  # expected output
+    input=question,  # question passed to litellm.completion
 )

-print(result)
+print(result)