From ea55551001e8280a92973e54c99e1d25cfb75ba3 Mon Sep 17 00:00:00 2001
From: Xi Yan <xiyan@meta.com>
Date: Tue, 4 Mar 2025 14:00:51 -0800
Subject: [PATCH] genfiles

---
 .../recorded_responses/chat_completion.json   | 2638 +++++++++++++++--
 .../recorded_responses/chat_completion.pickle |  Bin 541735 -> 620451 bytes
 .../recorded_responses/invoke_tool.json       |   49 +-
 .../recorded_responses/invoke_tool.pickle     |  Bin 52685 -> 53549 bytes
 4 files changed, 2359 insertions(+), 328 deletions(-)

diff --git a/tests/integration/fixtures/recorded_responses/chat_completion.json b/tests/integration/fixtures/recorded_responses/chat_completion.json
index 8a4bae93d..9168b121a 100644
--- a/tests/integration/fixtures/recorded_responses/chat_completion.json
+++ b/tests/integration/fixtures/recorded_responses/chat_completion.json
@@ -10665,7 +10665,7 @@
       {
         "event": {
           "delta": {
-            "text": " provided function definitions are",
+            "text": " provided function definitions are not suitable for",
             "type": "text"
           },
           "event_type": {
@@ -10680,7 +10680,7 @@
       {
         "event": {
           "delta": {
-            "text": " not suitable",
+            "text": " this task",
             "type": "text"
           },
           "event_type": {
@@ -10695,7 +10695,7 @@
       {
         "event": {
           "delta": {
-            "text": " for this task. Please re",
+            "text": ". Please re",
             "type": "text"
           },
           "event_type": {
@@ -10793,7 +10793,7 @@
       {
         "event": {
           "delta": {
-            "text": "get_boiling_point(liquid_name='polyjuice', celcius",
+            "text": "get_boiling_point(liquid_name='polyjuice",
             "type": "text"
           },
           "event_type": {
@@ -10808,7 +10808,7 @@
       {
         "event": {
           "delta": {
-            "text": "=True)]",
+            "text": "', celcius=True)]",
             "type": "text"
           },
           "event_type": {
@@ -10832,7 +10832,7 @@
                 "celcius": true,
                 "liquid_name": "polyjuice"
               },
-              "call_id": "3cb5e131-c553-494b-ae31-7d3836fbb4d8",
+              "call_id": "1fc2d874-894e-4857-ae2b-7aacc75c330e",
               "tool_name": "get_boiling_point"
             },
             "type": "tool_call"
@@ -10905,7 +10905,7 @@
       {
         "event": {
           "delta": {
-            "text": " function call returned an",
+            "text": " function call returned an error",
             "type": "text"
           },
           "event_type": {
@@ -10920,7 +10920,7 @@
       {
         "event": {
           "delta": {
-            "text": " error since \"",
+            "text": " since \"polyjuice\" is",
             "type": "text"
           },
           "event_type": {
@@ -10935,7 +10935,7 @@
       {
         "event": {
           "delta": {
-            "text": "polyjuice\" is not a real liquid. Polyju",
+            "text": " not a real liquid. Polyjuice is a fictional substance",
             "type": "text"
           },
           "event_type": {
@@ -10950,7 +10950,7 @@
       {
         "event": {
           "delta": {
-            "text": "ice is a fictional substance from the",
+            "text": " from the Harry Potter series. The boiling",
             "type": "text"
           },
           "event_type": {
@@ -10965,7 +10965,7 @@
       {
         "event": {
           "delta": {
-            "text": " Harry Potter series. The boiling",
+            "text": " point of a liquid is a physical",
             "type": "text"
           },
           "event_type": {
@@ -10980,7 +10980,7 @@
       {
         "event": {
           "delta": {
-            "text": " point of a substance is a physical",
+            "text": " property that can be measured and",
             "type": "text"
           },
           "event_type": {
@@ -10995,7 +10995,7 @@
       {
         "event": {
           "delta": {
-            "text": " property that can be measured, but it",
+            "text": " quantified, but it only applies",
             "type": "text"
           },
           "event_type": {
@@ -11010,52 +11010,7 @@
       {
         "event": {
           "delta": {
-            "text": " only applies to real substances. If you",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": "'d like to know the boiling point of a different",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": " liquid, I can",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": " try to help with that.",
+            "text": " to real substances that exist in the physical world.",
             "type": "text"
           },
           "event_type": {
@@ -11123,7 +11078,7 @@
       {
         "event": {
           "delta": {
-            "text": "get_boiling_point(liquid",
+            "text": "get_boiling_point(liquid_name='polyjuice",
             "type": "text"
           },
           "event_type": {
@@ -11138,22 +11093,7 @@
       {
         "event": {
           "delta": {
-            "text": "_name='polyjuice', celcius=True",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": ")]",
+            "text": "', celcius=True)]",
             "type": "text"
           },
           "event_type": {
@@ -11177,7 +11117,7 @@
                 "celcius": true,
                 "liquid_name": "polyjuice"
               },
-              "call_id": "4c62a314-448c-4cd5-a921-610583007faa",
+              "call_id": "7d72d1ae-9f52-40c7-8dc5-48fff52b253a",
               "tool_name": "get_boiling_point"
             },
             "type": "tool_call"
@@ -11250,7 +11190,7 @@
       {
         "event": {
           "delta": {
-            "text": " I answered the",
+            "text": " I answered the phone, the friendly",
             "type": "text"
           },
           "event_type": {
@@ -11265,22 +11205,7 @@
       {
         "event": {
           "delta": {
-            "text": " phone, the friendly voice on the other end said",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": " \"hello\" and asked how I was doing",
+            "text": " voice on the other end said \"hello\" and asked how I was doing",
             "type": "text"
           },
           "event_type": {
@@ -11423,7 +11348,7 @@
       {
         "event": {
           "delta": {
-            "text": " the file path is correct",
+            "text": " the file path is correct and the file exists in the specified location. If",
             "type": "text"
           },
           "event_type": {
@@ -11438,7 +11363,7 @@
       {
         "event": {
           "delta": {
-            "text": " and the file exists in the specified location. If",
+            "text": " the file is located in a different directory, you should",
             "type": "text"
           },
           "event_type": {
@@ -11453,7 +11378,7 @@
       {
         "event": {
           "delta": {
-            "text": " the file is located in a different directory,",
+            "text": " provide the correct file path.\n\nAdditionally, you can",
             "type": "text"
           },
           "event_type": {
@@ -11468,7 +11393,7 @@
       {
         "event": {
           "delta": {
-            "text": " you should provide the correct path to the",
+            "text": " use the `os` module to check if the file exists before attempting",
             "type": "text"
           },
           "event_type": {
@@ -11483,7 +11408,7 @@
       {
         "event": {
           "delta": {
-            "text": " file.\n\nAdditionally, you can use the `os`",
+            "text": " to read it. Here",
             "type": "text"
           },
           "event_type": {
@@ -11498,7 +11423,7 @@
       {
         "event": {
           "delta": {
-            "text": " module to check if the file exists before attempting to",
+            "text": "'s an example:\n\n```python\nimport os\nimport",
             "type": "text"
           },
           "event_type": {
@@ -11513,7 +11438,7 @@
       {
         "event": {
           "delta": {
-            "text": " read it. Here's an example:\n\n```",
+            "text": " pandas as pd\n\nfile_path = \"/var/folders",
             "type": "text"
           },
           "event_type": {
@@ -11528,7 +11453,7 @@
       {
         "event": {
           "delta": {
-            "text": "python\nimport os\nimport pandas as pd\n\nfile",
+            "text": "/rb/qv8vwgyj6yjd3t4p",
             "type": "text"
           },
           "event_type": {
@@ -11543,7 +11468,7 @@
       {
         "event": {
           "delta": {
-            "text": "_path",
+            "text": "wsy9t0rm0000gn/T/tmp4n_d_h",
             "type": "text"
           },
           "event_type": {
@@ -11558,7 +11483,7 @@
       {
         "event": {
           "delta": {
-            "text": " = \"/var/folders/rb/qvq",
+            "text": "5o/u4yh2j11inflation.csv\"\n\nif",
             "type": "text"
           },
           "event_type": {
@@ -11573,7 +11498,7 @@
       {
         "event": {
           "delta": {
-            "text": "vwgyj6yjd3t4pwsy9t0",
+            "text": " os.path.isfile(file_path):\n    df =",
             "type": "text"
           },
           "event_type": {
@@ -11588,7 +11513,7 @@
       {
         "event": {
           "delta": {
-            "text": "rm0000gn/T/tmpdcpkc9",
+            "text": " pd.read_csv(file_path)\n    print",
             "type": "text"
           },
           "event_type": {
@@ -11603,37 +11528,7 @@
       {
         "event": {
           "delta": {
-            "text": "_f/15dhK1rDinflation.csv\"\n\nif",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": " os.path.isfile(file_path):\n    df = pd.read_csv(file_path",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": ")\n    print(\"Number of rows and columns in the",
+            "text": "(\"Number of rows and columns in the",
             "type": "text"
           },
           "event_type": {
@@ -11852,7 +11747,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "qvwgyj6yjd3",
+            "tool_call": "8vwgyj6yjd3t4pwsy9t",
             "type": "tool_call"
           },
           "event_type": {
@@ -11871,7 +11766,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "t4pwsy9t0rm0000gn/T/tmpd",
+            "tool_call": "0rm0000gn/T/tmp4n_d_h5o/u4",
             "type": "tool_call"
           },
           "event_type": {
@@ -11890,7 +11785,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "cpkc9_f/15dhK1rDinflation.csv\")\n",
+            "tool_call": "yh2j11inflation.csv\")\n# Rows\nprint(\"Number of",
             "type": "tool_call"
           },
           "event_type": {
@@ -11909,7 +11804,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "# Rows\nprint(\"Number of rows and columns in the data:\", df",
+            "tool_call": " rows and columns in the data:\", df.shape)\n# Columns\nprint(\"",
             "type": "tool_call"
           },
           "event_type": {
@@ -11928,7 +11823,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": ".shape)\n# Columns\nprint(\"Columns of the data are:\", len(df",
+            "tool_call": "Columns of the data are:\", len(df.columns))\n# Column names\nprint",
             "type": "tool_call"
           },
           "event_type": {
@@ -11947,7 +11842,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": ".columns))\n# Column names\nprint(\"Columns of the data are:\", df",
+            "tool_call": "(\"Columns of the data are:\", df.columns)\n# Column dtypes\n",
             "type": "tool_call"
           },
           "event_type": {
@@ -11966,7 +11861,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": ".columns)\n# Column dtypes\nprint(\"Datatype of the columns are",
+            "tool_call": "print(\"Datatype of the columns are:\", df.dtypes)\n#",
             "type": "tool_call"
           },
           "event_type": {
@@ -11985,26 +11880,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": ":\", df.dtypes)\n# Sample of data\nprint",
-            "type": "tool_call"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "parse_status": {
-              "__enum__": "ToolCallParseStatus",
-              "value": "in_progress"
-            },
-            "tool_call": "(\"Data sample from file:\")\nprint(df.head())",
+            "tool_call": " Sample of data\nprint(\"Data sample from file:\")\nprint(df.head())",
             "type": "tool_call"
           },
           "event_type": {
@@ -12025,9 +11901,866 @@
             },
             "tool_call": {
               "arguments": {
-                "code": "import pandas as pd\n# Load data\ndf = pd.read_csv(\"/var/folders/rb/qvqvwgyj6yjd3t4pwsy9t0rm0000gn/T/tmpdcpkc9_f/15dhK1rDinflation.csv\")\n# Rows\nprint(\"Number of rows and columns in the data:\", df.shape)\n# Columns\nprint(\"Columns of the data are:\", len(df.columns))\n# Column names\nprint(\"Columns of the data are:\", df.columns)\n# Column dtypes\nprint(\"Datatype of the columns are:\", df.dtypes)\n# Sample of data\nprint(\"Data sample from file:\")\nprint(df.head())"
+                "code": "import pandas as pd\n# Load data\ndf = pd.read_csv(\"/var/folders/rb/qv8vwgyj6yjd3t4pwsy9t0rm0000gn/T/tmp4n_d_h5o/u4yh2j11inflation.csv\")\n# Rows\nprint(\"Number of rows and columns in the data:\", df.shape)\n# Columns\nprint(\"Columns of the data are:\", len(df.columns))\n# Column names\nprint(\"Columns of the data are:\", df.columns)\n# Column dtypes\nprint(\"Datatype of the columns are:\", df.dtypes)\n# Sample of data\nprint(\"Data sample from file:\")\nprint(df.head())"
               },
-              "call_id": "bdb9c5e1-2082-49c8-ab7a-15aae2135656",
+              "call_id": "517038eb-c373-441b-96fe-3a0e2f063fc0",
+              "tool_name": {
+                "__enum__": "BuiltinTool",
+                "value": "code_interpreter"
+              }
+            },
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='Here is a csv, can you describe it?', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, arguments={'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics about the dataframe\\nprint(df.describe())'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=\"error\\n[stdout]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stdout]\\n[stderr]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stderr]\"), CompletionMessage(role='assistant', content='The error message indicates that the file \"<TEMP_FILE>\" does not exist. This could be due to a number of reasons such as the file being deleted, the path being incorrect, or the file being moved to a different location.\\n\\nTo resolve this issue, you should ensure that the file exists and the path is correct. If the file does exist, you can try to load it using the correct path. If the file does not exist, you will need to create it or obtain it from the relevant source.\\n\\nHere is an example of how you can modify the code to handle this situation:\\n\\n```\\nimport pandas as pd\\n\\n# Define the path to the CSV file\\nfile_path = \"<TEMP_FILE>\"\\n\\n# Check if the file exists\\nimport os\\nif os.path.isfile(file_path):\\n    # Load the CSV file\\n    df = pd.read_csv(file_path)\\n\\n    # Print the first few rows of the dataframe\\n    print(df.head())\\n\\n    # Print information about the dataframe\\n    print(df.info())\\n\\n    # Print summary statistics about the dataframe\\n    print(df.describe())\\nelse:\\n    print(\"The file does not exist.\")\\n```\\n\\nThis code will check if the file exists before attempting to load it. If the file does not exist, it will print a message indicating that the file does not exist.', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[]), UserMessage(role='user', content='Plot average yearly inflation as a time series', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, arguments={'code': 'import pandas as pd\\nimport matplotlib.pyplot as plt\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Convert the \\'Year\\' column to datetime\\ndf[\\'Year\\'] = pd.to_datetime(df[\\'Year\\'], format=\\'%Y\\')\\n\\n# Group by \\'Year\\' and calculate the average inflation\\ndf_avg_inflation = df.groupby(\\'Year\\')[\\'Inflation\\'].mean().reset_index()\\n\\n# Plot the average yearly inflation as a time series\\nplt.figure(figsize=(10,6))\\nplt.plot(df_avg_inflation[\\'Year\\'], df_avg_inflation[\\'Inflation\\'], marker=\\'o\\')\\nplt.title(\\'Average Yearly Inflation\\')\\nplt.xlabel(\\'Year\\')\\nplt.ylabel(\\'Inflation\\')\\nplt.grid(True)\\nplt.show()'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=\"error\\n[stdout]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stdout]\\n[stderr]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stderr]\")])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, description='Execute code', parameters={'code': ToolParamDefinition(param_type='string', description='The code to execute', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "The",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " error message indicates that the file \"/var/folders/rb/qv8",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "vwgyj6yjd3t4pwsy9t0",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "rm0000gn/T/tmpbb210725/duWDtjG",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "ninflation.csv\" does not exist. This could be due to a number",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " of reasons such as the file being deleted, the path being incorrect, or",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the file being moved to a different location.\n\nTo resolve this issue, you",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " should ensure that the file exists and the path is correct. If the file",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " does exist, you can try to load it using the correct path. If",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the file does not exist, you will need to create it or obtain it",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " from the relevant source.\n\nHere is an example of how you can modify the",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " code to handle this situation:\n\n```\nimport pandas as pd\nimport matplotlib",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ".pyplot as plt\n\n# Define the path to the CSV file\nfile_path",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " = \"/var/folders/rb/qv8vwgyj6y",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "jd3t4pwsy9t0rm0000gn/T",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "/tmpbb210725/duWDtjGninflation.csv\"\n\n#",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " Check if the file exists\nimport os\nif os.path.isfile(file_path",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "):\n    # Load the CSV file\n    df = pd.read_csv(file",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_path)\n\n    # Convert the 'Year' column to datetime\n    df",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "['Year'] = pd.to_datetime(df['Year'], format='%Y')\n\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "    # Group by 'Year' and calculate the average inflation\n    df",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_avg_inflation = df.groupby('Year')['Inflation'].mean().reset",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_index()\n\n    # Plot the average yearly inflation as a time series\n   ",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " plt.figure(figsize=(10,6))\n    plt.plot(df_avg_inflation",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "['Year'], df_avg_inflation['Inflation'], marker='o')\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "    plt.title('Average Yearly Inflation')\n    plt.xlabel('Year",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "')\n    plt.ylabel('Inflation')\n    plt.grid(True)\n    plt",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ".show()\nelse:\n    print(\"The file does not exist.\")\n```\n\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "This code will check if the file exists before attempting to load it. If",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the file does not exist, it will print a message indicating that the file",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " does not exist.",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='Here is a csv, can you describe it?', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, arguments={'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics about the dataframe\\nprint(df.describe())'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=\"error\\n[stdout]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stdout]\\n[stderr]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stderr]\"), CompletionMessage(role='assistant', content='The error message indicates that the file \"<TEMP_FILE>\" does not exist. This could be due to a number of reasons such as the file being deleted, the path being incorrect, or the file being moved to a different location.\\n\\nTo resolve this issue, you should ensure that the file exists and the path is correct. If the file does exist, you can try to load it using the correct path. If the file does not exist, you will need to create it or obtain it from the relevant source.\\n\\nHere is an example of how you can modify the code to handle this situation:\\n\\n```\\nimport pandas as pd\\n\\n# Define the path to the CSV file\\nfile_path = \"<TEMP_FILE>\"\\n\\n# Check if the file exists\\nimport os\\nif os.path.isfile(file_path):\\n    # Load the CSV file\\n    df = pd.read_csv(file_path)\\n\\n    # Print the first few rows of the dataframe\\n    print(df.head())\\n\\n    # Print information about the dataframe\\n    print(df.info())\\n\\n    # Print summary statistics about the dataframe\\n    print(df.describe())\\nelse:\\n    print(\"The file does not exist.\")\\n```\\n\\nThis code will check if the file exists before attempting to load it. If the file does not exist, it will print a message indicating that the file does not exist.', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[]), UserMessage(role='user', content='Plot average yearly inflation as a time series', context=None)])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, description='Execute code', parameters={'code': ToolParamDefinition(param_type='string', description='The code to execute', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "started"
+            },
+            "tool_call": "",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "import pandas as pd\nimport matplotlib.pyplot as plt\n\n# Load the CSV",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": " file\ndf = pd.read_csv(\"/var/folders/rb/qv",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "8vwgyj6yjd3t4pwsy9t",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "0rm0000gn/T/tmpbb210725/duWDtj",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "Gninflation.csv\")\n\n# Convert the 'Year' column to datetime\n",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "df['Year'] = pd.to_datetime(df['Year'], format",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "='%Y')\n\n# Group by 'Year' and calculate",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": " the average inflation\ndf_avg_inflation = df.groupby('",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "Year')['Inflation'].mean().reset_index()\n\n# Plot the average yearly",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": " inflation as a time series\nplt.figure(figsize=(10",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": ",6))\nplt.plot(df_avg_inflation['Year'], df_avg_in",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": "flation['Inflation'], marker='o')\nplt.title('Average Yearly",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": " Inflation')\nplt.xlabel('Year')\nplt.ylabel('Inflation')\nplt",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "in_progress"
+            },
+            "tool_call": ".grid(True)\nplt.show()",
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "succeeded"
+            },
+            "tool_call": {
+              "arguments": {
+                "code": "import pandas as pd\nimport matplotlib.pyplot as plt\n\n# Load the CSV file\ndf = pd.read_csv(\"/var/folders/rb/qv8vwgyj6yjd3t4pwsy9t0rm0000gn/T/tmpbb210725/duWDtjGninflation.csv\")\n\n# Convert the 'Year' column to datetime\ndf['Year'] = pd.to_datetime(df['Year'], format='%Y')\n\n# Group by 'Year' and calculate the average inflation\ndf_avg_inflation = df.groupby('Year')['Inflation'].mean().reset_index()\n\n# Plot the average yearly inflation as a time series\nplt.figure(figsize=(10,6))\nplt.plot(df_avg_inflation['Year'], df_avg_inflation['Inflation'], marker='o')\nplt.title('Average Yearly Inflation')\nplt.xlabel('Year')\nplt.ylabel('Inflation')\nplt.grid(True)\nplt.show()"
+              },
+              "call_id": "a6646608-a943-4849-884e-1852d5ef4a7e",
               "tool_name": {
                 "__enum__": "BuiltinTool",
                 "value": "code_interpreter"
@@ -14650,6 +15383,494 @@
     ],
     "type": "generator"
   },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='Here is a csv, can you describe it?', context=None), ToolResponseMessage(role='tool', call_id='', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=[TextContentItem(type='text', text='# User provided a file accessible to you at \"<TEMP_FILE>\"\\nYou can use code_interpreter to load and inspect it.')]), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, arguments={'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics about the dataframe\\nprint(df.describe())'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=\"error\\n[stdout]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stdout]\\n[stderr]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stderr]\")])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, description='Execute code', parameters={'code': ToolParamDefinition(param_type='string', description='The code to execute', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "The",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " error message indicates that the file \"/var/folders/rb/qv8",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "vwgyj6yjd3t4pwsy9t0",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "rm0000gn/T/tmpbb210725/duWDtjG",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "ninflation.csv\" does not exist. This could be",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " due to a number of reasons such as the file being deleted,",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the path being",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " incorrect, or the file being moved to a different location.\n\nTo",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " resolve this issue, you should ensure that",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the file exists and the path is correct. If the",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " file does exist, you can try to load",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " it using the correct path. If the file does",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " not exist, you will need to create it or obtain",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " it from the relevant",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " source.\n\nHere is an example of",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " how you can modify the code to handle this situation:\n\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "```\nimport pandas as pd\n\n# Define the path to the CSV file",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "\nfile_path = \"/var/folders/rb/qv8",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "vwgyj6yjd3t4pwsy9t0",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "rm0000gn/T/tmpbb210725/duWDtjG",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "ninflation.csv\"\n\n# Check if the file exists\nimport os",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "\nif os.path.isfile(file_path):\n    # Load",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the CSV file\n    df = pd.read_csv(file_path)\n\n   ",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " # Print the first few rows of the dataframe\n    print(df.head())\n\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "    # Print information about",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the dataframe\n    print(df.info())\n\n    # Print summary statistics about the",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " dataframe\n    print(df.describe())\nelse:\n    print(\"The file does",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " not exist.\")\n```\n\nThis code will check if the file exists before",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " attempting to load it. If the file does not exist, it will print",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " a message indicating that the file does not exist.",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
   "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='Here is a csv, can you describe it?', context=None), ToolResponseMessage(role='tool', call_id='', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=[TextContentItem(type='text', text='# User provided a file accessible to you at \"<TEMP_FILE>\"\\nYou can use code_interpreter to load and inspect it.')]), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, arguments={'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics of the dataframe\\nprint(df.describe())'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, content=\"error\\n[stdout]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stdout]\\n[stderr]\\n[Errno 2] No such file or directory: 'bwrap'\\n[/stderr]\")])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=<ToolPromptFormat.python_list: 'python_list'>, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', <ToolPromptFormat.python_list: 'python_list'>), ('tools', [ToolDefinition(tool_name=<BuiltinTool.code_interpreter: 'code_interpreter'>, description='Execute code', parameters={'code': ToolParamDefinition(param_type='string', description='The code to execute', required=True, default=None)})])]": {
     "chunks": [
       {
@@ -15669,7 +16890,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "import pandas as pd\n\n# Load the CSV file\ndf = pd.read",
+            "tool_call": "import pandas as pd\n\n# Load the CSV file\ndf = pd.read_csv(\"/var/folders",
             "type": "tool_call"
           },
           "event_type": {
@@ -15688,7 +16909,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "_csv(\"/var/folders/rb/qv8vwgyj6y",
+            "tool_call": "/rb/qv8vwgyj6yjd3t4pwsy9t0",
             "type": "tool_call"
           },
           "event_type": {
@@ -15707,7 +16928,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "jd3t4pwsy9t0rm0000gn/T",
+            "tool_call": "rm0000gn/T/tmpbb210725/duWDtjGninflation.csv\")\n\n#",
             "type": "tool_call"
           },
           "event_type": {
@@ -15726,7 +16947,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "/tmpdcpkc9_f/FKWQnYoVinflation.csv\")\n\n",
+            "tool_call": " Print the first few rows of the dataframe\nprint(df.head())\n\n#",
             "type": "tool_call"
           },
           "event_type": {
@@ -15745,7 +16966,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "# Print the first few rows of the dataframe\n",
+            "tool_call": " Print information about",
             "type": "tool_call"
           },
           "event_type": {
@@ -15764,7 +16985,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "print(df.head())\n\n# Print information about",
+            "tool_call": " the dataframe\nprint(df.info())\n\n# Print summary statistics about the",
             "type": "tool_call"
           },
           "event_type": {
@@ -15783,45 +17004,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " the dataframe\nprint(df",
-            "type": "tool_call"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "parse_status": {
-              "__enum__": "ToolCallParseStatus",
-              "value": "in_progress"
-            },
-            "tool_call": ".info())\n\n# Print summary statistics of the dataframe\nprint(df.describe",
-            "type": "tool_call"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "parse_status": {
-              "__enum__": "ToolCallParseStatus",
-              "value": "in_progress"
-            },
-            "tool_call": "())",
+            "tool_call": " dataframe\nprint(df.describe())",
             "type": "tool_call"
           },
           "event_type": {
@@ -15842,9 +17025,9 @@
             },
             "tool_call": {
               "arguments": {
-                "code": "import pandas as pd\n\n# Load the CSV file\ndf = pd.read_csv(\"/var/folders/rb/qv8vwgyj6yjd3t4pwsy9t0rm0000gn/T/tmpdcpkc9_f/FKWQnYoVinflation.csv\")\n\n# Print the first few rows of the dataframe\nprint(df.head())\n\n# Print information about the dataframe\nprint(df.info())\n\n# Print summary statistics of the dataframe\nprint(df.describe())"
+                "code": "import pandas as pd\n\n# Load the CSV file\ndf = pd.read_csv(\"/var/folders/rb/qv8vwgyj6yjd3t4pwsy9t0rm0000gn/T/tmpbb210725/duWDtjGninflation.csv\")\n\n# Print the first few rows of the dataframe\nprint(df.head())\n\n# Print information about the dataframe\nprint(df.info())\n\n# Print summary statistics about the dataframe\nprint(df.describe())"
               },
-              "call_id": "4208ff16-c9e6-4754-8566-8aeb587afcb3",
+              "call_id": "3ab348fd-a9b8-47d7-be10-7d38159c9a0d",
               "tool_name": {
                 "__enum__": "BuiltinTool",
                 "value": "code_interpreter"
@@ -16477,6 +17660,673 @@
     ],
     "type": "generator"
   },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='I am attaching some documentation for Torchtune. Help me answer questions I will ask next.', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name='knowledge_search', arguments={'query': 'Torchtune documentation'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name='knowledge_search', content=[TextContentItem(type='text', text='knowledge_search tool found 5 chunks:\\nBEGIN of knowledge_search tool results.\\n'), TextContentItem(type='text', text='Result 1:\\nDocument_id:f76dc\\nContent:  conversational data, :func:`~torchtune.datasets.chat_dataset` seems to be a good fit. For any\\ncustom local dataset we always need to specify ``source``, ``data_files``, and ``split`` for any dataset\\nbuilder in torchtune. For :func:`~torchtune.datasets.chat_dataset`, we additionally need to specify\\n``conversation_column`` and ``conversation_style``. Our data follows the ``\"sharegpt\"`` format, so\\nwe can specify that here. Altogether, our :func:`~torchtune.datasets.chat_dataset` call should\\nlook like so:\\n\\n.. code-block:: python\\n\\n    from torchtune.datasets import chat_dataset\\n    from torchtune.models.llama3 import llama3_tokenizer\\n\\n    tokenizer = llama3_tokenizer(\"/tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\")\\n    ds = chat_dataset(\\n        tokenizer=tokenizer,\\n        source=\"json\",\\n        data_files=\"data/my_data.json\",\\n        split=\"train\",\\n        conversation_column=\"dialogue\",\\n        conversation_style=\"sharegpt\",\\n    )\\n\\n.. code-block:: yaml\\n\\n    # In config\\n    tokenizer:\\n      _component_: torchtune.models.llama3.llama3_tokenizer\\n      path: /tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\\n\\n    dataset:\\n      _component_: torchtune.datasets.chat_dataset\\n      source: json\\n      data_files: data/my_data.json\\n      split: train\\n      conversation_column: dialogue\\n      conversation_style: sharegpt\\n\\n.. note::\\n    You can pass in any keyword argument for `load_dataset <https://huggingface.co/docs/datasets/v2.20.0/en/package_reference/loading_methods#datasets.load_dataset>`_ into all our\\n    Dataset classes and they will honor them. This is useful for common parameters\\n    such as specifying the data split with :code:`split` or configuration with\\n    :code:`name`\\n\\nIf you needed to add a prompt template, you would simply pass it into the tokenizer.\\nSince we\\'re fine-tuning Llama3, the tokenizer will handle all formatting for\\nus and prompt templates are optional. Other models such as Mistral\\'s :class:`~torchtune.models.mistral._tokenizer.MistralTokenizer`,\\nuse a chat template by default (:class:`~torchtune.models.mistral.MistralChatTemplate`) to format\\nall messages according to their `recommendations <https://\\n'), TextContentItem(type='text', text=\"Result 2:\\nDocument_id:c4fc3\\nContent: .. _lora_finetune_label:\\n\\n============================\\nFine-Tuning Llama2 with LoRA\\n============================\\n\\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\\nIf you already know what LoRA is and want to get straight to running\\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\\n\\n.. grid:: 2\\n\\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\\n\\n      * What LoRA is and how it saves memory during finetuning\\n      * An overview of LoRA components in torchtune\\n      * How to run a LoRA finetune using torchtune\\n      * How to experiment with different LoRA configurations\\n\\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\\n\\n      * Be familiar with :ref:`torchtune<overview_label>`\\n      * Make sure to :ref:`install torchtune<install_label>`\\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\\n\\nWhat is LoRA?\\n-------------\\n\\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\\ntransformer models, in which case it is common to add the low-rank matrices\\nto some of the linear projections in each transformer layer's self-attention.\\n\\n.. note::\\n\\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\\n\\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\\nyou can expect to see memory savings due to a substantial reduction in the\\nnumber of parameters with gradients. When using an optimizer with momentum,\\nlike `AdamW <https://py\\n\"), TextContentItem(type='text', text='Result 3:\\nDocument_id:de2d4\\nContent: ` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='Result 4:\\nDocument_id:c4fc3\\nContent: 06% of all params are trainable.\\n\\n.. note::\\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\\n    of in the recipe.\\n\\n\\n.. _lora_recipe_label:\\n\\nLoRA finetuning recipe in torchtune\\n-----------------------------------\\n\\nFinally, we can put it all together and finetune a model using torchtune\\'s `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\\n\\n.. code-block:: bash\\n\\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\\n\\n.. note::\\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\\n    for more details on how you can easily clone and modify torchtune configs.\\n\\n.. note::\\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\\n    and (b) the memory constraints of your hardware.\\n\\nThe preceding command will run a LoRA finetune with torchtune\\'s factory settings, but we may want to experiment a bit.\\nLet\\'s take a closer look at some of the :code:`lora_finetune_distributed` config.\\n\\n.. code-block:: yaml\\n\\n  # Model Arguments\\n  model:\\n    _component_: lora_llama2_7b\\n    lora_attn_modules: [\\'q_proj\\', \\'v_proj\\']\\n    lora_rank: 8\\n    lora_alpha: 16\\n  ...\\n\\nWe see that the\\n'), TextContentItem(type='text', text='Result 5:\\nDocument_id:de2d4\\nContent: etune\\n:func:`torchtune.models.llama3.llama3_8b` with DoRA, you would use :func:`torchtune.models.llama3.lora_llama3_8b` with ``use_dora=True``:\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.use_dora=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    use_dora: True\\n\\nSince DoRA extends LoRA, the parameters for :ref:`customizing LoRA <glossary_lora>` are identical. You can also quantize the base model weights like in :ref:`glossary_qlora` by using ``quantize=True`` to reap\\neven more memory savings!\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.apply_lora_to_mlp=True \\\\\\n  model.lora_attn_modules=[\"q_proj\",\"k_proj\",\"v_proj\"] \\\\\\n  model.lora_rank=16 \\\\\\n  model.lora_alpha=32 \\\\\\n  model.use_dora=True \\\\\\n  model.quantize_base=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    apply_lora_to_mlp: True\\n    lora_attn_modules: [\"q_proj\", \"k_proj\", \"v_proj\"]\\n    lora_rank: 16\\n    lora_alpha: 32\\n    use_dora: True\\n    quantize_base: True\\n\\n\\n.. note::\\n\\n   Under the hood, we\\'ve enabled DoRA by adding the :class:`~torchtune.modules.peft.DoRALinear` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='END of knowledge_search tool results.\\n')]), CompletionMessage(role='assistant', content=\"I'm ready to help. What's your first question about Torchtune?\", stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[]), UserMessage(role='user', content='Tell me how to use LoRA', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name='knowledge_search', arguments={'query': 'using LoRA in Torchtune'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name='knowledge_search', content=[TextContentItem(type='text', text='knowledge_search tool found 5 chunks:\\nBEGIN of knowledge_search tool results.\\n'), TextContentItem(type='text', text=\"Result 1:\\nDocument_id:c4fc3\\nContent: .. _lora_finetune_label:\\n\\n============================\\nFine-Tuning Llama2 with LoRA\\n============================\\n\\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\\nIf you already know what LoRA is and want to get straight to running\\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\\n\\n.. grid:: 2\\n\\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\\n\\n      * What LoRA is and how it saves memory during finetuning\\n      * An overview of LoRA components in torchtune\\n      * How to run a LoRA finetune using torchtune\\n      * How to experiment with different LoRA configurations\\n\\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\\n\\n      * Be familiar with :ref:`torchtune<overview_label>`\\n      * Make sure to :ref:`install torchtune<install_label>`\\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\\n\\nWhat is LoRA?\\n-------------\\n\\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\\ntransformer models, in which case it is common to add the low-rank matrices\\nto some of the linear projections in each transformer layer's self-attention.\\n\\n.. note::\\n\\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\\n\\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\\nyou can expect to see memory savings due to a substantial reduction in the\\nnumber of parameters with gradients. When using an optimizer with momentum,\\nlike `AdamW <https://py\\n\"), TextContentItem(type='text', text='Result 2:\\nDocument_id:c4fc3\\nContent:  LoRA to Llama2 models\\n------------------------------\\n\\nWith torchtune, we can easily apply LoRA to Llama2 with a variety of different configurations.\\nLet\\'s take a look at how to construct Llama2 models in torchtune with and without LoRA.\\n\\n.. code-block:: python\\n\\n  from torchtune.models.llama2 import llama2_7b, lora_llama2_7b\\n\\n  # Build Llama2 without any LoRA layers\\n  base_model = llama2_7b()\\n\\n  # The default settings for lora_llama2_7b will match those for llama2_7b\\n  # We just need to define which layers we want LoRA applied to.\\n  # Within each self-attention, we can choose from [\"q_proj\", \"k_proj\", \"v_proj\", and \"output_proj\"].\\n  # We can also set apply_lora_to_mlp=True or apply_lora_to_output=True to apply LoRA to other linear\\n  # layers outside of the self-attention.\\n  lora_model = lora_llama2_7b(lora_attn_modules=[\"q_proj\", \"v_proj\"])\\n\\n.. note::\\n\\n    Calling :func:`lora_llama_2_7b <torchtune.models.llama2.lora_llama2_7b>` alone will not handle the definition of which parameters are trainable.\\n    See :ref:`below<setting_trainable_params>` for how to do this.\\n\\nLet\\'s inspect each of these models a bit more closely.\\n\\n.. code-block:: bash\\n\\n  # Print the first layer\\'s self-attention in the usual Llama2 model\\n  >>> print(base_model.layers[0].attn)\\n  MultiHeadAttention(\\n    (q_proj): Linear(in_features=4096, out_features=4096, bias=False)\\n    (k_proj): Linear(in_features=4096, out_features=4096, bias=False)\\n    (v_proj): Linear(in_features=4096, out_features=4096, bias=False)\\n    (output_proj): Linear(in_features=4096, out_features=4096, bias=False)\\n    (pos_embeddings): RotaryPositionalEmbeddings()\\n  )\\n\\n  # Print the same for Llama2 with LoRA weights\\n  >>> print(lora_model.layers[0].attn)\\n  MultiHeadAttention(\\n    (q_proj): LoRALinear(\\n      (dropout): Dropout(p=0.0, inplace=False)\\n     \\n'), TextContentItem(type='text', text='Result 3:\\nDocument_id:c4fc3\\nContent: 06% of all params are trainable.\\n\\n.. note::\\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\\n    of in the recipe.\\n\\n\\n.. _lora_recipe_label:\\n\\nLoRA finetuning recipe in torchtune\\n-----------------------------------\\n\\nFinally, we can put it all together and finetune a model using torchtune\\'s `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\\n\\n.. code-block:: bash\\n\\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\\n\\n.. note::\\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\\n    for more details on how you can easily clone and modify torchtune configs.\\n\\n.. note::\\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\\n    and (b) the memory constraints of your hardware.\\n\\nThe preceding command will run a LoRA finetune with torchtune\\'s factory settings, but we may want to experiment a bit.\\nLet\\'s take a closer look at some of the :code:`lora_finetune_distributed` config.\\n\\n.. code-block:: yaml\\n\\n  # Model Arguments\\n  model:\\n    _component_: lora_llama2_7b\\n    lora_attn_modules: [\\'q_proj\\', \\'v_proj\\']\\n    lora_rank: 8\\n    lora_alpha: 16\\n  ...\\n\\nWe see that the\\n'), TextContentItem(type='text', text='Result 4:\\nDocument_id:c4fc3\\nContent:  from our Llama2\\nmodel without any wrappers or custom checkpoint conversion logic.\\n\\n.. code-block:: python\\n\\n  # Assuming that base_model already has the pretrained Llama2 weights,\\n  # this will directly load them into your LoRA model without any conversion necessary.\\n  lora_model.load_state_dict(base_model.state_dict(), strict=False)\\n\\n.. note::\\n    Whenever loading weights with :code:`strict=False`, you should verify that any missing or extra keys in\\n    the loaded :code:`state_dict` are as expected. torchtune\\'s LoRA recipes do this by default via\\n    :func:`validate_missing_and_unexpected_for_lora() <torchtune.modules.peft.validate_missing_and_unexpected_for_lora>`.\\n\\nOnce we\\'ve loaded the base model weights, we also want to set only LoRA parameters to trainable.\\n\\n.. _setting_trainable_params:\\n\\n.. code-block:: python\\n\\n  from torchtune.modules.peft.peft_utils import get_adapter_params, set_trainable_params\\n\\n  # Fetch all params from the model that are associated with LoRA.\\n  lora_params = get_adapter_params(lora_model)\\n\\n  # Set requires_grad=True on lora_params, and requires_grad=False on all others.\\n  set_trainable_params(lora_model, lora_params)\\n\\n  # Print the total number of parameters\\n  total_params = sum([p.numel() for p in lora_model.parameters()])\\n  trainable_params = sum([p.numel() for p in lora_model.parameters() if p.requires_grad])\\n  print(\\n    f\"\"\"\\n    {total_params} total params,\\n    {trainable_params}\" trainable params,\\n    {(100.0 * trainable_params / total_params):.2f}% of all params are trainable.\\n    \"\"\"\\n  )\\n\\n  6742609920 total params,\\n  4194304 trainable params,\\n  0.06% of all params are trainable.\\n\\n.. note::\\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\\n    of in the recipe.\\n\\n\\n.. _lora_recipe_label:\\n\\nLoRA finetuning recipe in torchtune\\n-----------------------------------\\n\\nFinally, we can put it all together and finetune a model using torchtune\\'s `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92\\n'), TextContentItem(type='text', text='Result 5:\\nDocument_id:c4fc3\\nContent: ,\\n    and (b) the memory constraints of your hardware.\\n\\nThe preceding command will run a LoRA finetune with torchtune\\'s factory settings, but we may want to experiment a bit.\\nLet\\'s take a closer look at some of the :code:`lora_finetune_distributed` config.\\n\\n.. code-block:: yaml\\n\\n  # Model Arguments\\n  model:\\n    _component_: lora_llama2_7b\\n    lora_attn_modules: [\\'q_proj\\', \\'v_proj\\']\\n    lora_rank: 8\\n    lora_alpha: 16\\n  ...\\n\\nWe see that the default is to apply LoRA to Q and V projections with a rank of 8.\\nSome experiments with LoRA have found that it can be beneficial to apply LoRA to all linear layers in\\nthe self-attention, and to increase the rank to 16 or 32. Note that this is likely to increase our max memory,\\nbut as long as we keep :code:`rank<<embed_dim`, the impact should be relatively minor.\\n\\nLet\\'s run this experiment. We can also increase alpha (in general it is good practice to scale alpha and rank together).\\n\\n.. code-block:: bash\\n\\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora \\\\\\n    lora_attn_modules=[\\'q_proj\\',\\'k_proj\\',\\'v_proj\\',\\'output_proj\\'] \\\\\\n    lora_rank=32 lora_alpha=64 output_dir=./lora_experiment_1\\n\\nA comparison of the (smoothed) loss curves between this run and our baseline over the first 500 steps can be seen below.\\n\\n.. image:: /_static/img/lora_experiment_loss_curves.png\\n\\n.. note::\\n    The above figure was generated with W&B. You can use torchtune\\'s :class:`~torchtune.training.metric_logging.WandBLogger`\\n    to generate similar loss curves, but you will need to install W&B and setup an account separately. For more details on\\n    using W&B in torchtune, see our \":ref:`wandb_logging`\" recipe.\\n\\n.. _lora_tutorial_memory_tradeoff_label:\\n\\nTrading off memory and model performance with LoRA\\n--------------------------------------------------\\n\\nIn the preceding example, we ran LoRA on two devices. But given LoRA\\'s low memory footprint, we can run fine-tuning\\non a single device using most commodity GPUs which support `bfloat16 <https://\\n'), TextContentItem(type='text', text='END of knowledge_search tool results.\\n')])])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name='knowledge_search', description='Search for information in a database.', parameters={'query': ToolParamDefinition(param_type='string', description='The query to search for. Can be a natural language sentence or keywords.', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "To",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " use LoRA in Torchtune, you can follow",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " these steps:\n\n1. Import the necessary modules: `",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "from torch",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "tune.models.llama2 import llama2_7b",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ", lora_llama2_7b`\n2. Create a",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " Llama2 model with LoRA: `lora",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_model = lora_ll",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "ama2_7b",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "(lora_attn_modules=[\"q_proj\", \"v_proj\"])`\n3",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ". Load the pre-trained Llama2 weights into",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " the LoRA model: `lora_model.load_state",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_dict(base_model.state_dict(), strict=False)`\n4. Set only Lo",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "RA parameters to trainable: `from torchtune.modules.peft",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ".peft_utils import get_adapter_params,",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " set_trainable_params`\n5. Run the",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " LoRA finetune using torchtune's Lo",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "RA recipe: `tune run --",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "nnodes 1 --nproc_per_node 2 lora_finet",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "une_distributed --config llama2/7B_lora`\n\nYou can",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " also experiment with different LoRA configurations, such as applying Lo",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "RA to all linear layers in the self-attention, increasing the rank,",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " and scaling alpha and rank together.\n\n",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "Note: You need to have the pre-trained",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " Llama2 weights and tokenizer downloaded and installed before running the LoRA fin",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "etune. Additionally, you can use torch",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "tune's `WandBLogger` to generate",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " loss curves and track the experiment's",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " progress.",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='I am attaching some documentation for Torchtune. Help me answer questions I will ask next.', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name='knowledge_search', arguments={'query': 'Torchtune documentation'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name='knowledge_search', content=[TextContentItem(type='text', text='knowledge_search tool found 5 chunks:\\nBEGIN of knowledge_search tool results.\\n'), TextContentItem(type='text', text='Result 1:\\nDocument_id:f76dc\\nContent:  conversational data, :func:`~torchtune.datasets.chat_dataset` seems to be a good fit. For any\\ncustom local dataset we always need to specify ``source``, ``data_files``, and ``split`` for any dataset\\nbuilder in torchtune. For :func:`~torchtune.datasets.chat_dataset`, we additionally need to specify\\n``conversation_column`` and ``conversation_style``. Our data follows the ``\"sharegpt\"`` format, so\\nwe can specify that here. Altogether, our :func:`~torchtune.datasets.chat_dataset` call should\\nlook like so:\\n\\n.. code-block:: python\\n\\n    from torchtune.datasets import chat_dataset\\n    from torchtune.models.llama3 import llama3_tokenizer\\n\\n    tokenizer = llama3_tokenizer(\"/tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\")\\n    ds = chat_dataset(\\n        tokenizer=tokenizer,\\n        source=\"json\",\\n        data_files=\"data/my_data.json\",\\n        split=\"train\",\\n        conversation_column=\"dialogue\",\\n        conversation_style=\"sharegpt\",\\n    )\\n\\n.. code-block:: yaml\\n\\n    # In config\\n    tokenizer:\\n      _component_: torchtune.models.llama3.llama3_tokenizer\\n      path: /tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\\n\\n    dataset:\\n      _component_: torchtune.datasets.chat_dataset\\n      source: json\\n      data_files: data/my_data.json\\n      split: train\\n      conversation_column: dialogue\\n      conversation_style: sharegpt\\n\\n.. note::\\n    You can pass in any keyword argument for `load_dataset <https://huggingface.co/docs/datasets/v2.20.0/en/package_reference/loading_methods#datasets.load_dataset>`_ into all our\\n    Dataset classes and they will honor them. This is useful for common parameters\\n    such as specifying the data split with :code:`split` or configuration with\\n    :code:`name`\\n\\nIf you needed to add a prompt template, you would simply pass it into the tokenizer.\\nSince we\\'re fine-tuning Llama3, the tokenizer will handle all formatting for\\nus and prompt templates are optional. Other models such as Mistral\\'s :class:`~torchtune.models.mistral._tokenizer.MistralTokenizer`,\\nuse a chat template by default (:class:`~torchtune.models.mistral.MistralChatTemplate`) to format\\nall messages according to their `recommendations <https://\\n'), TextContentItem(type='text', text=\"Result 2:\\nDocument_id:c4fc3\\nContent: .. _lora_finetune_label:\\n\\n============================\\nFine-Tuning Llama2 with LoRA\\n============================\\n\\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\\nIf you already know what LoRA is and want to get straight to running\\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\\n\\n.. grid:: 2\\n\\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\\n\\n      * What LoRA is and how it saves memory during finetuning\\n      * An overview of LoRA components in torchtune\\n      * How to run a LoRA finetune using torchtune\\n      * How to experiment with different LoRA configurations\\n\\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\\n\\n      * Be familiar with :ref:`torchtune<overview_label>`\\n      * Make sure to :ref:`install torchtune<install_label>`\\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\\n\\nWhat is LoRA?\\n-------------\\n\\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\\ntransformer models, in which case it is common to add the low-rank matrices\\nto some of the linear projections in each transformer layer's self-attention.\\n\\n.. note::\\n\\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\\n\\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\\nyou can expect to see memory savings due to a substantial reduction in the\\nnumber of parameters with gradients. When using an optimizer with momentum,\\nlike `AdamW <https://py\\n\"), TextContentItem(type='text', text='Result 3:\\nDocument_id:de2d4\\nContent: ` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='Result 4:\\nDocument_id:c4fc3\\nContent: 06% of all params are trainable.\\n\\n.. note::\\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\\n    of in the recipe.\\n\\n\\n.. _lora_recipe_label:\\n\\nLoRA finetuning recipe in torchtune\\n-----------------------------------\\n\\nFinally, we can put it all together and finetune a model using torchtune\\'s `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\\n\\n.. code-block:: bash\\n\\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\\n\\n.. note::\\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\\n    for more details on how you can easily clone and modify torchtune configs.\\n\\n.. note::\\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\\n    and (b) the memory constraints of your hardware.\\n\\nThe preceding command will run a LoRA finetune with torchtune\\'s factory settings, but we may want to experiment a bit.\\nLet\\'s take a closer look at some of the :code:`lora_finetune_distributed` config.\\n\\n.. code-block:: yaml\\n\\n  # Model Arguments\\n  model:\\n    _component_: lora_llama2_7b\\n    lora_attn_modules: [\\'q_proj\\', \\'v_proj\\']\\n    lora_rank: 8\\n    lora_alpha: 16\\n  ...\\n\\nWe see that the\\n'), TextContentItem(type='text', text='Result 5:\\nDocument_id:de2d4\\nContent: etune\\n:func:`torchtune.models.llama3.llama3_8b` with DoRA, you would use :func:`torchtune.models.llama3.lora_llama3_8b` with ``use_dora=True``:\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.use_dora=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    use_dora: True\\n\\nSince DoRA extends LoRA, the parameters for :ref:`customizing LoRA <glossary_lora>` are identical. You can also quantize the base model weights like in :ref:`glossary_qlora` by using ``quantize=True`` to reap\\neven more memory savings!\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.apply_lora_to_mlp=True \\\\\\n  model.lora_attn_modules=[\"q_proj\",\"k_proj\",\"v_proj\"] \\\\\\n  model.lora_rank=16 \\\\\\n  model.lora_alpha=32 \\\\\\n  model.use_dora=True \\\\\\n  model.quantize_base=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    apply_lora_to_mlp: True\\n    lora_attn_modules: [\"q_proj\", \"k_proj\", \"v_proj\"]\\n    lora_rank: 16\\n    lora_alpha: 32\\n    use_dora: True\\n    quantize_base: True\\n\\n\\n.. note::\\n\\n   Under the hood, we\\'ve enabled DoRA by adding the :class:`~torchtune.modules.peft.DoRALinear` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='END of knowledge_search tool results.\\n')]), CompletionMessage(role='assistant', content=\"I'm ready to help. What's your first question about Torchtune?\", stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[]), UserMessage(role='user', content='Tell me how to use LoRA', context=None)])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name='knowledge_search', description='Search for information in a database.', parameters={'query': ToolParamDefinition(param_type='string', description='The query to search for. Can be a natural language sentence or keywords.', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "[k",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "nowledge_search(query=\"using LoRA in Torchtune",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "\")]",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "parse_status": {
+              "__enum__": "ToolCallParseStatus",
+              "value": "succeeded"
+            },
+            "tool_call": {
+              "arguments": {
+                "query": "using LoRA in Torchtune"
+              },
+              "call_id": "8413a252-8372-4061-a4a1-0a1d165dd373",
+              "tool_name": "knowledge_search"
+            },
+            "type": "tool_call"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
+  "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='I am attaching some documentation for Torchtune. Help me answer questions I will ask next.', context=None), CompletionMessage(role='assistant', content='', stop_reason=<StopReason.end_of_turn: 'end_of_turn'>, tool_calls=[ToolCall(call_id='<UUID>', tool_name='knowledge_search', arguments={'query': 'Torchtune documentation'})]), ToolResponseMessage(role='tool', call_id='<UUID>', tool_name='knowledge_search', content=[TextContentItem(type='text', text='knowledge_search tool found 5 chunks:\\nBEGIN of knowledge_search tool results.\\n'), TextContentItem(type='text', text='Result 1:\\nDocument_id:f76dc\\nContent:  conversational data, :func:`~torchtune.datasets.chat_dataset` seems to be a good fit. For any\\ncustom local dataset we always need to specify ``source``, ``data_files``, and ``split`` for any dataset\\nbuilder in torchtune. For :func:`~torchtune.datasets.chat_dataset`, we additionally need to specify\\n``conversation_column`` and ``conversation_style``. Our data follows the ``\"sharegpt\"`` format, so\\nwe can specify that here. Altogether, our :func:`~torchtune.datasets.chat_dataset` call should\\nlook like so:\\n\\n.. code-block:: python\\n\\n    from torchtune.datasets import chat_dataset\\n    from torchtune.models.llama3 import llama3_tokenizer\\n\\n    tokenizer = llama3_tokenizer(\"/tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\")\\n    ds = chat_dataset(\\n        tokenizer=tokenizer,\\n        source=\"json\",\\n        data_files=\"data/my_data.json\",\\n        split=\"train\",\\n        conversation_column=\"dialogue\",\\n        conversation_style=\"sharegpt\",\\n    )\\n\\n.. code-block:: yaml\\n\\n    # In config\\n    tokenizer:\\n      _component_: torchtune.models.llama3.llama3_tokenizer\\n      path: /tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\\n\\n    dataset:\\n      _component_: torchtune.datasets.chat_dataset\\n      source: json\\n      data_files: data/my_data.json\\n      split: train\\n      conversation_column: dialogue\\n      conversation_style: sharegpt\\n\\n.. note::\\n    You can pass in any keyword argument for `load_dataset <https://huggingface.co/docs/datasets/v2.20.0/en/package_reference/loading_methods#datasets.load_dataset>`_ into all our\\n    Dataset classes and they will honor them. This is useful for common parameters\\n    such as specifying the data split with :code:`split` or configuration with\\n    :code:`name`\\n\\nIf you needed to add a prompt template, you would simply pass it into the tokenizer.\\nSince we\\'re fine-tuning Llama3, the tokenizer will handle all formatting for\\nus and prompt templates are optional. Other models such as Mistral\\'s :class:`~torchtune.models.mistral._tokenizer.MistralTokenizer`,\\nuse a chat template by default (:class:`~torchtune.models.mistral.MistralChatTemplate`) to format\\nall messages according to their `recommendations <https://\\n'), TextContentItem(type='text', text=\"Result 2:\\nDocument_id:c4fc3\\nContent: .. _lora_finetune_label:\\n\\n============================\\nFine-Tuning Llama2 with LoRA\\n============================\\n\\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\\nIf you already know what LoRA is and want to get straight to running\\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\\n\\n.. grid:: 2\\n\\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\\n\\n      * What LoRA is and how it saves memory during finetuning\\n      * An overview of LoRA components in torchtune\\n      * How to run a LoRA finetune using torchtune\\n      * How to experiment with different LoRA configurations\\n\\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\\n\\n      * Be familiar with :ref:`torchtune<overview_label>`\\n      * Make sure to :ref:`install torchtune<install_label>`\\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\\n\\nWhat is LoRA?\\n-------------\\n\\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\\ntransformer models, in which case it is common to add the low-rank matrices\\nto some of the linear projections in each transformer layer's self-attention.\\n\\n.. note::\\n\\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\\n\\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\\nyou can expect to see memory savings due to a substantial reduction in the\\nnumber of parameters with gradients. When using an optimizer with momentum,\\nlike `AdamW <https://py\\n\"), TextContentItem(type='text', text='Result 3:\\nDocument_id:de2d4\\nContent: ` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='Result 4:\\nDocument_id:c4fc3\\nContent: 06% of all params are trainable.\\n\\n.. note::\\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\\n    of in the recipe.\\n\\n\\n.. _lora_recipe_label:\\n\\nLoRA finetuning recipe in torchtune\\n-----------------------------------\\n\\nFinally, we can put it all together and finetune a model using torchtune\\'s `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\\n\\n.. code-block:: bash\\n\\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\\n\\n.. note::\\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\\n    for more details on how you can easily clone and modify torchtune configs.\\n\\n.. note::\\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\\n    and (b) the memory constraints of your hardware.\\n\\nThe preceding command will run a LoRA finetune with torchtune\\'s factory settings, but we may want to experiment a bit.\\nLet\\'s take a closer look at some of the :code:`lora_finetune_distributed` config.\\n\\n.. code-block:: yaml\\n\\n  # Model Arguments\\n  model:\\n    _component_: lora_llama2_7b\\n    lora_attn_modules: [\\'q_proj\\', \\'v_proj\\']\\n    lora_rank: 8\\n    lora_alpha: 16\\n  ...\\n\\nWe see that the\\n'), TextContentItem(type='text', text='Result 5:\\nDocument_id:de2d4\\nContent: etune\\n:func:`torchtune.models.llama3.llama3_8b` with DoRA, you would use :func:`torchtune.models.llama3.lora_llama3_8b` with ``use_dora=True``:\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.use_dora=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    use_dora: True\\n\\nSince DoRA extends LoRA, the parameters for :ref:`customizing LoRA <glossary_lora>` are identical. You can also quantize the base model weights like in :ref:`glossary_qlora` by using ``quantize=True`` to reap\\neven more memory savings!\\n\\n.. code-block:: bash\\n\\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\\\\n  model.apply_lora_to_mlp=True \\\\\\n  model.lora_attn_modules=[\"q_proj\",\"k_proj\",\"v_proj\"] \\\\\\n  model.lora_rank=16 \\\\\\n  model.lora_alpha=32 \\\\\\n  model.use_dora=True \\\\\\n  model.quantize_base=True\\n\\n.. code-block:: yaml\\n\\n  model:\\n    _component_: torchtune.models.lora_llama3_8b\\n    apply_lora_to_mlp: True\\n    lora_attn_modules: [\"q_proj\", \"k_proj\", \"v_proj\"]\\n    lora_rank: 16\\n    lora_alpha: 32\\n    use_dora: True\\n    quantize_base: True\\n\\n\\n.. note::\\n\\n   Under the hood, we\\'ve enabled DoRA by adding the :class:`~torchtune.modules.peft.DoRALinear` module, which we swap\\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\\n\\n.. _glossary_distrib:\\n\\n\\n.. TODO\\n\\n.. Distributed\\n.. -----------\\n\\n.. .. _glossary_fsdp:\\n\\n.. Fully Sharded Data Parallel (FSDP)\\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\\n\\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\\n.. .. _glossary_fsdp2:\\n\\n'), TextContentItem(type='text', text='END of knowledge_search tool results.\\n')])])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name='knowledge_search', description='Search for information in a database.', parameters={'query': ToolParamDefinition(param_type='string', description='The query to search for. Can be a natural language sentence or keywords.', required=True, default=None)})])]": {
+    "chunks": [
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "start"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "I",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "'m ready to help. What's",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " your first question about Torchtune?",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "complete"
+          },
+          "logprobs": null,
+          "stop_reason": {
+            "__enum__": "StopReason",
+            "value": "end_of_turn"
+          }
+        },
+        "metrics": null
+      }
+    ],
+    "type": "generator"
+  },
   "('meta-llama/Llama-3.3-70B-Instruct', [SystemMessage(role='system', content='You are a helpful assistant'), UserMessage(role='user', content='I am attaching some documentation for Torchtune. Help me answer questions I will ask next.', context=None)])_[('response_format', None), ('sampling_params', SamplingParams(strategy=TopPSamplingStrategy(type='top_p', temperature=0.0001, top_p=0.9), max_tokens=0, repetition_penalty=1.0)), ('stream', True), ('tool_config', ToolConfig(tool_choice=<ToolChoice.auto: 'auto'>, tool_prompt_format=None, system_message_behavior=<SystemMessageBehavior.append: 'append'>)), ('tool_prompt_format', None), ('tools', [ToolDefinition(tool_name='knowledge_search', description='Search for information in a database.', parameters={'query': ToolParamDefinition(param_type='string', description='The query to search for. Can be a natural language sentence or keywords.', required=True, default=None)})])]": {
     "chunks": [
       {
@@ -16535,7 +18385,7 @@
               "arguments": {
                 "query": "Torchtune documentation"
               },
-              "call_id": "42e0a687-a52e-4208-8181-db6e7a84faeb",
+              "call_id": "f21015ed-e70b-4a2b-a038-9335acbe0c53",
               "tool_name": "knowledge_search"
             },
             "type": "tool_call"
@@ -16872,7 +18722,22 @@
       {
         "event": {
           "delta": {
-            "text": " the standard multi-head attention.",
+            "text": " the standard",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " multi-head attention.",
             "type": "text"
           },
           "event_type": {
@@ -16940,7 +18805,7 @@
       {
         "event": {
           "delta": {
-            "text": "nowledge_search(query=\"Llama3-8",
+            "text": "nowledge_search(query=\"Llama",
             "type": "text"
           },
           "event_type": {
@@ -16955,7 +18820,7 @@
       {
         "event": {
           "delta": {
-            "text": "B attention type\")]",
+            "text": "3-8B attention type\")]",
             "type": "text"
           },
           "event_type": {
@@ -16978,7 +18843,7 @@
               "arguments": {
                 "query": "Llama3-8B attention type"
               },
-              "call_id": "b3019313-870b-42e5-a2a3-02f933f153b1",
+              "call_id": "bf3bf9f9-0e56-4720-a6a9-be8ad9e8dfcb",
               "tool_name": "knowledge_search"
             },
             "type": "tool_call"
@@ -17051,7 +18916,7 @@
       {
         "event": {
           "delta": {
-            "text": "nowledge_search(query=\"Llama3-8B attention",
+            "text": "nowledge_search(query=\"Llama",
             "type": "text"
           },
           "event_type": {
@@ -17066,7 +18931,7 @@
       {
         "event": {
           "delta": {
-            "text": " type\")]",
+            "text": "3-8B attention type\")]",
             "type": "text"
           },
           "event_type": {
@@ -17089,7 +18954,7 @@
               "arguments": {
                 "query": "Llama3-8B attention type"
               },
-              "call_id": "e4659511-69a4-412b-b995-fa90f43a25c7",
+              "call_id": "9c9a922f-afd6-4bc8-83ba-28211bb3fd29",
               "tool_name": "knowledge_search"
             },
             "type": "tool_call"
@@ -17329,7 +19194,7 @@
               "arguments": {
                 "query": "current CEO of Meta"
               },
-              "call_id": "ccadcdbb-cfa1-4f69-9c60-0fc50ae35f11",
+              "call_id": "2039dce8-afbe-4517-bb4a-43c92dab8cff",
               "tool_name": {
                 "__enum__": "BuiltinTool",
                 "value": "brave_search"
@@ -17405,7 +19270,22 @@
       {
         "event": {
           "delta": {
-            "text": " boiling point of polyjuice is -100\u00b0C.",
+            "text": " boiling point of polyjuice is",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " -100\u00b0C.",
             "type": "text"
           },
           "event_type": {
@@ -17541,7 +19421,157 @@
       {
         "event": {
           "delta": {
-            "text": " boiling point of polyjuice is -100 degrees Celsius.",
+            "text": " provided function \"get_boiling_point\" is",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " not sufficient to",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " answer the question as it does not contain information",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " about the boiling point of \"poly",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "juice\". Polyjuice is not a",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " real liquid and does",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " not have a known boiling point. If you",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " have any other questions or need",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " information about a different liquid,",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " I would be happy to try and",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": " assist you.",
             "type": "text"
           },
           "event_type": {
@@ -17609,7 +19639,7 @@
       {
         "event": {
           "delta": {
-            "text": "get_boiling_point(liquid_name='polyjuice",
+            "text": "get",
             "type": "text"
           },
           "event_type": {
@@ -17624,7 +19654,22 @@
       {
         "event": {
           "delta": {
-            "text": "', celcius=True)]",
+            "text": "_boiling_point(liquid",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "_name='polyjuice', celcius=True)]",
             "type": "text"
           },
           "event_type": {
@@ -17648,7 +19693,7 @@
                 "celcius": true,
                 "liquid_name": "polyjuice"
               },
-              "call_id": "cbea2158-ad0a-4faf-a2ec-3e411bd5aa50",
+              "call_id": "302993c2-3c56-48cf-8891-afac1f20723e",
               "tool_name": "get_boiling_point"
             },
             "type": "tool_call"
@@ -17760,7 +19805,7 @@
                 "celcius": true,
                 "liquid_name": "polyjuice"
               },
-              "call_id": "ac3bf39b-16e7-46e9-a243-130939094e24",
+              "call_id": "9544e61b-5e69-427b-b30c-874fdbcf53f7",
               "tool_name": "get_boiling_point"
             },
             "type": "tool_call"
@@ -17863,7 +19908,7 @@
       {
         "event": {
           "delta": {
-            "text": "'s not a real substance, it doesn't have a boiling point",
+            "text": "'s not a real substance, it doesn",
             "type": "text"
           },
           "event_type": {
@@ -17878,7 +19923,7 @@
       {
         "event": {
           "delta": {
-            "text": ". Polyjuice Potion is a magical concoction",
+            "text": "'t have a boiling point. Polyjuice Potion is",
             "type": "text"
           },
           "event_type": {
@@ -17893,7 +19938,7 @@
       {
         "event": {
           "delta": {
-            "text": " that allows the drinker to assume the form and",
+            "text": " a magical concoction that allows the drinker to assume the",
             "type": "text"
           },
           "event_type": {
@@ -17908,7 +19953,7 @@
       {
         "event": {
           "delta": {
-            "text": " appearance of another person, but",
+            "text": " form and appearance of another person, but it's not",
             "type": "text"
           },
           "event_type": {
@@ -17923,7 +19968,7 @@
       {
         "event": {
           "delta": {
-            "text": " it's not a physical substance that can",
+            "text": " a physical substance that can be measured or analyzed in the same",
             "type": "text"
           },
           "event_type": {
@@ -17938,7 +19983,7 @@
       {
         "event": {
           "delta": {
-            "text": " be measured or analyzed in the same way as real-world",
+            "text": " way as real-world chemicals.\n\nIf",
             "type": "text"
           },
           "event_type": {
@@ -17953,7 +19998,7 @@
       {
         "event": {
           "delta": {
-            "text": " chemicals.\n\nIf you have any other questions or if there",
+            "text": " you have any other questions or if there's anything else I can help you",
             "type": "text"
           },
           "event_type": {
@@ -17968,22 +20013,7 @@
       {
         "event": {
           "delta": {
-            "text": "'s anything else I can help you with, feel free to ask",
-            "type": "text"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "text": "!",
+            "text": " with, feel free to ask!",
             "type": "text"
           },
           "event_type": {
@@ -18090,7 +20120,7 @@
                 "celcius": true,
                 "liquid_name": "polyjuice"
               },
-              "call_id": "fc32cf9f-db3f-42a8-baad-da88903b53be",
+              "call_id": "ce595f0c-86f3-4055-b675-09e00007dc97",
               "tool_name": "get_boiling_point"
             },
             "type": "tool_call"
@@ -18246,7 +20276,7 @@
       {
         "event": {
           "delta": {
-            "text": " 100th prime number is ",
+            "text": " 100th prime number is 541",
             "type": "text"
           },
           "event_type": {
@@ -18261,7 +20291,7 @@
       {
         "event": {
           "delta": {
-            "text": "541.",
+            "text": ".",
             "type": "text"
           },
           "event_type": {
@@ -18356,7 +20386,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "\n    if n <= 3:\n        return True",
+            "tool_call": "\n    if n <=",
             "type": "tool_call"
           },
           "event_type": {
@@ -18375,7 +20405,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "\n    if n % 2 == 0 or n %",
+            "tool_call": " ",
             "type": "tool_call"
           },
           "event_type": {
@@ -18394,7 +20424,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " 3 == 0:\n       ",
+            "tool_call": "3:\n        return True\n    if n % 2 == 0",
             "type": "tool_call"
           },
           "event_type": {
@@ -18413,7 +20443,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " return False\n    i",
+            "tool_call": " or n % 3 == 0:\n        return False\n    i",
             "type": "tool_call"
           },
           "event_type": {
@@ -18432,7 +20462,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " = 5\n    while i * i <= n:\n        if n",
+            "tool_call": " = 5\n    while i * i <=",
             "type": "tool_call"
           },
           "event_type": {
@@ -18451,7 +20481,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " % i == 0 or n % (i + 2) ==",
+            "tool_call": " n:\n        if n % i == 0 or n % (i",
             "type": "tool_call"
           },
           "event_type": {
@@ -18470,7 +20500,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " 0:\n            return False\n        i +=",
+            "tool_call": " + 2) == 0:\n            return False\n        i +=",
             "type": "tool_call"
           },
           "event_type": {
@@ -18489,7 +20519,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " 6\n    return",
+            "tool_call": " 6\n    return True\n\ndef nth_prime(n):\n    count =",
             "type": "tool_call"
           },
           "event_type": {
@@ -18508,7 +20538,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": " True\n\ndef nth_prime(n):\n    count = ",
+            "tool_call": " 0\n    num = 2\n    while True:\n        if",
             "type": "tool_call"
           },
           "event_type": {
@@ -18527,45 +20557,7 @@
               "__enum__": "ToolCallParseStatus",
               "value": "in_progress"
             },
-            "tool_call": "0\n    num = 2\n   ",
-            "type": "tool_call"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "parse_status": {
-              "__enum__": "ToolCallParseStatus",
-              "value": "in_progress"
-            },
-            "tool_call": " while True:\n        if is_prime(num):\n           ",
-            "type": "tool_call"
-          },
-          "event_type": {
-            "__enum__": "ChatCompletionResponseEventType",
-            "value": "progress"
-          },
-          "logprobs": null,
-          "stop_reason": null
-        },
-        "metrics": null
-      },
-      {
-        "event": {
-          "delta": {
-            "parse_status": {
-              "__enum__": "ToolCallParseStatus",
-              "value": "in_progress"
-            },
-            "tool_call": " count += 1\n            if count == n",
+            "tool_call": " is_prime(num):\n            count += 1\n            if count == n",
             "type": "tool_call"
           },
           "event_type": {
@@ -18626,7 +20618,7 @@
               "arguments": {
                 "code": "def is_prime(n):\n    if n <= 1:\n        return False\n    if n <= 3:\n        return True\n    if n % 2 == 0 or n % 3 == 0:\n        return False\n    i = 5\n    while i * i <= n:\n        if n % i == 0 or n % (i + 2) == 0:\n            return False\n        i += 6\n    return True\n\ndef nth_prime(n):\n    count = 0\n    num = 2\n    while True:\n        if is_prime(num):\n            count += 1\n            if count == n:\n                return num\n        num += 1\n\nprint(nth_prime(100))"
               },
-              "call_id": "11645d4d-35d0-4542-bc8d-d01ed1758163",
+              "call_id": "63d06ce7-5266-4ee8-a620-0e81cf5108a1",
               "tool_name": {
                 "__enum__": "BuiltinTool",
                 "value": "code_interpreter"
@@ -18702,7 +20694,22 @@
       {
         "event": {
           "delta": {
-            "text": "plexity the company was founded in 2022.",
+            "text": "plexity the company was founded in 202",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": "2.",
             "type": "text"
           },
           "event_type": {
@@ -18808,7 +20815,7 @@
               "arguments": {
                 "query": "Perplexity the company founding date"
               },
-              "call_id": "42bca45b-e3d6-40a8-b110-d9d77328089e",
+              "call_id": "3804eaba-07f8-448c-8dd4-8ee14d748a05",
               "tool_name": "knowledge_search"
             },
             "type": "tool_call"
@@ -18896,7 +20903,7 @@
       {
         "event": {
           "delta": {
-            "text": " the merger of the Basketball Association of America (BAA) and the National",
+            "text": " the merger of the Basketball",
             "type": "text"
           },
           "event_type": {
@@ -18911,7 +20918,22 @@
       {
         "event": {
           "delta": {
-            "text": " Basketball League (NBL).",
+            "text": " Association of America (BAA) and the National Basketball League (NBL",
+            "type": "text"
+          },
+          "event_type": {
+            "__enum__": "ChatCompletionResponseEventType",
+            "value": "progress"
+          },
+          "logprobs": null,
+          "stop_reason": null
+        },
+        "metrics": null
+      },
+      {
+        "event": {
+          "delta": {
+            "text": ").",
             "type": "text"
           },
           "event_type": {
@@ -19002,7 +21024,7 @@
               "arguments": {
                 "query": "NBA creation date"
               },
-              "call_id": "bc879653-70ed-4c38-8a7f-fa8a4621b088",
+              "call_id": "d94006c1-5692-4ada-8f1a-d09ef2d46dab",
               "tool_name": "knowledge_search"
             },
             "type": "tool_call"
diff --git a/tests/integration/fixtures/recorded_responses/chat_completion.pickle b/tests/integration/fixtures/recorded_responses/chat_completion.pickle
index aef1aa45db1fbad744a507b0f021e2d2009e06f8..c4f1c7efdc966d90b11b6df1c5f7d19982624c80 100644
GIT binary patch
delta 77771
zcmeHwdteh)zP~e>nS{1L3-kdk?es;TX_F@D11PjS3qpZ{yrrbcgf_NGA1P3GSwOF@
zD;3cczPk8;yX$p*>?)|gcz0RF*Xq5xB6`(TL||QCyS%C>A_~7VuXNHjX~;}%u2=pT
zPEKde`JC_fd%oZA`JUH<x1|2&Oy=W%C9oWK<+2(#O|BMFhsb;`HOXB<-N>cJKJh=)
zG7`%H>@vQ{y(#J`)l>D4xlO|>g!hhBPZr)&k7$X-{_e(}u5rJbKA%fXf{IpbGM60t
z#KRfqQH5+dHSTjctHk8L=gtz7lk!%I$<Ok<xm)v54g6=(+GS$$kJ@X*WL?1=F?p%r
zIx%^mutiL6(N*!uMR5C6BIb!a{WP3wMzcZJrx``YH5x9n#{JRcNkXcnJh#t_+9|IH
zbg6My&6pupc5DVJlZRV3bE=p;H`CjQ8)r=sbH~g^74Yx=`)ou}K5432Bqrahnl2`t
za~6upQF9lF$tUMtD<-X1FBg*|=Nb5<(BKE=y^8s5uxY_fVuOb-uM`@*cezPO<*X2i
z;8{^F<jr1LBcx8QL>%FSXxA!Hh-R){D&(DBjTp-Pb@#O^gw*UcV&1tmi-o*j*NWfH
zS!?C<?ld<Ge|*6#WVx@eLsaI9i?OT`QqNl~LTaN`%*$aWaCwv5J<@rCxjBjx#HsG%
z8^*d1wyu%<+R(O6@~gzv-1F<s_J*Dx?&sT=OMbPjua*4D+tBX)wbh#%>;B`$Ig($i
zJC;d)MO{Bd__gQp%qJeZ{^vNANnUl8J;SZv#P=JYE_8X*;gQ_?HSYB7b|H0q`wStq
z;r45URLYKeA@%+avyj?;2amnRU3Mqm_!{>=@2nR7y3M^<Na?%gaw(shhwr?Z;&OTN
zo!s3d`L+L^65-dL$MfCS-0KY3h`a8?)!gef?o$u&q^WWL>ObZQdD#yx6jHA~xIjoX
z{Z7lJd?4jN^g7Aq@{krk#z=m}JkEbR)xGEO-v@+~x_<@VvKseapRN%qZ2ixfLMq~q
zeA{Z=U4JwQ6|k)|{pp5)#cn(BpxDZrUR=$6=!3rPCASoP?W<A=OnI$BQq`-k1t#c-
z*GGvh=ppFHw^s@+IPkXEmL=~j=?i4yyN3wj&D9_9B&>0dIXYX&`@>NlSdF{>Lz|G7
zdW@H0r09?3^)2z1<J+W7Yy3poXU2aj_6C-UZ+;rMX|bOZV$&MWOcScd&aM(tkDcv@
zviEiyym~qPe6^?(Up$Yr7pq`-o#?iH<M68z;lfjiyjFqxV=+O)!JIg(kGb$f#$#s)
z;obR3n4r<%%Op%tf^g4xY^Jnkn30V6t=h981&d7*$~!g*n=2%LJ{eofB^QIP9P6Xr
zJfD?gX=1D4+UXclg`6>g5i_u9KD9qF18efvaL<2Lsy@R#zi7v{rFo8jfmu~>z=37+
z)P@o#Y943c;iwZ6x(eLTjPb_42GUv(UjBt=TTr9fq*UlVyIQf%T;YxOd$BShDJf#_
zeb{s^m+iRuu<(A&5vZGanB4;4u^H|i-#+KbdO?+n!LeJgXwR(`>IMz$SV2U4(C-8d
z9JJxlaOr0Br(tiaR%kr8{~h~av;g6muQ5T{z}oYeRmhG12D@5FKJ^X8cb*zpeF3uw
zxud?t1Z@RReT!8IxeG61yjrh;6BjYQE7ySQJ4{f|kn}w^NqG0+@3B%LX}aX4?~zN`
zA|ZG4Wo#Co+?jw25OzL`3yKp~VYrCk5{8Qi?#6ME6U8d;yKky+-l)`onZTC{6-1D@
z2<9#l*9*Bxl=t07D7;e0ovOxp_SC@JYFuojO@j;C8^~e!RN-A1hKqtx65$2;euUTv
z*cyqi72Y*Q;Ub~mjPkakX}Gr)5hJ`M{C)&35Cmq8#6_-sHWC-9yCWJGX`UYA&3!e-
zi+A-XTrh>89*qmO5S|{5J2*Jg!9E7(C7qMrLdcHAQ@KBl^*k_~*sAip;lzz9NJzqY
zO~hFscr6L%wI=_walAkk{%1@w&f97J=O2;<Lh(OmrQm#r;^m&8@%IAC{k~MZb{Gd~
zDlE*yd4c7N8lEq(i~spxKF-^C{%5t;=jT^iT(snDe|x<EzZ|gMy*fNKQeax_WL&T@
z@cd+4(9W=|9Ou2F8W=W3pid2Wrg-IT?Nr<)l#o?{uMm=NRd{*bTq#h$2I8i98T|A#
zoVPkY8pT~owBrIh=Fah<gL*FBAW-P>xq=w*)NQ#M-yE=&FV4dw#a5;*_o8`aIbJTn
zUA{tq%a=G}<p3p`SK;qQ3*T;Q6gq}aOYBYfcM`J+&$fA6!*b?!7v3BY^IPrs=?I~Q
zF<ZUe^x>`E&O7A>fgm;T?G3nrd)EiTvp3?;NFluQD}iae=-hOxKncFhGq&Md10uS+
z6Q3$rZ^&~Cox!KVVO{t)ae{?g@(6l^_3jtJ$Vyc<my|g0o<|?W-BF@dyYoMhTnHA<
z_(!Bsg!GX=B1Q}88~=p*vyh%~0CjUA{nY`~3?aSy&!|%h>7r-wbz=JDGf0Sq{QI88
z&0@OdAYQ_!IWJ<A=hQ)bso$}rNAn_{6)m*yhW|mb&W&E6;BCB4NPhG-js|<|m<E3N
zj`sz_yEq!wak(G8iwk2Txbtt`+-dI##6lM4Jsi0g+`Ap`BfZ8aGmapI$|s*cg1R`L
zyx{|H6$M98=jC&c97XcTCx7-KOG~b>v}4}F{(8(?1#_Gw2KU0)6Sy!$gAY#Nc0RXf
zj0U=oysiBBBfL@g>bL(uc7-p%@UifMl+9V6;0{V8_h%=2*mn0RWScma@D3bkPvbVf
zj?D5iIH?xudHic+0r@KDokvE1PaZvwv^AgH@Qs%&=@;;cT&@(;nG5&>Ugzr5%PeZn
zx!QS;3K5z2vnFDy0v~v2#J$lkJdH}V8nu$6qi2{(7)`_K2yYULR3RWe{wmxTsp{}s
z-Um^tC&cFdeT-_MQ1nf)Dnv6>i?lUWajKtrTN9V05<@C*Fi9nZBLoVs8L#qB;a?@I
zV#OwOXQ)IO{8gq(ltJSJl_<I&O;DjgMlT>wXQ|#2UFQ$;y)C~{>%~8zKqYpRBLynd
zJ2`^wEcBK;L#HzKDK|o|YVtPlzl&Agp8WF?l}}s*MwJF=V0oEJEjAFQs_KQ>YbsPI
z#)N?Q(NoBUzRYW{8c4iOCG-pU+jT0WnK=Ag8dYMS&uCKdN>9ol<Rv2~eExl^u^FC)
z9mK=f6BXwk#Nc2e77J5{sWOFPPTa+|j4RQ7H%otsuuS^3it#Hf$Y*{}#BxWsN*rPo
zeBmwc_!la%o3woC<!914l{mb4{+#!-+ONF1<kzZM0;2oARxv_y>3Nkn6uNxgON0l%
z@m5iKL4}k#*O2!ws6-`s^S7$0LT<uEuW<bNq8Fs|JMU*P-+M*o$?sW#<_cSLNhQRF
zV9aHesMr2<SyjcquyZLP5>SH?BF23^$(1<4bEgI_;Do4=A5sykxB?c#a)Ov3RCbsk
z#9q9f^p=}V5hAN!qr8P(rzXT6IzmH;G<{M-pusAK{F-4zgOH4g@K*d>1i?#Q4Q!6|
zmXH=jh#ljDD59q~6u|Yvi5RXF&TD<2!f@C!hDaAR*4JYQVPseX+hPeM2D~QAjw1xy
z%G)?N5=Xq^SD5M(i0WbDr^C_+uQ}b5Mj&C}i!4hQi>!eo=>+1dL{>Lt5Fh(3K5GJ@
zi4;h2gPssgR$&q06mq+Zykxu6;H7r4k>C|h4ZLRbvf~#fFI^`V6JpmqUrdNv=Ft*@
z?-|nmh<wb8UVU<63W1cG7yd8(B0o|=ARm(FXW2YLw3?^p5l9lf-^ajj=M(Gw7ILhb
zKyD*n$gs5pZ>FW#K3hxt#fuGF$F`p*`2*_+WM}!bv0h9Iiv6v6Vx8YQFE<d#k>u;F
zXeanUe+|6VP812b%h!A9{M~wQ$9Z4_k<Yy##b?<_?C|27^$WHO@R&aSMUP1Qax>v;
z>oT?w{%xmuD=|&f%U}Oe=v2}=|K}FsbrrT4y5FaoGt%ifwAs<NfoWx|w5y(>o9mqp
zCZ9{%S{oRLwXp-t7E&jCfK7q-ZX=Qawxj;cmEnXHx1)Z=rRT#N&E#}Q-a$;^GtxYp
zcMx_0-$%R6Eh*GK8U=6n!{PTS7p&byjN&u)!96<(Q`~;^$NJsv^%>RmnYVXk+l800
z?L-D&*b?rWNG_jyxM9;SBH2)+Gn82^OsUpvt7EiAlfFb-S7$V9jRs3uk=0yRYO&e6
zI)}NO&c<4YxrynryW#a+#EiT*SUB&nk2ld{M}1axd!3zwai9;3=iVS=$LvC{_55WX
z`(;nNXZZbdnn!yV;fPN@i9YBgT+BvSm;HN`u21hN?0XsxN0D0U0$b=e5VMOIjh%z;
zzY+11zeHKp_H*n9F*#eiHg#p!N1=!P8#c#iXTPXVmi~dQhpWK;J#4+79G%BjCN%Fd
zN><yiN=46}%DGC}Jl~q9$*CFD)0s`XV}_4*A5Txt=kSDpVRJwXYXY|(VeqAKKV+z{
z@0SiD#bE3%B60*vd>%a0zP!P`w>tq2{)Kqo6a56ytV;7rWPLg>KHGYV6r{M1$QO8s
zNx_PIp|^t0s0bSUYp~G{dUAOeU)#WaCZneSj1Ky%o}Sj3?H-vM2j9Fvj7kXQ^IV8{
zk;o0{(|GrYqWIvy9NE*-blNd70`&hyqy+!Dq{(`Bj5Z%mA0X7hvdQP;gW3dG_Y5&M
zq`Gt9jTecWkUp(&k1NcC<d=xV;6L}O;pd2%!8SIhhtO2EUZ=~+30g2#dOx+lhWeFM
zbFmt^Go#pG)fHQq60NDIxL9jsSk+!!q|@q{QoY4y((6ji`Yujq+uuST*biY>U3F7e
zO_%*0&yE*}3)l~+*nj&M;vsb;r*KcPP)<Y3`_!1gN^6{arPW(^v!;O8Pn_m~lwAZl
z<mRJ1pz0pLaMAG3LqtxfmMbs=2C5qIaXuln^jBa%c}76|E@HUAfWTOOAPa_{qdj*Y
zCRP%V`xw!ZT$9%0iC9otY9%dcoF|f4i}LMj&_g0voMW~!4esb7;%2Nsf2+2yWIy-u
zOW1FaU&4N0zg611xmtNY%wleA?6S9}v2I~SD|*x3h8}`{z@TKc-Nrt94Cz2{Dno*U
zAfUS0N9Sz!zUgD&(RYbdNO_qWwXBPSB=tyx$H`(3L_67F$ASK3YTTe=+$@)%`qm~L
z`nS$exTMh4)Ld6rq}P=cnF_7#%VxOjvmFf%Tcg?4;B*vN+SaG#L`0<fkbEvDY+*$6
zDRAO3Di@-U6JrLI@Un#?0XD11gz&~V6Sf>B5@5-3BEvoMreWa?HU%mW(_u~~5w&y>
zwSwFp*V~=yRI_Tfw!zxfnPD*38H}YitJYjrSE@CZSkWMv(d)D&Rzs=YRAwnN>#Whf
zqvVUJ?ladXVDn(nF`_l5PxpnbG303Y^cZmmV&DkaqasPzev}vmzdlZkbbQEaz!U7_
zIC=<*oz?O6lCib_&TaP{YIDkeAf+0Zd~0}v<TFsNVezr{k9+tUK`-bYYcv3;Xf}S(
zW3X1Hc@CWT$vfnnT`u6@8(gTA<sBk>ZG@I=DjNzvpyG$hP3%+`w$>H4tS{~AVf&T%
ziZBWV!2~x^rnkKHB#{;>8Dv&{b}^M3YSpr(KnMGlP&znr7Zo{V7^Z@LKQ$E&+&zRC
z(x5wyOoJ`I9zqNiaE2t~V2_bZf<0%6u|vj?@t~*3@zB&wge(*?`$XgyglWi{UkK(|
zRAF&wN=X`emfbr?!Oxdd<A;n8@t|8l#VbGvnbHvR6)`DPBFL=z*jL2#P^*^B{uFR(
zG_jzYO+_fc1le#(pe2LMgR^;*8Xi4QM2AWjnJiiG4N*2kRVQ8`QiiDNzg{3hRs=E$
zzUf;cGt^eg7P>STF@;KlRTqcM7G1bVl!n@TnUsI=J7VS#RejI*#QY(u`sbI3C81U=
zTiy!c-m360{$pXmEGl8=LNY2;VuVfTd<sUkM~>f?(GxYl2c@L}gL~kOD6)XM3uW5@
z4v!*7V{SM+oQ$7wC(5d}yV>`B!sNi_813vAzF~5%8flpPkqkCWp7#iP)BY%W2+@@L
zP_o*7Kl|(%e)a`W84>_HR~!52oX!Tu-6=oIhBM<x^|USygETH4JTMllFL`96%Z1@D
zQ@IMGnk<KAaB3tuu7YKhQbdvm=MT|js-kdY^Q;KwCz3@9^Gr4>BWzA2jS8cZ$GXzd
zB&{gx<iWW-nw+dC9N9dp04#~DP?%@3QJJ7Ji8LvUN*?PD#F6ESvTo)TsK}l8RcMI@
z`o}L^+s0Y}-oC(|c!hDvW?qFG+o*+OFH*6J(yROm=+%cz8F0@_ls1g;xc6M2=&_6=
zzrdHaW+HC3vkw<~2)+qt{UkFz{#^v=`a8~f>FXnG4oJE+ybI+svBOCi>!R8F_-QD!
zkN@NcgZL`EH;RnJ+#Yi>`TWQzuIx^>?AtP+<#S?mV0h!?!|UVTiNN^TCO9^VBn59X
zFc!hv3_z+*)slKf5;$bZ*N0ra@$eku-h_8Xks|~wK`AVMSm4=0^6I=Rs9x%G%cg>Q
z{f2cN_Tr8ZDFJVeB1Z{S2&&)vqe2G!>L`^MDjDQ4;7dK3J2W*vRz%JWwdSDIzh82r
z(atQ`dN(x*n)g$Y(wJq4k|>V_4kNi@$Ousd(X*&31!y3fC3&zXhssj`i9BvZmyi>N
zj2j7XB8N&)fCjR;Q3(5b%`S!5H)JCzh2yi(f~<)vsS&WFjEoGGIr79pJCW24P0eQ}
zlG8%1SvK)AV6&Qxg`<<maiL<E7SOK?!dWSf5JFR_3Umy4QeZA8O`+03Ud`E4$c&+>
z`NJt>&d}6+_f&FDs5Q%${1SNeJ7O%{Sus?tpI=GpLv6i0S&N=VP8^z=KbS_&4z*_4
z94`Z1H<beP3sekDd56+KbvG3iDjInl*fAq?$(L92bu-D*P}?k<1KIHSmsBdOnnjKZ
z6@$FiU!Fx8LakYL>vQ3`r>HnMHk(Wd6@$Fi@2Db|gj%!g)*B&e0%?TD=7jFy1r7-O
za1o^4bIDAK-_6_%`bA{5m_ECRoG;zwTs6=hxiXW{$Q0}Av?ivwOlvGEsngaObQW!C
ziP2`QL%ZY*wi0%aoO{!~@dUfa8O&RVEGSrvW@CT2eb3h{A?wv*8w*yG44>xqi3i#*
zz3N)BkR;Y;A=q~;Bn!n7K3h+&5YziNkkj}yzb}0AKory4EJapC9&Krv5p5GMHI-=1
zOi`V-#B8=$N=z1mL5H@6vpd1<dr`&Q#&C9<^>5IR&SA~Y#twUXg9W|v0Lr+fy=Tgm
zCub)6;b8A0H`&PFi}HgRU`Z317DGFnF1oF~!DX&%WN4eSRk~k4G6HSoZ)l@k=C<p6
z@*@lAg^i54jiFm%Un8j($-31^mW%1aW^yr~9*|*kTgYz-g&AgHOl2k;E7Qd`gVv}s
znY4AqB_^$|jA8c`l~^rhoQQ`r!_IV&8%2iY<j~En&h-sebku^a-C<$3KGA9G7*}nb
zv!SuUv97k++2C-c(G9TH;^oNbQ38W)wgwA2kikW}oKj92ON0X)xHB7C+L<=4Tyq=U
z;G(Tgrj7gD;&iyo4GtRZxpKBPnL&RmDV*8ROr_H1I%m6k(VyeVG*--|rH>uQ34I!p
z7O?}+NSu(!!Qo?6ksv9tv2-hAZloI<TG|_|2#=MmS=tIZi-S>bUeC~G`Z|YmgM$`Y
zO>?b=id3ppC=N>ndOJCua4?Kj3I?0te(v8!k2cfR2Ad6?Sb=E4*O)JTYkU$q(_(|O
zz0pe7F?7ATxw!+8jCQqlu)w5mMn%!)wzh^g7v14(hegdI%?Ffr@&+=C6u`p0za$rl
z>DpV!wLOi{|B6h7)=ok^JR?6p%Y^`OB=Bjxl)4L@9RGY|0GkB#t!S`4r$CjcW-+%n
zF_3bbc<e@Vgpuv{O<enaw~b8GAl_%OT!NN0YO!l$)7)D=jDtFw8UvNLkqNNB(R-{%
zS}MK4jOf$G@lm_M*@~!Vsb`uR&<>)uf{2JYHYwq-DoEN+=D?@h$rNe+*aUh*gR4HD
zwlPd2ZEIy1mhwpTq)Ofzkh)LrAW!zuB`x?m#-}y0kQPJD6o^fwawmI0_abs0pB1E0
zFzAZP$_$nwt-)eKTg}l?A==W?GCev<#B9;qiqL*VL)aUI1$UEnQO97(?$o!FFdyj|
zHjLJy9s18dKK)8$eC}TI9YU1lByfI3#*_0J%}94hkAsPWz2mVl@b2rRpbL1qUpJ63
zW;dLb6&2YKp{<DSb(T_XsiDrSEh;V2>+9+aHfvECZ;U&mS#8nCSl2PNZH&3qQjhle
zBU`(v%l<d?UuS}Q(ZvMV^1C0@uX*qxGBq)*xBUlRIv2za_!lD-+W{|oO`{HuPr@?c
zw!e^Zp)MtqjUgSnUqKseR=@lsSk5^26>^SfzpyLq+t&`%x9e<%I$N2o44v1(>eLc+
za)-ItT!!|WmYS_)OsUmosS_OS>3Lp9dkA}T)M2vor`{}?)t8(Hg;Xq>|CgR;A-g9f
zvb{M`8nM5EJ(JSyNir9wcb`Tf#Sp6wtX_Y>Lp{cwB|j3)G&sH@>!j|_@`1Xl4IRm#
zH!)T%Q=+TW8qH`pY}Oe{wPgl_$!w`(bQY7Lzpe_me@$lpfN_L3&y!A)Ke}W?J~H~k
zA!@gvv~&^nE&2S>CI5!<?Kh$azjUQ%sJ=O$Kf2@>=x^2b&FtqsYqHsI(3))ad*3zL
zT&>bI*^tj2T>|J$`(5ZEERwkuC9Cb**k@0z1HqXZ5*#~MH~VluHhuh34uy2Vaq!Ss
zxPi!3DHC63E|{Og6X5n^1beIsORm8IS}qGHoE}Mzy=L&xZI*=&N&PsT?};i#N3FHC
z-sCK7HwHshgFn$6i2t+Y0@rrb7uofC=+;nKgDL>BC3UhJ+mh>kaQ@)Rsce`P?yWU>
zuz4628{XtBb8p>}4F`r%G2xA~$bG3sw}L%@Xz;qfe5S+YVN~T{DtfsZD$oHm=vY?d
zSuk~4i=hNXbB$=~qO91)Xbol^Q)JT>8*CO`{|C^##2!Es58E~9oCi7)MZ6_?k5?=n
zq*zvBj$AFWV_No+j~;?W<`^njiR|Aj_B!5$v)Tix#=sO?!+R1w%MCZM#+G$lxQDOz
z;sxE~MhpO|*O@b$^F3=Ksb*r>PL;6Y9x5LoA0h3^PNksJgNm$rGovlDnTk+k-cq71
zwOULlerB_woVp^D!5r>WDQ}FS?i8bDsdP_3o;@-NML}Kdtqv5YH#=yiwbge{1x35t
z8XOje=Az|%eB3u?j}^QB{5B0ElhLHDB+82Ax{p5?=RSB;4gW}{#Az0cc6Xl~0}rQA
zlf`gb8Z4)&WTJPx8lC*w(r$LR8f*=WHJ`3)cd;>kr=t-?ZkwAM8+;<}CKDTb<-+o9
z?R9M~GeV5!f$GgJn%T(4ywPj`f8cXR8yn?CA#)V;y^;vw&oZd@BEmWdHY1obhJ21F
zWKZ%Gj*4alq03%g!0o*(FF+l33VH}y#s4wNK4&)vHCFBe09A@=V;_C@Ua}aZ&U5g<
z`kwDB8=ZIWrIM(E8rA!y8Rx`TD2XSi^SAxsf$at=O;I=sFfDlsw_!GXh*W5zriK@h
zlHl<~G70VAQ<6yXBzxBwa#DB^$-DVdNg~PXZjYBzSBDpo^t)c542nXMN1?3~scDMB
zk*$y>!E;loNecHh*{I@R-%C`2qLh-?|G6!fhH~m(_)?+}`3GwDL7|7>l5m|+GSKnw
z8A!J~N<#h8(0bU!xAQ8gT_eNV$qcGH`V0YCCsT?0If9ZWe>Kx^u#lV^>imbys{fas
zRw=X9zh6Sl3YFkN=`+8)Mk5Kd?B+C4%I<57Rbc8(Hk?^-XeO2JJu6ZT&n^x9<Vu-*
zxpo<K&5-eBCNxvzOxV7B$eN$Of~pC%`7$XVvvLS2KMg9>WGR0f;N(@*h#{iE(N$DQ
zs8!4EhGo$GPbv}qvYHC{t_^wiZ^KC{J=E6A6uy!*p*LD))nBfmW`x>m**wpNluWd4
z^VoL;Iniocl_fdkAjH)WvLP8^M<S_*|5`g_z0hu^LUx8^H@^(bXQ^0NTSpZRnN*a)
z@E52IetX+9@#Ju*wG5d>`rbm#36&7?)X|PFsd=H+EK?_V7%JrDNHVLw!#0FwcnY*!
zCNkl*DrziL$7w=7u{&&rtiP+LK8hEna^Slyl(1!Kz;*BAZ=i10h~J$$L`;B23z^Ah
z^toj-(C(@K?xd>K{A#J;dgS^GtEG}rS~}mDtmjutjYIkNvFO1E5_;Ax#p=1$Qk%!1
zzg62~+0T7eOR?Xe)l%&Dz86rkwc6S0xJU0Zh1fp`F$)?ctL>@mv!_}P51S`|>NUqH
zpemPziW~e^TqzRY3qF)0&v4<eA-mP!GB!)Bad7YkVqc{!LLu=P2ag>i#=%;kB9)<-
zOx9fjDq9&KvPqK+%_N!3-98Z}h$MGWgb5<a%@oQYk|{pPyQ!M60HV5wDh>-EuiZmU
zQU-|Z4yA)`Qj-NQ-Aj#829Zo*X}pgb9~MB8?x#w_0?4QLQ-xsx<e@!OZdd@Z?G2mm
zGaV{FrHaAv?`Y;KIPamy&Fa^=k=>#7Q1K+Chw9%b<vhqnv<zCFq$)u7TeL7EJZQ8K
z%!jFRnD79VtPCQVO7GnVsEn`xvi(0OlQKYLk720d4%R=vV((n&U!(mEu4J<6(t}}Q
zpZ@SWO0Nv7X2~6|lympV!iV1xH0*weN>>J!Ohzqwn7TGBfK)z0<%I>1%a2gAlmQ~!
zB*cRGYl>C|Okhp3X258PZ-l0wNJ+01;R8lXJSTonZHtWJVlpFGbu?1XA6p%;pN*3b
zw0B6SSBOc?-R~>}QDy`LBgB||7FlwUE$NQDBSqYfydy=Zi65ZHfFY({c%*QGlBhm#
z>|EXKqthT9OqqiAy|7@UOLl`tC<%h~>zxIqll;PjQ-7k;uNgdavWYkz_G+l{gG#}`
zz15%GNf<r6R2sdzVrEaM=ftjeC+?TqvaybA-q6-j=JM_$yh60u8P!*SR;FxTe1;l3
zh_WdY-GOJR-0(%W{UB8^i0EYZ>lE0XNQSd!^yr_baBL7sC{z57yg*eBB0AX&&UHWc
z^V~tz+cF8r-lj5$1Psla>9H!@K1xU`M>C?Gf1%Px3OkY<<|cF))x}iznd=i^b2;UP
z;~HuhympL8^lW;W`V4dIM0>pLcd-vZ55WWCEWBi4uz&w!0M{}Et27k;?#BP7PLB+8
ze>W&w?z5cphnQ0hs^bSjWrUV&DjNzvpyHJoO$F7@{UQSP(%G;8!d~MN7C`n4*Mvtv
zB#dTpv)EbOtgAzf?F~|BujM#Zsf@_T?$(8HDVsu6Izf#N6GT@--fn6lI1W)G=SM^+
z%{kfHIYwVVPp@Yz*Ku2{Z4HgmJGBO$bVx=9e4w$v>@ca8ZZ^B>;f;H!Y{f-iw!}?`
zXAe<%@Z>*~3g5~`Gy_uaN2V?B4Jt`-a>=xE3qJ`PO|bwr?L}VecTZ5o;YOv{&!~zp
z(O!!o^*7XLxcnK~tU9nZ2tpai6riJ@Q?+3M<j_B<`C$R%v44fh+MJCim71oODI?lb
zVKQ&@uTx<%<+=Mbl^+(uy7CNFr3{dYV5VXG4!6*}2hgujCEz?ujZy}XY_na$?yAUu
z$=zYHwqkEQSyGJ-@=@All})Hzh_NcQ+CrwPx#P<)v5U@g)G}q{SSCeQd_`4<1(1nf
zQ?r!;5_pU?6mdh_dFrikl9SWSuaTFaWVBkmC<8titu_n$Ge!*OMt1D6T2^zb&#e+z
zocp;;vD`u7aBZ`=fn&hkA8*B~>yyOYACDHPg?kK|p~0YT;PVG8<JU%YTK11T@@aQ#
zqzBVqvHLu-x}Co^TRPt_vwJRIqs~;OSI7hsU8`1TNqP8n&%Cwj?3^FDaChRXu9M>#
z42E!@xm8`RjBp2*sbDserR7{JgFO9jB&!L==k>dY1`W<%L&v$~Z0$mKh1Ex~7l!RL
zKu4!KcLF;F*Wc|W?EKuOu1*r&)zsS21y6UXGk==6L)!~IXKz!#zT`*W!<RT^h;Y_m
z^zfDcP%E^|TBi9*`&b<=Av!JW`v}v9TMYBXPt*#99Au9dli}E1SUlYKsXAPS`Z=K2
zs&k<EGj(|EQyuZSdWtfJQ)ah1_PJ70BNNDd|5S&^*2^3JrB-NeRVGE2om5W?3mM5j
zrIhNGNs-H^)J0)Ikrz*^Cxiu%O=pxc&$5+1y27ItLkj`Us$-QQ&CFn&??3_PDjHo-
z2`83dg|MJot<WA0nIepTp;jm!FB8boFVu6C;gd`t|M_K@P^9aeIy?fY?O&-2lwpnR
zQT1^4o&kDc#}X&HT(jVc2PXraKN1+<Py~8Q&a1mMQQSow8`+CEI`a7qQ30<x8YllQ
z56On8{;mY$H$(|nlm)(6M7W~NM=|<dEYkbX9rnf%VLfoq<s!WSNp3so6)O=?1$Bo_
zAXLTd0?{lui)qGHTqz{q<;Mb|psxJ#iwN$;HOrL&BAYbm80@Fe)y#WTnxZg4l)h^g
zI-<3c&_sp_psS&P)Qp8c9ij>$fzpf!6If;NXG&ABl)XiqZmVZ+9+xOlMWnnoplS+2
z8x)II&vVmO7H4ZKV{y^!!bE-*V68@zAPsgXf?9T$m<G>%jc$ILuSWN%m&a-%6h|mq
z%f<+o>{!uFJOy+Wx|IHkSkEr>lqlVPHJogWx#%i*_8y~+=BDOGW@1Fd+O=z&J6!cn
zM?^zYv$GXlA=D<M`U785XAjC^^b3B4T*1vo@`<KcQ48AWW@|(QE3&oR!qt=uL}HjI
zfH9zdnHm#*(mBp|zh~i+LRV8We|uVgobJu&EMdQ=0ym)rp`ylf7g_Qbx-~d#jb>Ma
z)4?6(5E0Q}8xU`9&jEr#;gzkNGT`y4WQO8QmyIhGUipql4L@AzyP`D(%5+$nPTzCU
znybSC$o(;z1z`bX>nP3aIsMvv??r+E#tQvvewjR4HCj_07NnUxMl&ZYfTYGMHB^zw
zny5I<d}SyS*tHpo+cT%cYZ{3kduYISkx9SZK2UG>oq|>>GN1+LS7bbx$7@oR5iXfh
z9-FM8l>ri1$_3BJXMqV9$^kYs#XWj2Fk$bx?aVNg>WqxJ&aBmy*h<lbx}_F$39Hqp
zEoB(J(OP0GHS0`W>`l0t{jNgMqC$FBp>$?|c|M*53ziZZICeE2_0wg#c66Dpnbu5-
z__3=4)k3CqK=<0ecRfgv!U?c%5ivn=H#Vrw=r>-7`W;>*4UsFOJOhIo3Ojg>R&(u7
zcF^Zo`aYw|e(j)4t5a>zOblzQV=Xi4bj23E)>K@EuKqS#&Dv6%-mJCi${1Ub)mUsb
z*Kt-S`YQW<Wypf@cE-M^44RCZ)St`>YgYD}G-H4KW@SnJl?6k6W1)j&R<gmolJME^
ze#I)>X9Iy!?(cZ0FyrGDH+Qn5Ni*SK4L(zGT!AfK5Ya+B=f`J;$M+7Th*P#q`|`MK
zh&fE&;nA7Yi*eFcQf#$&QZ4E)G^E97vlu*^E7bp{A*~Ej!JfS?^#_=cfBgSp>0*A&
zV)c6w!WJVe0q%K1od9MFsS~p@;ml3yOqf)w7P1E1aAa7k{#*u{?<r_}LVd}zu!DFQ
zd!pi;3iG`FC0U4x+n~O<Rb9)cTi}IlY6G8M0&8~>qn7VuZ&BqQy~jsypucoxlp6I0
zbCIb?TWTmlmP%Kw*P4xHy;f(|TlK{ztJP3q=(4}bmNGpLJ>Eg7O<nfC!Bd^;>^!y%
zE{l6Zm^t5%GV3KLX>qmhhv(iPW5?`5f9r9Q=dqtJhVJ*N0crTnZ8B--K{Wgf?~wzS
z26n6<q6t<oJcs{G{zl~)c0%=c6&$qT(LG`@S_6A1wV3gn*VTU)W$D&;)pb!K53c=(
zdYPEc{8(Klq$4A2t<EMi`-Rqw_y|!t9E?(@!-P*nA!>$~KT%hUMcn+UdV!FRiLPyO
zTA4<=oNjcsnrj;yeF{=T$|vd);aw~b_8nJctJX#sq%TG17SQvYW-B+V+1$!#VZkAF
z97#7gTu$kGSy|j0^PDx6G*{<DdM#Hc_oJW@6;X@!^0{DNBdHgwoD2v5iMqr0ht%rf
zYa@&W^kN20l{p$az}zj$Vl!3>_x($q2&+!2$3yEHZ=<mZkn*N_f)oUn3Kgf+i$qG`
zr`1cu^vkE!RbqO}nI3{yo%IqN61&wMBDCp1eW5Ok;2PCxc3hY5Q%@HB>kD<3G%J2W
zwbR8+q*tIBY6rt0dO7KO^LhsKpQ|gxLTezVL!AsKzf?!$a7%(39Ec{3jp+3{#^!8g
z=+<_JqrtJRhnBVmXz3(GifJY=u674gKtrmUOeA`X22HbnMU#<hm!T=WY4e=x)-kPX
zSt#om2h-|HeZ;XwXImR>X>VQ6u=AG)bE{c6P>0#r%(ON%F%DN2thIPKHY|dj<zCmy
zw1IgwS;V(%p#Dc7<vI&eZ=mjgir?cV&*n7zG6rX-QE$0N-ZTO&#~`CUA5N#nVxF_}
zsqxqo3n!YfID1VR+rQbz67<;l_qwalKYkU_3Y1Z8Ux}W+w`HwibH>?g+5db7m|R&F
zlx=4p((|9$--7C4P_o)?W1l@*hAqp^mdn4y{efRav@(sqx+@?U<A7j#uObQx5DQX3
z)ys(!P?gI<#b4cZrAT~Dt1>{?TdXS-0kT;ZMUb^iZf(+`f9o9l9B*A+kzQ9)WGb|_
zFPq`A&z6LD`o){qTc{*F?3Z%W<O0?@;NmHwL>cl`%0)8?^!uqvQZKh(GF>T^WV3Z7
zZ`jZ|T}TBZ%{veudjU-16h?0i!EJmNdVp-oRlx8ZDuF#3j?y$a*K?+YJ)3Qu;>45<
zH4iFs(3xV~dNxJaD;tpxT1=!)aZ1S+yG(v%nAM3aFSD_s&6UrsZL^?NM6T8j)?%|B
zlV4#h@?)t6QYvP--8dhu!lK*TL>EO|=Eg1;Dxl}sXcs(o4xLOIF3d+4zbnst*+LnM
zh6Q9ScOktpl&X@;))czU+1_elpzycoIKc4WUMYKLQ_jkUHoC3B)y}O|LM!Y1c8L&s
z#7w!Qn~2u>MX+~KG)1J-GZ<TggXu9Ts2{uP8G8ESrCfhk8oX>DAvFSQ<s=Q43&}`j
z*e=ua{6FmQT_aZ#O=#rkyQnXno(>DtWc)Qf%TSdTLD|YM2QFVE(if$3Q3j>aEs#so
zBA@;n0V$be%EE{U-{Zx?LtjpJn;WxW;dF|GW8V>R^TJP6jz?rek&DNvv5GrnvKc*}
zW3<)mGTU0wB>-^8LsT5e@|lLS6R1QKsTig>=y`Iba~kah9093SXq52c_vjw!J((m4
ze>#WmgH%K^Wy7qb9ZnbT<`%&1mxxMbaMj2qUnOmJxtOMA7w68hE;k(3grmb~fW$b>
z6lJIuc<8cbz<||&(X(DxTyPOI$+)D~6bu{1<6~<mN_Z%eor2lniO!@hVm`q^6fpE1
z0Po&Unc#XtGYXoPQ4>u822uV;ERgaA5eLx|NED|}Co5s!lhm{*slN&L9;Q-L2XyP;
zL<X6n5{+%-YKM2z2VBY^Gk0YpXCE1kRARM*rrm2Bvso>zhMK3SIEu~Um0}Jo&g;n#
zlnxgjRkMA2I#vLWWs(!wZ8{@xUR3pP>t!Mmvf?yZ9&J9ArHYb9P5+k$OMTYqaqVek
z!=3D-KHc8N{<p0sK+FA&%?u`r+xL#pD+$sB0M<EOxQ#9w&Wt0~=wcoY=k8E&O8QE_
zfx)0Wu0U9GVff1wdwI~{VGL>%;1?sD9!ZY9X7JDjR)Ipy-Y+^f7VN#?t>0kqK$J!M
zz5Gu$48;EF!C1XO;3v&?z}6TtA2uhF!v|FgWJ_uRbS9Do;f*m14!=xgg*V1xIFU#e
zhd0LQQ1A-6qI<!|I2GPNi{SXxR3c27O2vmaQ2nkKD8nGCQJG4fyJBzfl)P-^gH8*W
zN=*uH7RSN9m#Bn6<gr{++2`oa50R_ZnPDz2HWnA_O10)Pqd{vdHI`{hOO1?HUur6{
zni!kWT!QZ5JDzscsH@Oze8~Gdfj&b^hdx68!5_wvT`|4qUwND6K{o9j%)wT|eZm$Y
zdWM{+NtPD*_Z$Zp!Sw5u1t!$c4y($de;QT^<E$$kRskAT{mxx+^D$`tD_-GwbS`DW
zSR0k<xi*I!rQ+7A4EI^9^1pP{6=1#0PfJt+EGL5h!!s7Lr=QBXB`W!_og||bkFEyg
z00a{IDyZB~RVj{ZMKA-nK)B{|p=$1A8E(l6T5s92Dx?Sw7?qmKQ-Ffevj%~Jfo*LN
zYwo7d11!AoA2VcEIVdg?vI$)Y3uaN3;fJdVcFdy2?fM&@2r2vVVQ~3#DgutHh=@vV
zCFX!JyMclswetIt1uc-~7wbB#=&UAJy-xsmFM{q)`B{wOq?IkhlM0$Unj6u)3VUo%
zqbp+I)dxK%`=Dvostn=i8AYauWD9UIILpZ-IC_B?uFNz?P=iyyS{62aOJphoL^h)*
zuty5@8SeC%>i0Kwj;=!Je^v89eJiLyqhAW5QQlNx^#M9uNIV3Ko$L3x+*1+hTP;@$
z7;`3aQ@#8mguYY$%FkENmkW6!cSKhXw-kYfpS?_FFJdQ>tkPqg6d|tcu5E<viKJ0+
z1uA>tRs~BhD1V+R4p+*RLktRuDo#1sYb9pYHaM)z#%xjgDw9Z4uN(Ii5k1-Ci!$21
zb$ue}x+$N1pNfE!tsYIQvY@-0GAPbp**$g&jIdH#h-N5q*~Uh59n+YdwSqBAkFZdL
zgtCE_!D%a%w<3E<Yde#}X>jBT`7?x}+Cc?SM$SgQ&F)Nc%#wn%9QJTX<=3&wMp*^U
zDs<>8ySiX0yY`$rZgWofnUlHfP-h$@Odv;iS3ksuUmuFzSxF}T5FX^<hnACi2fW3Q
KI@8`>@c#k4>C(sm

delta 40639
zcmeG_cYIUV)x4+oo+NJrUSP1iu(2&$vW6wV*o?4;%`hVbEXfkKF*bNWpa~;1X<7^z
zWOCXNR(4Yoph>C>!b;jCh3rBG5Fj+84Phi~68P?Y@9F8ul8tPM;P3l={^R-Xd)7VY
z+^Hwdratp<;*R$yNmO}Xdt!c(T|v(f!XMCCY*?LTwC6D^a2P(yCwjd2DKm*?V<+#U
zitI~5UXpAtf7z}JEfk6$A2+~NJSeO>O7cbdSFm#<QEWe$JO)SXiFHOOtR)7pk>#6u
zy!d>|1r82%R+0Te-@Ez7itLYP3=_irGp7sT?=qd~jY3+4a*7asO*vTzo3lp>;Tzd=
zgz&DM`9gS^Y6K1g#tNDWsE8Lc)q_bEw|N>BU(9HC!%e5XTgK*K;+-1MpARqgURpKq
z?=0c$7{w7ohw`P0?8k>X+b^=4?<(Nai|rTh;#$PzR}32{l<z*=mHzl}mhQ0AMitxj
zBZ`DVpN|+Kglk5+(z}itFQmUT>K-9nHhQWM4j-ezVG%8!8gqbXn-+%g54dO%I&~1+
zSn<>c+5eb6eWy9;Q)G8c%V#@SP9dmAOfMD+ou1Bd5LbBQZdMw>M4&>$W^nAp8E0m2
zVt~UN?wKZ39zN5ReqrWBA^p)=F0me2TINh&XPV~>+TSz@$@ax&jy3ztF9`YjEfzMs
z&pg4txXjgDUuz#W9gh+>(fGG@MF=nHCHB3wGx_iv?EjN>|G@uY=SXs@ootvb6x`o1
zRS4HDm?eZW7d8mts|(A8@N4&u6v8tWO%cK&iwE-I$#5=#41IC?;`>M@h3?X&GS#lW
zpBr`_V~||(emGn0q`k<Vyt+~dpIALq2rpbSSqLXIaiHMxUo@G7^wn!QG;q3c9fvy(
z|99Ouq0CDAL_Yi|``-hai1jNNKBvTfdc#~H{MX0w_%MrHcl+dxHErSc;_^*#Qnm($
z;fJR<lHu_0pXRg?4yQj;B$PSu%y=O@_gN+1TMLbq^XCIJpHpI=xZNs*BX@AM6YF^R
z4(?dq7JPQB|5E;1!eNVHdGD18LjSd|-X(;CUgI#wWtv~p@jddr=w5%|mc6Xr^`wgu
z556^nZ=nTd3;y2Z#B7Sa^ni^oRbo##Sm@s8frD*Qp2aNk{csm%V(Nz<n$EU{vDtOV
zh2^Bflf1)~|LH+Ws4?RxM{!)c`?29d`U}Un;e^x6zvN*5=*wq>`~$}`Jz9Tp{)xw(
z7?;?qzHtr0Uf((g7*FMozr8iavHu}l7+0Mg%=WkQ>|X>Jwx4T-@>|ZUTqYv<@;F|%
z6xrXp%qdL4I@!yvRJW~=AHDk5o=*J*o1+LpvBJn`!f9~awU#3+hB!?LmBz*stP*84
zFkFZySQQLwKPQV}V=sc$k}ewoLwgf#gXCD8Ky;1A&BLJcl43Z~pWy5=Qsi*o0HRdr
zIVYb;V<RHH>OkIyQJ@aoGlZDQ7b$|Up~PUeU4cIE;!t94n*?$k93=UgbS!BgRwg-4
z{795ZU{^Jf?qm|=)gbJ#uYx2Aj@1zCki=fhMm}`{q|7Hq2u1eHCpZ~ysmUCFswIA(
zA(U&_NEmTMXbOrq5q37)sWG5vGf{o3!R#pCz{4MxVsE;(&yn_~B$0sQ4-*lNtQu*B
z44S4<5e^iOmBC&c838vQLRs=dl4&x>ny-kX-2{+!Um^sB2c?%0DV%u6Tp>mak(aL!
z+{nZfnQ@h{2svG^5rX!Fm#>MaQgoeQO%bfUPBaPS>wiYF<m@B<7oxuqdF~g&AVhRG
zL@YRRgD4hqmfj?WIV0<1Ndc_&dq_dO!`%ewg6alAI(bzLkCLKddWk6Vv4mu;BScc<
z)6O0sh$dYi{*fltLQXuxm1m{oFAO;d=U|RbfXDwzM6dq?)zx0z6epBFBqcf1jA>|-
zk%9pNT22<Qm9e7?f0T=|@`6N&d=bQ<3+iBUhtRGzgmf|L;}8MY2~ZO%M2a9NOw`iz
zVWdDr7#2>tWZ=7SlI0KP+5}h^A%ZzMlFMQdJ`gF&nbDOL%sxoFk%HZaSGtkaJfwr5
zvOCF*D}J2hKzbCJ$Yvu$=y*1iS|V|LSVL+h5F1b4&1NLlmB7JxlGE}yQq_wm4~|6k
zCOQ8EM_%a7kr7QXN?=$5$yri<Wc_f<LG@B1IYTb=S&_+86*m@|<>YP_`6Mm^#aZMO
z7_TJ93KcFYNvEU284P$oo4k3;UY}Hvy@T0CuvkP5AO*_^`v;Jm0l_&_@=4Aq+<CSb
zf(CNMu&5TpD+5J*DJ>xDh33)<$!UCK0vsw7NyEHBJS%Y9(Svyb_~^@Gcy%yY!XxGG
z95@~^P_-n_pHU-8R#jj}b`M{?1l}FR4+%k?%^yuJy(JCa9z)7pG)S5%0_~ltWWIpG
z^l3Z>eDhHdKAl{0%jV1OCjS+I8(}A+&{!o1Pzwa-&Lyu3&H(JG<4{E6#4~hFJvr}|
zy&Y~KzYk)2V^u-)a!z#ELGzqAGVlSif=8_gu023%*ocP-*}sB(-38R)-wWI+fd~H}
zjHk(<T1l?IC2)^5k^=+>1v2feQ6i+7ycjLm<Vk-)<&f=0D+S{re2^rax4tc0i0#|R
zrVu`>2-dxdgbG(eb6C*6hBTKma^y86ug=Jd*O7v7MuzS}s>2z%xC>$DjBI!V4RmKD
zcQ-j(h@9Sy28J_d(;m_!L?-Md^Ke9PR3aTe>?KQDo!L9izex^^V5?)d<bi*o!Gjyd
zk?cdHS%{oEL<;j(_}yWy80?c%#i0F^6sCx9ijQzv_RmCFgFoj;ie0MpERcymNhZK=
zzCi4C_L*`7sUT-${}H5KoRJ5Pia|Sulz}tn$T6gnoRQyr$x$6p+r^N4oMatA&Wn5h
zI8RWFo%IAyHXMmNNeZ)LIC_$-bhal<k8vs0DG@=wK1EhJOTm->MoPd5g63<!n8=-D
z7n2+r-;i?{wj36a?@o(2|EC|2nMExKjEex}8Pe98Pv;nPmW-DQUGBJqjJmV`F_)2<
zaz>6_Ms~y*S$Ku#+s+_F_|&VUfz9%O^T(?snjzp?7|w5R3iuSQe@w#h2WRvnB-yx>
z2xhcya&N0JpC=`CEc$>~Lf{p-gcT_+c25u=L$Lj!MXQ^FC5u{Xm80zO5Xlaf9I)?a
z#P?I(CEP&7Y<n<D!jcvtBaB{$I$E;Mg<^EPgqtv6wD!hJ*tHuGS~Gh|T4e<XKx1!7
zR}QzWDH4%%uS}J=q+8oZA{r@uB+fM}7g$@<B>!cnBpgwWXYoW~vHGo2gjJtxiEDHo
z$(C^10pq(qN7M^iY}0yYa;RET>7u|t^%9p#xi3%BVo40T8g4~_LZgJ@gc}0^1(I@>
zi}Qo12{5TpQo%yewl+m`l%F|8i<{^<M<R?v_-u}ZQ=m9!SrtbXR!ybMm2jF`#9odk
zXeNTDJYzRW;!+$%i>T*_7Yi>uL%`miL=+UrC8;cYYyT+O&IRy9ulY}smJ_}Hk4mg<
z3m=-A9A<&T6TL^BtrkPhj}lI`W0+6;C}Bq>R!q<Gv?zl33leV9$xad9ydZH6<5?HE
zEEY-nl4O`rY11VH5gvDVtq`VM7E$J=IP%ODu1mHB!&Q;+d~sFc((?~pld!9>oXEvp
z=S2<?rWkf#7okw|GuH$jV_O7hUiyU}I~dEEHzeHBA&zvvDd8+2j=X+TGJ*vfx4V7{
z#ZrdDKu%B``4B!&3++xPDVDFCCAmgYuA%d133aznZVE-Eu?-`o^0?3gETp+ESme_g
z%4NL{GR}svs;H7uE>#gGqd0bK%|(=bSw^`G%VasliZBM}dA1uQ*{`z!c5p5W7PXTU
zLb=A{(GW^J1hZjrC>6<8#5)Xl3h*gIbb)2vsbrkW>fB4+DRzp_Mpi~qqlBFFXs#bY
zJ4M2gXzHETB-BwHOIhVYZFv&q@+r0?QJhd=t!GT;;m469$rL9Nt`&y+Q>d?7>x8#%
zeJDDZ?FsYy0X5|^(K)$P4bA~X*G)o^bs7;@^jeBlhrr6+ds-3qmgqRrv#ji=r(9a$
zvYv7&!EJe*7>V^f2O09>udu2P)()h$v4A)cd#G)kzAU7Wn~u4HaWamfI9Cftei%cs
z(k(C|0-hX8Eoi$v<d@6BptKwDi=#A$dX|7SvpDHx+n1N}0w+>sj*m*IV;t~k*JCRS
zi#n?qo}NvyRtjM|0rcfmKR2`@;FEGBf_Sg0wf!6i^4b$*0xTa80-A*l6t}&F(fp)=
z$`x{^F5o!EjoV)q@C3)@o?1v{@xTe@jHABoUTPJK04vPHmT;qwjeNaCBy_)9>VZVc
zGOAT~f@{2NIaT1YI+uPYG~NP;PamcZNI)@_rpU^PkT{i|6B4c%sW4U7Ewt8J%itU#
z*9zGuqoh^c74yn#s;yay`f{tnR$F1ME~{DupRc0gVQm$y63XJHh$OhU3Yj@k^Of-B
zD#q2~`PJ0BLiV8Pw8C*>4K<r0cPs3s`3cN!1=_3F1H@Rm9wJ_$y2{xE{ITx|R>xHC
zL80;u4dp50%2U@gr&qelr(<;XIVe-GP^EGU99d8G)>tg2GE14+thCrnYNghuH!6)5
zy-KOFS#&CsRim@1)y<9a`kI=mS=FYw)@D>O>k(>b<}nP-ar`-jK27Cm;~LBy2)jH$
zIJts}qMks-AaW|*4FhvhFKu*BVewrJ)SQ^!S5e7Es@{5UeRE|{B0?(J)nZU0e6W&I
z_GD0cC5=8@&#nSQA|!rBMKA4w^2SvXxO!yY<<0jur<aGI4_l{PTZ!wJ_ZDa1UfJ&0
zPorc~xwYBVEQW(eGK6h86n|a$0z8#Cqp3Us)5Dd`Lp9i6sL~bo$k1+}SivL|wihI?
z5VcLGnYW~qJ8!(usJz@og_cA@5QVxC$uVyyRZS%cQd*wOiPTD08!oBlMgcc0c0=Re
zsQ%II8Ul^U_U-EA*k)e_PKW?fV_Xo-dWebjt)9kJFG8VF<mW3?{el$SpHCg@T@7?o
z)LQEsYO58)OjUJOwv`H>+Hj5f#x#3aZklhPi)!_Rg14!j?XK3>UX<I{w^}L}nxP6k
ziyMb*dl5{97xq)BzICc~bsDK+`>bx5tH@X6;&6LA&b9B&&GoHc5oJ^1!`)PxFLLXY
z^G$oGyL>6%*M%IDu2!k~_Vo#)=|Z*2&yhkDD@d&I8&lM3y;fJIEmLZAWh$jsr_EKG
zErv2>nM!RfQ|IXnYQ3hJGYluNM*V>3(&fSC3C)$K9P9Q`SBcwWIR5+=^|UmYRpHlg
zuh(Jg7`l7g%B_e0%FUYr5E&#XYll0vMauWfB7tHR)A!dfM7K8Bm1C(cU0h}&h_%A3
zQ{t1oP7C*DuiF-&U)?%x_<)*DLDLla1nU5{%T9`vjt&MT$zx#7QL1;l6_x^a4v@#f
z%>qW|TV1E#T6&p^Z>Nvi*avpK%k=TB9}#|8usof~j0^Hf;fd;HLgX<jv)$dr!2QRl
zn08ki4uig+QsI|gbOb~kqk<G=);ddVg&DcnKDaS`1U=m-N%v8=-y_s%MYn5nRR)_)
ztyfx%R=rZ2r_(A8I=x<LFj>tyL!QZIF*|j8QWDa#*z>=?xiSTXr;dc;qf{;IeV0jr
zZ;w)IU5LSR6Xn6M<ro!mdvyOlzoa((zwYnAY-EsMx*s_MT9`ix&0q7sqk=n!5ona=
z)S7eVFEDg)=GNUgfpHlU-g^6KCzUbsq`;8KPe5)?W-<Z;h~Ltqg1se-3gR~~0g@iS
zAu52iBwYZ%bRLM3ATpClf)7pyYJ~YIK68Jd#s@}x`~+nD87iw&01|eV(gg+(zr{BP
zOvUmXke>^bu=ov8S2&X(@6}1j69YR(FfpS$Xc}6z41N<S3nH?Ztj-6Q7E1NB2I79A
zLOKZt6F^PT32@}6P9xxXur`a)z>W)4cwlJcr&^qFkur7)Kzd)I0<=QyCq+KIL<L9z
z`3cCf%T#J$SmU?GNrGO5$g7xnB~atYPtyE+g)(#!(&%CD1hh8Nluy&}?bSeW%uo7k
zzDA7=41N3rWa)KkQeXh_TZVIB+bAXn{`7O8WY}+r;$UY5lM)#6bh3rVK{u#|;NH7Z
zT>G-`p|E)G@4XauUzT|nrB}WKJA>(N#9I*AkB%AoCQ2Gt`4+C=wiEjfPSIB48s*Ey
z8x3qf+?KP&R8`enc{BxYfM*^>B`c4i55E!n0Sb<*{1AU#^L0-E26YGk)G6u>e;S8?
z`dwzo;AXaO@eX@C0K$!ZC?<>FP-Q^r2zf?;p&H;1t>9b;-J=jQC{RT551gH$bYeik
z@tbG4P!vn&2AF4lL#2gt`<Zyy6idf;Hqhcg{ZA$?z)<D;BjhP?*1+_?$6qN&gGAUU
zT;HV&+9XAP{J|YgZ~D#FLQqeUN5Qg@^2`7e&~MOmu(?LA>ugZz?aLSRh8=H^G(;R=
zx^+76V0#>`?`%*N+KGFWuyQahhjW9Npa6sC=TJTKHlqxv1@I3Z`<BH$9kv+yN3!IJ
zROApmg+EWD5AV>hN=0;hu66%He5#7`csv}8rEO}tnVjF{b^>k}ZUZ}Z?8n`^6JT^X
zU9G_2)NJr-Fda<1<tXb(?+*`V+kOMLy&Ke-=x9cp(Dm>iIuDo72^V+Z4E6-mH1DCd
z4GZs~wn3?uX9Y0{Z|$ODT43L`sT}?mOo#EX_#|Mh!U9Fn@==-X=wIxS`s8f2)-`Na
z(lH(F*-xa;9cOxWv}^y6zLZU8bhKxmjA(1*Msm}rgW_1a8-#pM^@ejL3<ali=-@jB
z%`o`zd#XQtNYcT2(GvR|k;VCHdRj*b;h#Xv$fc)tv}eBsA``Y}GMNFOzTc2U!;<Mt
zG-PW#E|C85;eeJ-zhivJfxRQp($uTEj$`jP2Mlm_1d{>5KT%-;5D5R6p~|CGcZ?ai
zc!wqvHYd_j=xgXWNBkqfKMb_Cqa^UJ=SCwvtfM{qErqGjBU!F^q>!Oub-z1B`^^4y
zN=GT+AMH=}r~BTSo*x@PkL+mAeset!!XssIus;7zVP7<mR^Kt~Gk}PrGw!(3JzhW$
z?<fuYlloT*@1X1%K{ZMq2fb{J;*PVRdN6J1C=2`^gz2y~pNWF_*-Qw`971=!V}K;X
zN3)q^$Qasj{qHw1GT<alcZU;0>BKumhoOQaB8Qtv=+O7kyY3)Gv=E+5YXdMu+Fm^Q
z^_H174X0BX;r1-Pa0}XT^f>pFpT^N+g%o@tcKEH1#G5P{vrS_(E7f{yo>Hr~8kMG8
ztwyQVsEit;%BZ#GYSDEkI5VD(rSN%pFfF6f@*Zw*?MU91o3eKo(^jc~3X86K8f_I)
zJTBNe&;{EuH2F*#oLt4Ig>vl8<Xkut#iYaP4Rnx~d&^STTTkZ+H89zh-imA*i&<w?
zYt%}MPNz|7jasu3T_#p5^U5>^joxN9Ys(D$EwPW&&_Wn@lOVnFUntTjpI1}0sIsBL
zg04awMhTw8Ohtqa<h|qm7Wz4N;X${xr&Q8OaB5DAYuursit3trMO{Nhy~$h!#p7sq
zVur^lY&Es$LU=`;qTW<D2R%wc_ZNuAGU~TgbiR8^?p%7JkmA8QVDCm3RnwO#ul$1_
zqL^tyb+(J^rSxDS#V3y0ESg-4&1h4WnKd@0HrHfOnoTBjug_#K7*!gxPJ?fzuou2N
z1II2dpc~vd25rkfN5mBm(J8b*7?xDAjdZbl$`_4vsapzRfNiVjM5tL!$H0*SNf2zP
zqWicN$;il76gkBfh3YG6suf5COp3Xt*%jy*gThi%ZK<)KbeP{rxyuZZ10%B~Jz?$|
zI#`ayXD)hkpv=oqOoHSlB$V!N3k1vO5*2VgThdEfUv8>bSWI4e&_mc-I;E>(p=puA
zREKU7o2rxxYig^!^b%%JSjw$)G0=6{K|%0zjwB&Sfn>VEhTl1WlXK`?H{1zyXlflg
zm$}@I$m0$hQo|&=LE)CzihMUW)Bm}R@@+9&O}T2FL1`*enb1QACL2=ZR*O<&)vDFz
zGM&k!Q*|Qwes3c^TO{9z$M&Q{J>h0|i4?}$$uM{<m2pX6D<rLan*M}xXH^Dl*(i&#
z7hmrNwT)DZ7b;|M<`dc=RPf0_TD5weQKwcb^+uCcsa5Bim1d(+r?i=jDw|eg%GFu&
zuz@r^Pshmk3u9lyvggs<@U|Gnw_l)p_x!(o6S(rNpuk^s_48!l@&j~1V2-}|eGV@f
z!rn(p@;SXUK<Cyw*<rld@6jXOZ5WZjj%wMMD$`t(Mrm-@x2%iT4d!j5hqw*xskd_C
z%o>&2s8OQ^^HgT!5?FOeWuo>~xi+IlV^brSK+UVnuQLQEuJU${?ySS~@Be>vi_bfH
zys6^#BD<fXyZ9$MK(_|{1f)hU9Ud4p)5!*P-bMP9yQzki*JyM51}qw)DwE!jr!?tu
zt!Tii3`&FAphhk|n!K6}$my|~y$;xI*U@&_Z866`{!CZV9elDt$}1=sL@^3q-aHZA
z<<9`qJ~9?mXPC&i1wP%V&lc2SWAOY13uiB?)Gw+mL-*Z%xQ#FBI2P7~GBI&wKGhrI
z>QiBvH^*X}Wy?|P%F0KpYll`;+p0`>8j)?OTaeV(x7Q51x*F`4te8-<urA1ceyOJ2
zj}!C*B8=(R?rH;}e;6~c-PHy_VGz>;>|sn&yX&UH%VCU<5B`YQlnL{1NP9p`2-D3M
z$-3p!3Fb1h(SnvdlxWc9q6H5NnrN8wOiDGHSXgt_8l7IJ=ZBuh(+PjaPbb8{q)<jh
z%m;Ohyc=v9ArHfEDad6`ad0?7nd!IZ^&BG9t{xZ*5pm4N_zBbu37me3Isx;h(mf@W
zUKfmF@q$q-9DTIK;s|m?mTW*X!3pD9W{|Lan`qkT(~^YNqDStA8qF%S28&W_DMS8;
zF&E7=)GD1pqf+JBOeUVDzv_|%dZ%w?m~d#f@(H}^=X}_XU8=bp%d8Pi-q0ktM-PRq
zp&HNrtI_<ts)~Qg%UY)JGFcA~Q&?+j(S*CMqS|6rc+U5$LWLEwB(%r?^ApkNahqea
zK3^)VOl0C|^e|z~T=%yN+3ZAn&EY7Rox}_ftPD<%PFBpTsi>}3)Y#DKMO}lruHJ;e
zfV5<0pj$zr4}6-;^p<5Q%nkL5ih557`lc&ts;kg~!@PM_6;`w!R>LklxEig?R*bYM
z7S%Mk*TqjOhNqP&sw(DKaiuxcH49;@MiMJ8tFYP7Q;gMKItvR!<>xn4lx3kO8@;W8
z#Kb7-YZu}6%B@xN6bmcr%h7s<2{n}}S`ckzD!r-?b2zATPb-J`@|=g;MH}{^Me#+O
z2r%U`io%F&<jqH-4}XfW?H81UbL{-_b^gT+pXPBM;8e1G;}3uBW=b;)iTFlI`@rKL
zWc2#_q2DlamvC+?j6QkHt<n+BhtP48F)wcq1qXCU=y)!}MjexM8-WV|dzFPu#%*P<
ze*_$u#}ssC0>;CdLMFZw6Yz|I8E_j3=pT1KGBU$EEpU7KF{3*za69`mhE5Ay(*S1h
zZ3ND5t=Hea@4hTpJxU&aTL-RxhV7Bz^7z|GME`(eFZv8FV7@2ke2RUk&++FA^x+*U
z)*g#4`n2xRh%ecAEcN{_c(StJ5ayBa&h0n1y%Koqmq%M(|7q{jqu!qi_elWVu7`*p
zFlR3U1!ketPeA?;zI^8=MRt`i!vez^pEP}|GJ>X9V`1%ZW^CtsdTJOfQ=^CY5=Jmm
zcz<fAc^_~X6f5Xq?7_WG!oa(rNP|wI6eP%lU{$d^>Jf#!vpl9a1V6VnB;c~;=ipP!
zU?vBKcYXpQyN4<66o8z*hsg^JAbzVOBdANz;q6amGMRya$WI=voy7#`)mFbr(*q(4
znH~WjO(T3+zG=&X=td8oGpI_v7`6_ev!TDK)9C7SAkyRt_{GF@3yduJ%|b1lFOX-z
z8?opn+Gl1aEHGgCDdLMP%&5Qs;x~PaaHfD(!tctMn7}~fCu!7HW<;j|B*eyy3=ANC
z^JoAp8%*~E>1?KRyuSO7*-U`WgZL>dTgn6FSNP4Nfp9~Kw(5Gt$^zsHwmm`q)qe%U
zQOTT&aodT6;1!|+@U86N<@}aeA#<xn#K5`t(8jyR&M8Idv}&KW1&^&}MoS&&7dcdf
z(DX;E>A5gDT7DNiRz;@@$?TqMD8z@!V!dSa0Cg<7p@g>l8Bcg%@S{wsmrA`M@*}1<
z`+_>$Gp=P{qSwsfCLwPDiRfi<&$?jV$c%5%Av%H#BR8R)QV*;kVl!iK?*i}O!tu>a
ze<-*nbMF~;Y(cx#o{f}lWptj&1Tx{@qQ}WbJkErB!b$XmJ>M}sLH-02>{%C{dji4b
z(GxkOAM7obbcgUy(8cgqpJc*dV=AJr=!f~{5NcTdH-zh&r@S_-dYZ9#HcS*ju!G5m
z+0P)RcytRrpJfugB!B!Ylk1r*W!Te4UiP_R@N-`2_v3R+Hr(Hceo{n?2$RnqAA*xt
zDFqz;3%ZEs3E28=%yiFWD!vpQ{!e^`i394%7RNbY$P3I6&noCAbLYQ;E*&1bf~e+3
zQ}1JvTo?@M2&TzV_&k|TIGRpUQW8GUk~#3<c=;QSFJ59kVIFx*cD((+b|V}eoB0M~
z^yPq$P@!Nqlk7_c(OIHiu>4)7mv1MR#6NUqaGf%%N0-QaIA<n6*|e95@&!tv!q|OG
zT)QfS?PoIDRpG>bCfk<^BElu$HwP1ZBb=z(&)A246wZxB<KXy6`3T<{5J<6h05hna
zfM%c_k&JeBgWn$WrJLTukv*@!$^*yWVbY?xi&rgAj=`z|rrCjPMhJO(PH+DAAag1l
zjlk=VJW0ELr<Ap1qThb;R0QzJCCZzQ|LHh7HRh>+ww_=VUXs07J#2)!f91^x5xKA=
zPM+_jneC^L8S+q!u<YN=6fdRce$DjqG&G?2hB106efAp<JBf}^!N0y`iafhSAfA62
z!G8KXbSK+`3dDFg`7vtk%l~*aIZOYGEQ^PchY8;^v*65}mbSmhK7USc_^?<W4_XJ)
zokW`4!^<HC!cv>OuU++<2pS!X>esRerZt%+?+y{MbXU*n&^(Jt@PbA>?06R$Y>)23
z!iuY>)s#4owR+xBV|sC>YE3>J>scM%I?s6Vs9;~UJR1~U(es0ce`LCPfhP}&2O+70
zpU`tSo<!H<M-?@&@&fV#JaaQZVe{&hh~`0_)!_3>%p@<#Z(e3bdr5xs3NzFfYw7sx
zD)UYcP-$fp8j{x_LML^NN#t-H6dV2$`FfInRTKtQ(oux#R*dWJp?9n7I36pt#)})9
z125~OW870}_0kF<rIm(84VQgGIvV>)jj1femU%K4#Kbnb3aln+OP?rMUInxMAxner
z=F437(^~1_R4w1b$|T2*ho##je|t=p?Q+Gjrh?5IWwQiGQA!oe+a%KnDflRAd|Nsg
z9#|vI=*r%Fb-(6f-YmOKr{<sCBA^8btsC~HYx^9Zy)ElYK-0U@2*;9FrPH$zNq>gf
zmt^jjF(K%(Y>I#!OMs6r%Ul-;*p#mSks4vy)s~)l^fg(F3-gDr$;P`kR{Fivo12~k
z=e{PQVen~biWd?8`LwjJm*m%fkhYv<V1{iuBOU0abp2UrfoC%E)W;u^rb5j*X^i_E
zgvE3{DWBwyz;uaxgnLRiO5TEEM<{s<ioHO~7rEC;xG22~mL#>9IKZ`w(qW!Z!r@D(
zw1<L$otLHFRKmI|(o8SPe&SVWoKKo!#x?0TG9(|Kb{oE;WP`l`@)|9h>`p#*8v7NE
zUKo6hK{DoPdLEF<ay(li(38#IpgDtw{zul&B$IhD&_p)q<g#qf8X=kZXt1KLyru!&
zQ;rCdMM>wG@S)ur&(q9IhQd}+Wrge@G`%jJ!30Ta>PkJEL^rt$Mxt5YJiR>BGdC#_
zpHD7BXPL7VBhWG9G<1KvT4BA{G<RN=wO>$BX{nbcr5W=U)uUg5hbb4S6!19t&d{?k
z(4L)1Vift1_(!HYI`i*AEKtSBy%<;U?kV-|)#|;Gpr8tyXY)iqI7y*(JjGQ?4)Qd4
zv}X}%c3<`<k<s;$bhtpsU8<NJSN5*55uP3n%<m=}<0%s`vAb-jXEIr!fT|nP1eg*f
z^Jbg-!M=%z3h33At}rrM)*ZKy5Vd}B4tgpZ{Z)=ppwDRhnFuUUKSd)U_8eqi#>htb
zG;CtyWG2eff)GmfdL^h5WG#&qR#)F9$a=x*Z6X&8o0MDL7}4gMEheqbth8#%(2s4Z
z@Pi9#wMtoLEX&K&<Qh~4qw~Q9H?xEAZA<~vSTY{Qmryb|KAOBuKdd<>Nu~<IT7;4m
zS!+E-gh+>-#Z;P43uRyB$R>CpEqtPr<#`fsT3hxQ<BxuFI?t#_PmAQKtYzqGhz8ws
zGv(RPt#gA(tIt)NRR)8%n{Em?tCuC-mdO%{9#3HxGxi!}_sP8~Uqmp|bSm8oB}YS{
ei5%@EBM#0?Amd<ND*B~F=emwpUnqfW$o?Oo>P|xd

diff --git a/tests/integration/fixtures/recorded_responses/invoke_tool.json b/tests/integration/fixtures/recorded_responses/invoke_tool.json
index 2dde8c83c..77995f72f 100644
--- a/tests/integration/fixtures/recorded_responses/invoke_tool.json
+++ b/tests/integration/fixtures/recorded_responses/invoke_tool.json
@@ -44,6 +44,15 @@
       "metadata": null
     }
   },
+  "()_[('kwargs', {'session_id': '<UUID>', 'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics about the dataframe\\nprint(df.describe())'}), ('tool_name', 'code_interpreter')]": {
+    "type": "value",
+    "value": {
+      "content": "error\n[stdout]\n[Errno 2] No such file or directory: 'bwrap'\n[/stdout]\n[stderr]\n[Errno 2] No such file or directory: 'bwrap'\n[/stderr]",
+      "error_code": null,
+      "error_message": null,
+      "metadata": null
+    }
+  },
   "()_[('kwargs', {'session_id': '<UUID>', 'code': 'import pandas as pd\\n\\n# Load the CSV file\\ndf = pd.read_csv(\"<TEMP_FILE>\")\\n\\n# Print the first few rows of the dataframe\\nprint(df.head())\\n\\n# Print information about the dataframe\\nprint(df.info())\\n\\n# Print summary statistics of the dataframe\\nprint(df.describe())'}), ('tool_name', 'code_interpreter')]": {
     "type": "value",
     "value": {
@@ -298,23 +307,23 @@
           "type": "text"
         },
         {
-          "text": "Result 1:\nDocument_id:3e3a0\nContent:  conversational data, :func:`~torchtune.datasets.chat_dataset` seems to be a good fit. For any\ncustom local dataset we always need to specify ``source``, ``data_files``, and ``split`` for any dataset\nbuilder in torchtune. For :func:`~torchtune.datasets.chat_dataset`, we additionally need to specify\n``conversation_column`` and ``conversation_style``. Our data follows the ``\"sharegpt\"`` format, so\nwe can specify that here. Altogether, our :func:`~torchtune.datasets.chat_dataset` call should\nlook like so:\n\n.. code-block:: python\n\n    from torchtune.datasets import chat_dataset\n    from torchtune.models.llama3 import llama3_tokenizer\n\n    tokenizer = llama3_tokenizer(\"/tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\")\n    ds = chat_dataset(\n        tokenizer=tokenizer,\n        source=\"json\",\n        data_files=\"data/my_data.json\",\n        split=\"train\",\n        conversation_column=\"dialogue\",\n        conversation_style=\"sharegpt\",\n    )\n\n.. code-block:: yaml\n\n    # In config\n    tokenizer:\n      _component_: torchtune.models.llama3.llama3_tokenizer\n      path: /tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\n\n    dataset:\n      _component_: torchtune.datasets.chat_dataset\n      source: json\n      data_files: data/my_data.json\n      split: train\n      conversation_column: dialogue\n      conversation_style: sharegpt\n\n.. note::\n    You can pass in any keyword argument for `load_dataset <https://huggingface.co/docs/datasets/v2.20.0/en/package_reference/loading_methods#datasets.load_dataset>`_ into all our\n    Dataset classes and they will honor them. This is useful for common parameters\n    such as specifying the data split with :code:`split` or configuration with\n    :code:`name`\n\nIf you needed to add a prompt template, you would simply pass it into the tokenizer.\nSince we're fine-tuning Llama3, the tokenizer will handle all formatting for\nus and prompt templates are optional. Other models such as Mistral's :class:`~torchtune.models.mistral._tokenizer.MistralTokenizer`,\nuse a chat template by default (:class:`~torchtune.models.mistral.MistralChatTemplate`) to format\nall messages according to their `recommendations <https://\n",
+          "text": "Result 1:\nDocument_id:f76dc\nContent:  conversational data, :func:`~torchtune.datasets.chat_dataset` seems to be a good fit. For any\ncustom local dataset we always need to specify ``source``, ``data_files``, and ``split`` for any dataset\nbuilder in torchtune. For :func:`~torchtune.datasets.chat_dataset`, we additionally need to specify\n``conversation_column`` and ``conversation_style``. Our data follows the ``\"sharegpt\"`` format, so\nwe can specify that here. Altogether, our :func:`~torchtune.datasets.chat_dataset` call should\nlook like so:\n\n.. code-block:: python\n\n    from torchtune.datasets import chat_dataset\n    from torchtune.models.llama3 import llama3_tokenizer\n\n    tokenizer = llama3_tokenizer(\"/tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\")\n    ds = chat_dataset(\n        tokenizer=tokenizer,\n        source=\"json\",\n        data_files=\"data/my_data.json\",\n        split=\"train\",\n        conversation_column=\"dialogue\",\n        conversation_style=\"sharegpt\",\n    )\n\n.. code-block:: yaml\n\n    # In config\n    tokenizer:\n      _component_: torchtune.models.llama3.llama3_tokenizer\n      path: /tmp/Meta-Llama-3-8B-Instruct/original/tokenizer.model\n\n    dataset:\n      _component_: torchtune.datasets.chat_dataset\n      source: json\n      data_files: data/my_data.json\n      split: train\n      conversation_column: dialogue\n      conversation_style: sharegpt\n\n.. note::\n    You can pass in any keyword argument for `load_dataset <https://huggingface.co/docs/datasets/v2.20.0/en/package_reference/loading_methods#datasets.load_dataset>`_ into all our\n    Dataset classes and they will honor them. This is useful for common parameters\n    such as specifying the data split with :code:`split` or configuration with\n    :code:`name`\n\nIf you needed to add a prompt template, you would simply pass it into the tokenizer.\nSince we're fine-tuning Llama3, the tokenizer will handle all formatting for\nus and prompt templates are optional. Other models such as Mistral's :class:`~torchtune.models.mistral._tokenizer.MistralTokenizer`,\nuse a chat template by default (:class:`~torchtune.models.mistral.MistralChatTemplate`) to format\nall messages according to their `recommendations <https://\n",
           "type": "text"
         },
         {
-          "text": "Result 2:\nDocument_id:7da0c\nContent: .. _lora_finetune_label:\n\n============================\nFine-Tuning Llama2 with LoRA\n============================\n\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\nIf you already know what LoRA is and want to get straight to running\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\n\n.. grid:: 2\n\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\n\n      * What LoRA is and how it saves memory during finetuning\n      * An overview of LoRA components in torchtune\n      * How to run a LoRA finetune using torchtune\n      * How to experiment with different LoRA configurations\n\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\n\n      * Be familiar with :ref:`torchtune<overview_label>`\n      * Make sure to :ref:`install torchtune<install_label>`\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\n\nWhat is LoRA?\n-------------\n\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\ntransformer models, in which case it is common to add the low-rank matrices\nto some of the linear projections in each transformer layer's self-attention.\n\n.. note::\n\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\n\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\nyou can expect to see memory savings due to a substantial reduction in the\nnumber of parameters with gradients. When using an optimizer with momentum,\nlike `AdamW <https://py\n",
+          "text": "Result 2:\nDocument_id:c4fc3\nContent: .. _lora_finetune_label:\n\n============================\nFine-Tuning Llama2 with LoRA\n============================\n\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\nIf you already know what LoRA is and want to get straight to running\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\n\n.. grid:: 2\n\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\n\n      * What LoRA is and how it saves memory during finetuning\n      * An overview of LoRA components in torchtune\n      * How to run a LoRA finetune using torchtune\n      * How to experiment with different LoRA configurations\n\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\n\n      * Be familiar with :ref:`torchtune<overview_label>`\n      * Make sure to :ref:`install torchtune<install_label>`\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\n\nWhat is LoRA?\n-------------\n\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\ntransformer models, in which case it is common to add the low-rank matrices\nto some of the linear projections in each transformer layer's self-attention.\n\n.. note::\n\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\n\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\nyou can expect to see memory savings due to a substantial reduction in the\nnumber of parameters with gradients. When using an optimizer with momentum,\nlike `AdamW <https://py\n",
           "type": "text"
         },
         {
-          "text": "Result 3:\nDocument_id:fd0f6\nContent: ` module, which we swap\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\n\n.. _glossary_distrib:\n\n\n.. TODO\n\n.. Distributed\n.. -----------\n\n.. .. _glossary_fsdp:\n\n.. Fully Sharded Data Parallel (FSDP)\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\n.. .. _glossary_fsdp2:\n\n",
+          "text": "Result 3:\nDocument_id:de2d4\nContent: ` module, which we swap\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\n\n.. _glossary_distrib:\n\n\n.. TODO\n\n.. Distributed\n.. -----------\n\n.. .. _glossary_fsdp:\n\n.. Fully Sharded Data Parallel (FSDP)\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\n.. .. _glossary_fsdp2:\n\n",
           "type": "text"
         },
         {
-          "text": "Result 4:\nDocument_id:7da0c\nContent: 06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\n\n.. note::\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\n    for more details on how you can easily clone and modify torchtune configs.\n\n.. note::\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the\n",
+          "text": "Result 4:\nDocument_id:c4fc3\nContent: 06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\n\n.. note::\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\n    for more details on how you can easily clone and modify torchtune configs.\n\n.. note::\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the\n",
           "type": "text"
         },
         {
-          "text": "Result 5:\nDocument_id:fd0f6\nContent: etune\n:func:`torchtune.models.llama3.llama3_8b` with DoRA, you would use :func:`torchtune.models.llama3.lora_llama3_8b` with ``use_dora=True``:\n\n.. code-block:: bash\n\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\n  model.use_dora=True\n\n.. code-block:: yaml\n\n  model:\n    _component_: torchtune.models.lora_llama3_8b\n    use_dora: True\n\nSince DoRA extends LoRA, the parameters for :ref:`customizing LoRA <glossary_lora>` are identical. You can also quantize the base model weights like in :ref:`glossary_qlora` by using ``quantize=True`` to reap\neven more memory savings!\n\n.. code-block:: bash\n\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\n  model.apply_lora_to_mlp=True \\\n  model.lora_attn_modules=[\"q_proj\",\"k_proj\",\"v_proj\"] \\\n  model.lora_rank=16 \\\n  model.lora_alpha=32 \\\n  model.use_dora=True \\\n  model.quantize_base=True\n\n.. code-block:: yaml\n\n  model:\n    _component_: torchtune.models.lora_llama3_8b\n    apply_lora_to_mlp: True\n    lora_attn_modules: [\"q_proj\", \"k_proj\", \"v_proj\"]\n    lora_rank: 16\n    lora_alpha: 32\n    use_dora: True\n    quantize_base: True\n\n\n.. note::\n\n   Under the hood, we've enabled DoRA by adding the :class:`~torchtune.modules.peft.DoRALinear` module, which we swap\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\n\n.. _glossary_distrib:\n\n\n.. TODO\n\n.. Distributed\n.. -----------\n\n.. .. _glossary_fsdp:\n\n.. Fully Sharded Data Parallel (FSDP)\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\n.. .. _glossary_fsdp2:\n\n",
+          "text": "Result 5:\nDocument_id:de2d4\nContent: etune\n:func:`torchtune.models.llama3.llama3_8b` with DoRA, you would use :func:`torchtune.models.llama3.lora_llama3_8b` with ``use_dora=True``:\n\n.. code-block:: bash\n\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\n  model.use_dora=True\n\n.. code-block:: yaml\n\n  model:\n    _component_: torchtune.models.lora_llama3_8b\n    use_dora: True\n\nSince DoRA extends LoRA, the parameters for :ref:`customizing LoRA <glossary_lora>` are identical. You can also quantize the base model weights like in :ref:`glossary_qlora` by using ``quantize=True`` to reap\neven more memory savings!\n\n.. code-block:: bash\n\n  tune run lora_finetune_single_device --config llama3/8B_lora_single_device \\\n  model.apply_lora_to_mlp=True \\\n  model.lora_attn_modules=[\"q_proj\",\"k_proj\",\"v_proj\"] \\\n  model.lora_rank=16 \\\n  model.lora_alpha=32 \\\n  model.use_dora=True \\\n  model.quantize_base=True\n\n.. code-block:: yaml\n\n  model:\n    _component_: torchtune.models.lora_llama3_8b\n    apply_lora_to_mlp: True\n    lora_attn_modules: [\"q_proj\", \"k_proj\", \"v_proj\"]\n    lora_rank: 16\n    lora_alpha: 32\n    use_dora: True\n    quantize_base: True\n\n\n.. note::\n\n   Under the hood, we've enabled DoRA by adding the :class:`~torchtune.modules.peft.DoRALinear` module, which we swap\n   out for :class:`~torchtune.modules.peft.LoRALinear` when ``use_dora=True``.\n\n.. _glossary_distrib:\n\n\n.. TODO\n\n.. Distributed\n.. -----------\n\n.. .. _glossary_fsdp:\n\n.. Fully Sharded Data Parallel (FSDP)\n.. ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n\n.. All our ``_distributed`` recipes use `FSDP <https://pytorch.org/docs/stable/fsdp.html>`.\n.. .. _glossary_fsdp2:\n\n",
           "type": "text"
         },
         {
@@ -326,11 +335,11 @@
       "error_message": null,
       "metadata": {
         "document_ids": [
-          "3e3a05a7-23d4-461e-a304-8aa7cb35a4f5",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "fd0f6ee9-15d2-43b3-8500-25bc5bdfd365",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "fd0f6ee9-15d2-43b3-8500-25bc5bdfd365"
+          "f76dc7f5-9648-4272-a579-c8387fb1408a",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "de2d49de-55de-44dd-9bca-6f4f6d633b0a",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "de2d49de-55de-44dd-9bca-6f4f6d633b0a"
         ]
       }
     }
@@ -353,23 +362,23 @@
           "type": "text"
         },
         {
-          "text": "Result 1:\nDocument_id:7da0c\nContent: .. _lora_finetune_label:\n\n============================\nFine-Tuning Llama2 with LoRA\n============================\n\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\nIf you already know what LoRA is and want to get straight to running\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\n\n.. grid:: 2\n\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\n\n      * What LoRA is and how it saves memory during finetuning\n      * An overview of LoRA components in torchtune\n      * How to run a LoRA finetune using torchtune\n      * How to experiment with different LoRA configurations\n\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\n\n      * Be familiar with :ref:`torchtune<overview_label>`\n      * Make sure to :ref:`install torchtune<install_label>`\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\n\nWhat is LoRA?\n-------------\n\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\ntransformer models, in which case it is common to add the low-rank matrices\nto some of the linear projections in each transformer layer's self-attention.\n\n.. note::\n\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\n\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\nyou can expect to see memory savings due to a substantial reduction in the\nnumber of parameters with gradients. When using an optimizer with momentum,\nlike `AdamW <https://py\n",
+          "text": "Result 1:\nDocument_id:c4fc3\nContent: .. _lora_finetune_label:\n\n============================\nFine-Tuning Llama2 with LoRA\n============================\n\nThis guide will teach you about `LoRA <https://arxiv.org/abs/2106.09685>`_, a parameter-efficient finetuning technique,\nand show you how you can use torchtune to finetune a Llama2 model with LoRA.\nIf you already know what LoRA is and want to get straight to running\nyour own LoRA finetune in torchtune, you can jump to :ref:`LoRA finetuning recipe in torchtune<lora_recipe_label>`.\n\n.. grid:: 2\n\n    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn\n\n      * What LoRA is and how it saves memory during finetuning\n      * An overview of LoRA components in torchtune\n      * How to run a LoRA finetune using torchtune\n      * How to experiment with different LoRA configurations\n\n    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites\n\n      * Be familiar with :ref:`torchtune<overview_label>`\n      * Make sure to :ref:`install torchtune<install_label>`\n      * Make sure you have downloaded the :ref:`Llama2-7B model weights<download_llama_label>`\n\nWhat is LoRA?\n-------------\n\n`LoRA <https://arxiv.org/abs/2106.09685>`_ is an adapter-based method for\nparameter-efficient finetuning that adds trainable low-rank decomposition matrices to different layers of a neural network,\nthen freezes the network's remaining parameters. LoRA is most commonly applied to\ntransformer models, in which case it is common to add the low-rank matrices\nto some of the linear projections in each transformer layer's self-attention.\n\n.. note::\n\n    If you're unfamiliar, check out these references for the `definition of rank <https://en.wikipedia.org/wiki/Rank_(linear_algebra)>`_\n    and discussion of `low-rank approximations <https://en.wikipedia.org/wiki/Low-rank_approximation>`_.\n\nBy finetuning with LoRA (as opposed to finetuning all model parameters),\nyou can expect to see memory savings due to a substantial reduction in the\nnumber of parameters with gradients. When using an optimizer with momentum,\nlike `AdamW <https://py\n",
           "type": "text"
         },
         {
-          "text": "Result 2:\nDocument_id:7da0c\nContent:  LoRA to Llama2 models\n------------------------------\n\nWith torchtune, we can easily apply LoRA to Llama2 with a variety of different configurations.\nLet's take a look at how to construct Llama2 models in torchtune with and without LoRA.\n\n.. code-block:: python\n\n  from torchtune.models.llama2 import llama2_7b, lora_llama2_7b\n\n  # Build Llama2 without any LoRA layers\n  base_model = llama2_7b()\n\n  # The default settings for lora_llama2_7b will match those for llama2_7b\n  # We just need to define which layers we want LoRA applied to.\n  # Within each self-attention, we can choose from [\"q_proj\", \"k_proj\", \"v_proj\", and \"output_proj\"].\n  # We can also set apply_lora_to_mlp=True or apply_lora_to_output=True to apply LoRA to other linear\n  # layers outside of the self-attention.\n  lora_model = lora_llama2_7b(lora_attn_modules=[\"q_proj\", \"v_proj\"])\n\n.. note::\n\n    Calling :func:`lora_llama_2_7b <torchtune.models.llama2.lora_llama2_7b>` alone will not handle the definition of which parameters are trainable.\n    See :ref:`below<setting_trainable_params>` for how to do this.\n\nLet's inspect each of these models a bit more closely.\n\n.. code-block:: bash\n\n  # Print the first layer's self-attention in the usual Llama2 model\n  >>> print(base_model.layers[0].attn)\n  MultiHeadAttention(\n    (q_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (k_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (v_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (output_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (pos_embeddings): RotaryPositionalEmbeddings()\n  )\n\n  # Print the same for Llama2 with LoRA weights\n  >>> print(lora_model.layers[0].attn)\n  MultiHeadAttention(\n    (q_proj): LoRALinear(\n      (dropout): Dropout(p=0.0, inplace=False)\n     \n",
+          "text": "Result 2:\nDocument_id:c4fc3\nContent:  LoRA to Llama2 models\n------------------------------\n\nWith torchtune, we can easily apply LoRA to Llama2 with a variety of different configurations.\nLet's take a look at how to construct Llama2 models in torchtune with and without LoRA.\n\n.. code-block:: python\n\n  from torchtune.models.llama2 import llama2_7b, lora_llama2_7b\n\n  # Build Llama2 without any LoRA layers\n  base_model = llama2_7b()\n\n  # The default settings for lora_llama2_7b will match those for llama2_7b\n  # We just need to define which layers we want LoRA applied to.\n  # Within each self-attention, we can choose from [\"q_proj\", \"k_proj\", \"v_proj\", and \"output_proj\"].\n  # We can also set apply_lora_to_mlp=True or apply_lora_to_output=True to apply LoRA to other linear\n  # layers outside of the self-attention.\n  lora_model = lora_llama2_7b(lora_attn_modules=[\"q_proj\", \"v_proj\"])\n\n.. note::\n\n    Calling :func:`lora_llama_2_7b <torchtune.models.llama2.lora_llama2_7b>` alone will not handle the definition of which parameters are trainable.\n    See :ref:`below<setting_trainable_params>` for how to do this.\n\nLet's inspect each of these models a bit more closely.\n\n.. code-block:: bash\n\n  # Print the first layer's self-attention in the usual Llama2 model\n  >>> print(base_model.layers[0].attn)\n  MultiHeadAttention(\n    (q_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (k_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (v_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (output_proj): Linear(in_features=4096, out_features=4096, bias=False)\n    (pos_embeddings): RotaryPositionalEmbeddings()\n  )\n\n  # Print the same for Llama2 with LoRA weights\n  >>> print(lora_model.layers[0].attn)\n  MultiHeadAttention(\n    (q_proj): LoRALinear(\n      (dropout): Dropout(p=0.0, inplace=False)\n     \n",
           "type": "text"
         },
         {
-          "text": "Result 3:\nDocument_id:7da0c\nContent: 06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\n\n.. note::\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\n    for more details on how you can easily clone and modify torchtune configs.\n\n.. note::\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the\n",
+          "text": "Result 3:\nDocument_id:c4fc3\nContent: 06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92c749411fbd5f0ff140023a25/recipes/lora_finetune.py>`_.\nMake sure that you have first downloaded the Llama2 weights and tokenizer by following :ref:`these instructions<download_llama_label>`.\nYou can then run the following command to perform a LoRA finetune of Llama2-7B with two GPUs (each having VRAM of at least 16GB):\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora\n\n.. note::\n    Make sure to point to the location of your Llama2 weights and tokenizer. This can be done\n    either by adding :code:`checkpointer.checkpoint_files=[my_model_checkpoint_path] tokenizer_checkpoint=my_tokenizer_checkpoint_path`\n    or by directly modifying the :code:`7B_lora.yaml` file. See our \"\":ref:`config_tutorial_label`\" recipe\n    for more details on how you can easily clone and modify torchtune configs.\n\n.. note::\n    You can modify the value of :code:`nproc_per_node` depending on (a) the number of GPUs you have available,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the\n",
           "type": "text"
         },
         {
-          "text": "Result 4:\nDocument_id:7da0c\nContent:  from our Llama2\nmodel without any wrappers or custom checkpoint conversion logic.\n\n.. code-block:: python\n\n  # Assuming that base_model already has the pretrained Llama2 weights,\n  # this will directly load them into your LoRA model without any conversion necessary.\n  lora_model.load_state_dict(base_model.state_dict(), strict=False)\n\n.. note::\n    Whenever loading weights with :code:`strict=False`, you should verify that any missing or extra keys in\n    the loaded :code:`state_dict` are as expected. torchtune's LoRA recipes do this by default via\n    :func:`validate_missing_and_unexpected_for_lora() <torchtune.modules.peft.validate_missing_and_unexpected_for_lora>`.\n\nOnce we've loaded the base model weights, we also want to set only LoRA parameters to trainable.\n\n.. _setting_trainable_params:\n\n.. code-block:: python\n\n  from torchtune.modules.peft.peft_utils import get_adapter_params, set_trainable_params\n\n  # Fetch all params from the model that are associated with LoRA.\n  lora_params = get_adapter_params(lora_model)\n\n  # Set requires_grad=True on lora_params, and requires_grad=False on all others.\n  set_trainable_params(lora_model, lora_params)\n\n  # Print the total number of parameters\n  total_params = sum([p.numel() for p in lora_model.parameters()])\n  trainable_params = sum([p.numel() for p in lora_model.parameters() if p.requires_grad])\n  print(\n    f\"\"\"\n    {total_params} total params,\n    {trainable_params}\" trainable params,\n    {(100.0 * trainable_params / total_params):.2f}% of all params are trainable.\n    \"\"\"\n  )\n\n  6742609920 total params,\n  4194304 trainable params,\n  0.06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92\n",
+          "text": "Result 4:\nDocument_id:c4fc3\nContent:  from our Llama2\nmodel without any wrappers or custom checkpoint conversion logic.\n\n.. code-block:: python\n\n  # Assuming that base_model already has the pretrained Llama2 weights,\n  # this will directly load them into your LoRA model without any conversion necessary.\n  lora_model.load_state_dict(base_model.state_dict(), strict=False)\n\n.. note::\n    Whenever loading weights with :code:`strict=False`, you should verify that any missing or extra keys in\n    the loaded :code:`state_dict` are as expected. torchtune's LoRA recipes do this by default via\n    :func:`validate_missing_and_unexpected_for_lora() <torchtune.modules.peft.validate_missing_and_unexpected_for_lora>`.\n\nOnce we've loaded the base model weights, we also want to set only LoRA parameters to trainable.\n\n.. _setting_trainable_params:\n\n.. code-block:: python\n\n  from torchtune.modules.peft.peft_utils import get_adapter_params, set_trainable_params\n\n  # Fetch all params from the model that are associated with LoRA.\n  lora_params = get_adapter_params(lora_model)\n\n  # Set requires_grad=True on lora_params, and requires_grad=False on all others.\n  set_trainable_params(lora_model, lora_params)\n\n  # Print the total number of parameters\n  total_params = sum([p.numel() for p in lora_model.parameters()])\n  trainable_params = sum([p.numel() for p in lora_model.parameters() if p.requires_grad])\n  print(\n    f\"\"\"\n    {total_params} total params,\n    {trainable_params}\" trainable params,\n    {(100.0 * trainable_params / total_params):.2f}% of all params are trainable.\n    \"\"\"\n  )\n\n  6742609920 total params,\n  4194304 trainable params,\n  0.06% of all params are trainable.\n\n.. note::\n    If you are directly using the LoRA recipe (as detailed :ref:`here<lora_recipe_label>`), you need only pass the\n    relevant checkpoint path. Loading model weights and setting trainable parameters will be taken care\n    of in the recipe.\n\n\n.. _lora_recipe_label:\n\nLoRA finetuning recipe in torchtune\n-----------------------------------\n\nFinally, we can put it all together and finetune a model using torchtune's `LoRA recipe <https://github.com/pytorch/torchtune/blob/48626d19d2108f92\n",
           "type": "text"
         },
         {
-          "text": "Result 5:\nDocument_id:7da0c\nContent: ,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the default is to apply LoRA to Q and V projections with a rank of 8.\nSome experiments with LoRA have found that it can be beneficial to apply LoRA to all linear layers in\nthe self-attention, and to increase the rank to 16 or 32. Note that this is likely to increase our max memory,\nbut as long as we keep :code:`rank<<embed_dim`, the impact should be relatively minor.\n\nLet's run this experiment. We can also increase alpha (in general it is good practice to scale alpha and rank together).\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora \\\n    lora_attn_modules=['q_proj','k_proj','v_proj','output_proj'] \\\n    lora_rank=32 lora_alpha=64 output_dir=./lora_experiment_1\n\nA comparison of the (smoothed) loss curves between this run and our baseline over the first 500 steps can be seen below.\n\n.. image:: /_static/img/lora_experiment_loss_curves.png\n\n.. note::\n    The above figure was generated with W&B. You can use torchtune's :class:`~torchtune.training.metric_logging.WandBLogger`\n    to generate similar loss curves, but you will need to install W&B and setup an account separately. For more details on\n    using W&B in torchtune, see our \":ref:`wandb_logging`\" recipe.\n\n.. _lora_tutorial_memory_tradeoff_label:\n\nTrading off memory and model performance with LoRA\n--------------------------------------------------\n\nIn the preceding example, we ran LoRA on two devices. But given LoRA's low memory footprint, we can run fine-tuning\non a single device using most commodity GPUs which support `bfloat16 <https://\n",
+          "text": "Result 5:\nDocument_id:c4fc3\nContent: ,\n    and (b) the memory constraints of your hardware.\n\nThe preceding command will run a LoRA finetune with torchtune's factory settings, but we may want to experiment a bit.\nLet's take a closer look at some of the :code:`lora_finetune_distributed` config.\n\n.. code-block:: yaml\n\n  # Model Arguments\n  model:\n    _component_: lora_llama2_7b\n    lora_attn_modules: ['q_proj', 'v_proj']\n    lora_rank: 8\n    lora_alpha: 16\n  ...\n\nWe see that the default is to apply LoRA to Q and V projections with a rank of 8.\nSome experiments with LoRA have found that it can be beneficial to apply LoRA to all linear layers in\nthe self-attention, and to increase the rank to 16 or 32. Note that this is likely to increase our max memory,\nbut as long as we keep :code:`rank<<embed_dim`, the impact should be relatively minor.\n\nLet's run this experiment. We can also increase alpha (in general it is good practice to scale alpha and rank together).\n\n.. code-block:: bash\n\n    tune run --nnodes 1 --nproc_per_node 2 lora_finetune_distributed --config llama2/7B_lora \\\n    lora_attn_modules=['q_proj','k_proj','v_proj','output_proj'] \\\n    lora_rank=32 lora_alpha=64 output_dir=./lora_experiment_1\n\nA comparison of the (smoothed) loss curves between this run and our baseline over the first 500 steps can be seen below.\n\n.. image:: /_static/img/lora_experiment_loss_curves.png\n\n.. note::\n    The above figure was generated with W&B. You can use torchtune's :class:`~torchtune.training.metric_logging.WandBLogger`\n    to generate similar loss curves, but you will need to install W&B and setup an account separately. For more details on\n    using W&B in torchtune, see our \":ref:`wandb_logging`\" recipe.\n\n.. _lora_tutorial_memory_tradeoff_label:\n\nTrading off memory and model performance with LoRA\n--------------------------------------------------\n\nIn the preceding example, we ran LoRA on two devices. But given LoRA's low memory footprint, we can run fine-tuning\non a single device using most commodity GPUs which support `bfloat16 <https://\n",
           "type": "text"
         },
         {
@@ -381,11 +390,11 @@
       "error_message": null,
       "metadata": {
         "document_ids": [
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f",
-          "7da0c755-7ffa-4c1a-9ab0-cfdda7cce00f"
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0",
+          "c4fc3cb6-6172-489e-90a7-b39d343e14c0"
         ]
       }
     }
diff --git a/tests/integration/fixtures/recorded_responses/invoke_tool.pickle b/tests/integration/fixtures/recorded_responses/invoke_tool.pickle
index a642db721a05d52dd9fa0a70de106191bfa3f158..33bccd4d34f1167ba246bb389c88de885e55eee5 100644
GIT binary patch
delta 1057
zcmah|&1(}u6z?Wk6STImCjCg0Vx>r1*qUS~`vH1u@gPLKNG~e;$#jsmU;-irTQHK+
zU_WN1qEMp|p@+7X@z_fXUX&hs(M$acym)F46>)a+wY8!QJl>o4d-LY^n|V7gy{m7$
z?3C}>`P~gR$umLxs(hJb`96j<MM2ldGS~{R8Zb4U#76r9_*<+Smq#M3ZX|U;wnsiO
z)$GERAO7m@lWXr!JaWoKGsVdQkT{SOlbn(gWlocLNi@|2h)ar9>~oIRRDlx`6aggJ
z;N-X>aw;$DJm8H4(Bc&4w3Bs%OQom*K-W20)f7%Jfhp($&#Q68f^%@*xR-@z(y+}x
zXZ6D%Y$lsGi-X>CFiNgY=K{8aKhKmG9t4F0=pUH2aujxwnxbEu7|$5v8S56^kz5(L
zU-V^+`xy&0F-=W)@@)@B`AcjiQf5M@_8qqpx6E!eGA*vmXuyNldppTq{wLEwoOU6K
zk8!Ecj`#AdI8qpEV2+%BcPiQJbee~ubXGO+TH7FAp9<sePh;&p^nNw|ls@XBF+3#Q
zbNvA(frppAGAR;$e!ztG;Q?K4`tT6nUMgHb9ke8kIvs15rz>jOVjfmnW{WEe!6g3m
z;$i%6#~fGBrOrRKBU||nPlNU!(ronpPnzX|OM2uI7KJI1IuEyc$LQuP)J?&Z1hU1f
zm>Bhr%UV@qbO&>10l8i(d2k`z>OrP0v=7l5^16JdHXZfZ8D5R}>_1QZ7iYa>DD%$i
zjMUnPNPUjJ_;Go&7H)5@)aGyU<BdQw{nEA0V<fQ{WmrX>$Y${FVi$&3=tXh+-iewy
d^2jJfx9xWxKqB?hNOG)f+lD?isM;bs^c%v@LQ?<$

delta 539
zcmZ3xi23YnX4VFlsfW&PWHmBo=E)G4ynl)H=2Bx7Mpolg<3xka^GptMu$reN8YFL)
zjZop3d{<U_@?uvh*0dCZG_%czTu(7VWhc6SV26sf`EOvW2WvM?G}kpUPBGCnF*8in
zO*A$z(X~iSG*3=4Hcd21Go8|-0yf&*)Ku3zEiF;kB-t=g*D^85KsPxpB?YK3In}@*
z4X6xkU23YOuAym)k*<kxlCiFZseys6k!e!0X;MmBim{pLl#Kq238}@U8G?QpLhSuh
zG%|qx*}NyLM~hh|Lt(RbV=V`WG5K`o;>q`nJtybPv6*~FR+_12>*R}b#3p-nuLN>s
zm^hdwuUC|qEI*%r^Xt}kj6fetG4-@eUeF;16srK~n7r(q^5mv|Ibl&o1_qdgF#ERk
zYj7}XOuj$;I-}0!?K8eJPPUq|eRAIH4U_L1dqC}!*?g!~oC#*~Mn#0l^EwWJgh4jQ
zWr2)`5F%JC`nKRM(`3sjJ2oF%5&??@coZeAlY+)e<GNIKcobb@pL}pHOy<Gfm9VJo
UI~K^n0}QPR86tkANu{NF0Fz$9O8@`>