From edd9aaac3b22fe91e8f45e7c6bc6e3d9f97cb250 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?S=C3=A9bastien=20Han?= <seb@redhat.com>
Date: Thu, 10 Apr 2025 22:39:20 +0200
Subject: [PATCH] fix: use torchao 0.8.0 for inference (#1925)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?

While building the "experimental-post-training" distribution, we
encountered a version conflict between torchao with inference requiring
version 0.5.0 and training currently depending on version 0.8.0.

Resolves this error:

```
  × No solution found when resolving dependencies:
  ╰─▶ Because you require torchao==0.5.0 and torchao==0.8.0, we can conclude that your requirements are unsatisfiable.
ERROR    2025-04-10 10:41:22,597 llama_stack.distribution.build:128 uncategorized: Failed to build target test with
         return code 1
```

Signed-off-by: Sébastien Han <seb@redhat.com>
---
 llama_stack/providers/registry/inference.py | 2 +-
 llama_stack/templates/dependencies.json     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index aabb3bbdf..3c54cabcf 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -24,7 +24,7 @@ META_REFERENCE_DEPS = [
     "zmq",
     "lm-format-enforcer",
     "sentence-transformers",
-    "torchao==0.5.0",
+    "torchao==0.8.0",
     "fbgemm-gpu-genai==1.1.2",
 ]
 
diff --git a/llama_stack/templates/dependencies.json b/llama_stack/templates/dependencies.json
index 053d6ef8a..b96191752 100644
--- a/llama_stack/templates/dependencies.json
+++ b/llama_stack/templates/dependencies.json
@@ -381,7 +381,7 @@
     "sentence-transformers",
     "sentencepiece",
     "torch",
-    "torchao==0.5.0",
+    "torchao==0.8.0",
     "torchvision",
     "tqdm",
     "transformers",