From edd9aaac3b22fe91e8f45e7c6bc6e3d9f97cb250 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?S=C3=A9bastien=20Han?= Date: Thu, 10 Apr 2025 22:39:20 +0200 Subject: [PATCH] fix: use torchao 0.8.0 for inference (#1925) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit # What does this PR do? While building the "experimental-post-training" distribution, we encountered a version conflict between torchao with inference requiring version 0.5.0 and training currently depending on version 0.8.0. Resolves this error: ``` × No solution found when resolving dependencies: ╰─▶ Because you require torchao==0.5.0 and torchao==0.8.0, we can conclude that your requirements are unsatisfiable. ERROR 2025-04-10 10:41:22,597 llama_stack.distribution.build:128 uncategorized: Failed to build target test with return code 1 ``` Signed-off-by: Sébastien Han --- llama_stack/providers/registry/inference.py | 2 +- llama_stack/templates/dependencies.json | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py index aabb3bbdf..3c54cabcf 100644 --- a/llama_stack/providers/registry/inference.py +++ b/llama_stack/providers/registry/inference.py @@ -24,7 +24,7 @@ META_REFERENCE_DEPS = [ "zmq", "lm-format-enforcer", "sentence-transformers", - "torchao==0.5.0", + "torchao==0.8.0", "fbgemm-gpu-genai==1.1.2", ] diff --git a/llama_stack/templates/dependencies.json b/llama_stack/templates/dependencies.json index 053d6ef8a..b96191752 100644 --- a/llama_stack/templates/dependencies.json +++ b/llama_stack/templates/dependencies.json @@ -381,7 +381,7 @@ "sentence-transformers", "sentencepiece", "torch", - "torchao==0.5.0", + "torchao==0.8.0", "torchvision", "tqdm", "transformers",