Nuke fp8_requirements, fold fbgemm into common requirements

2025-12-05 10:23:44 +00:00 · 2024-08-07 13:58:13 -07:00 · 2024-08-07 13:58:13 -07:00 · 66412b932b
commit 66412b932b
parent cc697c59e5
4 changed files with 5 additions and 42 deletions
--- a/README.md
+++ b/README.md
@ -28,15 +28,3 @@ pip install -e .
 ## The Llama CLI

 The `llama` CLI makes it easy to configure and run the Llama toolchain. Read the [CLI reference](docs/cli_reference.md) for details.
-
-## Appendix: Running FP8
-
-If you want to run FP8, you need the `fbgemm-gpu` package which requires `torch >= 2.4.0` (currently only in nightly, but releasing shortly...)
-
-```bash
-ENV=fp8_env
-conda create -n $ENV python=3.10
-conda activate $ENV
-
-pip3 install -r fp8_requirements.txt
-```
--- a/fp8_requirements.txt
+++ b/fp8_requirements.txt
@ -1,28 +0,0 @@
-torch>=2.4.0
-accelerate
-black==24.4.2
-codeshield
-fairscale
-fastapi
-fire
-flake8
-huggingface-hub
-httpx
-json-strong-typing
-matplotlib
-omegaconf
-pandas
-Pillow
-pre-commit
-pydantic==1.10.13
-pydantic_core==2.18.2
-python-dotenv
-python-openapi
-requests
-tiktoken
-transformers
-ufmt==2.7.0
-usort==1.0.8
-uvicorn
-zmq
-fbgemm-gpu==0.8.0
--- a/llama_toolchain/distribution/registry.py
+++ b/llama_toolchain/distribution/registry.py
@ -26,7 +26,6 @@ COMMON_DEPENDENCIES = [
    "huggingface-hub",
    "json-strong-typing",
    "llama-models",
-    "omegaconf",
    "pandas",
    "Pillow",
    "pydantic==1.10.13",
@ -60,7 +59,10 @@ def available_distribution_specs() -> List[DistributionSpec]:
        DistributionSpec(
            spec_id="inline",
            description="Use code from `llama_toolchain` itself to serve all llama stack APIs",
-            additional_pip_packages=COMMON_DEPENDENCIES,
+            additional_pip_packages=COMMON_DEPENDENCIES
+            + [
+                "fbgemm-gpu==0.8.0",
+            ],
            provider_specs={
                Api.inference: providers[Api.inference]["meta-reference"],
                Api.safety: providers[Api.safety]["meta-reference"],
--- a/requirements.txt
+++ b/requirements.txt
@ -1,5 +1,6 @@
 black==24.4.2
 fastapi
+fbgemm-gpu==0.8.0
 fire
 flake8
 httpx