mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-29 15:23:51 +00:00
Nuke fp8_requirements, fold fbgemm into common requirements
This commit is contained in:
parent
cc697c59e5
commit
66412b932b
4 changed files with 5 additions and 42 deletions
12
README.md
12
README.md
|
@ -28,15 +28,3 @@ pip install -e .
|
||||||
## The Llama CLI
|
## The Llama CLI
|
||||||
|
|
||||||
The `llama` CLI makes it easy to configure and run the Llama toolchain. Read the [CLI reference](docs/cli_reference.md) for details.
|
The `llama` CLI makes it easy to configure and run the Llama toolchain. Read the [CLI reference](docs/cli_reference.md) for details.
|
||||||
|
|
||||||
## Appendix: Running FP8
|
|
||||||
|
|
||||||
If you want to run FP8, you need the `fbgemm-gpu` package which requires `torch >= 2.4.0` (currently only in nightly, but releasing shortly...)
|
|
||||||
|
|
||||||
```bash
|
|
||||||
ENV=fp8_env
|
|
||||||
conda create -n $ENV python=3.10
|
|
||||||
conda activate $ENV
|
|
||||||
|
|
||||||
pip3 install -r fp8_requirements.txt
|
|
||||||
```
|
|
||||||
|
|
|
@ -1,28 +0,0 @@
|
||||||
torch>=2.4.0
|
|
||||||
accelerate
|
|
||||||
black==24.4.2
|
|
||||||
codeshield
|
|
||||||
fairscale
|
|
||||||
fastapi
|
|
||||||
fire
|
|
||||||
flake8
|
|
||||||
huggingface-hub
|
|
||||||
httpx
|
|
||||||
json-strong-typing
|
|
||||||
matplotlib
|
|
||||||
omegaconf
|
|
||||||
pandas
|
|
||||||
Pillow
|
|
||||||
pre-commit
|
|
||||||
pydantic==1.10.13
|
|
||||||
pydantic_core==2.18.2
|
|
||||||
python-dotenv
|
|
||||||
python-openapi
|
|
||||||
requests
|
|
||||||
tiktoken
|
|
||||||
transformers
|
|
||||||
ufmt==2.7.0
|
|
||||||
usort==1.0.8
|
|
||||||
uvicorn
|
|
||||||
zmq
|
|
||||||
fbgemm-gpu==0.8.0
|
|
|
@ -26,7 +26,6 @@ COMMON_DEPENDENCIES = [
|
||||||
"huggingface-hub",
|
"huggingface-hub",
|
||||||
"json-strong-typing",
|
"json-strong-typing",
|
||||||
"llama-models",
|
"llama-models",
|
||||||
"omegaconf",
|
|
||||||
"pandas",
|
"pandas",
|
||||||
"Pillow",
|
"Pillow",
|
||||||
"pydantic==1.10.13",
|
"pydantic==1.10.13",
|
||||||
|
@ -60,7 +59,10 @@ def available_distribution_specs() -> List[DistributionSpec]:
|
||||||
DistributionSpec(
|
DistributionSpec(
|
||||||
spec_id="inline",
|
spec_id="inline",
|
||||||
description="Use code from `llama_toolchain` itself to serve all llama stack APIs",
|
description="Use code from `llama_toolchain` itself to serve all llama stack APIs",
|
||||||
additional_pip_packages=COMMON_DEPENDENCIES,
|
additional_pip_packages=COMMON_DEPENDENCIES
|
||||||
|
+ [
|
||||||
|
"fbgemm-gpu==0.8.0",
|
||||||
|
],
|
||||||
provider_specs={
|
provider_specs={
|
||||||
Api.inference: providers[Api.inference]["meta-reference"],
|
Api.inference: providers[Api.inference]["meta-reference"],
|
||||||
Api.safety: providers[Api.safety]["meta-reference"],
|
Api.safety: providers[Api.safety]["meta-reference"],
|
||||||
|
|
|
@ -1,5 +1,6 @@
|
||||||
black==24.4.2
|
black==24.4.2
|
||||||
fastapi
|
fastapi
|
||||||
|
fbgemm-gpu==0.8.0
|
||||||
fire
|
fire
|
||||||
flake8
|
flake8
|
||||||
httpx
|
httpx
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue