mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-29 07:14:20 +00:00
Nuke fp8_requirements, fold fbgemm into common requirements
This commit is contained in:
parent
cc697c59e5
commit
66412b932b
4 changed files with 5 additions and 42 deletions
12
README.md
12
README.md
|
@ -28,15 +28,3 @@ pip install -e .
|
|||
## The Llama CLI
|
||||
|
||||
The `llama` CLI makes it easy to configure and run the Llama toolchain. Read the [CLI reference](docs/cli_reference.md) for details.
|
||||
|
||||
## Appendix: Running FP8
|
||||
|
||||
If you want to run FP8, you need the `fbgemm-gpu` package which requires `torch >= 2.4.0` (currently only in nightly, but releasing shortly...)
|
||||
|
||||
```bash
|
||||
ENV=fp8_env
|
||||
conda create -n $ENV python=3.10
|
||||
conda activate $ENV
|
||||
|
||||
pip3 install -r fp8_requirements.txt
|
||||
```
|
||||
|
|
|
@ -1,28 +0,0 @@
|
|||
torch>=2.4.0
|
||||
accelerate
|
||||
black==24.4.2
|
||||
codeshield
|
||||
fairscale
|
||||
fastapi
|
||||
fire
|
||||
flake8
|
||||
huggingface-hub
|
||||
httpx
|
||||
json-strong-typing
|
||||
matplotlib
|
||||
omegaconf
|
||||
pandas
|
||||
Pillow
|
||||
pre-commit
|
||||
pydantic==1.10.13
|
||||
pydantic_core==2.18.2
|
||||
python-dotenv
|
||||
python-openapi
|
||||
requests
|
||||
tiktoken
|
||||
transformers
|
||||
ufmt==2.7.0
|
||||
usort==1.0.8
|
||||
uvicorn
|
||||
zmq
|
||||
fbgemm-gpu==0.8.0
|
|
@ -26,7 +26,6 @@ COMMON_DEPENDENCIES = [
|
|||
"huggingface-hub",
|
||||
"json-strong-typing",
|
||||
"llama-models",
|
||||
"omegaconf",
|
||||
"pandas",
|
||||
"Pillow",
|
||||
"pydantic==1.10.13",
|
||||
|
@ -60,7 +59,10 @@ def available_distribution_specs() -> List[DistributionSpec]:
|
|||
DistributionSpec(
|
||||
spec_id="inline",
|
||||
description="Use code from `llama_toolchain` itself to serve all llama stack APIs",
|
||||
additional_pip_packages=COMMON_DEPENDENCIES,
|
||||
additional_pip_packages=COMMON_DEPENDENCIES
|
||||
+ [
|
||||
"fbgemm-gpu==0.8.0",
|
||||
],
|
||||
provider_specs={
|
||||
Api.inference: providers[Api.inference]["meta-reference"],
|
||||
Api.safety: providers[Api.safety]["meta-reference"],
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
black==24.4.2
|
||||
fastapi
|
||||
fbgemm-gpu==0.8.0
|
||||
fire
|
||||
flake8
|
||||
httpx
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue