move distribution to yaml files

2025-12-06 18:40:57 +00:00 · 2024-09-14 15:02:22 -07:00 · 2024-09-14 15:02:22 -07:00 · 0068d059db
commit 0068d059db
parent 3802d5acdc
9 changed files with 78 additions and 49 deletions
--- a/llama_toolchain/configs/distributions/conda/local-tgi-conda-example-build.yaml
+++ b/llama_toolchain/configs/distributions/conda/local-tgi-conda-example-build.yaml
@ -1,7 +1,7 @@
 name: local-tgi-conda-example
 distribution_spec:
  distribution_type: local-plus-tgi-inference
-  description: Use TGI for running LLM inference
+  description: Use TGI (local or with Hugging Face Inference Endpoints for running LLM inference. When using HF Inference Endpoints, you must provide the name of the endpoint).
  docker_image: null
  providers:
    inference: remote::tgi
--- a/llama_toolchain/configs/distributions/distribution_registry/local-ollama.yaml
+++ b/llama_toolchain/configs/distributions/distribution_registry/local-ollama.yaml
@ -0,0 +1,9 @@
+distribution_type: local-ollama
+description: Like local, but use ollama for running LLM inference
+docker_image: null
+providers:
+  inference: remote::ollama
+  safety: meta-reference
+  agentic_system: meta-reference
+  memory: meta-reference-faiss
+  telemetry: console
--- a/llama_toolchain/configs/distributions/distribution_registry/local-plus-fireworks-inference.yaml
+++ b/llama_toolchain/configs/distributions/distribution_registry/local-plus-fireworks-inference.yaml
@ -0,0 +1,9 @@
+distribution_type: local-plus-fireworks-inference
+description: Use Fireworks.ai for running LLM inference
+docker_image: null
+providers:
+  inference: remote::fireworks
+  safety: meta-reference
+  agentic_system: meta-reference
+  memory: meta-reference-faiss
+  telemetry: console
--- a/llama_toolchain/configs/distributions/distribution_registry/local-plus-tgi-inference.yaml
+++ b/llama_toolchain/configs/distributions/distribution_registry/local-plus-tgi-inference.yaml
@ -0,0 +1,8 @@
+distribution_type: local-plus-tgi-inference
+description: Use TGI (local or with Hugging Face Inference Endpoints for running LLM inference. When using HF Inference Endpoints, you must provide the name of the endpoint).
+docker_image: null
+providers:
+  inference: remote::tgi
+  safety: meta-reference
+  agentic_system: meta-reference
+  memory: meta-reference-faiss
--- a/llama_toolchain/configs/distributions/distribution_registry/local-plus-together-inference.yaml
+++ b/llama_toolchain/configs/distributions/distribution_registry/local-plus-together-inference.yaml
@ -0,0 +1,9 @@
+distribution_type: local-plus-together-inference
+description: Use Together.ai for running LLM inference
+docker_image: null
+providers:
+  inference: remote::together
+  safety: meta-reference
+  agentic_system: meta-reference
+  memory: meta-reference-faiss
+  telemetry: console
--- a/llama_toolchain/configs/distributions/distribution_registry/local.yaml
+++ b/llama_toolchain/configs/distributions/distribution_registry/local.yaml
@ -0,0 +1,9 @@
+distribution_type: local
+description: Use code from `llama_toolchain` itself to serve all llama stack APIs
+docker_image: null
+providers:
+  inference: meta-reference
+  memory: meta-reference-faiss
+  safety: meta-reference
+  agentic_system: meta-reference
+  telemetry: console
--- a/llama_toolchain/configs/distributions/run.py
+++ b/llama_toolchain/configs/distributions/run.py
@ -0,0 +1,21 @@
+from llama_toolchain.core.distribution_registry import *
+import json
+
+import fire
+import yaml
+from llama_toolchain.common.serialize import EnumEncoder
+
+
+def main():
+    for d in available_distribution_specs():
+        file_path = "./configs/distributions/distribution_registry/{}.yaml".format(
+            d.distribution_type
+        )
+
+        with open(file_path, "w") as f:
+            to_write = json.loads(json.dumps(d.dict(), cls=EnumEncoder))
+            f.write(yaml.dump(to_write, sort_keys=False))
+
+
+if __name__ == "__main__":
+    fire.Fire(main)