init: first remote llamacpp implementation

2025-12-26 23:12:00 +00:00 · 2025-07-12 16:28:08 -07:00 · 2025-07-12 16:28:08 -07:00 · ec73d0d55b
commit ec73d0d55b
parent 8374d4cefd
9 changed files with 675 additions and 0 deletions
--- a/llama_stack/templates/llamacpp/build.yaml
+++ b/llama_stack/templates/llamacpp/build.yaml
@ -0,0 +1,38 @@
+version: "2"
+distribution_spec:
+  description: Use llama.cpp server for running LLM inference
+  providers:
+    inference:
+      - remote::llamacpp
+      - inline::sentence-transformers
+    vector_io:
+      - inline::faiss
+      - remote::chromadb
+      - remote::pgvector
+    safety:
+      - inline::llama-guard
+    agents:
+      - inline::meta-reference
+    telemetry:
+      - inline::meta-reference
+    eval:
+      - inline::meta-reference
+    datasetio:
+      - remote::huggingface
+      - inline::localfs
+    scoring:
+      - inline::basic
+      - inline::llm-as-judge
+      - inline::braintrust
+    files:
+      - inline::localfs
+    tool_runtime:
+      - remote::brave-search
+      - remote::tavily-search
+      - remote::wolfram-alpha
+      - inline::rag-runtime
+      - remote::model-context-protocol
+image_type: conda
+additional_pip_packages:
+  - aiosqlite
+  - sqlalchemy[asyncio]