mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-04 18:13:44 +00:00
refactor(k8s): update run configs to v2 storage and registered_resources structure
Some checks failed
Python Package Build Test / build (3.13) (push) Failing after 1s
SqlStore Integration Tests / test-postgres (3.12) (push) Failing after 0s
Integration Auth Tests / test-matrix (oauth2_token) (push) Failing after 1s
SqlStore Integration Tests / test-postgres (3.13) (push) Failing after 1s
Integration Tests (Replay) / Integration Tests (, , , client=, ) (push) Failing after 3s
Test External Providers Installed via Module / test-external-providers-from-module (venv) (push) Has been skipped
Test Llama Stack Build / generate-matrix (push) Successful in 3s
Test Llama Stack Build / build-single-provider (push) Failing after 3s
Python Package Build Test / build (3.12) (push) Failing after 3s
Vector IO Integration Tests / test-matrix (push) Failing after 5s
Test Llama Stack Build / build-custom-container-distribution (push) Failing after 4s
Test Llama Stack Build / build-ubi9-container-distribution (push) Failing after 4s
Test Llama Stack Build / build (push) Failing after 3s
Unit Tests / unit-tests (3.13) (push) Failing after 3s
Test External API and Providers / test-external (venv) (push) Failing after 4s
Unit Tests / unit-tests (3.12) (push) Failing after 5s
API Conformance Tests / check-schema-compatibility (push) Successful in 12s
UI Tests / ui-tests (22) (push) Successful in 42s
Pre-commit / pre-commit (push) Successful in 1m30s
Some checks failed
Python Package Build Test / build (3.13) (push) Failing after 1s
SqlStore Integration Tests / test-postgres (3.12) (push) Failing after 0s
Integration Auth Tests / test-matrix (oauth2_token) (push) Failing after 1s
SqlStore Integration Tests / test-postgres (3.13) (push) Failing after 1s
Integration Tests (Replay) / Integration Tests (, , , client=, ) (push) Failing after 3s
Test External Providers Installed via Module / test-external-providers-from-module (venv) (push) Has been skipped
Test Llama Stack Build / generate-matrix (push) Successful in 3s
Test Llama Stack Build / build-single-provider (push) Failing after 3s
Python Package Build Test / build (3.12) (push) Failing after 3s
Vector IO Integration Tests / test-matrix (push) Failing after 5s
Test Llama Stack Build / build-custom-container-distribution (push) Failing after 4s
Test Llama Stack Build / build-ubi9-container-distribution (push) Failing after 4s
Test Llama Stack Build / build (push) Failing after 3s
Unit Tests / unit-tests (3.13) (push) Failing after 3s
Test External API and Providers / test-external (venv) (push) Failing after 4s
Unit Tests / unit-tests (3.12) (push) Failing after 5s
API Conformance Tests / check-schema-compatibility (push) Successful in 12s
UI Tests / ui-tests (22) (push) Successful in 42s
Pre-commit / pre-commit (push) Successful in 1m30s
Migrates k8s run configs to match the updated run configs - Replace storage.references with storage.stores - Wrap resources under registered_resources section - Update provider configs to use persistence with namespace/backend - Add telemetry and vector_stores top-level sections - Simplify agent/files metadata store configuration
This commit is contained in:
parent
0e57233a0a
commit
658fb2c777
2 changed files with 107 additions and 99 deletions
|
|
@ -27,28 +27,24 @@ providers:
|
||||||
config:
|
config:
|
||||||
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
||||||
metadata_store:
|
metadata_store:
|
||||||
type: sqlite
|
table_name: files_metadata
|
||||||
db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
|
backend: sql_default
|
||||||
vector_io:
|
vector_io:
|
||||||
- provider_id: ${env.ENABLE_CHROMADB:+chromadb}
|
- provider_id: ${env.ENABLE_CHROMADB:+chromadb}
|
||||||
provider_type: remote::chromadb
|
provider_type: remote::chromadb
|
||||||
config:
|
config:
|
||||||
url: ${env.CHROMADB_URL:=}
|
url: ${env.CHROMADB_URL:=}
|
||||||
kvstore:
|
persistence:
|
||||||
type: postgres
|
namespace: vector_io::chroma_remote
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
backend: kv_default
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
|
||||||
files:
|
files:
|
||||||
- provider_id: meta-reference-files
|
- provider_id: meta-reference-files
|
||||||
provider_type: inline::localfs
|
provider_type: inline::localfs
|
||||||
config:
|
config:
|
||||||
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
||||||
metadata_store:
|
metadata_store:
|
||||||
type: sqlite
|
table_name: files_metadata
|
||||||
db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
|
backend: sql_default
|
||||||
safety:
|
safety:
|
||||||
- provider_id: llama-guard
|
- provider_id: llama-guard
|
||||||
provider_type: inline::llama-guard
|
provider_type: inline::llama-guard
|
||||||
|
|
@ -58,20 +54,15 @@ providers:
|
||||||
- provider_id: meta-reference
|
- provider_id: meta-reference
|
||||||
provider_type: inline::meta-reference
|
provider_type: inline::meta-reference
|
||||||
config:
|
config:
|
||||||
persistence_store:
|
persistence:
|
||||||
type: postgres
|
agent_state:
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
namespace: agents
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
backend: kv_default
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
responses:
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
table_name: responses
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
backend: sql_default
|
||||||
responses_store:
|
max_write_queue_size: 10000
|
||||||
type: postgres
|
num_writers: 4
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
|
||||||
telemetry:
|
telemetry:
|
||||||
- provider_id: meta-reference
|
- provider_id: meta-reference
|
||||||
provider_type: inline::meta-reference
|
provider_type: inline::meta-reference
|
||||||
|
|
@ -112,32 +103,45 @@ storage:
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
db: ${env.POSTGRES_DB:=llamastack}
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
user: ${env.POSTGRES_USER:=llamastack}
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
||||||
references:
|
stores:
|
||||||
metadata:
|
metadata:
|
||||||
backend: kv_default
|
|
||||||
namespace: registry
|
namespace: registry
|
||||||
|
backend: kv_default
|
||||||
inference:
|
inference:
|
||||||
backend: sql_default
|
|
||||||
table_name: inference_store
|
table_name: inference_store
|
||||||
models:
|
backend: sql_default
|
||||||
- metadata:
|
max_write_queue_size: 10000
|
||||||
embedding_dimension: 768
|
num_writers: 4
|
||||||
model_id: nomic-embed-text-v1.5
|
conversations:
|
||||||
provider_id: sentence-transformers
|
table_name: openai_conversations
|
||||||
model_type: embedding
|
backend: sql_default
|
||||||
- model_id: ${env.INFERENCE_MODEL}
|
registered_resources:
|
||||||
provider_id: vllm-inference
|
models:
|
||||||
model_type: llm
|
- metadata:
|
||||||
shields:
|
embedding_dimension: 768
|
||||||
- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
model_id: nomic-embed-text-v1.5
|
||||||
vector_dbs: []
|
provider_id: sentence-transformers
|
||||||
datasets: []
|
model_type: embedding
|
||||||
scoring_fns: []
|
- model_id: ${env.INFERENCE_MODEL}
|
||||||
benchmarks: []
|
provider_id: vllm-inference
|
||||||
tool_groups:
|
model_type: llm
|
||||||
- toolgroup_id: builtin::websearch
|
shields:
|
||||||
provider_id: tavily-search
|
- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
||||||
- toolgroup_id: builtin::rag
|
vector_dbs: []
|
||||||
provider_id: rag-runtime
|
datasets: []
|
||||||
|
scoring_fns: []
|
||||||
|
benchmarks: []
|
||||||
|
tool_groups:
|
||||||
|
- toolgroup_id: builtin::websearch
|
||||||
|
provider_id: tavily-search
|
||||||
|
- toolgroup_id: builtin::rag
|
||||||
|
provider_id: rag-runtime
|
||||||
server:
|
server:
|
||||||
port: 8323
|
port: 8323
|
||||||
|
telemetry:
|
||||||
|
enabled: true
|
||||||
|
vector_stores:
|
||||||
|
default_provider_id: chromadb
|
||||||
|
default_embedding_model:
|
||||||
|
provider_id: sentence-transformers
|
||||||
|
model_id: nomic-ai/nomic-embed-text-v1.5
|
||||||
|
|
|
||||||
|
|
@ -32,21 +32,17 @@ providers:
|
||||||
provider_type: remote::chromadb
|
provider_type: remote::chromadb
|
||||||
config:
|
config:
|
||||||
url: ${env.CHROMADB_URL:=}
|
url: ${env.CHROMADB_URL:=}
|
||||||
kvstore:
|
persistence:
|
||||||
type: postgres
|
namespace: vector_io::chroma_remote
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
backend: kv_default
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
|
||||||
files:
|
files:
|
||||||
- provider_id: meta-reference-files
|
- provider_id: meta-reference-files
|
||||||
provider_type: inline::localfs
|
provider_type: inline::localfs
|
||||||
config:
|
config:
|
||||||
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
|
||||||
metadata_store:
|
metadata_store:
|
||||||
type: sqlite
|
table_name: files_metadata
|
||||||
db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
|
backend: sql_default
|
||||||
safety:
|
safety:
|
||||||
- provider_id: llama-guard
|
- provider_id: llama-guard
|
||||||
provider_type: inline::llama-guard
|
provider_type: inline::llama-guard
|
||||||
|
|
@ -56,20 +52,15 @@ providers:
|
||||||
- provider_id: meta-reference
|
- provider_id: meta-reference
|
||||||
provider_type: inline::meta-reference
|
provider_type: inline::meta-reference
|
||||||
config:
|
config:
|
||||||
persistence_store:
|
persistence:
|
||||||
type: postgres
|
agent_state:
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
namespace: agents
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
backend: kv_default
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
responses:
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
table_name: responses
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
backend: sql_default
|
||||||
responses_store:
|
max_write_queue_size: 10000
|
||||||
type: postgres
|
num_writers: 4
|
||||||
host: ${env.POSTGRES_HOST:=localhost}
|
|
||||||
port: ${env.POSTGRES_PORT:=5432}
|
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
|
||||||
telemetry:
|
telemetry:
|
||||||
- provider_id: meta-reference
|
- provider_id: meta-reference
|
||||||
provider_type: inline::meta-reference
|
provider_type: inline::meta-reference
|
||||||
|
|
@ -110,40 +101,53 @@ storage:
|
||||||
db: ${env.POSTGRES_DB:=llamastack}
|
db: ${env.POSTGRES_DB:=llamastack}
|
||||||
user: ${env.POSTGRES_USER:=llamastack}
|
user: ${env.POSTGRES_USER:=llamastack}
|
||||||
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
password: ${env.POSTGRES_PASSWORD:=llamastack}
|
||||||
references:
|
stores:
|
||||||
metadata:
|
metadata:
|
||||||
backend: kv_default
|
|
||||||
namespace: registry
|
namespace: registry
|
||||||
|
backend: kv_default
|
||||||
inference:
|
inference:
|
||||||
backend: sql_default
|
|
||||||
table_name: inference_store
|
table_name: inference_store
|
||||||
models:
|
backend: sql_default
|
||||||
- metadata:
|
max_write_queue_size: 10000
|
||||||
embedding_dimension: 768
|
num_writers: 4
|
||||||
model_id: nomic-embed-text-v1.5
|
conversations:
|
||||||
provider_id: sentence-transformers
|
table_name: openai_conversations
|
||||||
model_type: embedding
|
backend: sql_default
|
||||||
- metadata: {}
|
registered_resources:
|
||||||
model_id: ${env.INFERENCE_MODEL}
|
models:
|
||||||
provider_id: vllm-inference
|
- metadata:
|
||||||
model_type: llm
|
embedding_dimension: 768
|
||||||
- metadata: {}
|
model_id: nomic-embed-text-v1.5
|
||||||
model_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
provider_id: sentence-transformers
|
||||||
provider_id: vllm-safety
|
model_type: embedding
|
||||||
model_type: llm
|
- metadata: {}
|
||||||
shields:
|
model_id: ${env.INFERENCE_MODEL}
|
||||||
- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
provider_id: vllm-inference
|
||||||
vector_dbs: []
|
model_type: llm
|
||||||
datasets: []
|
- metadata: {}
|
||||||
scoring_fns: []
|
model_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
||||||
benchmarks: []
|
provider_id: vllm-safety
|
||||||
tool_groups:
|
model_type: llm
|
||||||
- toolgroup_id: builtin::websearch
|
shields:
|
||||||
provider_id: tavily-search
|
- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
|
||||||
- toolgroup_id: builtin::rag
|
vector_dbs: []
|
||||||
provider_id: rag-runtime
|
datasets: []
|
||||||
|
scoring_fns: []
|
||||||
|
benchmarks: []
|
||||||
|
tool_groups:
|
||||||
|
- toolgroup_id: builtin::websearch
|
||||||
|
provider_id: tavily-search
|
||||||
|
- toolgroup_id: builtin::rag
|
||||||
|
provider_id: rag-runtime
|
||||||
server:
|
server:
|
||||||
port: 8321
|
port: 8321
|
||||||
auth:
|
auth:
|
||||||
provider_config:
|
provider_config:
|
||||||
type: github_token
|
type: github_token
|
||||||
|
telemetry:
|
||||||
|
enabled: true
|
||||||
|
vector_stores:
|
||||||
|
default_provider_id: chromadb
|
||||||
|
default_embedding_model:
|
||||||
|
provider_id: sentence-transformers
|
||||||
|
model_id: nomic-ai/nomic-embed-text-v1.5
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue