diff --git a/.github/workflows/integration-tests.yml b/.github/workflows/integration-tests.yml index 808984368..e6d0475d3 100644 --- a/.github/workflows/integration-tests.yml +++ b/.github/workflows/integration-tests.yml @@ -91,7 +91,7 @@ jobs: - name: Build Llama Stack run: | - uv run llama stack build --template ci-tests --image-type venv + uv run llama stack build --template starter --image-type venv - name: Check Storage and Memory Available Before Tests if: ${{ always() }} @@ -108,9 +108,9 @@ jobs: shell: bash run: | if [ "${{ matrix.client-type }}" == "library" ]; then - stack_config="ci-tests" + stack_config="starter" else - stack_config="server:ci-tests" + stack_config="server:starter" fi EXCLUDE_TESTS="builtin_tool or safety_with_image or code_interpreter or test_rag" diff --git a/.github/workflows/integration-vector-io-tests.yml b/.github/workflows/integration-vector-io-tests.yml index 525c17d46..e1aeafddc 100644 --- a/.github/workflows/integration-vector-io-tests.yml +++ b/.github/workflows/integration-vector-io-tests.yml @@ -93,7 +93,7 @@ jobs: - name: Build Llama Stack run: | - uv run llama stack build --template ci-tests --image-type venv + uv run llama stack build --template starter --image-type venv - name: Check Storage and Memory Available Before Tests if: ${{ always() }} diff --git a/.github/workflows/providers-build.yml b/.github/workflows/providers-build.yml index 392fddda6..6de72cd60 100644 --- a/.github/workflows/providers-build.yml +++ b/.github/workflows/providers-build.yml @@ -97,9 +97,9 @@ jobs: - name: Build a single provider run: | - yq -i '.image_type = "container"' llama_stack/templates/ci-tests/build.yaml - yq -i '.image_name = "test"' llama_stack/templates/ci-tests/build.yaml - USE_COPY_NOT_MOUNT=true LLAMA_STACK_DIR=. uv run llama stack build --config llama_stack/templates/ci-tests/build.yaml + yq -i '.image_type = "container"' llama_stack/templates/starter/build.yaml + yq -i '.image_name = "test"' llama_stack/templates/starter/build.yaml + USE_COPY_NOT_MOUNT=true LLAMA_STACK_DIR=. uv run llama stack build --config llama_stack/templates/starter/build.yaml - name: Inspect the container image entrypoint run: | @@ -126,14 +126,14 @@ jobs: .image_type = "container" | .image_name = "ubi9-test" | .distribution_spec.container_image = "registry.access.redhat.com/ubi9:latest" - ' llama_stack/templates/ci-tests/build.yaml + ' llama_stack/templates/starter/build.yaml - name: Build dev container (UBI9) env: USE_COPY_NOT_MOUNT: "true" LLAMA_STACK_DIR: "." run: | - uv run llama stack build --config llama_stack/templates/ci-tests/build.yaml + uv run llama stack build --config llama_stack/templates/starter/build.yaml - name: Inspect UBI9 image run: | diff --git a/llama_stack/templates/ci-tests/__init__.py b/llama_stack/templates/ci-tests/__init__.py deleted file mode 100644 index b309587f5..000000000 --- a/llama_stack/templates/ci-tests/__init__.py +++ /dev/null @@ -1,7 +0,0 @@ -# Copyright (c) Meta Platforms, Inc. and affiliates. -# All rights reserved. -# -# This source code is licensed under the terms described in the LICENSE file in -# the root directory of this source tree. - -from .ci_tests import get_distribution_template # noqa: F401 diff --git a/llama_stack/templates/ci-tests/build.yaml b/llama_stack/templates/ci-tests/build.yaml deleted file mode 100644 index 625e36e4f..000000000 --- a/llama_stack/templates/ci-tests/build.yaml +++ /dev/null @@ -1,60 +0,0 @@ -version: 2 -distribution_spec: - description: CI tests for Llama Stack - providers: - inference: - - remote::cerebras - - remote::ollama - - remote::vllm - - remote::tgi - - remote::hf::serverless - - remote::hf::endpoint - - remote::fireworks - - remote::together - - remote::bedrock - - remote::databricks - - remote::nvidia - - remote::runpod - - remote::openai - - remote::anthropic - - remote::gemini - - remote::groq - - remote::llama-openai-compat - - remote::sambanova - - remote::passthrough - - inline::sentence-transformers - vector_io: - - inline::faiss - - inline::sqlite-vec - - inline::milvus - - remote::chromadb - - remote::pgvector - files: - - inline::localfs - safety: - - inline::llama-guard - agents: - - inline::meta-reference - telemetry: - - inline::meta-reference - post_training: - - inline::huggingface - eval: - - inline::meta-reference - datasetio: - - remote::huggingface - - inline::localfs - scoring: - - inline::basic - - inline::llm-as-judge - - inline::braintrust - tool_runtime: - - remote::brave-search - - remote::tavily-search - - inline::rag-runtime - - remote::model-context-protocol -image_type: conda -additional_pip_packages: -- aiosqlite -- asyncpg -- sqlalchemy[asyncio] diff --git a/llama_stack/templates/ci-tests/ci_tests.py b/llama_stack/templates/ci-tests/ci_tests.py deleted file mode 100644 index 49cb36e39..000000000 --- a/llama_stack/templates/ci-tests/ci_tests.py +++ /dev/null @@ -1,19 +0,0 @@ -# Copyright (c) Meta Platforms, Inc. and affiliates. -# All rights reserved. -# -# This source code is licensed under the terms described in the LICENSE file in -# the root directory of this source tree. - - -from llama_stack.templates.template import DistributionTemplate - -from ..starter.starter import get_distribution_template as get_starter_distribution_template - - -def get_distribution_template() -> DistributionTemplate: - template = get_starter_distribution_template() - name = "ci-tests" - template.name = name - template.description = "CI tests for Llama Stack" - - return template diff --git a/llama_stack/templates/ci-tests/run.yaml b/llama_stack/templates/ci-tests/run.yaml deleted file mode 100644 index 1396d54a8..000000000 --- a/llama_stack/templates/ci-tests/run.yaml +++ /dev/null @@ -1,1138 +0,0 @@ -version: 2 -image_name: ci-tests -apis: -- agents -- datasetio -- eval -- files -- inference -- post_training -- safety -- scoring -- telemetry -- tool_runtime -- vector_io -providers: - inference: - - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_type: remote::cerebras - config: - base_url: https://api.cerebras.ai - api_key: ${env.CEREBRAS_API_KEY} - - provider_id: ${env.ENABLE_OLLAMA:=__disabled__} - provider_type: remote::ollama - config: - url: ${env.OLLAMA_URL:=http://localhost:11434} - - provider_id: ${env.ENABLE_VLLM:=__disabled__} - provider_type: remote::vllm - config: - url: ${env.VLLM_URL:=} - max_tokens: ${env.VLLM_MAX_TOKENS:=4096} - api_token: ${env.VLLM_API_TOKEN:=fake} - tls_verify: ${env.VLLM_TLS_VERIFY:=true} - - provider_id: ${env.ENABLE_TGI:=__disabled__} - provider_type: remote::tgi - config: - url: ${env.TGI_URL} - - provider_id: ${env.ENABLE_HF_SERVERLESS:=__disabled__} - provider_type: remote::hf::serverless - config: - huggingface_repo: ${env.INFERENCE_MODEL} - api_token: ${env.HF_API_TOKEN} - - provider_id: ${env.ENABLE_HF_ENDPOINT:=__disabled__} - provider_type: remote::hf::endpoint - config: - endpoint_name: ${env.INFERENCE_ENDPOINT_NAME} - api_token: ${env.HF_API_TOKEN} - - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_type: remote::fireworks - config: - url: https://api.fireworks.ai/inference/v1 - api_key: ${env.FIREWORKS_API_KEY} - - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_type: remote::together - config: - url: https://api.together.xyz/v1 - api_key: ${env.TOGETHER_API_KEY} - - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_type: remote::bedrock - config: {} - - provider_id: ${env.ENABLE_DATABRICKS:=__disabled__} - provider_type: remote::databricks - config: - url: ${env.DATABRICKS_URL} - api_token: ${env.DATABRICKS_API_TOKEN} - - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_type: remote::nvidia - config: - url: ${env.NVIDIA_BASE_URL:=https://integrate.api.nvidia.com} - api_key: ${env.NVIDIA_API_KEY:=} - append_api_version: ${env.NVIDIA_APPEND_API_VERSION:=True} - - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_type: remote::runpod - config: - url: ${env.RUNPOD_URL:=} - api_token: ${env.RUNPOD_API_TOKEN} - - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_type: remote::openai - config: - api_key: ${env.OPENAI_API_KEY} - - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_type: remote::anthropic - config: - api_key: ${env.ANTHROPIC_API_KEY} - - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_type: remote::gemini - config: - api_key: ${env.GEMINI_API_KEY} - - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_type: remote::groq - config: - url: https://api.groq.com - api_key: ${env.GROQ_API_KEY} - - provider_id: ${env.ENABLE_LLAMA_OPENAI_COMPAT:=__disabled__} - provider_type: remote::llama-openai-compat - config: - openai_compat_api_base: https://api.llama.com/compat/v1/ - api_key: ${env.LLAMA_API_KEY} - - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_type: remote::sambanova - config: - url: https://api.sambanova.ai/v1 - api_key: ${env.SAMBANOVA_API_KEY} - - provider_id: ${env.ENABLE_PASSTHROUGH:=__disabled__} - provider_type: remote::passthrough - config: - url: ${env.PASSTHROUGH_URL} - api_key: ${env.PASSTHROUGH_API_KEY} - - provider_id: ${env.ENABLE_SENTENCE_TRANSFORMERS:=sentence-transformers} - provider_type: inline::sentence-transformers - config: {} - vector_io: - - provider_id: ${env.ENABLE_FAISS:=faiss} - provider_type: inline::faiss - config: - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/faiss_store.db - - provider_id: ${env.ENABLE_SQLITE_VEC:=__disabled__} - provider_type: inline::sqlite-vec - config: - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec.db - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec_registry.db - - provider_id: ${env.ENABLE_MILVUS:=__disabled__} - provider_type: inline::milvus - config: - db_path: ${env.MILVUS_DB_PATH:=~/.llama/distributions/starter}/milvus.db - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/milvus_registry.db - - provider_id: ${env.ENABLE_CHROMADB:=__disabled__} - provider_type: remote::chromadb - config: - url: ${env.CHROMADB_URL:=} - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter/}/chroma_remote_registry.db - - provider_id: ${env.ENABLE_PGVECTOR:=__disabled__} - provider_type: remote::pgvector - config: - host: ${env.PGVECTOR_HOST:=localhost} - port: ${env.PGVECTOR_PORT:=5432} - db: ${env.PGVECTOR_DB:=} - user: ${env.PGVECTOR_USER:=} - password: ${env.PGVECTOR_PASSWORD:=} - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/pgvector_registry.db - files: - - provider_id: meta-reference-files - provider_type: inline::localfs - config: - storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files} - metadata_store: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db - safety: - - provider_id: llama-guard - provider_type: inline::llama-guard - config: - excluded_categories: [] - agents: - - provider_id: meta-reference - provider_type: inline::meta-reference - config: - persistence_store: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/agents_store.db - responses_store: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/responses_store.db - telemetry: - - provider_id: meta-reference - provider_type: inline::meta-reference - config: - service_name: "${env.OTEL_SERVICE_NAME:=\u200B}" - sinks: ${env.TELEMETRY_SINKS:=console,sqlite} - sqlite_db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/trace_store.db - otel_exporter_otlp_endpoint: ${env.OTEL_EXPORTER_OTLP_ENDPOINT:=} - post_training: - - provider_id: huggingface - provider_type: inline::huggingface - config: - checkpoint_format: huggingface - distributed_backend: null - device: cpu - eval: - - provider_id: meta-reference - provider_type: inline::meta-reference - config: - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/meta_reference_eval.db - datasetio: - - provider_id: huggingface - provider_type: remote::huggingface - config: - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/huggingface_datasetio.db - - provider_id: localfs - provider_type: inline::localfs - config: - kvstore: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/localfs_datasetio.db - scoring: - - provider_id: basic - provider_type: inline::basic - config: {} - - provider_id: llm-as-judge - provider_type: inline::llm-as-judge - config: {} - - provider_id: braintrust - provider_type: inline::braintrust - config: - openai_api_key: ${env.OPENAI_API_KEY:=} - tool_runtime: - - provider_id: brave-search - provider_type: remote::brave-search - config: - api_key: ${env.BRAVE_SEARCH_API_KEY:=} - max_results: 3 - - provider_id: tavily-search - provider_type: remote::tavily-search - config: - api_key: ${env.TAVILY_SEARCH_API_KEY:=} - max_results: 3 - - provider_id: rag-runtime - provider_type: inline::rag-runtime - config: {} - - provider_id: model-context-protocol - provider_type: remote::model-context-protocol - config: {} -metadata_store: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/registry.db -inference_store: - type: sqlite - db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/inference_store.db -models: -- metadata: - embedding_dimension: 384 - model_id: all-MiniLM-L6-v2 - provider_id: ${env.ENABLE_SENTENCE_TRANSFORMERS:=sentence-transformers} - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/llama3.1-8b - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama3.1-8b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama3.1-8b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/llama-3.3-70b - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama-3.3-70b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama-3.3-70b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/llama-4-scout-17b-16e-instruct - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_CEREBRAS:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_CEREBRAS:=__disabled__} - provider_model_id: llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OLLAMA:=__disabled__}/${env.OLLAMA_INFERENCE_MODEL:=__disabled__} - provider_id: ${env.ENABLE_OLLAMA:=__disabled__} - provider_model_id: ${env.OLLAMA_INFERENCE_MODEL:=__disabled__} - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OLLAMA:=__disabled__}/${env.SAFETY_MODEL:=__disabled__} - provider_id: ${env.ENABLE_OLLAMA:=__disabled__} - provider_model_id: ${env.SAFETY_MODEL:=__disabled__} - model_type: llm -- metadata: - embedding_dimension: ${env.OLLAMA_EMBEDDING_DIMENSION:=384} - model_id: ${env.ENABLE_OLLAMA:=__disabled__}/${env.OLLAMA_EMBEDDING_MODEL:=__disabled__} - provider_id: ${env.ENABLE_OLLAMA:=__disabled__} - provider_model_id: ${env.OLLAMA_EMBEDDING_MODEL:=__disabled__} - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_VLLM:=__disabled__}/${env.VLLM_INFERENCE_MODEL:=__disabled__} - provider_id: ${env.ENABLE_VLLM:=__disabled__} - provider_model_id: ${env.VLLM_INFERENCE_MODEL:=__disabled__} - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p1-8b-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p1-70b-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.1-70B-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p1-405b-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p2-3b-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-3b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-3b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p2-11b-vision-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-11b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.2-11B-Vision-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-11b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p2-90b-vision-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-90b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.2-90B-Vision-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p2-90b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-v3p3-70b-instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p3-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-v3p3-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama4-scout-instruct-basic - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama4-scout-instruct-basic - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama4-scout-instruct-basic - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama4-maverick-instruct-basic - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama4-maverick-instruct-basic - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama4-maverick-instruct-basic - model_type: llm -- metadata: - embedding_dimension: 768 - context_length: 8192 - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/nomic-ai/nomic-embed-text-v1.5 - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: nomic-ai/nomic-embed-text-v1.5 - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-guard-3-8b - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-guard-3-8b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-Guard-3-8B - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-guard-3-8b - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/accounts/fireworks/models/llama-guard-3-11b-vision - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-guard-3-11b-vision - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_FIREWORKS:=__disabled__}/meta-llama/Llama-Guard-3-11B-Vision - provider_id: ${env.ENABLE_FIREWORKS:=__disabled__} - provider_model_id: accounts/fireworks/models/llama-guard-3-11b-vision - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.1-70B-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-3B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-3B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-11B-Vision-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.2-90B-Vision-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.3-70B-Instruct-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-3.3-70B-Instruct-Turbo - model_type: llm -- metadata: - embedding_dimension: 768 - context_length: 8192 - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/togethercomputer/m2-bert-80M-8k-retrieval - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: togethercomputer/m2-bert-80M-8k-retrieval - model_type: embedding -- metadata: - embedding_dimension: 768 - context_length: 32768 - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/togethercomputer/m2-bert-80M-32k-retrieval - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: togethercomputer/m2-bert-80M-32k-retrieval - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Scout-17B-16E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Scout-17B-16E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/together/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Scout-17B-16E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/together/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-Guard-3-8B - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-Guard-3-8B - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-Guard-3-11B-Vision-Turbo - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-Guard-3-11B-Vision-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_TOGETHER:=__disabled__}/meta-llama/Llama-Guard-3-11B-Vision - provider_id: ${env.ENABLE_TOGETHER:=__disabled__} - provider_model_id: meta-llama/Llama-Guard-3-11B-Vision-Turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta.llama3-1-8b-instruct-v1:0 - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-8b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-8b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta.llama3-1-70b-instruct-v1:0 - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-70b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta-llama/Llama-3.1-70B-Instruct - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-70b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta.llama3-1-405b-instruct-v1:0 - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-405b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_BEDROCK:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_BEDROCK:=__disabled__} - provider_model_id: meta.llama3-1-405b-instruct-v1:0 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_DATABRICKS:=__disabled__}/databricks-meta-llama-3-1-70b-instruct - provider_id: ${env.ENABLE_DATABRICKS:=__disabled__} - provider_model_id: databricks-meta-llama-3-1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_DATABRICKS:=__disabled__}/meta-llama/Llama-3.1-70B-Instruct - provider_id: ${env.ENABLE_DATABRICKS:=__disabled__} - provider_model_id: databricks-meta-llama-3-1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_DATABRICKS:=__disabled__}/databricks-meta-llama-3-1-405b-instruct - provider_id: ${env.ENABLE_DATABRICKS:=__disabled__} - provider_model_id: databricks-meta-llama-3-1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_DATABRICKS:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_DATABRICKS:=__disabled__} - provider_model_id: databricks-meta-llama-3-1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama3-8b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama3-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3-8B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama3-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama3-70b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama3-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3-70B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama3-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.1-8b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-8b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.1-70b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.1-70B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.1-405b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.1-405b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.2-1b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-1b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.2-1B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-1b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.2-3b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-3b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-3b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.2-11b-vision-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-11b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.2-11B-Vision-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-11b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.2-90b-vision-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-90b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.2-90B-Vision-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.2-90b-vision-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta/llama-3.3-70b-instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.3-70b-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: meta/llama-3.3-70b-instruct - model_type: llm -- metadata: - embedding_dimension: 2048 - context_length: 8192 - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/nvidia/llama-3.2-nv-embedqa-1b-v2 - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: nvidia/llama-3.2-nv-embedqa-1b-v2 - model_type: embedding -- metadata: - embedding_dimension: 1024 - context_length: 512 - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/nvidia/nv-embedqa-e5-v5 - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: nvidia/nv-embedqa-e5-v5 - model_type: embedding -- metadata: - embedding_dimension: 4096 - context_length: 512 - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/nvidia/nv-embedqa-mistral-7b-v2 - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: nvidia/nv-embedqa-mistral-7b-v2 - model_type: embedding -- metadata: - embedding_dimension: 1024 - context_length: 512 - model_id: ${env.ENABLE_NVIDIA:=__disabled__}/snowflake/arctic-embed-l - provider_id: ${env.ENABLE_NVIDIA:=__disabled__} - provider_model_id: snowflake/arctic-embed-l - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-8B - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-8B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-70B - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-70B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B:bf16-mp8 - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B:bf16-mp8 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B:bf16-mp16 - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B:bf16-mp16 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-8B-Instruct - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-8B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-70B-Instruct - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-70B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B-Instruct:bf16-mp8 - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B-Instruct:bf16-mp8 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B-Instruct - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.1-405B-Instruct:bf16-mp16 - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.1-405B-Instruct:bf16-mp16 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.2-1B - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.2-1B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_RUNPOD:=__disabled__}/Llama3.2-3B - provider_id: ${env.ENABLE_RUNPOD:=__disabled__} - provider_model_id: Llama3.2-3B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-3.5-turbo-0125 - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-3.5-turbo-0125 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-3.5-turbo - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-3.5-turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-3.5-turbo-instruct - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-3.5-turbo-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4 - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4-turbo - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4-turbo - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4o - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4o - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4o-2024-08-06 - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4o-2024-08-06 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4o-mini - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4o-mini - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/gpt-4o-audio-preview - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: gpt-4o-audio-preview - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/chatgpt-4o-latest - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: chatgpt-4o-latest - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/o1 - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: o1 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/o1-mini - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: o1-mini - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/o3-mini - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: o3-mini - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_OPENAI:=__disabled__}/o4-mini - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: o4-mini - model_type: llm -- metadata: - embedding_dimension: 1536 - context_length: 8192 - model_id: ${env.ENABLE_OPENAI:=__disabled__}/text-embedding-3-small - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: text-embedding-3-small - model_type: embedding -- metadata: - embedding_dimension: 3072 - context_length: 8192 - model_id: ${env.ENABLE_OPENAI:=__disabled__}/text-embedding-3-large - provider_id: ${env.ENABLE_OPENAI:=__disabled__} - provider_model_id: text-embedding-3-large - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/claude-3-5-sonnet-latest - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/claude-3-5-sonnet-latest - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/claude-3-7-sonnet-latest - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/claude-3-7-sonnet-latest - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/claude-3-5-haiku-latest - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/claude-3-5-haiku-latest - model_type: llm -- metadata: - embedding_dimension: 1024 - context_length: 32000 - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/voyage-3 - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/voyage-3 - model_type: embedding -- metadata: - embedding_dimension: 512 - context_length: 32000 - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/voyage-3-lite - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/voyage-3-lite - model_type: embedding -- metadata: - embedding_dimension: 1024 - context_length: 32000 - model_id: ${env.ENABLE_ANTHROPIC:=__disabled__}/anthropic/voyage-code-3 - provider_id: ${env.ENABLE_ANTHROPIC:=__disabled__} - provider_model_id: anthropic/voyage-code-3 - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/gemini-1.5-flash - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/gemini-1.5-flash - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/gemini-1.5-pro - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/gemini-1.5-pro - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/gemini-2.0-flash - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/gemini-2.0-flash - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/gemini-2.5-flash - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/gemini-2.5-flash - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/gemini-2.5-pro - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/gemini-2.5-pro - model_type: llm -- metadata: - embedding_dimension: 768 - context_length: 2048 - model_id: ${env.ENABLE_GEMINI:=__disabled__}/gemini/text-embedding-004 - provider_id: ${env.ENABLE_GEMINI:=__disabled__} - provider_model_id: gemini/text-embedding-004 - model_type: embedding -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama3-8b-8192 - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama3-8b-8192 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama3-8b-8192 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama-3.1-8b-instant - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-3.1-8b-instant - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama3-70b-8192 - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama3-70b-8192 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-3-70B-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama3-70b-8192 - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama-3.3-70b-versatile - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-3.3-70b-versatile - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-3.3-70b-versatile - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama-3.2-3b-preview - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-3.2-3b-preview - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-3.2-3b-preview - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama-4-scout-17b-16e-instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/meta-llama/llama-4-scout-17b-16e-instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/meta-llama/llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/meta-llama/llama-4-scout-17b-16e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/llama-4-maverick-17b-128e-instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-4-maverick-17b-128e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/llama-4-maverick-17b-128e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/groq/meta-llama/llama-4-maverick-17b-128e-instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/meta-llama/llama-4-maverick-17b-128e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_GROQ:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_GROQ:=__disabled__} - provider_model_id: groq/meta-llama/llama-4-maverick-17b-128e-instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.1-8B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.1-8B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.1-8B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-3.1-405B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.1-405B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.1-405B-Instruct-FP8 - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.1-405B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-3.2-1B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.2-1B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.2-1B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.2-1B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.2-3B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.2-3B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.2-3B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.3-70B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.3-70B-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-3.3-70B-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Llama-3.2-11B-Vision-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-3.2-11B-Vision-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.2-11B-Vision-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-3.2-11B-Vision-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Llama-3.2-90B-Vision-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-3.2-90B-Vision-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-3.2-90B-Vision-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-3.2-90B-Vision-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-4-Scout-17B-16E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-4-Scout-17B-16E-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-4-Scout-17B-16E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-4-Maverick-17B-128E-Instruct - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/sambanova/Meta-Llama-Guard-3-8B - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: ${env.ENABLE_SAMBANOVA:=__disabled__}/meta-llama/Llama-Guard-3-8B - provider_id: ${env.ENABLE_SAMBANOVA:=__disabled__} - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm -shields: -- shield_id: ${env.SAFETY_MODEL:=__disabled__} - provider_shield_id: ${env.ENABLE_OLLAMA:=__disabled__}/${env.SAFETY_MODEL:=__disabled__} -vector_dbs: [] -datasets: [] -scoring_fns: [] -benchmarks: [] -tool_groups: -- toolgroup_id: builtin::websearch - provider_id: tavily-search -- toolgroup_id: builtin::rag - provider_id: rag-runtime -server: - port: 8321