From 6e03c3fb69cc928d78a19a728f6271da9740f371 Mon Sep 17 00:00:00 2001 From: Ashwin Bharambe Date: Thu, 20 Feb 2025 16:58:06 -0800 Subject: [PATCH] Run distro codegen for real --- docs/source/distributions/remote_hosted_distro/nvidia.md | 1 + llama_stack/templates/nvidia/run.yaml | 6 +++--- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/docs/source/distributions/remote_hosted_distro/nvidia.md b/docs/source/distributions/remote_hosted_distro/nvidia.md index f352f737e..a1f70e450 100644 --- a/docs/source/distributions/remote_hosted_distro/nvidia.md +++ b/docs/source/distributions/remote_hosted_distro/nvidia.md @@ -36,6 +36,7 @@ The following models are available by default: - `meta-llama/Llama-3.2-3B-Instruct (meta/llama-3.2-3b-instruct)` - `meta-llama/Llama-3.2-11B-Vision-Instruct (meta/llama-3.2-11b-vision-instruct)` - `meta-llama/Llama-3.2-90B-Vision-Instruct (meta/llama-3.2-90b-vision-instruct)` +- `baai/bge-m3 (baai/bge-m3)` ### Prerequisite: API Keys diff --git a/llama_stack/templates/nvidia/run.yaml b/llama_stack/templates/nvidia/run.yaml index f3ffab169..891fd112a 100644 --- a/llama_stack/templates/nvidia/run.yaml +++ b/llama_stack/templates/nvidia/run.yaml @@ -135,9 +135,9 @@ models: provider_id: nvidia provider_model_id: meta/llama-3.2-90b-vision-instruct model_type: llm -- metadata: { - embedding_dimension: 1024 - } +- metadata: + embedding_dimensions: 1024 + context_length: 8192 model_id: baai/bge-m3 provider_id: nvidia provider_model_id: baai/bge-m3