diff --git a/docs/source/distributions/self_hosted_distro/sambanova.md b/docs/source/distributions/self_hosted_distro/sambanova.md index 1b98840fe..6b6663502 100644 --- a/docs/source/distributions/self_hosted_distro/sambanova.md +++ b/docs/source/distributions/self_hosted_distro/sambanova.md @@ -42,8 +42,9 @@ The following models are available by default: - `sambanova/Meta-Llama-3.3-70B-Instruct (aliases: meta-llama/Llama-3.3-70B-Instruct)` - `sambanova/Llama-3.2-11B-Vision-Instruct (aliases: meta-llama/Llama-3.2-11B-Vision-Instruct)` - `sambanova/Llama-3.2-90B-Vision-Instruct (aliases: meta-llama/Llama-3.2-90B-Vision-Instruct)` -- `sambanova/Meta-Llama-Guard-3-8B (aliases: meta-llama/Llama-Guard-3-8B)` - `sambanova/Llama-4-Scout-17B-16E-Instruct (aliases: meta-llama/Llama-4-Scout-17B-16E-Instruct)` +- `sambanova/Llama-4-Maverick-17B-128E-Instruct (aliases: meta-llama/Llama-4-Maverick-17B-128E-Instruct)` +- `sambanova/Meta-Llama-Guard-3-8B (aliases: meta-llama/Llama-Guard-3-8B)` ### Prerequisite: API Keys diff --git a/llama_stack/providers/remote/inference/sambanova/models.py b/llama_stack/providers/remote/inference/sambanova/models.py index 95d521288..f7b4184f8 100644 --- a/llama_stack/providers/remote/inference/sambanova/models.py +++ b/llama_stack/providers/remote/inference/sambanova/models.py @@ -42,12 +42,16 @@ MODEL_ENTRIES = [ "sambanova/Llama-3.2-90B-Vision-Instruct", CoreModelId.llama3_2_90b_vision_instruct.value, ), - build_hf_repo_model_entry( - "sambanova/Meta-Llama-Guard-3-8B", - CoreModelId.llama_guard_3_8b.value, - ), build_hf_repo_model_entry( "sambanova/Llama-4-Scout-17B-16E-Instruct", CoreModelId.llama4_scout_17b_16e_instruct.value, ), + build_hf_repo_model_entry( + "sambanova/Llama-4-Maverick-17B-128E-Instruct", + CoreModelId.llama4_maverick_17b_128e_instruct.value, + ), + build_hf_repo_model_entry( + "sambanova/Meta-Llama-Guard-3-8B", + CoreModelId.llama_guard_3_8b.value, + ), ] diff --git a/llama_stack/templates/dev/run.yaml b/llama_stack/templates/dev/run.yaml index 0ce5f1291..b19a1f243 100644 --- a/llama_stack/templates/dev/run.yaml +++ b/llama_stack/templates/dev/run.yaml @@ -481,16 +481,6 @@ models: provider_id: sambanova provider_model_id: sambanova/Llama-3.2-90B-Vision-Instruct model_type: llm -- metadata: {} - model_id: sambanova/Meta-Llama-Guard-3-8B - provider_id: sambanova - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: meta-llama/Llama-Guard-3-8B - provider_id: sambanova - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm - metadata: {} model_id: sambanova/Llama-4-Scout-17B-16E-Instruct provider_id: sambanova @@ -501,6 +491,26 @@ models: provider_id: sambanova provider_model_id: sambanova/Llama-4-Scout-17B-16E-Instruct model_type: llm +- metadata: {} + model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: sambanova/Meta-Llama-Guard-3-8B + provider_id: sambanova + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-Guard-3-8B + provider_id: sambanova + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm - metadata: embedding_dimension: 384 model_id: all-MiniLM-L6-v2 diff --git a/llama_stack/templates/sambanova/run.yaml b/llama_stack/templates/sambanova/run.yaml index 099310da5..91693917e 100644 --- a/llama_stack/templates/sambanova/run.yaml +++ b/llama_stack/templates/sambanova/run.yaml @@ -165,16 +165,6 @@ models: provider_id: sambanova provider_model_id: sambanova/Llama-3.2-90B-Vision-Instruct model_type: llm -- metadata: {} - model_id: sambanova/Meta-Llama-Guard-3-8B - provider_id: sambanova - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: meta-llama/Llama-Guard-3-8B - provider_id: sambanova - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm - metadata: {} model_id: sambanova/Llama-4-Scout-17B-16E-Instruct provider_id: sambanova @@ -185,6 +175,26 @@ models: provider_id: sambanova provider_model_id: sambanova/Llama-4-Scout-17B-16E-Instruct model_type: llm +- metadata: {} + model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: sambanova/Meta-Llama-Guard-3-8B + provider_id: sambanova + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-Guard-3-8B + provider_id: sambanova + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm - metadata: embedding_dimension: 384 model_id: all-MiniLM-L6-v2 diff --git a/llama_stack/templates/verification/run.yaml b/llama_stack/templates/verification/run.yaml index 7334bf865..b3c47234b 100644 --- a/llama_stack/templates/verification/run.yaml +++ b/llama_stack/templates/verification/run.yaml @@ -564,16 +564,6 @@ models: provider_id: sambanova-openai-compat provider_model_id: sambanova/Llama-3.2-90B-Vision-Instruct model_type: llm -- metadata: {} - model_id: sambanova/Meta-Llama-Guard-3-8B - provider_id: sambanova-openai-compat - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm -- metadata: {} - model_id: meta-llama/Llama-Guard-3-8B - provider_id: sambanova-openai-compat - provider_model_id: sambanova/Meta-Llama-Guard-3-8B - model_type: llm - metadata: {} model_id: sambanova/Llama-4-Scout-17B-16E-Instruct provider_id: sambanova-openai-compat @@ -584,6 +574,26 @@ models: provider_id: sambanova-openai-compat provider_model_id: sambanova/Llama-4-Scout-17B-16E-Instruct model_type: llm +- metadata: {} + model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova-openai-compat + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-4-Maverick-17B-128E-Instruct + provider_id: sambanova-openai-compat + provider_model_id: sambanova/Llama-4-Maverick-17B-128E-Instruct + model_type: llm +- metadata: {} + model_id: sambanova/Meta-Llama-Guard-3-8B + provider_id: sambanova-openai-compat + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm +- metadata: {} + model_id: meta-llama/Llama-Guard-3-8B + provider_id: sambanova-openai-compat + provider_model_id: sambanova/Meta-Llama-Guard-3-8B + model_type: llm - metadata: {} model_id: llama3.1-8b provider_id: cerebras-openai-compat