From 532f607941d1582dfaed353841f1f3d93af84e02 Mon Sep 17 00:00:00 2001 From: Xi Yan Date: Sat, 15 Feb 2025 14:52:07 -0800 Subject: [PATCH] rm short context emb models --- .../templates/together/run-with-safety.yaml | 24 ---------------- llama_stack/templates/together/run.yaml | 24 ---------------- llama_stack/templates/together/together.py | 28 ------------------- 3 files changed, 76 deletions(-) diff --git a/llama_stack/templates/together/run-with-safety.yaml b/llama_stack/templates/together/run-with-safety.yaml index 0c72d4986..6d73f6042 100644 --- a/llama_stack/templates/together/run-with-safety.yaml +++ b/llama_stack/templates/together/run-with-safety.yaml @@ -150,36 +150,12 @@ models: provider_id: together provider_model_id: togethercomputer/m2-bert-80M-8k-retrieval model_type: embedding -- metadata: - embedding_dimension: 768 - model_id: togethercomputer/m2-bert-80M-2k-retrieval - provider_id: together - provider_model_id: togethercomputer/m2-bert-80M-2k-retrieval - model_type: embedding - metadata: embedding_dimension: 768 model_id: togethercomputer/m2-bert-80M-32k-retrieval provider_id: together provider_model_id: togethercomputer/m2-bert-80M-32k-retrieval model_type: embedding -- metadata: - embedding_dimension: 1024 - model_id: WhereIsAI/UAE-Large-V1 - provider_id: together - provider_model_id: WhereIsAI/UAE-Large-V1 - model_type: embedding -- metadata: - embedding_dimension: 1024 - model_id: BAAI/bge-large-en-v1.5 - provider_id: together - provider_model_id: BAAI/bge-large-en-v1.5 - model_type: embedding -- metadata: - embedding_dimension: 768 - model_id: BAAI/bge-base-en-v1.5 - provider_id: together - provider_model_id: BAAI/bge-base-en-v1.5 - model_type: embedding shields: - shield_id: meta-llama/Llama-Guard-3-8B provider_id: llama-guard diff --git a/llama_stack/templates/together/run.yaml b/llama_stack/templates/together/run.yaml index 88aee0da3..521ff23a9 100644 --- a/llama_stack/templates/together/run.yaml +++ b/llama_stack/templates/together/run.yaml @@ -144,36 +144,12 @@ models: provider_id: together provider_model_id: togethercomputer/m2-bert-80M-8k-retrieval model_type: embedding -- metadata: - embedding_dimension: 768 - model_id: togethercomputer/m2-bert-80M-2k-retrieval - provider_id: together - provider_model_id: togethercomputer/m2-bert-80M-2k-retrieval - model_type: embedding - metadata: embedding_dimension: 768 model_id: togethercomputer/m2-bert-80M-32k-retrieval provider_id: together provider_model_id: togethercomputer/m2-bert-80M-32k-retrieval model_type: embedding -- metadata: - embedding_dimension: 1024 - model_id: WhereIsAI/UAE-Large-V1 - provider_id: together - provider_model_id: WhereIsAI/UAE-Large-V1 - model_type: embedding -- metadata: - embedding_dimension: 1024 - model_id: BAAI/bge-large-en-v1.5 - provider_id: together - provider_model_id: BAAI/bge-large-en-v1.5 - model_type: embedding -- metadata: - embedding_dimension: 768 - model_id: BAAI/bge-base-en-v1.5 - provider_id: together - provider_model_id: BAAI/bge-base-en-v1.5 - model_type: embedding shields: - shield_id: meta-llama/Llama-Guard-3-8B vector_dbs: [] diff --git a/llama_stack/templates/together/together.py b/llama_stack/templates/together/together.py index 3ba443e39..083a4ef34 100644 --- a/llama_stack/templates/together/together.py +++ b/llama_stack/templates/together/together.py @@ -89,13 +89,6 @@ def get_distribution_template() -> DistributionTemplate: provider_model_id="togethercomputer/m2-bert-80M-8k-retrieval", metadata={"embedding_dimension": 768}, ), - ModelInput( - model_id="togethercomputer/m2-bert-80M-2k-retrieval", - provider_id="together", - model_type=ModelType.embedding, - provider_model_id="togethercomputer/m2-bert-80M-2k-retrieval", - metadata={"embedding_dimension": 768}, - ), ModelInput( model_id="togethercomputer/m2-bert-80M-32k-retrieval", provider_id="together", @@ -103,27 +96,6 @@ def get_distribution_template() -> DistributionTemplate: provider_model_id="togethercomputer/m2-bert-80M-32k-retrieval", metadata={"embedding_dimension": 768}, ), - ModelInput( - model_id="WhereIsAI/UAE-Large-V1", - provider_id="together", - model_type=ModelType.embedding, - provider_model_id="WhereIsAI/UAE-Large-V1", - metadata={"embedding_dimension": 1024}, - ), - ModelInput( - model_id="BAAI/bge-large-en-v1.5", - provider_id="together", - model_type=ModelType.embedding, - provider_model_id="BAAI/bge-large-en-v1.5", - metadata={"embedding_dimension": 1024}, - ), - ModelInput( - model_id="BAAI/bge-base-en-v1.5", - provider_id="together", - model_type=ModelType.embedding, - provider_model_id="BAAI/bge-base-en-v1.5", - metadata={"embedding_dimension": 768}, - ), ] return DistributionTemplate(