feat: allow user to register model alias explicitly, tests

# What does this PR do?

Context: https://github.com/llamastack/llama-stack/discussions/3483

This PR enables the registering `provider_model_id` as the model identifier without breaking backward compatibility.


## Test Plan
todo
# What does this PR do?


## Test Plan
This commit is contained in:
Eric Huang 2025-09-18 15:47:20 -07:00
parent ac1414b571
commit 83a229554b
20 changed files with 236 additions and 92 deletions

View file

@ -79,15 +79,15 @@ def get_distribution_template() -> DistributionTemplate:
)
inference_model = ModelInput(
model_id="${env.INFERENCE_MODEL}",
provider_model_id="${env.INFERENCE_MODEL}",
provider_id="tgi0",
)
safety_model = ModelInput(
model_id="${env.SAFETY_MODEL}",
provider_model_id="${env.SAFETY_MODEL}",
provider_id="tgi1",
)
embedding_model = ModelInput(
model_id="all-MiniLM-L6-v2",
provider_model_id="all-MiniLM-L6-v2",
provider_id="sentence-transformers",
model_type=ModelType.embedding,
metadata={

View file

@ -103,18 +103,21 @@ inference_store:
db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/dell}/inference_store.db
models:
- metadata: {}
model_id: ${env.INFERENCE_MODEL}
provider_model_id: ${env.INFERENCE_MODEL}
provider_id: tgi0
model_type: llm
use_provider_model_id_as_id: false
- metadata: {}
model_id: ${env.SAFETY_MODEL}
provider_model_id: ${env.SAFETY_MODEL}
provider_id: tgi1
model_type: llm
use_provider_model_id_as_id: false
- metadata:
embedding_dimension: 384
model_id: all-MiniLM-L6-v2
provider_model_id: all-MiniLM-L6-v2
provider_id: sentence-transformers
model_type: embedding
use_provider_model_id_as_id: false
shields:
- shield_id: ${env.SAFETY_MODEL}
vector_dbs: []

View file

@ -99,14 +99,16 @@ inference_store:
db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/dell}/inference_store.db
models:
- metadata: {}
model_id: ${env.INFERENCE_MODEL}
provider_model_id: ${env.INFERENCE_MODEL}
provider_id: tgi0
model_type: llm
use_provider_model_id_as_id: false
- metadata:
embedding_dimension: 384
model_id: all-MiniLM-L6-v2
provider_model_id: all-MiniLM-L6-v2
provider_id: sentence-transformers
model_type: embedding
use_provider_model_id_as_id: false
shields: []
vector_dbs: []
datasets: []