mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-28 02:53:30 +00:00
Fix fireworks run-with-safety template (#766)
Summary: Fixing issue reported in https://github.com/meta-llama/llama-stack/pull/755/files#r1915696188 Test Plan: Re-run the config gen ``` pip install . python3 llama_stack/scripts/distro_codegen.py ```
This commit is contained in:
parent
472feea8d4
commit
89e3f81520
3 changed files with 27 additions and 22 deletions
|
@ -71,14 +71,6 @@ def get_distribution_template() -> DistributionTemplate:
|
||||||
)
|
)
|
||||||
for m in MODEL_ALIASES
|
for m in MODEL_ALIASES
|
||||||
]
|
]
|
||||||
inference_model = ModelInput(
|
|
||||||
model_id="${env.INFERENCE_MODEL}",
|
|
||||||
provider_id="fireworks",
|
|
||||||
)
|
|
||||||
safety_model = ModelInput(
|
|
||||||
model_id="${env.SAFETY_MODEL}",
|
|
||||||
provider_id="fireworks",
|
|
||||||
)
|
|
||||||
embedding_model = ModelInput(
|
embedding_model = ModelInput(
|
||||||
model_id="all-MiniLM-L6-v2",
|
model_id="all-MiniLM-L6-v2",
|
||||||
provider_id="sentence-transformers",
|
provider_id="sentence-transformers",
|
||||||
|
@ -133,6 +125,11 @@ def get_distribution_template() -> DistributionTemplate:
|
||||||
provider_type="inline::llama-guard",
|
provider_type="inline::llama-guard",
|
||||||
config={},
|
config={},
|
||||||
),
|
),
|
||||||
|
Provider(
|
||||||
|
provider_id="llama-guard-vision",
|
||||||
|
provider_type="inline::llama-guard",
|
||||||
|
config={},
|
||||||
|
),
|
||||||
Provider(
|
Provider(
|
||||||
provider_id="code-scanner",
|
provider_id="code-scanner",
|
||||||
provider_type="inline::code-scanner",
|
provider_type="inline::code-scanner",
|
||||||
|
@ -141,15 +138,18 @@ def get_distribution_template() -> DistributionTemplate:
|
||||||
],
|
],
|
||||||
},
|
},
|
||||||
default_models=[
|
default_models=[
|
||||||
inference_model,
|
*default_models,
|
||||||
safety_model,
|
|
||||||
embedding_model,
|
embedding_model,
|
||||||
],
|
],
|
||||||
default_shields=[
|
default_shields=[
|
||||||
ShieldInput(
|
ShieldInput(
|
||||||
shield_id="${env.SAFETY_MODEL}",
|
shield_id="meta-llama/Llama-Guard-3-8B",
|
||||||
provider_id="llama-guard",
|
provider_id="llama-guard",
|
||||||
),
|
),
|
||||||
|
ShieldInput(
|
||||||
|
shield_id="meta-llama/Llama-Guard-3-11B-Vision",
|
||||||
|
provider_id="llama-guard-vision",
|
||||||
|
),
|
||||||
ShieldInput(
|
ShieldInput(
|
||||||
shield_id="CodeScanner",
|
shield_id="CodeScanner",
|
||||||
provider_id="code-scanner",
|
provider_id="code-scanner",
|
||||||
|
|
|
@ -33,6 +33,9 @@ providers:
|
||||||
- provider_id: llama-guard
|
- provider_id: llama-guard
|
||||||
provider_type: inline::llama-guard
|
provider_type: inline::llama-guard
|
||||||
config: {}
|
config: {}
|
||||||
|
- provider_id: llama-guard-vision
|
||||||
|
provider_type: inline::llama-guard
|
||||||
|
config: {}
|
||||||
- provider_id: code-scanner
|
- provider_id: code-scanner
|
||||||
provider_type: inline::code-scanner
|
provider_type: inline::code-scanner
|
||||||
config: {}
|
config: {}
|
||||||
|
@ -97,52 +100,52 @@ models:
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.1-8B-Instruct
|
model_id: meta-llama/Llama-3.1-8B-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p1-8b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p1-8b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.1-70B-Instruct
|
model_id: meta-llama/Llama-3.1-70B-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p1-70b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p1-70b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.1-405B-Instruct-FP8
|
model_id: meta-llama/Llama-3.1-405B-Instruct-FP8
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p1-405b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p1-405b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.2-1B-Instruct
|
model_id: meta-llama/Llama-3.2-1B-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p2-1b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p2-1b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.2-3B-Instruct
|
model_id: meta-llama/Llama-3.2-3B-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p2-3b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p2-3b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.2-11B-Vision-Instruct
|
model_id: meta-llama/Llama-3.2-11B-Vision-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p2-11b-vision-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p2-11b-vision-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.2-90B-Vision-Instruct
|
model_id: meta-llama/Llama-3.2-90B-Vision-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p2-90b-vision-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p2-90b-vision-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-3.3-70B-Instruct
|
model_id: meta-llama/Llama-3.3-70B-Instruct
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-v3p3-70b-instruct
|
provider_model_id: accounts/fireworks/models/llama-v3p3-70b-instruct
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-Guard-3-8B
|
model_id: meta-llama/Llama-Guard-3-8B
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-guard-3-8b
|
provider_model_id: accounts/fireworks/models/llama-guard-3-8b
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata: {}
|
- metadata: {}
|
||||||
model_id: meta-llama/Llama-Guard-3-11B-Vision
|
model_id: meta-llama/Llama-Guard-3-11B-Vision
|
||||||
provider_id: fireworks
|
provider_id: fireworks
|
||||||
provider_model_id: fireworks/llama-guard-3-11b-vision
|
provider_model_id: accounts/fireworks/models/llama-guard-3-11b-vision
|
||||||
model_type: llm
|
model_type: llm
|
||||||
- metadata:
|
- metadata:
|
||||||
embedding_dimension: 384
|
embedding_dimension: 384
|
||||||
|
@ -152,6 +155,8 @@ models:
|
||||||
shields:
|
shields:
|
||||||
- shield_id: meta-llama/Llama-Guard-3-8B
|
- shield_id: meta-llama/Llama-Guard-3-8B
|
||||||
provider_id: llama-guard
|
provider_id: llama-guard
|
||||||
|
- shield_id: meta-llama/Llama-Guard-3-11B-Vision
|
||||||
|
provider_id: llama-guard-vision
|
||||||
- shield_id: CodeScanner
|
- shield_id: CodeScanner
|
||||||
provider_id: code-scanner
|
provider_id: code-scanner
|
||||||
memory_banks: []
|
memory_banks: []
|
||||||
|
|
|
@ -47,7 +47,7 @@ providers:
|
||||||
config:
|
config:
|
||||||
service_name: ${env.OTEL_SERVICE_NAME:llama-stack}
|
service_name: ${env.OTEL_SERVICE_NAME:llama-stack}
|
||||||
sinks: ${env.TELEMETRY_SINKS:console,sqlite}
|
sinks: ${env.TELEMETRY_SINKS:console,sqlite}
|
||||||
sqlite_db_path: ${env.SQLITE_DB_PATH:~/.llama/distributions/accounts/fireworks/models/trace_store.db}
|
sqlite_db_path: ${env.SQLITE_DB_PATH:~/.llama/distributions/fireworks/trace_store.db}
|
||||||
eval:
|
eval:
|
||||||
- provider_id: meta-reference
|
- provider_id: meta-reference
|
||||||
provider_type: inline::meta-reference
|
provider_type: inline::meta-reference
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue