mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-31 07:50:00 +00:00
Updated the configuration templates to include the builtin preprocessors.
This commit is contained in:
parent
e895bb111c
commit
3f15349c9d
72 changed files with 632 additions and 25 deletions
|
|
@ -7,6 +7,7 @@
|
|||
from pathlib import Path
|
||||
|
||||
from llama_stack.apis.models.models import ModelType
|
||||
from llama_stack.apis.preprocessing.preprocessors import PreprocessorInput
|
||||
from llama_stack.distribution.datatypes import (
|
||||
ModelInput,
|
||||
Provider,
|
||||
|
|
@ -38,6 +39,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
"inline::rag-runtime",
|
||||
"remote::model-context-protocol",
|
||||
],
|
||||
"preprocessing": ["inline::basic", "inline::simple_chunking"],
|
||||
}
|
||||
name = "remote-vllm"
|
||||
inference_provider = Provider(
|
||||
|
|
@ -88,6 +90,16 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
provider_id="code-interpreter",
|
||||
),
|
||||
]
|
||||
default_preprocessors = [
|
||||
PreprocessorInput(
|
||||
preprocessor_id="builtin::basic",
|
||||
provider_id="basic",
|
||||
),
|
||||
PreprocessorInput(
|
||||
preprocessor_id="builtin::chunking",
|
||||
provider_id="simple_chunking",
|
||||
),
|
||||
]
|
||||
|
||||
return DistributionTemplate(
|
||||
name=name,
|
||||
|
|
@ -103,6 +115,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
},
|
||||
default_models=[inference_model, embedding_model],
|
||||
default_tool_groups=default_tool_groups,
|
||||
default_preprocessors=default_preprocessors,
|
||||
),
|
||||
"run-with-safety.yaml": RunConfigSettings(
|
||||
provider_overrides={
|
||||
|
|
@ -126,6 +139,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
],
|
||||
default_shields=[ShieldInput(shield_id="${env.SAFETY_MODEL}")],
|
||||
default_tool_groups=default_tool_groups,
|
||||
default_preprocessors=default_preprocessors,
|
||||
),
|
||||
},
|
||||
run_config_env_vars={
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue