mirror of
https://github.com/meta-llama/llama-stack.git
synced 2026-01-03 13:12:18 +00:00
Updated the configuration templates to include the builtin preprocessors.
This commit is contained in:
parent
e895bb111c
commit
3f15349c9d
72 changed files with 632 additions and 25 deletions
|
|
@ -5,6 +5,7 @@
|
|||
# the root directory of this source tree.
|
||||
|
||||
from llama_stack.apis.models.models import ModelType
|
||||
from llama_stack.apis.preprocessing.preprocessors import PreprocessorInput
|
||||
from llama_stack.distribution.datatypes import ModelInput, Provider
|
||||
from llama_stack.providers.inline.inference.sentence_transformers import (
|
||||
SentenceTransformersInferenceConfig,
|
||||
|
|
@ -35,6 +36,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
"inline::rag-runtime",
|
||||
"remote::model-context-protocol",
|
||||
],
|
||||
"preprocessing": ["inline::basic", "inline::simple_chunking"],
|
||||
}
|
||||
|
||||
name = "vllm-gpu"
|
||||
|
|
@ -80,6 +82,16 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
provider_id="code-interpreter",
|
||||
),
|
||||
]
|
||||
default_preprocessors = [
|
||||
PreprocessorInput(
|
||||
preprocessor_id="builtin::basic",
|
||||
provider_id="basic",
|
||||
),
|
||||
PreprocessorInput(
|
||||
preprocessor_id="builtin::chunking",
|
||||
provider_id="simple_chunking",
|
||||
),
|
||||
]
|
||||
|
||||
return DistributionTemplate(
|
||||
name=name,
|
||||
|
|
@ -96,6 +108,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
},
|
||||
default_models=[inference_model, embedding_model],
|
||||
default_tool_groups=default_tool_groups,
|
||||
default_preprocessors=default_preprocessors,
|
||||
),
|
||||
},
|
||||
run_config_env_vars={
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue