Updated the configuration templates to include the builtin preprocessors.

2026-01-03 13:12:18 +00:00 · 2025-03-07 16:08:14 +01:00 · 2025-03-07 16:08:14 +01:00 · 3f15349c9d
commit 3f15349c9d
parent e895bb111c
72 changed files with 632 additions and 25 deletions
--- a/llama_stack/templates/vllm-gpu/vllm.py
+++ b/llama_stack/templates/vllm-gpu/vllm.py
@ -5,6 +5,7 @@
 # the root directory of this source tree.

 from llama_stack.apis.models.models import ModelType
+from llama_stack.apis.preprocessing.preprocessors import PreprocessorInput
 from llama_stack.distribution.datatypes import ModelInput, Provider
 from llama_stack.providers.inline.inference.sentence_transformers import (
    SentenceTransformersInferenceConfig,
@ -35,6 +36,7 @@ def get_distribution_template() -> DistributionTemplate:
            "inline::rag-runtime",
            "remote::model-context-protocol",
        ],
+        "preprocessing": ["inline::basic", "inline::simple_chunking"],
    }

    name = "vllm-gpu"
@ -80,6 +82,16 @@ def get_distribution_template() -> DistributionTemplate:
            provider_id="code-interpreter",
        ),
    ]
+    default_preprocessors = [
+        PreprocessorInput(
+            preprocessor_id="builtin::basic",
+            provider_id="basic",
+        ),
+        PreprocessorInput(
+            preprocessor_id="builtin::chunking",
+            provider_id="simple_chunking",
+        ),
+    ]

    return DistributionTemplate(
        name=name,
@ -96,6 +108,7 @@ def get_distribution_template() -> DistributionTemplate:
                },
                default_models=[inference_model, embedding_model],
                default_tool_groups=default_tool_groups,
+                default_preprocessors=default_preprocessors,
            ),
        },
        run_config_env_vars={