Added draft implementation of built-in preprocessing for RAG.

2025-12-31 15:00:08 +00:00 · 2025-03-04 15:22:29 +01:00 · 2025-03-04 15:22:29 +01:00 · 1a6e71c61f
commit 1a6e71c61f
parent 5014de434e
9 changed files with 299 additions and 4 deletions
--- a/llama_stack/apis/preprocessing/preprocessing.py
+++ b/llama_stack/apis/preprocessing/preprocessing.py
@ -26,8 +26,8 @@ class PreprocessingDataType(Enum):
@json_schema_type
 class PreprocessingInput(BaseModel):
    preprocessor_input_id: str
-    preprocessor_input_type: Optional[PreprocessingDataType]
-    path_or_content: str | URL
+    preprocessor_input_type: Optional[PreprocessingDataType] = None
+    path_or_content: str | InterleavedContent | URL


 PreprocessorOptions = Dict[str, Any]
@ -36,7 +36,7 @@ PreprocessorOptions = Dict[str, Any]
@json_schema_type
 class PreprocessingResponse(BaseModel):
    status: bool
-    results: Optional[List[str | InterleavedContent | Chunk]]
+    results: Optional[List[str | InterleavedContent | Chunk]] = None


 class PreprocessorStore(Protocol):