Added lazy initialization to the docling provider.

2025-12-31 06:53:54 +00:00 · 2025-03-07 15:38:34 +01:00 · 2025-03-07 15:38:34 +01:00 · e895bb111c
commit e895bb111c
parent 275fdbc23f
1 changed files with 9 additions and 5 deletions
--- a/llama_stack/providers/inline/preprocessing/docling/docling.py
+++ b/llama_stack/providers/inline/preprocessing/docling/docling.py
@ -36,13 +36,10 @@ class InclineDoclingPreprocessorImpl(Preprocessing, PreprocessorsProtocolPrivate

    def __init__(self, config: InlineDoclingConfig) -> None:
        self.config = config
-        self.converter = DocumentConverter()
+        self.converter = None
        self.chunker = None

-    async def initialize(self) -> None:
-        if self.config.chunk:
-            # TODO: docling should use Llama Stack's inference API instead of handling tokenization by itself
-            self.chunker = HybridChunker()
+    async def initialize(self) -> None: ...

    async def shutdown(self) -> None: ...

@ -56,6 +53,13 @@ class InclineDoclingPreprocessorImpl(Preprocessing, PreprocessorsProtocolPrivate
        preprocessor_inputs: List[PreprocessingDataElement],
        options: Optional[PreprocessorOptions] = None,
    ) -> PreprocessorResponse:
+        if self.converter is None:
+            # this is the first time this method is called
+            self.converter = DocumentConverter()
+            if self.config.chunk and self.chunker is None:
+                # TODO: docling should use Llama Stack's inference API instead of handling tokenization by itself
+                self.chunker = HybridChunker()
+
        results = []

        for inp in preprocessor_inputs: