Fix server conditional awaiting on coroutines

2025-12-08 19:10:56 +00:00 · 2024-10-08 17:03:31 -07:00 · 2024-10-08 17:03:31 -07:00 · 8eee5b9adc
commit 8eee5b9adc
parent 216e7eb4d5
2 changed files with 9 additions and 5 deletions
--- a/llama_stack/providers/impls/meta_reference/inference/inference.py
+++ b/llama_stack/providers/impls/meta_reference/inference/inference.py
@ -34,6 +34,7 @@ class MetaReferenceInferenceImpl(Inference):
        # verify that the checkpoint actually is for this model lol

    async def initialize(self) -> None:
+        print(f"Loading model `{self.model.descriptor()}`")
        self.generator = LlamaModelParallelGenerator(self.config)
        self.generator.start()