From 9b3d7e85ff16617a977dbbc8fe2d49aed186ebd6 Mon Sep 17 00:00:00 2001 From: Young Han Date: Sat, 12 Jul 2025 16:28:22 -0700 Subject: [PATCH] feat: add llamacpp in registry --- llama_stack/providers/registry/inference.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py index 217870ec9..38276a2be 100644 --- a/llama_stack/providers/registry/inference.py +++ b/llama_stack/providers/registry/inference.py @@ -333,4 +333,14 @@ def available_providers() -> list[ProviderSpec]: description="IBM WatsonX inference provider for accessing AI models on IBM's WatsonX platform.", ), ), + remote_provider_spec( + api=Api.inference, + adapter=AdapterSpec( + adapter_type="llamacpp", + pip_packages=["litellm"], + module="llama_stack.providers.remote.inference.llamacpp", + config_class="llama_stack.providers.remote.inference.llamacpp.config.LlamaCppImplConfig", + provider_data_validator="llama_stack.providers.remote.inference.llamacpp.config.LlamaCppProviderDataValidator", + ), + ), ]