chore: make OpenAIMixin maintainable, turn OpenAIMixin into a pydantic.BaseModel

- implement get_api_key instead of relying on LiteLLMOpenAIMixin.get_api_key - remove use of LiteLLMOpenAIMixin - add default initialize/shutdown methods to OpenAIMixin - remove __init__s to allow proper pydantic construction - remove dead code from vllm adapter and associated / duplicate unit tests - update vllm adapter to use openaimixin for model registration - remove ModelRegistryHelper from fireworks & together adapters - remove Inference from nvidia adapter - complete type hints on embedding_model_metadata - allow extra fields on OpenAIMixin, for model_store, __provider_id__, etc - new recordings for ollama - enhance the list models error handling w/ new tests - update cerebras (remove cerebras-cloud-sdk) and anthropic (custom model listing) inference adapters - parametrized test_inference_client_caching - remove cerebras, databricks, fireworks, together from blanket mypy exclude
2025-12-14 17:02:38 +00:00 · 2025-10-02 20:47:54 -04:00 · 2025-10-02 20:47:54 -04:00 · fd06717d87
commit fd06717d87
parent 351c4b98e4
64 changed files with 12901 additions and 1734 deletions
--- a/tests/integration/suites.py
+++ b/tests/integration/suites.py
@ -131,6 +131,27 @@ SETUP_DEFINITIONS: dict[str, Setup] = {
            "embedding_model": "fireworks/accounts/fireworks/models/qwen3-embedding-8b",
        },
    ),
+    "anthropic": Setup(
+        name="anthropic",
+        description="Anthropic Claude models",
+        defaults={
+            "text_model": "anthropic/claude-3-5-haiku-20241022",
+        },
+    ),
+    "llama-api": Setup(
+        name="llama-openai-compat",
+        description="Llama models from https://api.llama.com",
+        defaults={
+            "text_model": "llama_openai_compat/Llama-3.3-8B-Instruct",
+        },
+    ),
+    "groq": Setup(
+        name="groq",
+        description="Groq models",
+        defaults={
+            "text_model": "groq/llama-3.3-70b-versatile",
+        },
+    ),
 }