Resolved merge conflicts

2026-01-03 01:12:16 +00:00 · 2025-03-13 01:58:09 -07:00 · 2025-03-13 01:58:09 -07:00 · 967dd0aa08
commit 967dd0aa08
parent 3298e50105
82 changed files with 66055 additions and 0 deletions
--- a/tests/integration/fixtures/init.py
+++ b/tests/integration/fixtures/init.py
@ -0,0 +1,5 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
--- a/tests/integration/fixtures/common.py
+++ b/tests/integration/fixtures/common.py
@ -0,0 +1,207 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import copy
+import inspect
+import logging
+import os
+import tempfile
+from pathlib import Path
+
+import pytest
+import yaml
+from llama_stack_client import LlamaStackClient
+
+from llama_stack import LlamaStackAsLibraryClient
+from llama_stack.apis.datatypes import Api
+from llama_stack.distribution.stack import run_config_from_adhoc_config_spec
+from llama_stack.env import get_env_or_fail
+
+from .recordable_mock import RecordableMock
+
+
+@pytest.fixture(scope="session")
+def provider_data():
+    # TODO: this needs to be generalized so each provider can have a sample provider data just
+    # like sample run config on which we can do replace_env_vars()
+    keymap = {
+        "TAVILY_SEARCH_API_KEY": "tavily_search_api_key",
+        "BRAVE_SEARCH_API_KEY": "brave_search_api_key",
+        "FIREWORKS_API_KEY": "fireworks_api_key",
+        "GEMINI_API_KEY": "gemini_api_key",
+        "OPENAI_API_KEY": "openai_api_key",
+        "TOGETHER_API_KEY": "together_api_key",
+        "ANTHROPIC_API_KEY": "anthropic_api_key",
+        "GROQ_API_KEY": "groq_api_key",
+        "WOLFRAM_ALPHA_API_KEY": "wolfram_alpha_api_key",
+    }
+    provider_data = {}
+    for key, value in keymap.items():
+        if os.environ.get(key):
+            provider_data[value] = os.environ[key]
+    return provider_data
+
+
+@pytest.fixture(scope="session")
+def llama_stack_client_with_mocked_inference(llama_stack_client, request):
+    """
+    Returns a client with mocked inference APIs and tool runtime APIs that use recorded responses by default.
+
+    If --record-responses is passed, it will call the real APIs and record the responses.
+    """
+    if not isinstance(llama_stack_client, LlamaStackAsLibraryClient):
+        logging.warning(
+            "llama_stack_client_with_mocked_inference is not supported for this client, returning original client without mocking"
+        )
+        return llama_stack_client
+
+    record_responses = request.config.getoption("--record-responses")
+    cache_dir = Path(__file__).parent / "recorded_responses"
+
+    # Create a shallow copy of the client to avoid modifying the original
+    client = copy.copy(llama_stack_client)
+
+    # Get the inference API used by the agents implementation
+    agents_impl = client.async_client.impls[Api.agents]
+    original_inference = agents_impl.inference_api
+
+    # Create a new inference object with the same attributes
+    inference_mock = copy.copy(original_inference)
+
+    # Replace the methods with recordable mocks
+    inference_mock.chat_completion = RecordableMock(
+        original_inference.chat_completion, cache_dir, "chat_completion", record=record_responses
+    )
+    inference_mock.completion = RecordableMock(
+        original_inference.completion, cache_dir, "text_completion", record=record_responses
+    )
+    inference_mock.embeddings = RecordableMock(
+        original_inference.embeddings, cache_dir, "embeddings", record=record_responses
+    )
+
+    # Replace the inference API in the agents implementation
+    agents_impl.inference_api = inference_mock
+
+    original_tool_runtime_api = agents_impl.tool_runtime_api
+    tool_runtime_mock = copy.copy(original_tool_runtime_api)
+
+    # Replace the methods with recordable mocks
+    tool_runtime_mock.invoke_tool = RecordableMock(
+        original_tool_runtime_api.invoke_tool, cache_dir, "invoke_tool", record=record_responses
+    )
+    agents_impl.tool_runtime_api = tool_runtime_mock
+
+    # Also update the client.inference for consistency
+    client.inference = inference_mock
+
+    return client
+
+
+@pytest.fixture(scope="session")
+def inference_provider_type(llama_stack_client):
+    providers = llama_stack_client.providers.list()
+    inference_providers = [p for p in providers if p.api == "inference"]
+    assert len(inference_providers) > 0, "No inference providers found"
+    return inference_providers[0].provider_type
+
+
+@pytest.fixture(scope="session")
+def client_with_models(
+    llama_stack_client,
+    text_model_id,
+    vision_model_id,
+    embedding_model_id,
+    embedding_dimension,
+    judge_model_id,
+):
+    client = llama_stack_client
+
+    providers = [p for p in client.providers.list() if p.api == "inference"]
+    assert len(providers) > 0, "No inference providers found"
+    inference_providers = [p.provider_id for p in providers if p.provider_type != "inline::sentence-transformers"]
+
+    model_ids = {m.identifier for m in client.models.list()}
+    model_ids.update(m.provider_resource_id for m in client.models.list())
+
+    if text_model_id and text_model_id not in model_ids:
+        client.models.register(model_id=text_model_id, provider_id=inference_providers[0])
+    if vision_model_id and vision_model_id not in model_ids:
+        client.models.register(model_id=vision_model_id, provider_id=inference_providers[0])
+    if judge_model_id and judge_model_id not in model_ids:
+        client.models.register(model_id=judge_model_id, provider_id=inference_providers[0])
+
+    if embedding_model_id and embedding_model_id not in model_ids:
+        # try to find a provider that supports embeddings, if sentence-transformers is not available
+        selected_provider = None
+        for p in providers:
+            if p.provider_type == "inline::sentence-transformers":
+                selected_provider = p
+                break
+
+        selected_provider = selected_provider or providers[0]
+        client.models.register(
+            model_id=embedding_model_id,
+            provider_id=selected_provider.provider_id,
+            model_type="embedding",
+            metadata={"embedding_dimension": embedding_dimension or 384},
+        )
+    return client
+
+
+@pytest.fixture(scope="session")
+def available_shields(llama_stack_client):
+    return [shield.identifier for shield in llama_stack_client.shields.list()]
+
+
+@pytest.fixture(scope="session")
+def model_providers(llama_stack_client):
+    return {x.provider_id for x in llama_stack_client.providers.list() if x.api == "inference"}
+
+
+@pytest.fixture(autouse=True)
+def skip_if_no_model(request):
+    model_fixtures = ["text_model_id", "vision_model_id", "embedding_model_id", "judge_model_id"]
+    test_func = request.node.function
+
+    actual_params = inspect.signature(test_func).parameters.keys()
+    for fixture in model_fixtures:
+        # Only check fixtures that are actually in the test function's signature
+        if fixture in actual_params and fixture in request.fixturenames and not request.getfixturevalue(fixture):
+            pytest.skip(f"{fixture} empty - skipping test")
+
+
+@pytest.fixture(scope="session")
+def llama_stack_client(request, provider_data, text_model_id):
+    config = request.config.getoption("--stack-config")
+    if not config:
+        config = get_env_or_fail("LLAMA_STACK_CONFIG")
+
+    if not config:
+        raise ValueError("You must specify either --stack-config or LLAMA_STACK_CONFIG")
+
+    # check if this looks like a URL
+    if config.startswith("http") or "//" in config:
+        return LlamaStackClient(
+            base_url=config,
+            provider_data=provider_data,
+        )
+
+    if "=" in config:
+        run_config = run_config_from_adhoc_config_spec(config)
+        run_config_file = tempfile.NamedTemporaryFile(delete=False, suffix=".yaml")
+        with open(run_config_file.name, "w") as f:
+            yaml.dump(run_config.model_dump(), f)
+        config = run_config_file.name
+
+    client = LlamaStackAsLibraryClient(
+        config,
+        provider_data=provider_data,
+        skip_logger_removal=True,
+    )
+    if not client.initialize():
+        raise RuntimeError("Initialization failed")
+
+    return client
--- a/tests/integration/fixtures/recordable_mock.py
+++ b/tests/integration/fixtures/recordable_mock.py
@ -0,0 +1,221 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+import importlib
+import json
+import os
+import re
+from datetime import datetime
+from enum import Enum
+from pathlib import Path
+
+
+class RecordableMock:
+    """A mock that can record and replay API responses."""
+
+    def __init__(self, real_func, cache_dir, func_name, record=False):
+        self.real_func = real_func
+        self.json_path = Path(cache_dir) / f"{func_name}.json"
+        self.record = record
+        self.cache = {}
+
+        # Load existing cache if available and not recording
+        if self.json_path.exists():
+            try:
+                with open(self.json_path, "r") as f:
+                    self.cache = json.load(f)
+            except Exception as e:
+                print(f"Error loading cache from {self.json_path}: {e}")
+                raise
+
+    async def __call__(self, *args, **kwargs):
+        """
+        Returns a coroutine that when awaited returns the result or an async generator,
+        matching the behavior of the original function.
+        """
+        # Create a cache key from the arguments
+        key = self._create_cache_key(args, kwargs)
+
+        if self.record:
+            # In record mode, always call the real function
+            real_result = self.real_func(*args, **kwargs)
+
+            # If it's a coroutine, we need to create a wrapper coroutine
+            if hasattr(real_result, "__await__"):
+                # Define a coroutine function that will record the result
+                async def record_coroutine():
+                    try:
+                        # Await the real coroutine
+                        result = await real_result
+
+                        # Check if the result is an async generator
+                        if hasattr(result, "__aiter__"):
+                            # It's an async generator, so we need to record its chunks
+                            chunks = []
+
+                            # Create and return a new async generator that records chunks
+                            async def recording_generator():
+                                nonlocal chunks
+                                async for chunk in result:
+                                    chunks.append(chunk)
+                                    yield chunk
+                                # After all chunks are yielded, save to cache
+                                self.cache[key] = {"type": "generator", "chunks": chunks}
+                                self._save_cache()
+
+                            return recording_generator()
+                        else:
+                            # It's a regular result, save it to cache
+                            self.cache[key] = {"type": "value", "value": result}
+                            self._save_cache()
+                            return result
+                    except Exception as e:
+                        print(f"Error in recording mode: {e}")
+                        raise
+
+                return await record_coroutine()
+            else:
+                # It's already an async generator, so we need to record its chunks
+                async def record_generator():
+                    chunks = []
+                    async for chunk in real_result:
+                        chunks.append(chunk)
+                        yield chunk
+                    # After all chunks are yielded, save to cache
+                    self.cache[key] = {"type": "generator", "chunks": chunks}
+                    self._save_cache()
+
+                return record_generator()
+        elif key not in self.cache:
+            # In replay mode, if the key is not in the cache, throw an error
+            raise KeyError(
+                f"No cached response found for key: {key}\nRun with --record-responses to record this response."
+            )
+        else:
+            # In replay mode with a cached response
+            cached_data = self.cache[key]
+
+            # Check if it's a value or chunks
+            if cached_data.get("type") == "value":
+                # It's a regular value
+                return self._reconstruct_object(cached_data["value"])
+            else:
+                # It's chunks from an async generator
+                async def replay_generator():
+                    for chunk in cached_data["chunks"]:
+                        yield self._reconstruct_object(chunk)
+
+                return replay_generator()
+
+    def _create_cache_key(self, args, kwargs):
+        """Create a hashable key from the function arguments, ignoring auto-generated IDs."""
+        # Convert to JSON strings with sorted keys
+        key = json.dumps((args, kwargs), sort_keys=True, default=self._json_default)
+
+        # Post-process the key with regex to replace IDs with placeholders
+        # Replace UUIDs and similar patterns
+        key = re.sub(r"[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}", "<UUID>", key)
+
+        # Replace temporary file paths created by tempfile.mkdtemp()
+        key = re.sub(r"/var/folders/[^,'\"\s]+", "<TEMP_FILE>", key)
+
+        # Replace /tmp/ paths which are also commonly used for temporary files
+        key = re.sub(r"/tmp/[^,'\"\s]+", "<TEMP_FILE>", key)
+
+        return key
+
+    def _save_cache(self):
+        """Save the cache to disk in JSON format."""
+        os.makedirs(self.json_path.parent, exist_ok=True)
+
+        # Write the JSON file with pretty formatting
+        try:
+            with open(self.json_path, "w") as f:
+                json.dump(self.cache, f, indent=2, sort_keys=True, default=self._json_default)
+                # write another empty line at the end of the file to make pre-commit happy
+                f.write("\n")
+        except Exception as e:
+            print(f"Error saving JSON cache: {e}")
+
+    def _json_default(self, obj):
+        """Default function for JSON serialization of objects."""
+
+        if isinstance(obj, datetime):
+            return {
+                "__datetime__": obj.isoformat(),
+                "__module__": obj.__class__.__module__,
+                "__class__": obj.__class__.__name__,
+            }
+
+        if isinstance(obj, Enum):
+            return {
+                "__enum__": obj.__class__.__name__,
+                "value": obj.value,
+                "__module__": obj.__class__.__module__,
+            }
+
+        # Handle Pydantic models
+        if hasattr(obj, "model_dump"):
+            model_data = obj.model_dump()
+            return {
+                "__pydantic__": obj.__class__.__name__,
+                "__module__": obj.__class__.__module__,
+                "data": model_data,
+            }
+
+    def _reconstruct_object(self, data):
+        """Reconstruct an object from its JSON representation."""
+        if isinstance(data, dict):
+            # Check if this is a serialized datetime
+            if "__datetime__" in data:
+                try:
+                    module_name = data.get("__module__", "datetime")
+                    class_name = data.get("__class__", "datetime")
+
+                    # Try to import the specific datetime class
+                    module = importlib.import_module(module_name)
+                    dt_class = getattr(module, class_name)
+
+                    # Parse the ISO format string
+                    dt = dt_class.fromisoformat(data["__datetime__"])
+                    return dt
+                except (ImportError, AttributeError, ValueError) as e:
+                    print(f"Error reconstructing datetime: {e}")
+                    return data
+
+            # Check if this is a serialized enum
+            elif "__enum__" in data:
+                try:
+                    module_name = data.get("__module__", "builtins")
+                    enum_class = self._import_class(module_name, data["__enum__"])
+                    return enum_class(data["value"])
+                except (ImportError, AttributeError) as e:
+                    print(f"Error reconstructing enum: {e}")
+                    return data
+
+            # Check if this is a serialized Pydantic model
+            elif "__pydantic__" in data:
+                try:
+                    module_name = data.get("__module__", "builtins")
+                    model_class = self._import_class(module_name, data["__pydantic__"])
+                    return model_class(**self._reconstruct_object(data["data"]))
+                except (ImportError, AttributeError) as e:
+                    print(f"Error reconstructing Pydantic model: {e}")
+                    return data
+
+            # Regular dictionary
+            return {k: self._reconstruct_object(v) for k, v in data.items()}
+
+        # Handle lists
+        elif isinstance(data, list):
+            return [self._reconstruct_object(item) for item in data]
+
+        # Return primitive types as is
+        return data
+
+    def _import_class(self, module_name, class_name):
+        """Import a class from a module."""
+        module = __import__(module_name, fromlist=[class_name])
+        return getattr(module, class_name)
--- a/tests/integration/fixtures/recorded_responses/chat_completion.json
+++ b/tests/integration/fixtures/recorded_responses/chat_completion.json
--- a/tests/integration/fixtures/recorded_responses/invoke_tool.json
+++ b/tests/integration/fixtures/recorded_responses/invoke_tool.json