mirror of
				https://github.com/meta-llama/llama-stack.git
				synced 2025-10-26 17:23:00 +00:00 
			
		
		
		
	a bunch of logger.info()s are good for server code to help debug in production, but we don't want them killing our unit test output :) --------- Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>
		
			
				
	
	
		
			357 lines
		
	
	
	
		
			11 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			357 lines
		
	
	
	
		
			11 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Copyright (c) Meta Platforms, Inc. and affiliates.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the terms described in the LICENSE file in
 | |
| # the root directory of this source tree.
 | |
| 
 | |
| import os
 | |
| from typing import Any
 | |
| from unittest.mock import AsyncMock, MagicMock, patch
 | |
| 
 | |
| import pytest
 | |
| 
 | |
| from llama_stack.apis.inference import CompletionMessage, UserMessage
 | |
| from llama_stack.apis.resource import ResourceType
 | |
| from llama_stack.apis.safety import RunShieldResponse, ViolationLevel
 | |
| from llama_stack.apis.shields import Shield
 | |
| from llama_stack.models.llama.datatypes import StopReason
 | |
| from llama_stack.providers.remote.safety.nvidia.config import NVIDIASafetyConfig
 | |
| from llama_stack.providers.remote.safety.nvidia.nvidia import NVIDIASafetyAdapter
 | |
| 
 | |
| 
 | |
| class FakeNVIDIASafetyAdapter(NVIDIASafetyAdapter):
 | |
|     """Test implementation that provides the required shield_store."""
 | |
| 
 | |
|     def __init__(self, config: NVIDIASafetyConfig, shield_store):
 | |
|         super().__init__(config)
 | |
|         self.shield_store = shield_store
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def nvidia_adapter():
 | |
|     """Set up the NVIDIASafetyAdapter for testing."""
 | |
|     os.environ["NVIDIA_GUARDRAILS_URL"] = "http://nemo.test"
 | |
| 
 | |
|     # Initialize the adapter
 | |
|     config = NVIDIASafetyConfig(
 | |
|         guardrails_service_url=os.environ["NVIDIA_GUARDRAILS_URL"],
 | |
|     )
 | |
| 
 | |
|     # Create a mock shield store that implements the ShieldStore protocol
 | |
|     shield_store = AsyncMock()
 | |
|     shield_store.get_shield = AsyncMock()
 | |
| 
 | |
|     adapter = FakeNVIDIASafetyAdapter(config=config, shield_store=shield_store)
 | |
| 
 | |
|     return adapter
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def mock_guardrails_post():
 | |
|     """Mock the HTTP request methods."""
 | |
|     with patch("llama_stack.providers.remote.safety.nvidia.nvidia.NeMoGuardrails._guardrails_post") as mock_post:
 | |
|         mock_post.return_value = {"status": "allowed"}
 | |
|         yield mock_post
 | |
| 
 | |
| 
 | |
| def _assert_request(
 | |
|     mock_call: MagicMock,
 | |
|     expected_url: str,
 | |
|     expected_headers: dict[str, str] | None = None,
 | |
|     expected_json: dict[str, Any] | None = None,
 | |
| ) -> None:
 | |
|     """
 | |
|     Helper method to verify request details in mock API calls.
 | |
| 
 | |
|     Args:
 | |
|         mock_call: The MagicMock object that was called
 | |
|         expected_url: The expected URL to which the request was made
 | |
|         expected_headers: Optional dictionary of expected request headers
 | |
|         expected_json: Optional dictionary of expected JSON payload
 | |
|     """
 | |
|     call_args = mock_call.call_args
 | |
| 
 | |
|     # Check URL
 | |
|     assert call_args[0][0] == expected_url
 | |
| 
 | |
|     # Check headers if provided
 | |
|     if expected_headers:
 | |
|         for key, value in expected_headers.items():
 | |
|             assert call_args[1]["headers"][key] == value
 | |
| 
 | |
|     # Check JSON if provided
 | |
|     if expected_json:
 | |
|         for key, value in expected_json.items():
 | |
|             if isinstance(value, dict):
 | |
|                 for nested_key, nested_value in value.items():
 | |
|                     assert call_args[1]["json"][key][nested_key] == nested_value
 | |
|             else:
 | |
|                 assert call_args[1]["json"][key] == value
 | |
| 
 | |
| 
 | |
| async def test_register_shield_with_valid_id(nvidia_adapter):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     shield = Shield(
 | |
|         provider_id="nvidia",
 | |
|         type=ResourceType.shield,
 | |
|         identifier="test-shield",
 | |
|         provider_resource_id="test-model",
 | |
|     )
 | |
| 
 | |
|     # Register the shield
 | |
|     await adapter.register_shield(shield)
 | |
| 
 | |
| 
 | |
| async def test_register_shield_without_id(nvidia_adapter):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     shield = Shield(
 | |
|         provider_id="nvidia",
 | |
|         type=ResourceType.shield,
 | |
|         identifier="test-shield",
 | |
|         provider_resource_id="",
 | |
|     )
 | |
| 
 | |
|     # Register the shield should raise a ValueError
 | |
|     with pytest.raises(ValueError):
 | |
|         await adapter.register_shield(shield)
 | |
| 
 | |
| 
 | |
| async def test_run_shield_allowed(nvidia_adapter, mock_guardrails_post):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     # Set up the shield
 | |
|     shield_id = "test-shield"
 | |
|     shield = Shield(
 | |
|         provider_id="nvidia",
 | |
|         type=ResourceType.shield,
 | |
|         identifier=shield_id,
 | |
|         provider_resource_id="test-model",
 | |
|     )
 | |
|     adapter.shield_store.get_shield.return_value = shield
 | |
| 
 | |
|     # Mock Guardrails API response
 | |
|     mock_guardrails_post.return_value = {"status": "allowed"}
 | |
| 
 | |
|     # Run the shield
 | |
|     messages = [
 | |
|         UserMessage(role="user", content="Hello, how are you?"),
 | |
|         CompletionMessage(
 | |
|             role="assistant",
 | |
|             content="I'm doing well, thank you for asking!",
 | |
|             stop_reason=StopReason.end_of_message,
 | |
|             tool_calls=[],
 | |
|         ),
 | |
|     ]
 | |
|     result = await adapter.run_shield(shield_id, messages)
 | |
| 
 | |
|     # Verify the shield store was called
 | |
|     adapter.shield_store.get_shield.assert_called_once_with(shield_id)
 | |
| 
 | |
|     # Verify the Guardrails API was called correctly
 | |
|     mock_guardrails_post.assert_called_once_with(
 | |
|         path="/v1/guardrail/checks",
 | |
|         data={
 | |
|             "model": shield_id,
 | |
|             "messages": [
 | |
|                 {"role": "user", "content": "Hello, how are you?"},
 | |
|                 {"role": "assistant", "content": "I'm doing well, thank you for asking!"},
 | |
|             ],
 | |
|             "temperature": 1.0,
 | |
|             "top_p": 1,
 | |
|             "frequency_penalty": 0,
 | |
|             "presence_penalty": 0,
 | |
|             "max_tokens": 160,
 | |
|             "stream": False,
 | |
|             "guardrails": {
 | |
|                 "config_id": "self-check",
 | |
|             },
 | |
|         },
 | |
|     )
 | |
| 
 | |
|     # Verify the result
 | |
|     assert isinstance(result, RunShieldResponse)
 | |
|     assert result.violation is None
 | |
| 
 | |
| 
 | |
| async def test_run_shield_blocked(nvidia_adapter, mock_guardrails_post):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     # Set up the shield
 | |
|     shield_id = "test-shield"
 | |
|     shield = Shield(
 | |
|         provider_id="nvidia",
 | |
|         type=ResourceType.shield,
 | |
|         identifier=shield_id,
 | |
|         provider_resource_id="test-model",
 | |
|     )
 | |
|     adapter.shield_store.get_shield.return_value = shield
 | |
| 
 | |
|     # Mock Guardrails API response
 | |
|     mock_guardrails_post.return_value = {"status": "blocked", "rails_status": {"reason": "harmful_content"}}
 | |
| 
 | |
|     # Run the shield
 | |
|     messages = [
 | |
|         UserMessage(role="user", content="Hello, how are you?"),
 | |
|         CompletionMessage(
 | |
|             role="assistant",
 | |
|             content="I'm doing well, thank you for asking!",
 | |
|             stop_reason=StopReason.end_of_message,
 | |
|             tool_calls=[],
 | |
|         ),
 | |
|     ]
 | |
|     result = await adapter.run_shield(shield_id, messages)
 | |
| 
 | |
|     # Verify the shield store was called
 | |
|     adapter.shield_store.get_shield.assert_called_once_with(shield_id)
 | |
| 
 | |
|     # Verify the Guardrails API was called correctly
 | |
|     mock_guardrails_post.assert_called_once_with(
 | |
|         path="/v1/guardrail/checks",
 | |
|         data={
 | |
|             "model": shield_id,
 | |
|             "messages": [
 | |
|                 {"role": "user", "content": "Hello, how are you?"},
 | |
|                 {"role": "assistant", "content": "I'm doing well, thank you for asking!"},
 | |
|             ],
 | |
|             "temperature": 1.0,
 | |
|             "top_p": 1,
 | |
|             "frequency_penalty": 0,
 | |
|             "presence_penalty": 0,
 | |
|             "max_tokens": 160,
 | |
|             "stream": False,
 | |
|             "guardrails": {
 | |
|                 "config_id": "self-check",
 | |
|             },
 | |
|         },
 | |
|     )
 | |
| 
 | |
|     # Verify the result
 | |
|     assert result.violation is not None
 | |
|     assert isinstance(result, RunShieldResponse)
 | |
|     assert result.violation.user_message == "Sorry I cannot do this."
 | |
|     assert result.violation.violation_level == ViolationLevel.ERROR
 | |
|     assert result.violation.metadata == {"reason": "harmful_content"}
 | |
| 
 | |
| 
 | |
| async def test_run_shield_not_found(nvidia_adapter, mock_guardrails_post):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     # Set up shield store to return None
 | |
|     shield_id = "non-existent-shield"
 | |
|     adapter.shield_store.get_shield.return_value = None
 | |
| 
 | |
|     messages = [
 | |
|         UserMessage(role="user", content="Hello, how are you?"),
 | |
|     ]
 | |
| 
 | |
|     with pytest.raises(ValueError):
 | |
|         await adapter.run_shield(shield_id, messages)
 | |
| 
 | |
|     # Verify the shield store was called
 | |
|     adapter.shield_store.get_shield.assert_called_once_with(shield_id)
 | |
| 
 | |
|     # Verify the Guardrails API was not called
 | |
|     mock_guardrails_post.assert_not_called()
 | |
| 
 | |
| 
 | |
| async def test_run_shield_http_error(nvidia_adapter, mock_guardrails_post):
 | |
|     adapter = nvidia_adapter
 | |
| 
 | |
|     shield_id = "test-shield"
 | |
|     shield = Shield(
 | |
|         provider_id="nvidia",
 | |
|         type=ResourceType.shield,
 | |
|         identifier=shield_id,
 | |
|         provider_resource_id="test-model",
 | |
|     )
 | |
|     adapter.shield_store.get_shield.return_value = shield
 | |
| 
 | |
|     # Mock Guardrails API to raise an exception
 | |
|     error_msg = "API Error: 500 Internal Server Error"
 | |
|     mock_guardrails_post.side_effect = Exception(error_msg)
 | |
| 
 | |
|     # Running the shield should raise an exception
 | |
|     messages = [
 | |
|         UserMessage(role="user", content="Hello, how are you?"),
 | |
|         CompletionMessage(
 | |
|             role="assistant",
 | |
|             content="I'm doing well, thank you for asking!",
 | |
|             stop_reason=StopReason.end_of_message,
 | |
|             tool_calls=[],
 | |
|         ),
 | |
|     ]
 | |
|     with pytest.raises(Exception) as exc_info:
 | |
|         await adapter.run_shield(shield_id, messages)
 | |
| 
 | |
|     # Verify the shield store was called
 | |
|     adapter.shield_store.get_shield.assert_called_once_with(shield_id)
 | |
| 
 | |
|     # Verify the Guardrails API was called correctly
 | |
|     mock_guardrails_post.assert_called_once_with(
 | |
|         path="/v1/guardrail/checks",
 | |
|         data={
 | |
|             "model": shield_id,
 | |
|             "messages": [
 | |
|                 {"role": "user", "content": "Hello, how are you?"},
 | |
|                 {"role": "assistant", "content": "I'm doing well, thank you for asking!"},
 | |
|             ],
 | |
|             "temperature": 1.0,
 | |
|             "top_p": 1,
 | |
|             "frequency_penalty": 0,
 | |
|             "presence_penalty": 0,
 | |
|             "max_tokens": 160,
 | |
|             "stream": False,
 | |
|             "guardrails": {
 | |
|                 "config_id": "self-check",
 | |
|             },
 | |
|         },
 | |
|     )
 | |
|     # Verify the exception message
 | |
|     assert error_msg in str(exc_info.value)
 | |
| 
 | |
| 
 | |
| def test_init_nemo_guardrails():
 | |
|     from llama_stack.providers.remote.safety.nvidia.nvidia import NeMoGuardrails
 | |
| 
 | |
|     os.environ["NVIDIA_GUARDRAILS_URL"] = "http://nemo.test"
 | |
| 
 | |
|     test_config_id = "test-custom-config-id"
 | |
|     config = NVIDIASafetyConfig(
 | |
|         guardrails_service_url=os.environ["NVIDIA_GUARDRAILS_URL"],
 | |
|         config_id=test_config_id,
 | |
|     )
 | |
|     # Initialize with default parameters
 | |
|     test_model = "test-model"
 | |
|     guardrails = NeMoGuardrails(config, test_model)
 | |
| 
 | |
|     # Verify the attributes are set correctly
 | |
|     assert guardrails.config_id == test_config_id
 | |
|     assert guardrails.model == test_model
 | |
|     assert guardrails.threshold == 0.9  # Default value
 | |
|     assert guardrails.temperature == 1.0  # Default value
 | |
|     assert guardrails.guardrails_service_url == os.environ["NVIDIA_GUARDRAILS_URL"]
 | |
| 
 | |
|     # Initialize with custom parameters
 | |
|     guardrails = NeMoGuardrails(config, test_model, threshold=0.8, temperature=0.7)
 | |
| 
 | |
|     # Verify the attributes are set correctly
 | |
|     assert guardrails.config_id == test_config_id
 | |
|     assert guardrails.model == test_model
 | |
|     assert guardrails.threshold == 0.8
 | |
|     assert guardrails.temperature == 0.7
 | |
|     assert guardrails.guardrails_service_url == os.environ["NVIDIA_GUARDRAILS_URL"]
 | |
| 
 | |
| 
 | |
| def test_init_nemo_guardrails_invalid_temperature():
 | |
|     from llama_stack.providers.remote.safety.nvidia.nvidia import NeMoGuardrails
 | |
| 
 | |
|     os.environ["NVIDIA_GUARDRAILS_URL"] = "http://nemo.test"
 | |
| 
 | |
|     config = NVIDIASafetyConfig(
 | |
|         guardrails_service_url=os.environ["NVIDIA_GUARDRAILS_URL"],
 | |
|         config_id="test-custom-config-id",
 | |
|     )
 | |
|     with pytest.raises(ValueError):
 | |
|         NeMoGuardrails(config, "test-model", temperature=0)
 |