forked from phoenix-oss/llama-stack-mirror
		
	docs: Add NVIDIA platform distro docs (#1971)
# What does this PR do? Add NVIDIA platform docs that serve as a starting point for Llama Stack users and explains all supported microservices. [//]: # (If resolving an issue, uncomment and update the line below) [//]: # (Closes #[issue-number]) ## Test Plan [Describe the tests you ran to verify your changes with result summaries. *Provide clear instructions so the plan can be easily re-executed.*] [//]: # (## Documentation) --------- Co-authored-by: Jash Gulabrai <jgulabrai@nvidia.com>
This commit is contained in:
		
							parent
							
								
									45e08ff417
								
							
						
					
					
						commit
						2ae1d7f4e6
					
				
					 6 changed files with 347 additions and 97 deletions
				
			
		
							
								
								
									
										77
									
								
								llama_stack/providers/remote/safety/nvidia/README.md
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										77
									
								
								llama_stack/providers/remote/safety/nvidia/README.md
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,77 @@ | |||
| # NVIDIA Safety Provider for LlamaStack | ||||
| 
 | ||||
| This provider enables safety checks and guardrails for LLM interactions using NVIDIA's NeMo Guardrails service. | ||||
| 
 | ||||
| ## Features | ||||
| 
 | ||||
| - Run safety checks for messages | ||||
| 
 | ||||
| ## Getting Started | ||||
| 
 | ||||
| ### Prerequisites | ||||
| 
 | ||||
| - LlamaStack with NVIDIA configuration | ||||
| - Access to NVIDIA NeMo Guardrails service | ||||
| - NIM for model to use for safety check is deployed | ||||
| 
 | ||||
| ### Setup | ||||
| 
 | ||||
| Build the NVIDIA environment: | ||||
| 
 | ||||
| ```bash | ||||
| llama stack build --template nvidia --image-type conda | ||||
| ``` | ||||
| 
 | ||||
| ### Basic Usage using the LlamaStack Python Client | ||||
| 
 | ||||
| #### Initialize the client | ||||
| 
 | ||||
| ```python | ||||
| import os | ||||
| 
 | ||||
| os.environ["NVIDIA_API_KEY"] = "your-api-key" | ||||
| os.environ["NVIDIA_GUARDRAILS_URL"] = "http://guardrails.test" | ||||
| 
 | ||||
| from llama_stack.distribution.library_client import LlamaStackAsLibraryClient | ||||
| 
 | ||||
| client = LlamaStackAsLibraryClient("nvidia") | ||||
| client.initialize() | ||||
| ``` | ||||
| 
 | ||||
| #### Create a safety shield | ||||
| 
 | ||||
| ```python | ||||
| from llama_stack.apis.safety import Shield | ||||
| from llama_stack.apis.inference import Message | ||||
| 
 | ||||
| # Create a safety shield | ||||
| shield = Shield( | ||||
|     shield_id="your-shield-id", | ||||
|     provider_resource_id="safety-model-id",  # The model to use for safety checks | ||||
|     description="Safety checks for content moderation", | ||||
| ) | ||||
| 
 | ||||
| # Register the shield | ||||
| await client.safety.register_shield(shield) | ||||
| ``` | ||||
| 
 | ||||
| #### Run safety checks | ||||
| 
 | ||||
| ```python | ||||
| # Messages to check | ||||
| messages = [Message(role="user", content="Your message to check")] | ||||
| 
 | ||||
| # Run safety check | ||||
| response = await client.safety.run_shield( | ||||
|     shield_id="your-shield-id", | ||||
|     messages=messages, | ||||
| ) | ||||
| 
 | ||||
| # Check for violations | ||||
| if response.violation: | ||||
|     print(f"Safety violation detected: {response.violation.user_message}") | ||||
|     print(f"Violation level: {response.violation.violation_level}") | ||||
|     print(f"Metadata: {response.violation.metadata}") | ||||
| else: | ||||
|     print("No safety violations detected") | ||||
| ``` | ||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue