forked from phoenix-oss/llama-stack-mirror
		
	# What does this PR do? * Added support postgresql inference store * Added 'oracle' template that demos how to config postgresql stores (except for telemetry, which is not supported currently) ## Test Plan llama stack build --template oracle --image-type conda --run LLAMA_STACK_CONFIG=http://localhost:8321 pytest -s -v tests/integration/ --text-model accounts/fireworks/models/llama-v3p3-70b-instruct -k 'inference_store'
		
			
				
	
	
		
			34 lines
		
	
	
	
		
			782 B
		
	
	
	
		
			YAML
		
	
	
	
	
	
			
		
		
	
	
			34 lines
		
	
	
	
		
			782 B
		
	
	
	
		
			YAML
		
	
	
	
	
	
| version: '2'
 | |
| distribution_spec:
 | |
|   description: Use (an external) Hugging Face Inference Endpoint for running LLM inference
 | |
|   providers:
 | |
|     inference:
 | |
|     - remote::hf::endpoint
 | |
|     vector_io:
 | |
|     - inline::faiss
 | |
|     - remote::chromadb
 | |
|     - remote::pgvector
 | |
|     safety:
 | |
|     - inline::llama-guard
 | |
|     agents:
 | |
|     - inline::meta-reference
 | |
|     telemetry:
 | |
|     - inline::meta-reference
 | |
|     eval:
 | |
|     - inline::meta-reference
 | |
|     datasetio:
 | |
|     - remote::huggingface
 | |
|     - inline::localfs
 | |
|     scoring:
 | |
|     - inline::basic
 | |
|     - inline::llm-as-judge
 | |
|     - inline::braintrust
 | |
|     tool_runtime:
 | |
|     - remote::brave-search
 | |
|     - remote::tavily-search
 | |
|     - inline::rag-runtime
 | |
|     - remote::model-context-protocol
 | |
| image_type: conda
 | |
| additional_pip_packages:
 | |
| - aiosqlite
 | |
| - sqlalchemy[asyncio]
 |