forked from phoenix-oss/llama-stack-mirror
		
	feat(providers): sambanova updated to use LiteLLM openai-compat (#1596)
# What does this PR do? switch sambanova inference adaptor to LiteLLM usage to simplify integration and solve issues with current adaptor when streaming and tool calling, models and templates updated ## Test Plan pytest -s -v tests/integration/inference/test_text_inference.py --stack-config=sambanova --text-model=sambanova/Meta-Llama-3.3-70B-Instruct pytest -s -v tests/integration/inference/test_vision_inference.py --stack-config=sambanova --vision-model=sambanova/Llama-3.2-11B-Vision-Instruct
This commit is contained in:
		
							parent
							
								
									dd49ef31f1
								
							
						
					
					
						commit
						b2b00a216b
					
				
					 15 changed files with 529 additions and 404 deletions
				
			
		|  | @ -38,6 +38,10 @@ from llama_stack.providers.remote.inference.openai.config import OpenAIConfig | |||
| from llama_stack.providers.remote.inference.openai.models import ( | ||||
|     MODEL_ENTRIES as OPENAI_MODEL_ENTRIES, | ||||
| ) | ||||
| from llama_stack.providers.remote.inference.sambanova.config import SambaNovaImplConfig | ||||
| from llama_stack.providers.remote.inference.sambanova.models import ( | ||||
|     MODEL_ENTRIES as SAMBANOVA_MODEL_ENTRIES, | ||||
| ) | ||||
| from llama_stack.providers.remote.vector_io.chroma.config import ChromaVectorIOConfig | ||||
| from llama_stack.providers.remote.vector_io.pgvector.config import ( | ||||
|     PGVectorVectorIOConfig, | ||||
|  | @ -77,6 +81,11 @@ def get_inference_providers() -> tuple[list[Provider], list[ModelInput]]: | |||
|             GROQ_MODEL_ENTRIES, | ||||
|             GroqConfig.sample_run_config(api_key="${env.GROQ_API_KEY:}"), | ||||
|         ), | ||||
|         ( | ||||
|             "sambanova", | ||||
|             SAMBANOVA_MODEL_ENTRIES, | ||||
|             SambaNovaImplConfig.sample_run_config(api_key="${env.SAMBANOVA_API_KEY:}"), | ||||
|         ), | ||||
|     ] | ||||
|     inference_providers = [] | ||||
|     available_models = {} | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue