mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-17 19:59:47 +00:00
Update Bedrock provider configuration
- Remove unnecessary provider file since Bedrock is in-tree - Add Bedrock runtime configuration to run.yaml with optional AWS env vars
This commit is contained in:
parent
3ee3746462
commit
8f62870b01
2 changed files with 13 additions and 7 deletions
|
|
@ -1,7 +0,0 @@
|
||||||
adapter:
|
|
||||||
adapter_type: bedrock
|
|
||||||
pip_packages: ["boto3>=1.26.137", "botocore"]
|
|
||||||
config_class: llama_stack.providers.remote.inference.bedrock.config.BedrockConfig
|
|
||||||
module: llama_stack.providers.remote.inference.bedrock
|
|
||||||
api_dependencies: ["inference"]
|
|
||||||
optional_api_dependencies: []
|
|
||||||
|
|
@ -19,6 +19,19 @@ providers:
|
||||||
max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
|
max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
|
||||||
api_token: ${env.VLLM_API_TOKEN:=fake}
|
api_token: ${env.VLLM_API_TOKEN:=fake}
|
||||||
tls_verify: ${env.VLLM_TLS_VERIFY:=true}
|
tls_verify: ${env.VLLM_TLS_VERIFY:=true}
|
||||||
|
- provider_id: bedrock-inference
|
||||||
|
provider_type: remote::bedrock
|
||||||
|
config:
|
||||||
|
aws_access_key_id: ${env.AWS_ACCESS_KEY_ID:=}
|
||||||
|
aws_secret_access_key: ${env.AWS_SECRET_ACCESS_KEY:=}
|
||||||
|
aws_session_token: ${env.AWS_SESSION_TOKEN:=}
|
||||||
|
region_name: ${env.AWS_DEFAULT_REGION:=}
|
||||||
|
profile_name: ${env.AWS_PROFILE:=}
|
||||||
|
total_max_attempts: ${env.AWS_MAX_ATTEMPTS:=}
|
||||||
|
retry_mode: ${env.AWS_RETRY_MODE:=}
|
||||||
|
connect_timeout: ${env.AWS_CONNECT_TIMEOUT:=}
|
||||||
|
read_timeout: ${env.AWS_READ_TIMEOUT:=}
|
||||||
|
session_ttl: ${env.AWS_SESSION_TTL:=}
|
||||||
- provider_id: sentence-transformers
|
- provider_id: sentence-transformers
|
||||||
provider_type: inline::sentence-transformers
|
provider_type: inline::sentence-transformers
|
||||||
config: {}
|
config: {}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue