mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-30 23:51:00 +00:00
refereshable boto credentials
This commit is contained in:
parent
7d28dc380e
commit
6697ca3d3a
5 changed files with 171 additions and 44 deletions
|
@ -18,6 +18,7 @@ from llama_stack.providers.utils.inference.model_registry import ModelRegistryHe
|
||||||
from llama_stack.apis.inference import * # noqa: F403
|
from llama_stack.apis.inference import * # noqa: F403
|
||||||
|
|
||||||
from llama_stack.providers.adapters.inference.bedrock.config import BedrockConfig
|
from llama_stack.providers.adapters.inference.bedrock.config import BedrockConfig
|
||||||
|
from llama_stack.providers.utils.refreshable_boto_session import RefreshableBotoSession
|
||||||
|
|
||||||
|
|
||||||
BEDROCK_SUPPORTED_MODELS = {
|
BEDROCK_SUPPORTED_MODELS = {
|
||||||
|
@ -441,38 +442,47 @@ class BedrockInferenceAdapter(ModelRegistryHelper, Inference):
|
||||||
|
|
||||||
|
|
||||||
def _create_bedrock_client(config: BedrockConfig) -> BaseClient:
|
def _create_bedrock_client(config: BedrockConfig) -> BaseClient:
|
||||||
retries_config = {
|
if config.aws_access_key_id and config.aws_secret_access_key:
|
||||||
k: v
|
retries_config = {
|
||||||
for k, v in dict(
|
k: v
|
||||||
total_max_attempts=config.total_max_attempts,
|
for k, v in dict(
|
||||||
mode=config.retry_mode,
|
total_max_attempts=config.total_max_attempts,
|
||||||
).items()
|
mode=config.retry_mode,
|
||||||
if v is not None
|
).items()
|
||||||
}
|
if v is not None
|
||||||
|
}
|
||||||
|
|
||||||
config_args = {
|
config_args = {
|
||||||
k: v
|
k: v
|
||||||
for k, v in dict(
|
for k, v in dict(
|
||||||
region_name=config.region_name,
|
region_name=config.region_name,
|
||||||
retries=retries_config if retries_config else None,
|
retries=retries_config if retries_config else None,
|
||||||
connect_timeout=config.connect_timeout,
|
connect_timeout=config.connect_timeout,
|
||||||
read_timeout=config.read_timeout,
|
read_timeout=config.read_timeout,
|
||||||
).items()
|
).items()
|
||||||
if v is not None
|
if v is not None
|
||||||
}
|
}
|
||||||
|
|
||||||
boto3_config = Config(**config_args)
|
boto3_config = Config(**config_args)
|
||||||
|
|
||||||
session_args = {
|
session_args = {
|
||||||
"aws_access_key_id": config.aws_access_key_id,
|
"aws_access_key_id": config.aws_access_key_id,
|
||||||
"aws_secret_access_key": config.aws_secret_access_key,
|
"aws_secret_access_key": config.aws_secret_access_key,
|
||||||
"aws_session_token": config.aws_session_token,
|
"aws_session_token": config.aws_session_token,
|
||||||
"region_name": config.region_name,
|
"region_name": config.region_name,
|
||||||
"profile_name": config.profile_name,
|
"profile_name": config.profile_name,
|
||||||
}
|
}
|
||||||
|
|
||||||
# Remove None values
|
# Remove None values
|
||||||
session_args = {k: v for k, v in session_args.items() if v is not None}
|
session_args = {k: v for k, v in session_args.items() if v is not None}
|
||||||
|
|
||||||
boto3_session = boto3.session.Session(**session_args)
|
boto3_session = boto3.session.Session(**session_args)
|
||||||
return boto3_session.client("bedrock-runtime", config=boto3_config)
|
return boto3_session.client("bedrock-runtime", config=boto3_config)
|
||||||
|
else:
|
||||||
|
return (
|
||||||
|
RefreshableBotoSession(
|
||||||
|
region_name=config.region_name, profile_name=config.profile_name
|
||||||
|
)
|
||||||
|
.refreshable_session()
|
||||||
|
.client("bedrock-runtime")
|
||||||
|
)
|
||||||
|
|
|
@ -14,6 +14,7 @@ import boto3
|
||||||
from llama_stack.apis.safety import * # noqa
|
from llama_stack.apis.safety import * # noqa
|
||||||
from llama_models.llama3.api.datatypes import * # noqa: F403
|
from llama_models.llama3.api.datatypes import * # noqa: F403
|
||||||
from llama_stack.providers.datatypes import ShieldsProtocolPrivate
|
from llama_stack.providers.datatypes import ShieldsProtocolPrivate
|
||||||
|
from llama_stack.providers.utils.refreshable_boto_session import RefreshableBotoSession
|
||||||
|
|
||||||
from .config import BedrockSafetyConfig
|
from .config import BedrockSafetyConfig
|
||||||
|
|
||||||
|
@ -27,19 +28,27 @@ BEDROCK_SUPPORTED_SHIELDS = [
|
||||||
|
|
||||||
|
|
||||||
def _create_bedrock_client(config: BedrockSafetyConfig, name: str):
|
def _create_bedrock_client(config: BedrockSafetyConfig, name: str):
|
||||||
session_args = {
|
if config.aws_access_key_id and config.aws_secret_access_key:
|
||||||
"aws_access_key_id": config.aws_access_key_id,
|
session_args = {
|
||||||
"aws_secret_access_key": config.aws_secret_access_key,
|
"aws_access_key_id": config.aws_access_key_id,
|
||||||
"aws_session_token": config.aws_session_token,
|
"aws_secret_access_key": config.aws_secret_access_key,
|
||||||
"region_name": config.region_name,
|
"aws_session_token": config.aws_session_token,
|
||||||
"profile_name": config.profile_name,
|
"region_name": config.region_name,
|
||||||
}
|
"profile_name": config.profile_name,
|
||||||
|
}
|
||||||
|
# Remove None values
|
||||||
|
session_args = {k: v for k, v in session_args.items() if v is not None}
|
||||||
|
|
||||||
# Remove None values
|
boto3_session = boto3.session.Session(**session_args)
|
||||||
session_args = {k: v for k, v in session_args.items() if v is not None}
|
return boto3_session.client(name)
|
||||||
|
else:
|
||||||
boto3_session = boto3.session.Session(**session_args)
|
return (
|
||||||
return boto3_session.client(name)
|
RefreshableBotoSession(
|
||||||
|
region_name=config.region_name, profile_name=config.profile_name
|
||||||
|
)
|
||||||
|
.refreshable_session()
|
||||||
|
.client(name)
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class BedrockSafetyAdapter(Safety, ShieldsProtocolPrivate):
|
class BedrockSafetyAdapter(Safety, ShieldsProtocolPrivate):
|
||||||
|
|
|
@ -124,7 +124,7 @@ def available_providers() -> List[ProviderSpec]:
|
||||||
api=Api.inference,
|
api=Api.inference,
|
||||||
adapter=AdapterSpec(
|
adapter=AdapterSpec(
|
||||||
adapter_type="bedrock",
|
adapter_type="bedrock",
|
||||||
pip_packages=["boto3"],
|
pip_packages=["boto3", "pytz"],
|
||||||
module="llama_stack.providers.adapters.inference.bedrock",
|
module="llama_stack.providers.adapters.inference.bedrock",
|
||||||
config_class="llama_stack.providers.adapters.inference.bedrock.BedrockConfig",
|
config_class="llama_stack.providers.adapters.inference.bedrock.BedrockConfig",
|
||||||
),
|
),
|
||||||
|
|
|
@ -43,7 +43,7 @@ def available_providers() -> List[ProviderSpec]:
|
||||||
api=Api.safety,
|
api=Api.safety,
|
||||||
adapter=AdapterSpec(
|
adapter=AdapterSpec(
|
||||||
adapter_type="bedrock",
|
adapter_type="bedrock",
|
||||||
pip_packages=["boto3"],
|
pip_packages=["boto3", "pytz"],
|
||||||
module="llama_stack.providers.adapters.safety.bedrock",
|
module="llama_stack.providers.adapters.safety.bedrock",
|
||||||
config_class="llama_stack.providers.adapters.safety.bedrock.BedrockSafetyConfig",
|
config_class="llama_stack.providers.adapters.safety.bedrock.BedrockSafetyConfig",
|
||||||
),
|
),
|
||||||
|
|
108
llama_stack/providers/utils/refreshable_boto_session.py
Normal file
108
llama_stack/providers/utils/refreshable_boto_session.py
Normal file
|
@ -0,0 +1,108 @@
|
||||||
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
||||||
|
# All rights reserved.
|
||||||
|
#
|
||||||
|
# This source code is licensed under the terms described in the LICENSE file in
|
||||||
|
# the root directory of this source tree.
|
||||||
|
|
||||||
|
import os
|
||||||
|
from datetime import datetime
|
||||||
|
from time import time
|
||||||
|
|
||||||
|
import pytz
|
||||||
|
from boto3 import Session
|
||||||
|
from botocore.credentials import RefreshableCredentials
|
||||||
|
from botocore.session import get_session
|
||||||
|
|
||||||
|
|
||||||
|
class RefreshableBotoSession:
|
||||||
|
"""
|
||||||
|
Boto Helper class which lets us create a refreshable session so that we can cache the client or resource.
|
||||||
|
|
||||||
|
Usage
|
||||||
|
-----
|
||||||
|
session = RefreshableBotoSession().refreshable_session()
|
||||||
|
|
||||||
|
client = session.client("bedrock-runtime") # we now can cache this client object without worrying about expiring credentials
|
||||||
|
"""
|
||||||
|
|
||||||
|
def __init__(
|
||||||
|
self,
|
||||||
|
region_name: str = None,
|
||||||
|
profile_name: str = None,
|
||||||
|
session_ttl: int = 30000,
|
||||||
|
):
|
||||||
|
"""
|
||||||
|
Initialize `RefreshableBotoSession`
|
||||||
|
|
||||||
|
Parameters
|
||||||
|
----------
|
||||||
|
region_name : str (optional)
|
||||||
|
Default region when creating a new connection. Will check AWS_REGION or AWS_DEFAULT_REGION env vars if not provided.
|
||||||
|
|
||||||
|
profile_name : str (optional)
|
||||||
|
The name of a profile to use. Will check environment variables before using profile.
|
||||||
|
"""
|
||||||
|
# Check environment variables for region
|
||||||
|
self.region_name = (
|
||||||
|
region_name
|
||||||
|
or os.environ.get("AWS_REGION")
|
||||||
|
or os.environ.get("AWS_DEFAULT_REGION")
|
||||||
|
)
|
||||||
|
self.profile_name = profile_name
|
||||||
|
self.session_ttl = session_ttl
|
||||||
|
|
||||||
|
def __get_session_credentials(self):
|
||||||
|
"""
|
||||||
|
Get session credentials from environment variables or session
|
||||||
|
"""
|
||||||
|
# Check for credentials in environment variables first
|
||||||
|
if all(
|
||||||
|
key in os.environ for key in ["AWS_ACCESS_KEY_ID", "AWS_SECRET_ACCESS_KEY"]
|
||||||
|
):
|
||||||
|
expiry_time = (
|
||||||
|
os.environ.get("EXPIRY_TIME")
|
||||||
|
or datetime.fromtimestamp(time() + self.session_ttl)
|
||||||
|
.replace(tzinfo=pytz.utc)
|
||||||
|
.isoformat()
|
||||||
|
)
|
||||||
|
credentials = {
|
||||||
|
"access_key": os.environ["AWS_ACCESS_KEY_ID"],
|
||||||
|
"secret_key": os.environ["AWS_SECRET_ACCESS_KEY"],
|
||||||
|
"token": os.environ.get("AWS_SESSION_TOKEN"), # Optional
|
||||||
|
"expiry_time": expiry_time,
|
||||||
|
}
|
||||||
|
return credentials
|
||||||
|
|
||||||
|
# Fall back to profile-based credentials
|
||||||
|
session = Session(region_name=self.region_name, profile_name=self.profile_name)
|
||||||
|
|
||||||
|
session_credentials = session.get_credentials().get_frozen_credentials()
|
||||||
|
credentials = {
|
||||||
|
"access_key": session_credentials.access_key,
|
||||||
|
"secret_key": session_credentials.secret_key,
|
||||||
|
"token": session_credentials.token,
|
||||||
|
"expiry_time": datetime.fromtimestamp(time() + self.session_ttl)
|
||||||
|
.replace(tzinfo=pytz.utc)
|
||||||
|
.isoformat(),
|
||||||
|
}
|
||||||
|
|
||||||
|
return credentials
|
||||||
|
|
||||||
|
def refreshable_session(self) -> Session:
|
||||||
|
"""
|
||||||
|
Get refreshable boto3 session.
|
||||||
|
"""
|
||||||
|
# Get refreshable credentials
|
||||||
|
refreshable_credentials = RefreshableCredentials.create_from_metadata(
|
||||||
|
metadata=self.__get_session_credentials(),
|
||||||
|
refresh_using=self.__get_session_credentials,
|
||||||
|
method="sts-assume-role",
|
||||||
|
)
|
||||||
|
|
||||||
|
# attach refreshable credentials current session
|
||||||
|
session = get_session()
|
||||||
|
session._credentials = refreshable_credentials
|
||||||
|
session.set_config_variable("region", self.region_name)
|
||||||
|
autorefresh_session = Session(botocore_session=session)
|
||||||
|
|
||||||
|
return autorefresh_session
|
Loading…
Add table
Add a link
Reference in a new issue