mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-27 18:50:41 +00:00
# What does this PR do? start_stack.sh was using --yaml-config which is deprecated. a bunch of distro docs also mentioned --yaml-config. Replaces all instances and logic for --yaml-config with --config resolves #2189 Signed-off-by: Charlie Doern <cdoern@redhat.com>
194 lines
5 KiB
Bash
Executable file
194 lines
5 KiB
Bash
Executable file
#!/usr/bin/env bash
|
|
|
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
|
|
CONTAINER_BINARY=${CONTAINER_BINARY:-docker}
|
|
CONTAINER_OPTS=${CONTAINER_OPTS:-}
|
|
LLAMA_CHECKPOINT_DIR=${LLAMA_CHECKPOINT_DIR:-}
|
|
LLAMA_STACK_DIR=${LLAMA_STACK_DIR:-}
|
|
TEST_PYPI_VERSION=${TEST_PYPI_VERSION:-}
|
|
PYPI_VERSION=${PYPI_VERSION:-}
|
|
VIRTUAL_ENV=${VIRTUAL_ENV:-}
|
|
|
|
set -euo pipefail
|
|
|
|
RED='\033[0;31m'
|
|
GREEN='\033[0;32m'
|
|
NC='\033[0m' # No Color
|
|
|
|
error_handler() {
|
|
echo "Error occurred in script at line: ${1}" >&2
|
|
exit 1
|
|
}
|
|
|
|
trap 'error_handler ${LINENO}' ERR
|
|
|
|
if [ $# -lt 3 ]; then
|
|
echo "Usage: $0 <env_type> <env_path_or_name> <port> [--config <yaml_config>] [--env KEY=VALUE]..."
|
|
exit 1
|
|
fi
|
|
|
|
env_type="$1"
|
|
shift
|
|
|
|
env_path_or_name="$1"
|
|
container_image="localhost/$env_path_or_name"
|
|
shift
|
|
|
|
port="$1"
|
|
shift
|
|
|
|
SCRIPT_DIR=$(dirname "$(readlink -f "$0")")
|
|
source "$SCRIPT_DIR/common.sh"
|
|
|
|
# Initialize variables
|
|
yaml_config=""
|
|
env_vars=""
|
|
other_args=""
|
|
|
|
# Process remaining arguments
|
|
while [[ $# -gt 0 ]]; do
|
|
case "$1" in
|
|
--config)
|
|
if [[ -n "$2" ]]; then
|
|
yaml_config="$2"
|
|
shift 2
|
|
else
|
|
echo -e "${RED}Error: $1 requires a CONFIG argument${NC}" >&2
|
|
exit 1
|
|
fi
|
|
;;
|
|
--env)
|
|
if [[ -n "$2" ]]; then
|
|
env_vars="$env_vars --env $2"
|
|
shift 2
|
|
else
|
|
echo -e "${RED}Error: --env requires a KEY=VALUE argument${NC}" >&2
|
|
exit 1
|
|
fi
|
|
;;
|
|
*)
|
|
other_args="$other_args $1"
|
|
shift
|
|
;;
|
|
esac
|
|
done
|
|
|
|
# Check if yaml_config is required based on env_type
|
|
if [[ "$env_type" == "venv" || "$env_type" == "conda" ]] && [ -z "$yaml_config" ]; then
|
|
echo -e "${RED}Error: --config is required for venv and conda environments${NC}" >&2
|
|
exit 1
|
|
fi
|
|
|
|
PYTHON_BINARY="python"
|
|
case "$env_type" in
|
|
"venv")
|
|
if [ -n "$VIRTUAL_ENV" ] && [ "$VIRTUAL_ENV" == "$env_path_or_name" ]; then
|
|
echo -e "${GREEN}Virtual environment already activated${NC}" >&2
|
|
else
|
|
# Activate virtual environment
|
|
if [ ! -d "$env_path_or_name" ]; then
|
|
echo -e "${RED}Error: Virtual environment not found at $env_path_or_name${NC}" >&2
|
|
exit 1
|
|
fi
|
|
|
|
if [ ! -f "$env_path_or_name/bin/activate" ]; then
|
|
echo -e "${RED}Error: Virtual environment activate binary not found at $env_path_or_name/bin/activate" >&2
|
|
exit 1
|
|
fi
|
|
|
|
source "$env_path_or_name/bin/activate"
|
|
fi
|
|
;;
|
|
"conda")
|
|
if ! is_command_available conda; then
|
|
echo -e "${RED}Error: conda not found" >&2
|
|
exit 1
|
|
fi
|
|
eval "$(conda shell.bash hook)"
|
|
conda deactivate && conda activate "$env_path_or_name"
|
|
PYTHON_BINARY="$CONDA_PREFIX/bin/python"
|
|
;;
|
|
*)
|
|
esac
|
|
|
|
if [[ "$env_type" == "venv" || "$env_type" == "conda" ]]; then
|
|
set -x
|
|
|
|
if [ -n "$yaml_config" ]; then
|
|
yaml_config_arg="--config $yaml_config"
|
|
else
|
|
yaml_config_arg=""
|
|
fi
|
|
|
|
$PYTHON_BINARY -m llama_stack.distribution.server.server \
|
|
$yaml_config_arg \
|
|
--port "$port" \
|
|
$env_vars \
|
|
$other_args
|
|
elif [[ "$env_type" == "container" ]]; then
|
|
set -x
|
|
|
|
# Check if container command is available
|
|
if ! is_command_available $CONTAINER_BINARY; then
|
|
printf "${RED}Error: ${CONTAINER_BINARY} command not found. Is ${CONTAINER_BINARY} installed and in your PATH?${NC}" >&2
|
|
exit 1
|
|
fi
|
|
|
|
if is_command_available selinuxenabled &> /dev/null && selinuxenabled; then
|
|
# Disable SELinux labels
|
|
CONTAINER_OPTS="$CONTAINER_OPTS --security-opt label=disable"
|
|
fi
|
|
|
|
mounts=""
|
|
if [ -n "$LLAMA_STACK_DIR" ]; then
|
|
mounts="$mounts -v $(readlink -f $LLAMA_STACK_DIR):/app/llama-stack-source"
|
|
fi
|
|
if [ -n "$LLAMA_CHECKPOINT_DIR" ]; then
|
|
mounts="$mounts -v $LLAMA_CHECKPOINT_DIR:/root/.llama"
|
|
CONTAINER_OPTS="$CONTAINER_OPTS --gpus=all"
|
|
fi
|
|
|
|
if [ -n "$PYPI_VERSION" ]; then
|
|
version_tag="$PYPI_VERSION"
|
|
elif [ -n "$LLAMA_STACK_DIR" ]; then
|
|
version_tag="dev"
|
|
elif [ -n "$TEST_PYPI_VERSION" ]; then
|
|
version_tag="test-$TEST_PYPI_VERSION"
|
|
else
|
|
if ! is_command_available jq; then
|
|
echo -e "${RED}Error: jq not found" >&2
|
|
exit 1
|
|
fi
|
|
URL="https://pypi.org/pypi/llama-stack/json"
|
|
version_tag=$(curl -s $URL | jq -r '.info.version')
|
|
fi
|
|
|
|
# Build the command with optional yaml config
|
|
cmd="$CONTAINER_BINARY run $CONTAINER_OPTS -it \
|
|
-p $port:$port \
|
|
$env_vars \
|
|
$mounts \
|
|
--env LLAMA_STACK_PORT=$port \
|
|
--entrypoint python \
|
|
$container_image:$version_tag \
|
|
-m llama_stack.distribution.server.server"
|
|
|
|
# Add yaml config if provided, otherwise use default
|
|
if [ -n "$yaml_config" ]; then
|
|
cmd="$cmd -v $yaml_config:/app/run.yaml --config /app/run.yaml"
|
|
else
|
|
cmd="$cmd --config /app/run.yaml"
|
|
fi
|
|
|
|
# Add any other args
|
|
cmd="$cmd $other_args"
|
|
|
|
# Execute the command
|
|
eval $cmd
|
|
fi
|