mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-05 20:27:35 +00:00
llama distribution -> llama stack + containers (WIP)
This commit is contained in:
parent
45987996c4
commit
fd3b65b718
16 changed files with 204 additions and 80 deletions
|
@ -1,44 +1,113 @@
|
|||
#!/bin/bash
|
||||
|
||||
if [ "$#" -ne 3 ]; then
|
||||
echo "Usage: $0 <image_name> <base_image> <pip_dependencies>
|
||||
echo "Example: $0 my-fastapi-app python:3.9-slim 'fastapi uvicorn'
|
||||
LLAMA_MODELS_DIR=${LLAMA_MODELS_DIR:-}
|
||||
LLAMA_TOOLCHAIN_DIR=${LLAMA_TOOLCHAIN_DIR:-}
|
||||
TEST_PYPI_VERSION=${TEST_PYPI_VERSION:-}
|
||||
|
||||
|
||||
if [ "$#" -ne 4 ]; then
|
||||
echo "Usage: $0 [api|stack] <image_name> <docker_base> <pip_dependencies>
|
||||
echo "Example: $0 agentic_system my-fastapi-app python:3.9-slim 'fastapi uvicorn'
|
||||
exit 1
|
||||
fi
|
||||
|
||||
IMAGE_NAME=$1
|
||||
BASE_IMAGE=$2
|
||||
PIP_DEPENDENCIES=$3
|
||||
api_or_stack=$1
|
||||
image_name=$2
|
||||
docker_base=$3
|
||||
pip_dependencies=$4
|
||||
|
||||
# Define color codes
|
||||
RED='\033[0;31m'
|
||||
GREEN='\033[0;32m'
|
||||
NC='\033[0m' # No Color
|
||||
|
||||
set -euo pipefail
|
||||
|
||||
PORT=8001
|
||||
|
||||
SCRIPT_DIR=$(dirname "$(readlink -f "$0")")
|
||||
SOURCE_DIR=$(dirname $(dirname $(dirname "$SCRIPT_DIR")))
|
||||
echo $SOURCE_DIR
|
||||
REPO_DIR=$(dirname $(dirname "$SCRIPT_DIR"))
|
||||
|
||||
TEMP_DIR=$(mktemp -d)
|
||||
echo "Created temporary directory: $TEMP_DIR"
|
||||
|
||||
cat <<EOF >"$TEMP_DIR/Dockerfile"
|
||||
FROM $BASE_IMAGE
|
||||
add_to_docker() {
|
||||
local input
|
||||
output_file="$TEMP_DIR/Dockerfile"
|
||||
if [ -t 0 ]; then
|
||||
printf '%s\n' "$1" >> "$output_file"
|
||||
else
|
||||
# If stdin is not a terminal, read from it (heredoc)
|
||||
cat >> "$output_file"
|
||||
fi
|
||||
}
|
||||
|
||||
|
||||
add_to_docker <<EOF
|
||||
FROM $docker_base
|
||||
WORKDIR /app
|
||||
COPY llama-stack/llama_toolchain /app/llama_toolchain
|
||||
COPY llama-models/models /app/llama_models
|
||||
|
||||
RUN pip install $PIP_DEPENDENCIES
|
||||
|
||||
EXPOSE $PORT
|
||||
ENTRYPOINT ["python3", "-m", "llama_toolchain.distribution.server", "--port", "$PORT"]
|
||||
RUN apt-get update && apt-get install -y \
|
||||
iputils-ping net-tools iproute2 dnsutils telnet \
|
||||
curl wget telnet \
|
||||
procps psmisc lsof \
|
||||
traceroute \
|
||||
&& rm -rf /var/lib/apt/lists/*
|
||||
|
||||
EOF
|
||||
|
||||
echo "Dockerfile created successfully in $TEMP_DIR/Dockerfile"
|
||||
toolchain_mount="/app/llama-toolchain-source"
|
||||
models_mount="/app/llama-models-source"
|
||||
|
||||
podman build -t $IMAGE_NAME -f "$TEMP_DIR/Dockerfile" "$SOURCE_DIR"
|
||||
if [ -n "$LLAMA_TOOLCHAIN_DIR" ]; then
|
||||
if [ ! -d "$LLAMA_TOOLCHAIN_DIR" ]; then
|
||||
echo "${RED}Warning: LLAMA_TOOLCHAIN_DIR is set but directory does not exist: $LLAMA_TOOLCHAIN_DIR${NC}" >&2
|
||||
exit 1
|
||||
fi
|
||||
add_to_docker "RUN pip install $toolchain_mount"
|
||||
else
|
||||
add_to_docker "RUN pip install llama-toolchain"
|
||||
fi
|
||||
|
||||
echo "Podman image '$IMAGE_NAME' built successfully."
|
||||
echo "You can run it with: podman run -p 8000:8000 $IMAGE_NAME"
|
||||
if [ -n "$LLAMA_MODELS_DIR" ]; then
|
||||
if [ ! -d "$LLAMA_MODELS_DIR" ]; then
|
||||
echo "${RED}Warning: LLAMA_MODELS_DIR is set but directory does not exist: $LLAMA_MODELS_DIR${NC}" >&2
|
||||
exit 1
|
||||
fi
|
||||
|
||||
rm -rf "$TEMP_DIR"
|
||||
add_to_docker <<EOF
|
||||
RUN pip uninstall -y llama-models
|
||||
RUN pip install $models_mount
|
||||
|
||||
EOF
|
||||
fi
|
||||
|
||||
if [ -n "$pip_dependencies" ]; then
|
||||
add_to_docker "RUN pip install $pip_dependencies"
|
||||
fi
|
||||
|
||||
add_to_docker <<EOF
|
||||
|
||||
# This would be good in production but for debugging flexibility lets not add it right now
|
||||
# We need a more solid production ready entrypoint.sh anyway
|
||||
#
|
||||
# ENTRYPOINT ["python", "-m", "llama_toolchain.distribution.server"]
|
||||
|
||||
EOF
|
||||
|
||||
printf "Dockerfile created successfully in $TEMP_DIR/Dockerfile"
|
||||
cat $TEMP_DIR/Dockerfile
|
||||
printf "\n"
|
||||
|
||||
mounts=""
|
||||
if [ -n "$LLAMA_TOOLCHAIN_DIR" ]; then
|
||||
mounts="$mounts -v $(readlink -f $LLAMA_TOOLCHAIN_DIR):$toolchain_mount"
|
||||
fi
|
||||
if [ -n "$LLAMA_MODELS_DIR" ]; then
|
||||
mounts="$mounts -v $(readlink -f $LLAMA_MODELS_DIR):$models_mount"
|
||||
fi
|
||||
set -x
|
||||
podman build -t $image_name -f "$TEMP_DIR/Dockerfile" "$REPO_DIR" $mounts
|
||||
set +x
|
||||
|
||||
printf "${GREEN}Succesfully setup Podman image. Configuring build...${NC}"
|
||||
echo "You can run it with: podman run -p 8000:8000 $image_name"
|
||||
|
||||
$CONDA_PREFIX/bin/python3 -m llama_toolchain.cli.llama api configure "$api_or_stack" --name "$image_name"
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue