wip

2025-12-05 02:17:31 +00:00 · 2024-09-27 13:52:23 -07:00 · 2024-09-27 13:52:23 -07:00 · ebb57a0c67
commit ebb57a0c67
parent ecd17ce9e9
5 changed files with 123 additions and 12 deletions
--- a/llama_stack/cli/stack/configure.py
+++ b/llama_stack/cli/stack/configure.py
@ -78,15 +78,31 @@ class StackConfigure(Subcommand):
                self._configure_llama_distribution(build_config, args.output_dir)
                return
-        # if we get here, we need to prompt user to try configure inside docker image
+        # if we get here, we need to try to find the docker image
-        self.parser.error(
+        cprint(
-            f"""
+            f"Could not find {build_config_file}. Trying docker image name instead...",
-            Could not find {build_config_file}. Did you download a docker image?
+            color="green",
            Try running `docker run -it --entrypoint "/bin/bash" <image_name>`
            `llama stack configure llamastack-build.yaml --output-dir  ./`
            to set a new run configuration file. 
            """,
        )
        docker_image = args.config
        builds_dir = BUILDS_BASE_DIR / ImageType.docker.value
        if args.output_dir:
            builds_dir = Path(output_dir)
        os.makedirs(builds_dir, exist_ok=True)
        script = pkg_resources.resource_filename(
            "llama_stack", "distribution/configure_container.sh"
        )
        script_args = [script, docker_image, str(builds_dir)]
        return_code = run_with_pty(script_args)
        # we have regenerated the build config file with script, now check if it exists
        if return_code != 0:
            self.parser.error(
                f"Failed to configure container {docker_image} with return code {return_code}. Please run `llama stack build first`. "
            )
            return
        return
    def _configure_llama_distribution(
--- a/llama_stack/distribution/build_container.sh
+++ b/llama_stack/distribution/build_container.sh
@ -102,7 +102,7 @@ add_to_docker <<EOF
 # This would be good in production but for debugging flexibility lets not add it right now
 # We need a more solid production ready entrypoint.sh anyway
 #
-ENTRYPOINT ["python", "-m", "llama_stack.distribution.server.server", "./llamastack-run.yaml"]
+CMD ["python", "-m", "llama_stack.distribution.server.server", "./llamastack-run.yaml"]
 EOF
--- a/llama_stack/distribution/configure_container.sh
+++ b/llama_stack/distribution/configure_container.sh
@ -0,0 +1,34 @@
 #!/bin/bash
 # Copyright (c) Meta Platforms, Inc. and affiliates.
 # All rights reserved.
 #
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 DOCKER_BINARY=${DOCKER_BINARY:-docker}
 DOCKER_OPTS=${DOCKER_OPTS:-}
 set -euo pipefail
 error_handler() {
  echo "Error occurred in script at line: ${1}" >&2
  exit 1
 }
 trap 'error_handler ${LINENO}' ERR
 if [ $# -lt 2 ]; then
  echo "Usage: $0 <container name> <build file path>"
  exit 1
 fi
 docker_image="$1"
 host_build_dir="$2"
 container_build_dir="/app/builds"
 set -x
 $DOCKER_BINARY run $DOCKER_OPTS -it \
  -v $host_build_dir:$container_build_dir \
  $docker_image \
  llama stack configure ./llamastack-build.yaml --output-dir $container_build_dir
--- a/llama_stack/distribution/server/server.py
+++ b/llama_stack/distribution/server/server.py
@ -410,9 +410,8 @@ async def resolve_impls_with_routing(run_config: StackRunConfig) -> Dict[Api, An
    return impls, specs
-def main(default_yaml: str, port: int = 5000, disable_ipv6: bool = False, config: Optional[str] = None):
+def main(yaml_config: str, port: int = 5000, disable_ipv6: bool = False):
-    config_file = config or default_yaml
+    with open(yaml_config, "r") as fp:
    with open(config_file, "r") as fp:
        config = StackRunConfig(**yaml.safe_load(fp))
    app = FastAPI()
--- a/llama_stack/distribution/start_container.sh
+++ b/llama_stack/distribution/start_container.sh
@ -0,0 +1,62 @@
 #!/bin/bash
 # Copyright (c) Meta Platforms, Inc. and affiliates.
 # All rights reserved.
 #
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 DOCKER_BINARY=${DOCKER_BINARY:-docker}
 DOCKER_OPTS=${DOCKER_OPTS:-}
 LLAMA_CHECKPOINT_DIR=${LLAMA_CHECKPOINT_DIR:-}
 set -euo pipefail
 RED='\033[0;31m'
 NC='\033[0m' # No Color
 error_handler() {
  echo "Error occurred in script at line: ${1}" >&2
  exit 1
 }
 trap 'error_handler ${LINENO}' ERR
 if [ $# -lt 3 ]; then
  echo "Usage: $0 <build_name> <yaml_config> <port> <other_args...>"
  exit 1
 fi
 build_name="$1"
 docker_image="llamastack-$build_name"
 shift
 yaml_config="$1"
 shift
 port="$1"
 shift
 set -x
 if [ -n "$LLAMA_CHECKPOINT_DIR" ]; then
  $DOCKER_BINARY run $DOCKER_OPTS -it \
    -p $port:$port \
    -v "$yaml_config:/app/config.yaml" \
    -v "$LLAMA_CHECKPOINT_DIR:/root/.llama" \
    --gpus=all \
    $docker_image \
    python -m llama_stack.distribution.server.server \
    --yaml_config /app/config.yaml \
    --port $port "$@"
 fi
 if [ -z "$LLAMA_CHECKPOINT_DIR" ]; then
  $DOCKER_BINARY run $DOCKER_OPTS -it \
    -p $port:$port \
    -v "$yaml_config:/app/config.yaml" \
    $docker_image \
    python -m llama_stack.distribution.server.server \
    --yaml_config /app/config.yaml \
    --port $port "$@"
 fi