diff --git a/distributions/ssambanova/build.yaml b/distributions/ssambanova/build.yaml new file mode 120000 index 000000000..32a5bd869 --- /dev/null +++ b/distributions/ssambanova/build.yaml @@ -0,0 +1 @@ +../../llama_stack/templates/fireworks/build.yaml \ No newline at end of file diff --git a/distributions/ssambanova/compose.yaml b/distributions/ssambanova/compose.yaml new file mode 100644 index 000000000..34ec14323 --- /dev/null +++ b/distributions/ssambanova/compose.yaml @@ -0,0 +1,16 @@ +services: + llamastack: + image: llamastack/distribution-ssambanova + network_mode: "host" + volumes: + - ~/.llama:/root/.llama + - ./run.yaml:/root/llamastack-run-ssambanova.yaml + ports: + - "5000:5000" + entrypoint: bash -c "python -m llama_stack.distribution.server.server --yaml_config /root/llamastack-run-ssambanova.yaml" + deploy: + restart_policy: + condition: on-failure + delay: 3s + max_attempts: 5 + window: 60s diff --git a/distributions/ssambanova/run.yaml b/distributions/ssambanova/run.yaml new file mode 100644 index 000000000..b2db276f4 --- /dev/null +++ b/distributions/ssambanova/run.yaml @@ -0,0 +1,71 @@ +version: "2" +image_name: ssambanova +docker_image: null +conda_env: ssambanova +apis: + - inference + - safety + - agents + - memory + - datasetio + - scoring + - eval + - telemetry +providers: + inference: + - provider_id: ssambanova + provider_type: remote::ssambanova + config: + url: https://api.sambanova.ai/v1 + api_key: ${env.SSAMBANOVA_API_KEY} + safety: + - provider_id: llama-guard + provider_type: inline::llama-guard + config: {} + agents: + - provider_id: meta-reference + provider_type: inline::meta-reference + config: + persistence_store: + type: sqlite + namespace: null + db_path: ${env.SQLITE_STORE_DIR:~/.llama/distributions/ssambanova}/agents_store.db + memory: + - provider_id: faiss + provider_type: inline::faiss + config: + kvstore: + type: sqlite + namespace: null + db_path: ${env.SQLITE_STORE_DIR:~/.llama/distributions/ssambanova}/faiss_store.db + datasetio: + - provider_id: localfs + provider_type: inline::localfs + config: {} + scoring: + - provider_id: basic + provider_type: inline::basic + config: {} + eval: + - provider_id: meta-reference + provider_type: inline::meta-reference + config: {} + telemetry: + - provider_id: meta-reference + provider_type: inline::meta-reference + config: {} +metadata_store: null +models: + - metadata: {} + model_id: meta-llama/Llama-3.1-8B-Instruct + provider_id: null + provider_model_id: Meta-Llama-3.1-8B-Instruct +shields: + - params: null + shield_id: meta-llama/Llama-Guard-3-8B + provider_id: null + provider_shield_id: null +memory_banks: [] +datasets: [] +scoring_fns: [] +eval_tasks: []