mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-08-15 14:08:00 +00:00
feat(ci): introduce workflow for re-recording inference outputs
This commit is contained in:
parent
369286f95b
commit
ae6d240444
2 changed files with 96 additions and 0 deletions
1
.github/workflows/README.md
vendored
1
.github/workflows/README.md
vendored
|
@ -13,6 +13,7 @@ Llama Stack uses GitHub Actions for Continuous Integration (CI). Below is a tabl
|
||||||
| Pre-commit | [pre-commit.yml](pre-commit.yml) | Run pre-commit checks |
|
| Pre-commit | [pre-commit.yml](pre-commit.yml) | Run pre-commit checks |
|
||||||
| Test Llama Stack Build | [providers-build.yml](providers-build.yml) | Test llama stack build |
|
| Test Llama Stack Build | [providers-build.yml](providers-build.yml) | Test llama stack build |
|
||||||
| Python Package Build Test | [python-build-test.yml](python-build-test.yml) | Test building the llama-stack PyPI project |
|
| Python Package Build Test | [python-build-test.yml](python-build-test.yml) | Test building the llama-stack PyPI project |
|
||||||
|
| Integration Tests (Record) | [record-integration-tests.yml](record-integration-tests.yml) | Run the integration test suite from tests/integration |
|
||||||
| Check semantic PR titles | [semantic-pr.yml](semantic-pr.yml) | Ensure that PR titles follow the conventional commit spec |
|
| Check semantic PR titles | [semantic-pr.yml](semantic-pr.yml) | Ensure that PR titles follow the conventional commit spec |
|
||||||
| Close stale issues and PRs | [stale_bot.yml](stale_bot.yml) | Run the Stale Bot action |
|
| Close stale issues and PRs | [stale_bot.yml](stale_bot.yml) | Run the Stale Bot action |
|
||||||
| Test External Providers Installed via Module | [test-external-provider-module.yml](test-external-provider-module.yml) | Test External Provider installation via Python module |
|
| Test External Providers Installed via Module | [test-external-provider-module.yml](test-external-provider-module.yml) | Test External Provider installation via Python module |
|
||||||
|
|
95
.github/workflows/record-integration-tests.yml
vendored
Normal file
95
.github/workflows/record-integration-tests.yml
vendored
Normal file
|
@ -0,0 +1,95 @@
|
||||||
|
name: Integration Tests (Record)
|
||||||
|
|
||||||
|
run-name: Run the integration test suite from tests/integration
|
||||||
|
|
||||||
|
on:
|
||||||
|
pull_request:
|
||||||
|
branches: [ main ]
|
||||||
|
types: [opened, synchronize, labeled]
|
||||||
|
paths:
|
||||||
|
- 'llama_stack/**'
|
||||||
|
- 'tests/**'
|
||||||
|
- 'uv.lock'
|
||||||
|
- 'pyproject.toml'
|
||||||
|
- '.github/workflows/record-integration-tests.yml' # This workflow
|
||||||
|
- '.github/actions/setup-ollama/action.yml'
|
||||||
|
- '.github/actions/setup-test-environment/action.yml'
|
||||||
|
- '.github/actions/run-and-record-tests/action.yml'
|
||||||
|
workflow_dispatch:
|
||||||
|
inputs:
|
||||||
|
test-provider:
|
||||||
|
description: 'Test against a specific provider'
|
||||||
|
type: string
|
||||||
|
default: 'ollama'
|
||||||
|
|
||||||
|
concurrency:
|
||||||
|
group: ${{ github.workflow }}-${{ github.ref }}
|
||||||
|
cancel-in-progress: true
|
||||||
|
|
||||||
|
jobs:
|
||||||
|
discover-tests:
|
||||||
|
if: contains(github.event.pull_request.labels.*.name, 're-record-tests') ||
|
||||||
|
contains(github.event.pull_request.labels.*.name, 're-record-vision-tests')
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
outputs:
|
||||||
|
test-types: ${{ steps.generate-test-types.outputs.test-types }}
|
||||||
|
matrix-modes: ${{ steps.generate-test-types.outputs.matrix-modes }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: Checkout repository
|
||||||
|
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
|
||||||
|
|
||||||
|
- name: Generate test types
|
||||||
|
id: generate-test-types
|
||||||
|
run: |
|
||||||
|
# Get test directories dynamically, excluding non-test directories
|
||||||
|
TEST_TYPES=$(find tests/integration -maxdepth 1 -mindepth 1 -type d -printf "%f\n" |
|
||||||
|
grep -Ev "^(__pycache__|fixtures|test_cases|recordings|post_training)$" |
|
||||||
|
sort | jq -R -s -c 'split("\n")[:-1]')
|
||||||
|
echo "test-types=$TEST_TYPES" >> $GITHUB_OUTPUT
|
||||||
|
|
||||||
|
modes_array=()
|
||||||
|
if [[ ${{ github.event.pull_request.labels.*.name }} == *"re-record-vision-tests"* ]]; then
|
||||||
|
modes_array+=("vision")
|
||||||
|
fi
|
||||||
|
if [[ ${{ github.event.pull_request.labels.*.name }} == *"re-record-tests"* ]]; then
|
||||||
|
modes_array+=("non-vision")
|
||||||
|
fi
|
||||||
|
matrix_modes=$(jq -n -c '$ARGS.positional' --jsonargs -- "${modes_array[@]}")
|
||||||
|
echo "matrix-modes=$matrix_modes" >> $GITHUB_OUTPUT
|
||||||
|
|
||||||
|
record-tests:
|
||||||
|
needs: discover-tests
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
|
||||||
|
permissions:
|
||||||
|
contents: write
|
||||||
|
|
||||||
|
strategy:
|
||||||
|
fail-fast: false
|
||||||
|
matrix:
|
||||||
|
mode: ${{ fromJSON(needs.discover-tests.outputs.matrix-modes) }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: Checkout repository
|
||||||
|
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
|
||||||
|
with:
|
||||||
|
ref: ${{ github.event.pull_request.head.ref }}
|
||||||
|
fetch-depth: 0
|
||||||
|
|
||||||
|
- name: Setup test environment
|
||||||
|
uses: ./.github/actions/setup-test-environment
|
||||||
|
with:
|
||||||
|
python-version: "3.12" # Use single Python version for recording
|
||||||
|
client-version: "latest"
|
||||||
|
provider: ${{ inputs.test-provider || 'ollama' }}
|
||||||
|
run-vision-tests: ${{ matrix.mode == 'vision' && 'true' || 'false' }}
|
||||||
|
|
||||||
|
- name: Run and record tests
|
||||||
|
uses: ./.github/actions/run-and-record-tests
|
||||||
|
with:
|
||||||
|
test-types: ${{ needs.discover-tests.outputs.test-types }}
|
||||||
|
stack-config: 'server:ci-tests' # recording must be done with server since more tests are run
|
||||||
|
provider: ${{ inputs.test-provider || 'ollama' }}
|
||||||
|
inference-mode: 'record'
|
||||||
|
run-vision-tests: ${{ matrix.mode == 'vision' && 'true' || 'false' }}
|
Loading…
Add table
Add a link
Reference in a new issue