feat: use chunk data in NIAH and QA evals #1490
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# End-to-end testing that deploys Supabase and the API, and deploy/tests llama-cpp-python, text-embeddings, and whisper | |
name: e2e-whisper | |
on: | |
pull_request: | |
types: | |
- opened # default trigger | |
- reopened # default trigger | |
- synchronize # default trigger | |
- ready_for_review # don't run on draft PRs | |
- milestoned # allows us to trigger on bot PRs | |
paths: | |
# Catch-all | |
- "**" | |
# Ignore updates to the .github directory, unless it's this current file | |
- "!.github/**" | |
- ".github/workflows/e2e-whisper.yaml" | |
- ".github/actions/uds-cluster/action.yaml" | |
# Ignore docs and website things | |
- "!**.md" | |
- "!docs/**" | |
- "!adr/**" | |
- "!website/**" | |
- "!netlify.toml" | |
# Ignore updates to generic github metadata files | |
- "!CODEOWNERS" | |
- "!.gitignore" | |
- "!LICENSE" | |
# Ignore local development files | |
- "!.pre-commit-config.yaml" | |
- "!tasks.yaml" | |
# Ignore non e2e tests changes | |
- "!tests/pytest/**" | |
# Ignore LFAI-UI source code changes | |
- "!src/leapfrogai_ui/**" | |
# Ignore changes to unrelated packages | |
- "!packages/k3d-gpu/**" | |
- "!packages/llama-cpp-python/**" | |
- "!packages/repeater/**" | |
- "!packages/text-embeddings/**" | |
- "!packages/ui/**" | |
- "!packages/vllm/**" | |
concurrency: | |
group: e2e-whisper-${{ github.ref }} | |
cancel-in-progress: true | |
jobs: | |
e2e_whisper: | |
runs-on: ai-ubuntu-big-boy-8-core | |
if: ${{ !github.event.pull_request.draft }} | |
permissions: | |
contents: read | |
packages: read | |
id-token: write # This is needed for OIDC federation. | |
steps: | |
- name: Checkout Repo | |
uses: actions/checkout@b4ffde65f46336ab88eb53be808477a3936bae11 # v4.1.1 | |
- name: Setup Python | |
uses: ./.github/actions/python | |
with: | |
additionalOptionalDep: dev-whisper | |
- name: Setup UDS Cluster | |
uses: ./.github/actions/uds-cluster | |
with: | |
registry1Username: ${{ secrets.IRON_BANK_ROBOT_USERNAME }} | |
registry1Password: ${{ secrets.IRON_BANK_ROBOT_PASSWORD }} | |
ghToken: ${{ secrets.GITHUB_TOKEN }} | |
chainguardIdentity: ${{ secrets.CHAINGUARD_IDENTITY }} | |
- name: Setup LFAI-API and Supabase | |
uses: ./.github/actions/lfai-core | |
########## | |
# whisper | |
########## | |
- name: Deploy whisper | |
run: | | |
make build-whisper LOCAL_VERSION=e2e-test | |
docker image prune -af | |
uds zarf package deploy packages/whisper/zarf-package-whisper-amd64-e2e-test.tar.zst -l=trace --confirm | |
rm packages/whisper/zarf-package-whisper-amd64-e2e-test.tar.zst | |
- name: Test whisper | |
run: | | |
python -m pytest ./tests/e2e/test_whisper.py -v |