-
Notifications
You must be signed in to change notification settings - Fork 901
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
add inital e2e test workflow for evals
- Loading branch information
Showing
1 changed file
with
104 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,104 @@ | ||
name: promptflow-evals-e2e-test | ||
|
||
on: | ||
schedule: | ||
- cron: "40 10 * * *" # 2:40 PST every day | ||
pull_request: | ||
paths: | ||
- src/promptflow-evals/** | ||
- .github/workflows/promptflow-evals-e2e-test.yml | ||
workflow_dispatch: | ||
|
||
env: | ||
IS_IN_CI_PIPELINE: "true" | ||
WORKING_DIRECTORY: ${{ github.workspace }}/src/promptflow-evals | ||
RECORD_DIRECTORY: ${{ github.workspace }}/src/promptflow-recording | ||
|
||
jobs: | ||
build: | ||
runs-on: ubuntu-latest | ||
steps: | ||
- uses: actions/checkout@v4 | ||
- uses: snok/install-poetry@v1 | ||
- name: build | ||
run: poetry build | ||
working-directory: ${{ env.WORKING_DIRECTORY }} | ||
- uses: actions/upload-artifact@v4 | ||
with: | ||
name: promptflow-evals | ||
path: ${{ env.WORKING_DIRECTORY }}/dist/promptflow_evals-*.whl | ||
|
||
test: | ||
needs: build | ||
strategy: | ||
matrix: | ||
os: [ubuntu-latest, windows-latest, macos-latest] | ||
python-version: ['3.8', '3.9', '3.10', '3.11'] | ||
fail-fast: false | ||
# snok/install-poetry need this to support Windows | ||
defaults: | ||
run: | ||
shell: bash | ||
runs-on: ${{ matrix.os }} | ||
steps: | ||
- uses: actions/checkout@v4 | ||
- name: set test mode | ||
run: echo "PROMPT_FLOW_TEST_MODE=$(if [[ "${{ github.event_name }}" == "pull_request" ]]; then echo replay; else echo live; fi)" >> $GITHUB_ENV | ||
- uses: actions/setup-python@v5 | ||
with: | ||
python-version: ${{ matrix.python-version }} | ||
- uses: snok/install-poetry@v1 | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: promptflow-evals | ||
path: ${{ env.WORKING_DIRECTORY }} | ||
- name: install promptflow-evals from wheel | ||
# wildcard expansion (*) does not work in Windows, so leverage python to find and install | ||
run: poetry run pip install $(python -c "import glob; print(glob.glob('promptflow_evals-*.whl')[0])") | ||
working-directory: ${{ env.WORKING_DIRECTORY }} | ||
- name: install test dependency group | ||
run: poetry install --only test | ||
working-directory: ${{ env.WORKING_DIRECTORY }} | ||
- name: install recording | ||
run: poetry install | ||
working-directory: ${{ env.RECORD_DIRECTORY }} | ||
- name: generate end-to-end test config from secret | ||
run: echo '${{ secrets.PF_TRACING_E2E_TEST_CONFIG }}' >> connections.json | ||
working-directory: ${{ env.WORKING_DIRECTORY }} | ||
- name: run e2e tests | ||
run: poetry run pytest -m e2etest --cov=promptflow --cov-config=pyproject.toml --cov-report=term --cov-report=html --cov-report=xml | ||
working-directory: ${{ env.WORKING_DIRECTORY }} | ||
- name: upload coverage report | ||
uses: actions/upload-artifact@v4 | ||
with: | ||
name: report-${{ matrix.os }}-py${{ matrix.python-version }} | ||
path: | | ||
${{ env.WORKING_DIRECTORY }}/*.xml | ||
${{ env.WORKING_DIRECTORY }}/htmlcov/ | ||
report: | ||
needs: test | ||
runs-on: ubuntu-latest | ||
permissions: | ||
checks: write | ||
pull-requests: write | ||
contents: read | ||
issues: read | ||
steps: | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
path: artifacts | ||
- uses: EnricoMi/publish-unit-test-result-action@v2 | ||
with: | ||
check_name: promptflow-evals test result | ||
comment_title: promptflow-evals test result | ||
files: "artifacts/**/test-results.xml" # align with `--junit-xml` in pyproject.toml | ||
- uses: irongut/CodeCoverageSummary@v1.3.0 | ||
with: | ||
filename: "artifacts/report-ubuntu-latest-py3.9/coverage.xml" | ||
badge: true | ||
fail_below_min: true | ||
format: markdown | ||
hide_complexity: true | ||
output: both | ||
thresholds: 40 80 |