Run Eval Benchmark Prod #199
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| name: Run Eval Benchmark Prod | |
| env: | |
| EVAL_API_URL: ${{ secrets.EVAL_API_URL }} | |
| EVAL_API_KEY: ${{ secrets.EVAL_API_KEY }} | |
| EVAL_EXPERIMENT_ID: ${{ secrets.EVAL_BENCHMARK_EXPERIMENT_ID }} | |
| on: | |
| workflow_run: | |
| workflows: ["Deploy Images to GHCR"] | |
| types: | |
| - completed | |
| branches: | |
| - main | |
| workflow_dispatch: | |
| jobs: | |
| run-eval-benchmark-prod: | |
| runs-on: ubuntu-latest | |
| if: ${{ github.event.workflow_run.conclusion == 'success' || github.event_name == 'workflow_dispatch' }} | |
| steps: | |
| - name: Checkout repository | |
| uses: actions/checkout@v3 | |
| - name: 'Install dependencies' | |
| run: | | |
| python -m pip install --upgrade pip | |
| pip install requests | |
| # make sure the image is deployed before running the eval benchmark | |
| - name: Wait for 2 minutes | |
| run: sleep 120 | |
| - name: 'Run Eval Benchmark Prod' | |
| run: | | |
| python .github/scripts/eval_run.py --label prod.${{ github.sha }} --api-url ${{ env.EVAL_API_URL }} --api-key ${{ env.EVAL_API_KEY }} --experiment-id ${{ env.EVAL_EXPERIMENT_ID }} |