diff --git a/.github/workflows/terminal-bench-regression.yml b/.github/workflows/terminal-bench-regression.yml index 8ed0265..68d6002 100644 --- a/.github/workflows/terminal-bench-regression.yml +++ b/.github/workflows/terminal-bench-regression.yml @@ -27,11 +27,8 @@ jobs: - name: Setup Python + uv uses: astral-sh/setup-uv@v6 - - name: Create venv and install deps - run: | - uv venv .venv - source .venv/bin/activate - uv pip install "harbor>=0.1.45" "litellm>=1.0.0" + - name: Install Harbor + run: uv pip install --system "harbor>=0.1.45" "litellm>=1.0.0" - name: Configure Modal env: @@ -47,8 +44,6 @@ jobs: ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }} OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }} run: | - source .venv/bin/activate - # Build --task-name flags from regression-tasks.txt TASK_FLAGS="" while IFS= read -r task; do @@ -98,7 +93,7 @@ jobs: GITHUB_RUN_ID: ${{ github.run_id }} GITHUB_SERVER_URL: ${{ github.server_url }} run: | - uv run python benchmarks/terminal_bench/report.py \ + python benchmarks/terminal_bench/report.py \ --results-dir results/ \ --baseline benchmarks/terminal_bench/baseline.json \ --repo "${{ github.repository }}"