diff --git a/.github/workflows/evals.yml b/.github/workflows/evals.yml index 3ca708d5..e9962069 100644 --- a/.github/workflows/evals.yml +++ b/.github/workflows/evals.yml @@ -115,6 +115,10 @@ jobs: OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }} GEMINI_API_KEY: ${{ secrets.GEMINI_API_KEY }} EVALS_CONCURRENCY: "40" + # Unset CI markers so Claude CLI behaves like a local environment + # (CI=true changes Claude's routing/tool selection behavior) + CI: "" + GITHUB_ACTIONS: "" run: EVALS=1 bun test --retry 2 --concurrent --max-concurrency 40 ${{ matrix.suite.file }} - name: Upload eval results