From 8cf23ba61ad1ceee4d293e2b729e5b381314929c Mon Sep 17 00:00:00 2001 From: Garry Tan Date: Mon, 23 Mar 2026 07:50:03 -0700 Subject: [PATCH] =?UTF-8?q?revert:=20remove=20CI=20env=20unset=20=E2=80=94?= =?UTF-8?q?=20didn't=20fix=20routing?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Unsetting CI/GITHUB_ACTIONS didn't improve routing test results (still 1/11 in container). The issue is model behavior in containerized environments, not env vars. Routing tests will be tracked as a known CI gap. Co-Authored-By: Claude Opus 4.6 (1M context) --- .github/workflows/evals.yml | 4 ---- 1 file changed, 4 deletions(-) diff --git a/.github/workflows/evals.yml b/.github/workflows/evals.yml index e9962069..3ca708d5 100644 --- a/.github/workflows/evals.yml +++ b/.github/workflows/evals.yml @@ -115,10 +115,6 @@ jobs: OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }} GEMINI_API_KEY: ${{ secrets.GEMINI_API_KEY }} EVALS_CONCURRENCY: "40" - # Unset CI markers so Claude CLI behaves like a local environment - # (CI=true changes Claude's routing/tool selection behavior) - CI: "" - GITHUB_ACTIONS: "" run: EVALS=1 bun test --retry 2 --concurrent --max-concurrency 40 ${{ matrix.suite.file }} - name: Upload eval results