mirror of
https://github.com/garrytan/gstack.git
synced 2026-05-06 21:46:40 +02:00
feat: add E2E evals for /review pre-existing bug + /ship reverted QA detection
Two new E2E tests: - review-pre-existing-bug: plants SQL injection in base branch, verifies Step 5.7 classifies as INFORMATIONAL and recommends /debug - ship-reverted-qa-commits: creates branch with reverted fix(qa): commits, verifies /ship detects them and recommends /debug Also fixes qa-debug-prompt-logic to use correct workingDirectory, and ensures test repo init uses -b main for portability. All 4 debug-related evals pass: $0.34 total, 94s. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
@@ -92,8 +92,10 @@ export const E2E_TOUCHFILES: Record<string, string[]> = {
|
||||
'gstack-upgrade-happy-path': ['gstack-upgrade/**'],
|
||||
|
||||
// Debug escalation
|
||||
'qa-debug-prompt-logic': ['qa/**', 'debug/**'],
|
||||
'qa-debug-escalation': ['qa/**', 'debug/**', 'browse/src/**'],
|
||||
'qa-debug-prompt-logic': ['qa/**', 'debug/**'],
|
||||
'qa-debug-escalation': ['qa/**', 'debug/**', 'browse/src/**'],
|
||||
'review-pre-existing-bug': ['review/**', 'debug/**'],
|
||||
'ship-reverted-qa-commits': ['ship/**', 'debug/**'],
|
||||
};
|
||||
|
||||
/**
|
||||
|
||||
Reference in New Issue
Block a user