mirror of
https://github.com/garrytan/gstack.git
synced 2026-05-01 19:25:10 +02:00
dc0bae82d3
* fix: sidebar agent uses extension's activeTabUrl instead of stale Playwright URL When the user navigates manually in headed Chrome, Playwright's page.url() stays on the old page. The sidebar agent was using this stale URL in its system prompt, causing it to navigate to the wrong page (e.g., Hacker News instead of the user's current page). The Chrome extension now captures the active tab URL via chrome.tabs.query() and sends it as activeTabUrl in the /sidebar-command POST body. The server prefers this over Playwright's URL. The URL is sanitized (http/https only, control chars stripped, 2048 char limit) to prevent prompt injection. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * feat: connect-chrome pre-flight cleanup + improved onboarding docs Adds Step 0 pre-flight cleanup that kills stale browse servers and cleans Chromium profile locks before connecting. Improves the onboarding flow with clearer instructions for finding the extension, opening the Side Panel, and troubleshooting connection issues. Fixes Mode check from cdp to headed. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * test: sidebar agent test suite (layers 1-2) Layer 1 (unit): 18 tests for URL sanitization in sidebar-utils.ts — http/https pass, chrome:// rejected, javascript: rejected, control chars stripped, truncation. Layer 2 (integration): 13 tests for server HTTP endpoints — auth, sidebar-command queue writes, activeTabUrl override/fallback, event relay to chat buffer, message queuing, queue overflow (429), chat clear, agent kill. Source changes for testability: - Extract sanitizeExtensionUrl() to browse/src/sidebar-utils.ts - Add BROWSE_HEADLESS_SKIP env var to skip browser launch in HTTP-only tests - Add SIDEBAR_QUEUE_PATH env var to both server.ts and sidebar-agent.ts - Add SIDEBAR_AGENT_TIMEOUT env var to sidebar-agent.ts - Sync package.json version to match VERSION (0.12.2.0) Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * test: sidebar agent round-trip tests with mock claude (layer 3) Starts server + sidebar-agent together with a mock claude binary (shell script outputting canned stream-json). Verifies the full queue-based message flow: - Full round-trip: POST /sidebar-command → queue → agent → mock claude → events → chat - Claude crash recovery: mock exits 1, agent_error appears, status returns to idle - Sequential queue drain: two rapid messages both process in order Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * test: sidebar agent E2E tests with real Claude (layer 4) Two E2E tests that exercise the full sidebar agent flow with real Claude: - sidebar-navigate: POST /sidebar-command asking Claude to describe a fixture page, verify it responds with page content through the chat buffer - sidebar-url-accuracy: POST with activeTabUrl differing from Playwright URL, verify the queue prompt uses the extension URL (the core bug fix) Both registered as periodic tier (~$0.80 total, non-deterministic). Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * fix: sidebar E2E tests — sequential execution + eval collector fix Both tests now pass: - sidebar-url-accuracy: deterministic queue file check (no Claude needed) - sidebar-navigate: real Claude responds through sidebar agent queue Fixed: testIfSelected (sequential, not concurrent) to avoid queue file conflicts. Added cost_usd field for eval collector compatibility. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * fix: kill stale sidebar-agent processes before starting new one Each /connect-chrome starts a new sidebar-agent subprocess with unref() but never kills the previous one. Old agents accumulate as zombies with stale auth tokens. When they pick up queue entries, their event relay fails (401), so the server never receives agent_done and marks the agent as "hung". The user sees the sidebar freeze. Fix: pkill any existing sidebar-agent.ts processes before spawning. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> * chore: bump version and changelog (v0.12.6.0) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * docs: add P1 TODO for sidebar Write tool + error visibility Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com> --------- Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
321 lines
9.8 KiB
TypeScript
321 lines
9.8 KiB
TypeScript
/**
|
|
* Layer 2: Server HTTP integration tests for sidebar endpoints.
|
|
* Starts the browse server as a subprocess (no browser via BROWSE_HEADLESS_SKIP),
|
|
* exercises sidebar HTTP endpoints with fetch(). No Chrome, no Claude, no sidebar-agent.
|
|
*/
|
|
|
|
import { describe, test, expect, beforeAll, afterAll, beforeEach } from 'bun:test';
|
|
import { spawn, type Subprocess } from 'bun';
|
|
import * as fs from 'fs';
|
|
import * as os from 'os';
|
|
import * as path from 'path';
|
|
|
|
let serverProc: Subprocess | null = null;
|
|
let serverPort: number = 0;
|
|
let authToken: string = '';
|
|
let tmpDir: string = '';
|
|
let stateFile: string = '';
|
|
let queueFile: string = '';
|
|
|
|
async function api(pathname: string, opts: RequestInit & { noAuth?: boolean } = {}): Promise<Response> {
|
|
const { noAuth, ...fetchOpts } = opts;
|
|
const headers: Record<string, string> = {
|
|
'Content-Type': 'application/json',
|
|
...(fetchOpts.headers as Record<string, string> || {}),
|
|
};
|
|
if (!noAuth && !headers['Authorization'] && authToken) {
|
|
headers['Authorization'] = `Bearer ${authToken}`;
|
|
}
|
|
return fetch(`http://127.0.0.1:${serverPort}${pathname}`, { ...fetchOpts, headers });
|
|
}
|
|
|
|
beforeAll(async () => {
|
|
tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'sidebar-integ-'));
|
|
stateFile = path.join(tmpDir, 'browse.json');
|
|
queueFile = path.join(tmpDir, 'sidebar-queue.jsonl');
|
|
|
|
// Ensure queue dir exists
|
|
fs.mkdirSync(path.dirname(queueFile), { recursive: true });
|
|
|
|
const serverScript = path.resolve(__dirname, '..', 'src', 'server.ts');
|
|
serverProc = spawn(['bun', 'run', serverScript], {
|
|
env: {
|
|
...process.env,
|
|
BROWSE_STATE_FILE: stateFile,
|
|
BROWSE_HEADLESS_SKIP: '1',
|
|
BROWSE_PORT: '0',
|
|
SIDEBAR_QUEUE_PATH: queueFile,
|
|
BROWSE_IDLE_TIMEOUT: '300',
|
|
},
|
|
stdio: ['ignore', 'pipe', 'pipe'],
|
|
});
|
|
|
|
// Wait for state file
|
|
const deadline = Date.now() + 15000;
|
|
while (Date.now() < deadline) {
|
|
if (fs.existsSync(stateFile)) {
|
|
try {
|
|
const state = JSON.parse(fs.readFileSync(stateFile, 'utf-8'));
|
|
if (state.port && state.token) {
|
|
serverPort = state.port;
|
|
authToken = state.token;
|
|
break;
|
|
}
|
|
} catch {}
|
|
}
|
|
await new Promise(r => setTimeout(r, 100));
|
|
}
|
|
if (!serverPort) throw new Error('Server did not start in time');
|
|
}, 20000);
|
|
|
|
afterAll(() => {
|
|
if (serverProc) { try { serverProc.kill(); } catch {} }
|
|
try { fs.rmSync(tmpDir, { recursive: true, force: true }); } catch {}
|
|
});
|
|
|
|
// Reset state between tests — creates a fresh session, clears all queues
|
|
async function resetState() {
|
|
await api('/sidebar-session/new', { method: 'POST' });
|
|
fs.writeFileSync(queueFile, '');
|
|
}
|
|
|
|
describe('sidebar auth', () => {
|
|
test('rejects request without auth token', async () => {
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
noAuth: true,
|
|
body: JSON.stringify({ message: 'test' }),
|
|
});
|
|
expect(resp.status).toBe(401);
|
|
});
|
|
|
|
test('rejects request with wrong token', async () => {
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
headers: { 'Authorization': 'Bearer wrong-token' },
|
|
body: JSON.stringify({ message: 'test' }),
|
|
});
|
|
expect(resp.status).toBe(401);
|
|
});
|
|
|
|
test('accepts request with correct token', async () => {
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'hello' }),
|
|
});
|
|
expect(resp.status).toBe(200);
|
|
// Clean up
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
});
|
|
|
|
describe('sidebar-command → queue', () => {
|
|
test('writes queue entry with activeTabUrl', async () => {
|
|
await resetState();
|
|
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({
|
|
message: 'what is on this page?',
|
|
activeTabUrl: 'https://example.com/test-page',
|
|
}),
|
|
});
|
|
expect(resp.status).toBe(200);
|
|
const data = await resp.json();
|
|
expect(data.ok).toBe(true);
|
|
|
|
// Give server a moment to write queue
|
|
await new Promise(r => setTimeout(r, 100));
|
|
|
|
const content = fs.readFileSync(queueFile, 'utf-8').trim();
|
|
const lines = content.split('\n').filter(Boolean);
|
|
expect(lines.length).toBeGreaterThan(0);
|
|
const entry = JSON.parse(lines[lines.length - 1]);
|
|
expect(entry.pageUrl).toBe('https://example.com/test-page');
|
|
expect(entry.prompt).toContain('https://example.com/test-page');
|
|
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
|
|
test('falls back when activeTabUrl is null', async () => {
|
|
await resetState();
|
|
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'test', activeTabUrl: null }),
|
|
});
|
|
await new Promise(r => setTimeout(r, 100));
|
|
|
|
const lines = fs.readFileSync(queueFile, 'utf-8').trim().split('\n').filter(Boolean);
|
|
expect(lines.length).toBeGreaterThan(0);
|
|
const entry = JSON.parse(lines[lines.length - 1]);
|
|
// No browser → playwright URL is 'about:blank'
|
|
expect(entry.pageUrl).toBe('about:blank');
|
|
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
|
|
test('rejects chrome:// activeTabUrl and falls back', async () => {
|
|
await resetState();
|
|
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'test', activeTabUrl: 'chrome://extensions' }),
|
|
});
|
|
await new Promise(r => setTimeout(r, 100));
|
|
|
|
const lines = fs.readFileSync(queueFile, 'utf-8').trim().split('\n').filter(Boolean);
|
|
expect(lines.length).toBeGreaterThan(0);
|
|
const entry = JSON.parse(lines[lines.length - 1]);
|
|
expect(entry.pageUrl).toBe('about:blank');
|
|
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
|
|
test('rejects empty message', async () => {
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: '' }),
|
|
});
|
|
expect(resp.status).toBe(400);
|
|
});
|
|
});
|
|
|
|
describe('sidebar-agent/event → chat buffer', () => {
|
|
test('agent events appear in /sidebar-chat', async () => {
|
|
await resetState();
|
|
|
|
// Post mock agent events using Claude's streaming format
|
|
await api('/sidebar-agent/event', {
|
|
method: 'POST',
|
|
body: JSON.stringify({
|
|
type: 'assistant',
|
|
message: { content: [{ type: 'text', text: 'Hello from mock agent' }] },
|
|
}),
|
|
});
|
|
|
|
const chatData = await (await api('/sidebar-chat?after=0')).json();
|
|
const textEntry = chatData.entries.find((e: any) => e.type === 'text');
|
|
expect(textEntry).toBeDefined();
|
|
expect(textEntry.text).toBe('Hello from mock agent');
|
|
});
|
|
|
|
test('agent_done transitions status to idle', async () => {
|
|
await resetState();
|
|
// Start a command so agent is processing
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'test' }),
|
|
});
|
|
|
|
// Verify processing
|
|
let session = await (await api('/sidebar-session')).json();
|
|
expect(session.agent.status).toBe('processing');
|
|
|
|
// Send agent_done
|
|
await api('/sidebar-agent/event', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ type: 'agent_done' }),
|
|
});
|
|
|
|
session = await (await api('/sidebar-session')).json();
|
|
expect(session.agent.status).toBe('idle');
|
|
});
|
|
});
|
|
|
|
describe('message queuing', () => {
|
|
test('queues message when agent is processing', async () => {
|
|
await resetState();
|
|
|
|
// First message starts processing
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'first' }),
|
|
});
|
|
|
|
// Second message gets queued
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'second' }),
|
|
});
|
|
const data = await resp.json();
|
|
expect(data.ok).toBe(true);
|
|
expect(data.queued).toBe(true);
|
|
expect(data.position).toBe(1);
|
|
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
|
|
test('returns 429 when queue is full', async () => {
|
|
await resetState();
|
|
|
|
// First message starts processing
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'first' }),
|
|
});
|
|
|
|
// Fill queue (max 5)
|
|
for (let i = 0; i < 5; i++) {
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: `fill-${i}` }),
|
|
});
|
|
}
|
|
|
|
// 7th message should be rejected
|
|
const resp = await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'overflow' }),
|
|
});
|
|
expect(resp.status).toBe(429);
|
|
|
|
await api('/sidebar-agent/kill', { method: 'POST' });
|
|
});
|
|
});
|
|
|
|
describe('chat clear', () => {
|
|
test('clears chat buffer', async () => {
|
|
await resetState();
|
|
// Add some entries
|
|
await api('/sidebar-agent/event', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ type: 'text', text: 'to be cleared' }),
|
|
});
|
|
|
|
await api('/sidebar-chat/clear', { method: 'POST' });
|
|
|
|
const data = await (await api('/sidebar-chat?after=0')).json();
|
|
expect(data.entries.length).toBe(0);
|
|
expect(data.total).toBe(0);
|
|
});
|
|
});
|
|
|
|
describe('agent kill', () => {
|
|
test('kill adds error entry and returns to idle', async () => {
|
|
await resetState();
|
|
|
|
// Start a command so agent is processing
|
|
await api('/sidebar-command', {
|
|
method: 'POST',
|
|
body: JSON.stringify({ message: 'kill me' }),
|
|
});
|
|
|
|
let session = await (await api('/sidebar-session')).json();
|
|
expect(session.agent.status).toBe('processing');
|
|
|
|
// Kill the agent
|
|
const killResp = await api('/sidebar-agent/kill', { method: 'POST' });
|
|
expect(killResp.status).toBe(200);
|
|
|
|
// Check chat for error entry
|
|
const chatData = await (await api('/sidebar-chat?after=0')).json();
|
|
const errorEntry = chatData.entries.find((e: any) => e.error === 'Killed by user');
|
|
expect(errorEntry).toBeDefined();
|
|
|
|
// Agent should be idle (no queue items to auto-process)
|
|
session = await (await api('/sidebar-session')).json();
|
|
expect(session.agent.status).toBe('idle');
|
|
});
|
|
});
|