Initial import from garrytan/gstack@026751e (main snapshot via local relay)

Source: https://github.com/garrytan/gstack/commit/026751e
2026-05-19 21:18:17 +02:00
commit 834c6db075
797 changed files with 267839 additions and 0 deletions
--- a/browse/test/security-adversarial-fixes.test.ts
+++ b/browse/test/security-adversarial-fixes.test.ts
@@ -0,0 +1,113 @@
+/**
+ * Regression tests for the 4 adversarial findings fixed during /ship:
+ *
+ * 1. Canary stream-chunk split bypass — rolling-buffer detection across
+ *    consecutive text_delta / input_json_delta events.
+ * 2. Tool-output ensemble rule — single ML classifier >= BLOCK blocks
+ *    directly when the content is tool output (not user input).
+ * 3. escapeHtml quote escaping (unit-level check on the shape we expect).
+ * 4. snapshot command added to PAGE_CONTENT_COMMANDS.
+ *
+ * These tests pin the fixes so future refactors don't silently re-open
+ * the bypasses both adversarial reviewers (Claude + Codex) flagged.
+ */
+import { describe, test, expect } from 'bun:test';
+import * as fs from 'fs';
+import * as path from 'path';
+import { combineVerdict, THRESHOLDS } from '../src/security';
+import { PAGE_CONTENT_COMMANDS } from '../src/commands';
+
+const REPO_ROOT = path.resolve(__dirname, '..', '..');
+
+// canary stream-chunk split detection — tested detectCanaryLeak inside
+// sidebar-agent.ts. Both the chat-stream pipeline and the function are
+// gone (Terminal pane uses an interactive PTY; user keystrokes are the
+// trust source, no chunked LLM stream to canary-scan).
+
+describe('tool-output ensemble rule (single-layer BLOCK)', () => {
+  test('user-input context: single layer at BLOCK degrades to WARN', () => {
+    const result = combineVerdict([
+      { layer: 'testsavant_content', confidence: 0.95 },
+      { layer: 'transcript_classifier', confidence: 0 },
+    ]);
+    expect(result.verdict).toBe('warn');
+    expect(result.reason).toBe('single_layer_high');
+  });
+
+  test('tool-output context: single layer at BLOCK blocks directly', () => {
+    const result = combineVerdict(
+      [
+        { layer: 'testsavant_content', confidence: 0.95 },
+        { layer: 'transcript_classifier', confidence: 0, meta: { degraded: true } },
+      ],
+      { toolOutput: true },
+    );
+    expect(result.verdict).toBe('block');
+    expect(result.reason).toBe('single_layer_tool_output');
+  });
+
+  test('tool-output context still respects ensemble path when 2 agree', () => {
+    const result = combineVerdict(
+      [
+        { layer: 'testsavant_content', confidence: 0.80 },
+        { layer: 'transcript_classifier', confidence: 0.75, meta: { verdict: 'block' } },
+      ],
+      { toolOutput: true },
+    );
+    expect(result.verdict).toBe('block');
+    expect(result.reason).toBe('ensemble_agreement');
+  });
+
+  test('tool-output context: below BLOCK threshold still WARN, not BLOCK', () => {
+    const result = combineVerdict(
+      [{ layer: 'testsavant_content', confidence: THRESHOLDS.WARN }],
+      { toolOutput: true },
+    );
+    expect(result.verdict).toBe('warn');
+  });
+});
+
+describe('sidepanel escapeHtml quote escaping', () => {
+  test('escapeHtml helper replaces double + single quotes', () => {
+    const src = fs.readFileSync(
+      path.join(REPO_ROOT, 'extension', 'sidepanel.js'),
+      'utf-8',
+    );
+    expect(src).toContain(".replace(/\"/g, '&quot;')");
+    expect(src).toContain(".replace(/'/g, '&#39;')");
+  });
+});
+
+describe('snapshot in PAGE_CONTENT_COMMANDS', () => {
+  test('snapshot is wrapped by untrusted-content envelope', () => {
+    expect(PAGE_CONTENT_COMMANDS.has('snapshot')).toBe(true);
+  });
+});
+
+describe('transcript classifier tool_output parameter', () => {
+  test('checkTranscript accepts optional tool_output', () => {
+    const src = fs.readFileSync(
+      path.join(REPO_ROOT, 'browse', 'src', 'security-classifier.ts'),
+      'utf-8',
+    );
+    expect(src).toContain('tool_output?: string');
+    expect(src).toContain('tool_output');
+    // Haiku prompt mentions tool_output
+    expect(src).toContain('tool_output');
+  });
+
+  // sidebar-agent passed tool text to the transcript classifier on
+  // tool-result scans. That whole pipeline is gone — Terminal pane has
+  // no LLM stream to scan, and security-classifier.ts is dead code with
+  // no production caller (a separate v1.1+ cleanup TODO).
+});
+
+describe('GSTACK_SECURITY_OFF kill switch', () => {
+  test('loadTestsavant honors env var early', () => {
+    const src = fs.readFileSync(
+      path.join(REPO_ROOT, 'browse', 'src', 'security-classifier.ts'),
+      'utf-8',
+    );
+    expect(src).toContain("process.env.GSTACK_SECURITY_OFF === '1'");
+  });
+});