optave · carlos-alm · May 17, 2026 · May 15, 2026 · May 15, 2026 · May 15, 2026
diff --git a/scripts/benchmark.ts b/scripts/benchmark.ts
@@ -15,7 +15,7 @@ import path from 'node:path';
 import { performance } from 'node:perf_hooks';
 import { fileURLToPath } from 'node:url';
 import Database from 'better-sqlite3';
-import { resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
+import { BENCHMARK_EXCLUDES, resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
 import { isWorker, workerEngine, workerTargets, forkEngines } from './lib/fork-engine.js';
 
 // ── Parent process: fork one child per engine, assemble final output ─────
@@ -130,7 +130,7 @@ console.log = (...args) => console.error(...args);
 if (fs.existsSync(dbPath)) fs.unlinkSync(dbPath);
 
 const buildStart = performance.now();
-const buildResult = await buildGraph(root, { engine, incremental: false });
+const buildResult = await buildGraph(root, { engine, incremental: false, exclude: [...BENCHMARK_EXCLUDES] });
 const buildTimeMs = performance.now() - buildStart;
 
 const queryStart = performance.now();
@@ -150,7 +150,7 @@ try {
 	const noopTimings = [];
 	for (let i = 0; i < INCREMENTAL_RUNS; i++) {
 		const start = performance.now();
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 		noopTimings.push(performance.now() - start);
 	}
 	noopRebuildMs = Math.round(median(noopTimings));
@@ -167,7 +167,7 @@ try {
 	for (let i = 0; i < INCREMENTAL_RUNS; i++) {
 		fs.writeFileSync(PROBE_FILE, original + `\n// probe-${i}\n`);
 		const start = performance.now();
-		const res = await buildGraph(root, { engine, incremental: true });
+		const res = await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 		oneFileRuns.push({ ms: performance.now() - start, phases: res?.phases || null });
 	}
 	oneFileRuns.sort((a, b) => a.ms - b.ms);
@@ -179,7 +179,7 @@ try {
 } finally {
 	fs.writeFileSync(PROBE_FILE, original);
 	try {
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 	} catch {
 		// Cleanup rebuild failed — probe file is already restored, move on
 	}

diff --git a/scripts/incremental-benchmark.ts b/scripts/incremental-benchmark.ts
@@ -14,7 +14,7 @@ import fs from 'node:fs';
 import path from 'node:path';
 import { performance } from 'node:perf_hooks';
 import { fileURLToPath } from 'node:url';
-import { resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
+import { BENCHMARK_EXCLUDES, resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
 import { isWorker, workerEngine, forkEngines } from './lib/fork-engine.js';
 
 // ── Parent process: fork one child per engine, assemble final output ─────
@@ -194,7 +194,7 @@ const fullTimings = [];
 for (let i = 0; i < RUNS; i++) {
 	if (fs.existsSync(dbPath)) fs.unlinkSync(dbPath);
 	const start = performance.now();
-	await buildGraph(root, { engine, incremental: false });
+	await buildGraph(root, { engine, incremental: false, exclude: [...BENCHMARK_EXCLUDES] });
 	fullTimings.push(performance.now() - start);
 }
 const fullBuildMs = Math.round(median(fullTimings));
@@ -203,12 +203,12 @@ const fullBuildMs = Math.round(median(fullTimings));
 let noopRebuildMs = null;
 try {
 	for (let i = 0; i < WARMUP_RUNS; i++) {
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 	}
 	const noopTimings = [];
 	for (let i = 0; i < RUNS; i++) {
 		const start = performance.now();
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 		noopTimings.push(performance.now() - start);
 	}
 	noopRebuildMs = Math.round(median(noopTimings));
@@ -223,13 +223,13 @@ let oneFilePhases = null;
 try {
 	for (let i = 0; i < WARMUP_RUNS; i++) {
 		fs.writeFileSync(PROBE_FILE, original + `\n// warmup-${i}\n`);
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 	}
 	const oneFileRuns = [];
 	for (let i = 0; i < RUNS; i++) {
 		fs.writeFileSync(PROBE_FILE, original + `\n// probe-${i}\n`);
 		const start = performance.now();
-		const res = await buildGraph(root, { engine, incremental: true });
+		const res = await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 		oneFileRuns.push({ ms: performance.now() - start, phases: res?.phases || null });
 	}
 	oneFileRuns.sort((a, b) => a.ms - b.ms);
@@ -241,7 +241,7 @@ try {
 } finally {
 	fs.writeFileSync(PROBE_FILE, original);
 	try {
-		await buildGraph(root, { engine, incremental: true });
+		await buildGraph(root, { engine, incremental: true, exclude: [...BENCHMARK_EXCLUDES] });
 	} catch {
 		// Cleanup rebuild failed — probe file is already restored, move on
 	}

diff --git a/scripts/lib/bench-config.ts b/scripts/lib/bench-config.ts
@@ -15,6 +15,21 @@ import { pathToFileURL } from 'node:url';
 
 import { getBenchmarkVersion } from '../bench-version.js';
 
+/**
+ * Globs excluded from every benchmark's `buildGraph(root, ...)` invocation.
+ *
+ * Resolution-benchmark fixtures (`tests/benchmarks/resolution/fixtures/**`)
+ * are hand-annotated scaffolding for the static-resolution test suite, not
+ * representative source code. They inflate dogfooding timing measurements
+ * disproportionately whenever a new-language PR lands a heavyweight grammar
+ * (e.g. tree-sitter-verilog added ~850ms to native fullBuildMs in #1107).
+ * Excluding them here keeps build/query/incremental benchmarks measuring
+ * codegraph's own source rather than its test fixtures.
+ */
+export const BENCHMARK_EXCLUDES: readonly string[] = [
+	'tests/benchmarks/resolution/fixtures/**',
+];
+
 // On Windows, `npm` is `npm.cmd` and Node refuses to spawn `.cmd`/`.bat`
 // without `shell: true` (since Node 18.20 / 20.15). When `shell: true`, the
 // Windows `cmd.exe` shell resolves bare `npm` to `npm.cmd` automatically, so

diff --git a/scripts/query-benchmark.ts b/scripts/query-benchmark.ts
@@ -16,7 +16,7 @@ import path from 'node:path';
 import { performance } from 'node:perf_hooks';
 import { fileURLToPath } from 'node:url';
 import Database from 'better-sqlite3';
-import { resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
+import { BENCHMARK_EXCLUDES, resolveBenchmarkSource, srcImport } from './lib/bench-config.js';
 import { isWorker, workerEngine, workerTargets, forkEngines } from './lib/fork-engine.js';
 
 // ── Parent process: fork one child per engine, assemble final output ─────
@@ -254,7 +254,7 @@ function benchDiffImpact(hubName) {
 
 // Build graph for this engine
 if (fs.existsSync(dbPath)) fs.unlinkSync(dbPath);
-await buildGraph(root, { engine, incremental: false });
+await buildGraph(root, { engine, incremental: false, exclude: [...BENCHMARK_EXCLUDES] });
 
 const targets = workerTargets() || selectTargets();
 console.error(`Targets: hub=${targets.hub}, mid=${targets.mid}, leaf=${targets.leaf}`);

diff --git a/src/domain/graph/builder/pipeline.ts b/src/domain/graph/builder/pipeline.ts
@@ -183,6 +183,13 @@ function setupPipeline(ctx: PipelineContext): void {
   initSchema(ctx.db);
 
   ctx.config = loadConfig(ctx.rootDir);
+  // Merge caller-supplied excludes on top of the file-config excludes so
+  // programmatic callers (e.g. benchmark scripts) can extend exclusion
+  // without mutating .codegraphrc.json. Native orchestrator picks this up
+  // automatically — it reads exclude off the serialized ctx.config below.
+  if (ctx.opts.exclude?.length) {
+    ctx.config.exclude = [...(ctx.config.exclude ?? []), ...ctx.opts.exclude];
+  }
   ctx.incremental =
     ctx.opts.incremental !== false && ctx.config.build && ctx.config.build.incremental !== false;
 

diff --git a/src/types.ts b/src/types.ts
@@ -1063,6 +1063,13 @@ export interface BuildGraphOpts {
   complexity?: boolean;
   cfg?: boolean;
   scope?: string[];
+  /**
+   * Glob patterns merged on top of `config.exclude` for this build only.
+   * Lets callers extend exclusion programmatically without writing a config
+   * file — used by the benchmark scripts to skip resolution-benchmark
+   * fixtures that aren't representative of real code.
+   */
+  exclude?: string[];
   skipRegistry?: boolean;
 }
 

diff --git a/tests/benchmarks/regression-guard.test.ts b/tests/benchmarks/regression-guard.test.ts
@@ -176,18 +176,6 @@
  *   absolute delta 10.4ms exactly at the MIN_ABSOLUTE_DELTA floor. Exempt
  *   this release; remove once 3.11.0+ data confirms stabilization.
  *
- * - 3.10.0:Full build — adding native Verilog support (#1107) pulled the
- *   4 `.v` resolution-benchmark fixtures into the corpus the incremental
- *   benchmark sweeps (it runs against the repo root). tree-sitter-verilog
- *   is a large grammar (SystemVerilog is one of the heaviest in the
- *   tree-sitter ecosystem) so each file costs noticeably more than the
- *   other fixture languages. Local measurement: 1959 → 2809 (+43%, run
- *   25716010487). The cost is real and structural — not a regression in
- *   shared code paths. Resolution: either exclude `tests/benchmarks/
- *   resolution/fixtures/verilog/**` from the benchmark sweep or accept the
- *   one-time bump as the cost of supporting Verilog. Tracked separately;
- *   exempt this release.
- *
  * - 3.10.0:Query time — cumulative effect of adding two native extractors
  *   (Solidity #1100 + R #1102) in quick succession. Neither tripped the
  *   threshold individually (Solidity PR's Query time stayed at 49ms, R PR
@@ -230,7 +218,6 @@
   '3.10.0:fnDeps depth 1',
   '3.10.0:fnDeps depth 3',
   '3.10.0:fnDeps depth 5',
-  '3.10.0:Full build',
   '3.10.0:Query time',
 ]);
 
@@ -447,7 +434,7 @@
          `  ${r.label}: ${r.previous} → ${r.current} (+${Math.round(r.pctChange * 100)}%, threshold ${Math.round(thresholdFor(r.label) * 100)}%)`,
      )
      .join('\n');
    expect.fail(`Benchmark regressions exceed threshold:\n${details}`);
  }
 }


diff --git a/tests/integration/config-include-exclude.test.ts b/tests/integration/config-include-exclude.test.ts
@@ -178,4 +178,37 @@ describe('config.include / config.exclude (issue #981)', () => {
     // Paths are already relative to each run's own tmpDir so they compare directly.
     expect(nativeFiles).toEqual(wasmFiles);
   });
+
+  // ── opts.exclude (programmatic, no on-disk config) ───────────────
+
+  async function buildWithOptsExclude(
+    root: string,
+    engine: EngineName,
+    optsExclude: string[],
+  ): Promise<string[]> {
+    clearConfigCache();
+    const dbDir = path.join(root, '.codegraph');
+    if (fs.existsSync(dbDir)) fs.rmSync(dbDir, { recursive: true, force: true });
+    await buildGraph(root, { engine, exclude: optsExclude, skipRegistry: true });
+    const files = readFileRows(path.join(dbDir, 'graph.db'));
+    return files.map((f) => f.replace(/\\/g, '/')).sort();
+  }
+
+  it('wasm: opts.exclude rejects matching files without writing config', async () => {
+    const root = fs.mkdtempSync(path.join(tmpDir, 'opts-wasm-'));
+    writeFixture(root);
+    const files = await buildWithOptsExclude(root, 'wasm', ['**/*.test.js', '**/*.spec.js']);
+    expect(files).toContain('src/math.js');
+    expect(files).not.toContain('src/math.test.js');
+    expect(files).not.toContain('src/util.spec.js');
+  });
+
+  itNative('native: opts.exclude rejects matching files without writing config', async () => {
+    const root = fs.mkdtempSync(path.join(tmpDir, 'opts-native-'));
+    writeFixture(root);
+    const files = await buildWithOptsExclude(root, 'native', ['**/*.test.js', '**/*.spec.js']);
+    expect(files).toContain('src/math.js');
+    expect(files).not.toContain('src/math.test.js');
+    expect(files).not.toContain('src/util.spec.js');
+  });
 });