hai 1 mes · 93e53e7c69
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,6 +7,28 @@ a [GitHub Release](https://github.com/colbymchenry/codegraph/releases) tagged
 
															 This project follows [Keep a Changelog](https://keepachangelog.com/en/1.1.0/)
														
 
															 and adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
														
 
															+## [Unreleased]
														
 
															+
														
 
															+### Changed
														
 
															+- **MCP / explore**: `codegraph_explore` output is now adaptive to project
														
 
															+  size. The tool used to apply a fixed 35KB cap regardless of how large the
														
 
															+  codebase was, which on small projects (~100 files) produced bigger
														
 
															+  responses than the agent's native grep+Read flow would have — exactly the
														
 
															+  scenario reported in
														
 
															+  [#185](https://github.com/colbymchenry/codegraph/issues/185). The budget
														
 
															+  now scales with indexed file count: small projects (<500 files) cap at
														
 
															+  ~18KB and skip the "Additional relevant files" / completeness / explore-
														
 
															+  budget reminders that earn their keep on bigger codebases; medium
														
 
															+  (<5,000) caps at ~28KB; large (<15,000) keeps the historical ~35KB; very
														
 
															+  large goes up to ~38KB. A new per-file char cap also prevents a single
														
 
															+  file with many adjacent symbols from collapsing into one whole-file dump
														
 
															+  (the Alamofire `Session.swift` case from #185). Measured against the
														
 
															+  same repos used in the README benchmark: Alamofire ~62% smaller per call,
														
 
															+  Excalidraw ~35%, VS Code ~14%. Agent-trust floor still holds — the
														
 
															+  Relationships section, scored cluster selection, and structured-source
														
 
															+  output are all retained. Thanks to
														
 
															+  [@essopsp](https://github.com/essopsp) for the repro.
														
 
															+
														
 
															 ## [0.7.10] - 2026-05-19
														
 
															 ### Fixed
														
--- a/__tests__/explore-output-budget.test.ts
+++ b/__tests__/explore-output-budget.test.ts
@@ -0,0 +1,191 @@
 
															+/**
														
 
															+ * Adaptive output budget for codegraph_explore (#185).
														
 
															+ *
														
 
															+ * The explore tool used to apply a fixed 35KB output cap regardless of
														
 
															+ * project size, which on small codebases was a net loss vs. native
														
 
															+ * grep+Read. These tests pin the per-tier budget shape so future tuning
														
 
															+ * doesn't silently drift the small-project case back into bloat.
														
 
															+ */
														
 
															+import { describe, it, expect, beforeAll, afterAll } from 'vitest';
														
 
															+import * as fs from 'fs';
														
 
															+import * as path from 'path';
														
 
															+import * as os from 'os';
														
 
															+import { getExploreOutputBudget, getExploreBudget, ToolHandler } from '../src/mcp/tools';
														
 
															+import CodeGraph from '../src/index';
														
 
															+
														
 
															+describe('getExploreOutputBudget', () => {
														
 
															+  it('returns a strictly smaller total cap for small projects than for huge ones', () => {
														
 
															+    const small = getExploreOutputBudget(100);
														
 
															+    const huge = getExploreOutputBudget(30000);
														
 
															+    expect(small.maxOutputChars).toBeLessThan(huge.maxOutputChars);
														
 
															+    expect(small.defaultMaxFiles).toBeLessThan(huge.defaultMaxFiles);
														
 
															+    expect(small.maxCharsPerFile).toBeLessThan(huge.maxCharsPerFile);
														
 
															+  });
														
 
															+
														
 
															+  it('caps total output well under 8000 tokens (~32k chars) on small projects', () => {
														
 
															+    const small = getExploreOutputBudget(100);
														
 
															+    expect(small.maxOutputChars).toBeLessThanOrEqual(20000);
														
 
															+  });
														
 
															+
														
 
															+  it('keeps the historical 35k+ ceiling for medium-large projects so existing benchmarks do not regress', () => {
														
 
															+    const large = getExploreOutputBudget(10000);
														
 
															+    expect(large.maxOutputChars).toBeGreaterThanOrEqual(35000);
														
 
															+  });
														
 
															+
														
 
															+  it('uses tier breakpoints matching getExploreBudget so call-count and output-budget agree on a project', () => {
														
 
															+    // Anything in the same tier should pick the same total-output cap.
														
 
															+    const tier1a = getExploreOutputBudget(50);
														
 
															+    const tier1b = getExploreOutputBudget(499);
														
 
															+    expect(tier1a.maxOutputChars).toBe(tier1b.maxOutputChars);
														
 
															+    expect(getExploreBudget(50)).toBe(getExploreBudget(499));
														
 
															+
														
 
															+    const tier2a = getExploreOutputBudget(500);
														
 
															+    const tier2b = getExploreOutputBudget(4999);
														
 
															+    expect(tier2a.maxOutputChars).toBe(tier2b.maxOutputChars);
														
 
															+    expect(getExploreBudget(500)).toBe(getExploreBudget(4999));
														
 
															+
														
 
															+    const tier3a = getExploreOutputBudget(5000);
														
 
															+    const tier3b = getExploreOutputBudget(14999);
														
 
															+    expect(tier3a.maxOutputChars).toBe(tier3b.maxOutputChars);
														
 
															+
														
 
															+    // And crossing a breakpoint changes the cap.
														
 
															+    expect(tier1a.maxOutputChars).not.toBe(tier2a.maxOutputChars);
														
 
															+    expect(tier2a.maxOutputChars).not.toBe(tier3a.maxOutputChars);
														
 
															+  });
														
 
															+
														
 
															+  it('gates off "Additional relevant files", completeness signal, and budget note on small projects', () => {
														
 
															+    const small = getExploreOutputBudget(100);
														
 
															+    expect(small.includeAdditionalFiles).toBe(false);
														
 
															+    expect(small.includeCompletenessSignal).toBe(false);
														
 
															+    expect(small.includeBudgetNote).toBe(false);
														
 
															+  });
														
 
															+
														
 
															+  it('keeps all meta-text on for projects that earn the breadth signal (>=500 files)', () => {
														
 
															+    const medium = getExploreOutputBudget(1000);
														
 
															+    expect(medium.includeAdditionalFiles).toBe(true);
														
 
															+    expect(medium.includeCompletenessSignal).toBe(true);
														
 
															+    expect(medium.includeBudgetNote).toBe(true);
														
 
															+  });
														
 
															+
														
 
															+  it('keeps the Relationships section on for every tier — it is the cheapest structural signal', () => {
														
 
															+    expect(getExploreOutputBudget(50).includeRelationships).toBe(true);
														
 
															+    expect(getExploreOutputBudget(1000).includeRelationships).toBe(true);
														
 
															+    expect(getExploreOutputBudget(10000).includeRelationships).toBe(true);
														
 
															+    expect(getExploreOutputBudget(30000).includeRelationships).toBe(true);
														
 
															+  });
														
 
															+
														
 
															+  it('caps the per-file header symbol list more tightly on small projects', () => {
														
 
															+    // Without this cap, a file like Alamofire's Session.swift produced
														
 
															+    // a 3.4KB symbol list in the `#### path — sym, sym, ...` header,
														
 
															+    // dwarfing the per-file body cap.
														
 
															+    const small = getExploreOutputBudget(100);
														
 
															+    const huge = getExploreOutputBudget(30000);
														
 
															+    expect(small.maxSymbolsInFileHeader).toBeLessThan(huge.maxSymbolsInFileHeader);
														
 
															+    expect(small.maxSymbolsInFileHeader).toBeGreaterThan(0);
														
 
															+  });
														
 
															+
														
 
															+  it('uses a tighter clustering gap threshold on small projects to break runaway single clusters', () => {
														
 
															+    const small = getExploreOutputBudget(100);
														
 
															+    const huge = getExploreOutputBudget(30000);
														
 
															+    expect(small.gapThreshold).toBeLessThanOrEqual(huge.gapThreshold);
														
 
															+  });
														
 
															+
														
 
															+  it('handles the boundary file counts exactly (off-by-one regression guard)', () => {
														
 
															+    // 499 -> small tier, 500 -> medium tier
														
 
															+    expect(getExploreOutputBudget(499).maxOutputChars).toBe(getExploreOutputBudget(100).maxOutputChars);
														
 
															+    expect(getExploreOutputBudget(500).maxOutputChars).toBe(getExploreOutputBudget(1000).maxOutputChars);
														
 
															+    // 4999 -> medium, 5000 -> large
														
 
															+    expect(getExploreOutputBudget(4999).maxOutputChars).toBe(getExploreOutputBudget(1000).maxOutputChars);
														
 
															+    expect(getExploreOutputBudget(5000).maxOutputChars).toBe(getExploreOutputBudget(10000).maxOutputChars);
														
 
															+    // 14999 -> large, 15000 -> xlarge
														
 
															+    expect(getExploreOutputBudget(14999).maxOutputChars).toBe(getExploreOutputBudget(10000).maxOutputChars);
														
 
															+    expect(getExploreOutputBudget(15000).maxOutputChars).toBe(getExploreOutputBudget(30000).maxOutputChars);
														
 
															+  });
														
 
															+});
														
 
															+
														
 
															+/**
														
 
															+ * End-to-end check that the budget is actually applied by handleExplore.
														
 
															+ *
														
 
															+ * Builds a tiny synthetic project (<500 files, so the small tier), indexes
														
 
															+ * it, and confirms the output:
														
 
															+ *   - stays under the small-tier maxOutputChars cap
														
 
															+ *   - omits the meta-text the small tier gates off (completeness signal,
														
 
															+ *     budget note, "Additional relevant files")
														
 
															+ *
														
 
															+ * Regression guard for #185 — protects against future edits to handleExplore
														
 
															+ * silently re-introducing the fixed 35KB cap on small projects.
														
 
															+ */
														
 
															+describe('codegraph_explore output respects the adaptive budget', () => {
														
 
															+  let testDir: string;
														
 
															+  let cg: CodeGraph;
														
 
															+  let handler: ToolHandler;
														
 
															+
														
 
															+  beforeAll(async () => {
														
 
															+    testDir = fs.mkdtempSync(path.join(os.tmpdir(), 'codegraph-explore-budget-'));
														
 
															+    const srcDir = path.join(testDir, 'src');
														
 
															+    fs.mkdirSync(srcDir);
														
 
															+
														
 
															+    // A handful of files with one fat target file. The fat file mimics the
														
 
															+    // Alamofire Session.swift case: many methods stacked on top of each other,
														
 
															+    // which collapsed into one giant cluster pre-#185.
														
 
															+    const fatLines: string[] = ['export class Session {'];
														
 
															+    for (let i = 0; i < 30; i++) {
														
 
															+      fatLines.push(`  method${i}(arg: string): string {`);
														
 
															+      fatLines.push(`    return this.helper${i}(arg) + "${i}";`);
														
 
															+      fatLines.push(`  }`);
														
 
															+      fatLines.push(`  private helper${i}(arg: string): string {`);
														
 
															+      fatLines.push(`    return arg.repeat(${i + 1});`);
														
 
															+      fatLines.push(`  }`);
														
 
															+    }
														
 
															+    fatLines.push('}');
														
 
															+    fs.writeFileSync(path.join(srcDir, 'session.ts'), fatLines.join('\n'));
														
 
															+
														
 
															+    // A few small supporting files so the project has >1 indexed file.
														
 
															+    for (let i = 0; i < 5; i++) {
														
 
															+      fs.writeFileSync(
														
 
															+        path.join(srcDir, `support${i}.ts`),
														
 
															+        `import { Session } from './session';\nexport function callSession${i}(s: Session) { return s.method${i}('hi'); }\n`
														
 
															+      );
														
 
															+    }
														
 
															+
														
 
															+    cg = CodeGraph.initSync(testDir, {
														
 
															+      config: { include: ['**/*.ts'], exclude: [] },
														
 
															+    });
														
 
															+    await cg.indexAll();
														
 
															+    handler = new ToolHandler(cg);
														
 
															+  });
														
 
															+
														
 
															+  afterAll(() => {
														
 
															+    if (cg) cg.destroy();
														
 
															+    if (testDir && fs.existsSync(testDir)) {
														
 
															+      fs.rmSync(testDir, { recursive: true, force: true });
														
 
															+    }
														
 
															+  });
														
 
															+
														
 
															+  it('keeps total output under the small-project cap', async () => {
														
 
															+    const result = await handler.execute('codegraph_explore', { query: 'Session method helper' });
														
 
															+    const text = result.content?.[0]?.text ?? '';
														
 
															+    const smallBudget = getExploreOutputBudget(100);
														
 
															+    // Allow a small overshoot for the trailing markers — the cap is enforced
														
 
															+    // per-file rather than as an absolute output ceiling.
														
 
															+    expect(text.length).toBeLessThan(smallBudget.maxOutputChars + 500);
														
 
															+  });
														
 
															+
														
 
															+  it('omits the meta-text gated off for small projects', async () => {
														
 
															+    const result = await handler.execute('codegraph_explore', { query: 'Session method helper' });
														
 
															+    const text = result.content?.[0]?.text ?? '';
														
 
															+    expect(text).not.toContain('### Additional relevant files');
														
 
															+    expect(text).not.toContain('Complete source code is included above');
														
 
															+    expect(text).not.toContain('Explore budget:');
														
 
															+  });
														
 
															+
														
 
															+  it('still includes the Relationships section — it is the cheapest structural signal', async () => {
														
 
															+    const result = await handler.execute('codegraph_explore', { query: 'Session method helper' });
														
 
															+    const text = result.content?.[0]?.text ?? '';
														
 
															+    // Either there are relationships, or no edges were significant — both are fine.
														
 
															+    // We just want to confirm we did not accidentally gate it off.
														
 
															+    const hasRelationships = text.includes('### Relationships');
														
 
															+    const sourceFollowsHeader = text.indexOf('### Source Code') > 0;
														
 
															+    expect(hasRelationships || sourceFollowsHeader).toBe(true);
														
 
															+  });
														
 
															+});
														
--- a/src/mcp/tools.ts
+++ b/src/mcp/tools.ts
@@ -44,6 +44,104 @@ export function getExploreBudget(fileCount: number): number {
 
															   return 5;
														
 
															 }
														
 
															+/**
														
 
															+ * Adaptive output budget for `codegraph_explore`, scaled to project size.
														
 
															+ *
														
 
															+ * Smaller codebases get a tighter total cap, fewer default files, smaller
														
 
															+ * per-file cap, and tighter clustering — so a focused query on a 100-file
														
 
															+ * project doesn't dump a whole file's worth of source into the agent's
														
 
															+ * context. Larger codebases keep the generous defaults because the
														
 
															+ * agent's native discovery cost (grep + find + many Reads) genuinely
														
 
															+ * dwarfs a fat explore call at that scale.
														
 
															+ *
														
 
															+ * Meta-text (relationships map, "additional relevant files" list,
														
 
															+ * completeness signal, budget note) is gated off for tiny projects
														
 
															+ * where one rich call is the whole story and the extra prose is just
														
 
															+ * overhead.
														
 
															+ *
														
 
															+ * Tier breakpoints mirror `getExploreBudget` so a project sits in the
														
 
															+ * same tier across both knobs.
														
 
															+ */
														
 
															+export interface ExploreOutputBudget {
														
 
															+  /** Hard cap on total output characters. */
														
 
															+  maxOutputChars: number;
														
 
															+  /** Default `maxFiles` when the caller didn't specify one. */
														
 
															+  defaultMaxFiles: number;
														
 
															+  /** Cap on contiguous source returned per file (across all its clusters). */
														
 
															+  maxCharsPerFile: number;
														
 
															+  /** Cluster gap threshold in lines — tighter clustering on small projects. */
														
 
															+  gapThreshold: number;
														
 
															+  /** Max symbols listed in the per-file header (`#### path — sym(kind), ...`). */
														
 
															+  maxSymbolsInFileHeader: number;
														
 
															+  /** Max edges shown per relationship kind in the Relationships section. */
														
 
															+  maxEdgesPerRelationshipKind: number;
														
 
															+  /** Include the "Relationships" section. */
														
 
															+  includeRelationships: boolean;
														
 
															+  /** Include the "Additional relevant files (not shown)" trailing list. */
														
 
															+  includeAdditionalFiles: boolean;
														
 
															+  /** Include the "Complete source code is included above…" reminder. */
														
 
															+  includeCompletenessSignal: boolean;
														
 
															+  /** Include the explore-budget reminder at the end. */
														
 
															+  includeBudgetNote: boolean;
														
 
															+}
														
 
															+
														
 
															+export function getExploreOutputBudget(fileCount: number): ExploreOutputBudget {
														
 
															+  if (fileCount < 500) {
														
 
															+    return {
														
 
															+      maxOutputChars: 18000,
														
 
															+      defaultMaxFiles: 5,
														
 
															+      maxCharsPerFile: 3800,
														
 
															+      gapThreshold: 8,
														
 
															+      maxSymbolsInFileHeader: 6,
														
 
															+      maxEdgesPerRelationshipKind: 6,
														
 
															+      includeRelationships: true,
														
 
															+      includeAdditionalFiles: false,
														
 
															+      includeCompletenessSignal: false,
														
 
															+      includeBudgetNote: false,
														
 
															+    };
														
 
															+  }
														
 
															+  if (fileCount < 5000) {
														
 
															+    return {
														
 
															+      maxOutputChars: 28000,
														
 
															+      defaultMaxFiles: 9,
														
 
															+      maxCharsPerFile: 5000,
														
 
															+      gapThreshold: 12,
														
 
															+      maxSymbolsInFileHeader: 10,
														
 
															+      maxEdgesPerRelationshipKind: 10,
														
 
															+      includeRelationships: true,
														
 
															+      includeAdditionalFiles: true,
														
 
															+      includeCompletenessSignal: true,
														
 
															+      includeBudgetNote: true,
														
 
															+    };
														
 
															+  }
														
 
															+  if (fileCount < 15000) {
														
 
															+    return {
														
 
															+      maxOutputChars: 35000,
														
 
															+      defaultMaxFiles: 12,
														
 
															+      maxCharsPerFile: 7000,
														
 
															+      gapThreshold: 15,
														
 
															+      maxSymbolsInFileHeader: 15,
														
 
															+      maxEdgesPerRelationshipKind: 15,
														
 
															+      includeRelationships: true,
														
 
															+      includeAdditionalFiles: true,
														
 
															+      includeCompletenessSignal: true,
														
 
															+      includeBudgetNote: true,
														
 
															+    };
														
 
															+  }
														
 
															+  return {
														
 
															+    maxOutputChars: 38000,
														
 
															+    defaultMaxFiles: 14,
														
 
															+    maxCharsPerFile: 7000,
														
 
															+    gapThreshold: 15,
														
 
															+    maxSymbolsInFileHeader: 15,
														
 
															+    maxEdgesPerRelationshipKind: 15,
														
 
															+    includeRelationships: true,
														
 
															+    includeAdditionalFiles: true,
														
 
															+    includeCompletenessSignal: true,
														
 
															+    includeBudgetNote: true,
														
 
															+  };
														
 
															+}
														
 
															+
														
 
															 /**
														
 
															  * Mark a Claude session as having consulted MCP tools.
														
 
															  * This enables Grep/Glob/Bash commands that would otherwise be blocked.
														
@@ -656,24 +754,35 @@ export class ToolHandler {
 
															     return this.textResult(this.truncateOutput(formatted));
														
 
															   }
														
 
															-  /** Maximum output for explore tool — sized to stay under MCP client token limits (~10k tokens) */
														
 
															-  private static readonly EXPLORE_MAX_OUTPUT = 35000;
														
 
															-
														
 
															   /**
														
 
															    * Handle codegraph_explore — deep exploration in a single call
														
 
															    *
														
 
															    * Strategy: find relevant symbols via graph traversal, group by file,
														
 
															    * then read contiguous file sections covering all symbols per file.
														
 
															    * This replaces multiple codegraph_node + Read calls.
														
 
															+   *
														
 
															+   * Output size is adaptive to project file count via
														
 
															+   * `getExploreOutputBudget` — see #185 for why a fixed 35k cap was a
														
 
															+   * tax on small projects while earning its keep on large ones.
														
 
															    */
														
 
															   private async handleExplore(args: Record<string, unknown>): Promise<ToolResult> {
														
 
															     const query = this.validateString(args.query, 'query');
														
 
															     if (typeof query !== 'string') return query;
														
 
															     const cg = this.getCodeGraph(args.projectPath as string | undefined);
														
 
															-    const maxFiles = clamp((args.maxFiles as number) || 12, 1, 20);
														
 
															     const projectRoot = cg.getProjectRoot();
														
 
															+    // Resolve adaptive output budget from project size. Falls back to the
														
 
															+    // largest-tier defaults if stats aren't available, which preserves
														
 
															+    // pre-#185 behavior for callers that hit the rare stats failure.
														
 
															+    let budget: ExploreOutputBudget;
														
 
															+    try {
														
 
															+      budget = getExploreOutputBudget(cg.getStats().fileCount);
														
 
															+    } catch {
														
 
															+      budget = getExploreOutputBudget(Infinity);
														
 
															+    }
														
 
															+    const maxFiles = clamp((args.maxFiles as number) || budget.defaultMaxFiles, 1, 20);
														
 
															+
														
 
															     // Step 1: Find relevant context with generous parameters.
														
 
															     // Use a large maxNodes budget — explore has its own 35k char output limit
														
 
															     // that prevents context bloat, so more nodes just means better coverage
														
@@ -765,7 +874,7 @@ export class ToolHandler {
 
															       e.kind !== 'contains' // skip contains — it's implied by file grouping
														
 
															     );
														
 
															-    if (significantEdges.length > 0) {
														
 
															+    if (budget.includeRelationships && significantEdges.length > 0) {
														
 
															       lines.push('### Relationships');
														
 
															       lines.push('');
														
@@ -782,14 +891,14 @@ export class ToolHandler {
 
															       }
														
 
															       for (const [kind, edges] of byKind) {
														
 
															-        // Show up to 15 relationships per kind
														
 
															-        const shown = edges.slice(0, 15);
														
 
															+        const cap = budget.maxEdgesPerRelationshipKind;
														
 
															+        const shown = edges.slice(0, cap);
														
 
															         lines.push(`**${kind}:**`);
														
 
															         for (const e of shown) {
														
 
															           lines.push(`- ${e.source} → ${e.target}`);
														
 
															         }
														
 
															-        if (edges.length > 15) {
														
 
															-          lines.push(`- ... and ${edges.length - 15} more`);
														
 
															+        if (edges.length > cap) {
														
 
															+          lines.push(`- ... and ${edges.length - cap} more`);
														
 
															         }
														
 
															         lines.push('');
														
 
															       }
														
@@ -801,10 +910,11 @@ export class ToolHandler {
 
															     let totalChars = lines.join('\n').length;
														
 
															     let filesIncluded = 0;
														
 
															+    let anyFileTrimmed = false;
														
 
															     for (const [filePath, group] of sortedFiles) {
														
 
															       if (filesIncluded >= maxFiles) break;
														
 
															-      if (totalChars > ToolHandler.EXPLORE_MAX_OUTPUT * 0.9) break;
														
 
															+      if (totalChars > budget.maxOutputChars * 0.9) break;
														
 
															       const absPath = validatePathWithinRoot(projectRoot, filePath);
														
 
															       if (!absPath || !existsSync(absPath)) continue;
														
@@ -820,14 +930,26 @@ export class ToolHandler {
 
															       const lang = group.nodes[0]?.language || '';
														
 
															       // Cluster nearby symbols to avoid reading huge gaps between distant symbols.
														
 
															-      // Sort by start line, then merge overlapping/adjacent ranges (within 15 lines).
														
 
															-      // Include both node ranges AND edge source locations so template sections
														
 
															-      // with component usages/calls are covered (not just script block symbols).
														
 
															-      const ranges: Array<{ start: number; end: number; name: string; kind: string }> = group.nodes
														
 
															+      // Sort by start line, then merge overlapping/adjacent ranges (within the
														
 
															+      // adaptive gap threshold). Include both node ranges AND edge source
														
 
															+      // locations so template sections with component usages/calls are
														
 
															+      // covered (not just script block symbols).
														
 
															+      //
														
 
															+      // Each range carries an `importance` score so we can rank clusters
														
 
															+      // when the per-file budget forces us to drop some: entry-point nodes
														
 
															+      // are worth 10, directly-connected nodes 3, peripheral nodes 1, and
														
 
															+      // bare edge-source lines 2 (less than a connected node but more than
														
 
															+      // a peripheral one — they hint at a reference but aren't a definition).
														
 
															+      const ranges: Array<{ start: number; end: number; name: string; kind: string; importance: number }> = group.nodes
														
 
															         .filter(n => n.startLine > 0 && n.endLine > 0)
														
 
															         // Skip file/component nodes that span the entire file — they'd create one giant cluster
														
 
															         .filter(n => !(n.kind === 'component' && n.startLine === 1 && n.endLine >= fileLines.length - 1))
														
 
															-        .map(n => ({ start: n.startLine, end: n.endLine, name: n.name, kind: n.kind }));
														
 
															+        .map(n => {
														
 
															+          let importance = 1;
														
 
															+          if (entryNodeIds.has(n.id)) importance = 10;
														
 
															+          else if (connectedToEntry.has(n.id)) importance = 3;
														
 
															+          return { start: n.startLine, end: n.endLine, name: n.name, kind: n.kind, importance };
														
 
															+        });
														
 
															       // Add edge source locations in this file — captures template references
														
 
															       // (component usages, event handlers) that aren't nodes themselves.
														
@@ -844,7 +966,7 @@ export class ToolHandler {
 
															           // Look up target name from subgraph first, fall back to edge kind
														
 
															           const targetNode = subgraph.nodes.get(edge.target);
														
 
															           const targetName = targetNode?.name ?? edge.kind;
														
 
															-          ranges.push({ start: edge.line, end: edge.line, name: targetName, kind: edge.kind });
														
 
															+          ranges.push({ start: edge.line, end: edge.line, name: targetName, kind: edge.kind, importance: 2 });
														
 
															         }
														
 
															       }
														
@@ -852,46 +974,129 @@ export class ToolHandler {
 
															       if (ranges.length === 0) continue;
														
 
															-      const GAP_THRESHOLD = 15; // merge sections within 15 lines of each other
														
 
															-      const clusters: Array<{ start: number; end: number; symbols: string[] }> = [];
														
 
															-      let current = { start: ranges[0]!.start, end: ranges[0]!.end, symbols: [`${ranges[0]!.name}(${ranges[0]!.kind})`] };
														
 
															+      const gapThreshold = budget.gapThreshold;
														
 
															+      const clusters: Array<{ start: number; end: number; symbols: string[]; score: number }> = [];
														
 
															+      let current = {
														
 
															+        start: ranges[0]!.start,
														
 
															+        end: ranges[0]!.end,
														
 
															+        symbols: [`${ranges[0]!.name}(${ranges[0]!.kind})`],
														
 
															+        score: ranges[0]!.importance,
														
 
															+      };
														
 
															       for (let i = 1; i < ranges.length; i++) {
														
 
															         const r = ranges[i]!;
														
 
															-        if (r.start <= current.end + GAP_THRESHOLD) {
														
 
															+        if (r.start <= current.end + gapThreshold) {
														
 
															           current.end = Math.max(current.end, r.end);
														
 
															           current.symbols.push(`${r.name}(${r.kind})`);
														
 
															+          current.score += r.importance;
														
 
															         } else {
														
 
															           clusters.push(current);
														
 
															-          current = { start: r.start, end: r.end, symbols: [`${r.name}(${r.kind})`] };
														
 
															+          current = {
														
 
															+            start: r.start,
														
 
															+            end: r.end,
														
 
															+            symbols: [`${r.name}(${r.kind})`],
														
 
															+            score: r.importance,
														
 
															+          };
														
 
															         }
														
 
															       }
														
 
															       clusters.push(current);
														
 
															-      // Build file section output from clusters
														
 
															+      // Build file section output from clusters, capped by per-file budget.
														
 
															+      // The pathological case (#185): a file like Session.swift where every
														
 
															+      // method is adjacent collapses into one cluster spanning the whole
														
 
															+      // file, and dumping that into the agent's context is most of the
														
 
															+      // token cost on small projects. We pick clusters in score order
														
 
															+      // (importance per line, so we don't prefer one giant low-density
														
 
															+      // cluster over several focused ones) until the per-file char cap is
														
 
															+      // hit. Truly enormous single clusters get tail-trimmed with a marker.
														
 
															       const contextPadding = 3;
														
 
															+      const buildSection = (c: { start: number; end: number }): string => {
														
 
															+        const startIdx = Math.max(0, c.start - 1 - contextPadding);
														
 
															+        const endIdx = Math.min(fileLines.length, c.end + contextPadding);
														
 
															+        return fileLines.slice(startIdx, endIdx).join('\n');
														
 
															+      };
														
 
															+      const GAP_MARKER = '\n\n// ... (gap) ...\n\n';
														
 
															+
														
 
															+      // Score clusters by score-per-line (density) so a 30-line cluster
														
 
															+      // with two entry symbols outranks a 400-line cluster with two
														
 
															+      // peripheral symbols. Stable tiebreak by score, then by smaller
														
 
															+      // span (cheaper to include).
														
 
															+      const rankedClusters = clusters
														
 
															+        .map((c, i) => ({ idx: i, span: c.end - c.start + 1, c }))
														
 
															+        .sort((a, b) => {
														
 
															+          const densityA = a.c.score / a.span;
														
 
															+          const densityB = b.c.score / b.span;
														
 
															+          if (densityB !== densityA) return densityB - densityA;
														
 
															+          if (b.c.score !== a.c.score) return b.c.score - a.c.score;
														
 
															+          return a.span - b.span;
														
 
															+        });
														
 
															+
														
 
															+      const chosenIndices = new Set<number>();
														
 
															+      let projectedChars = 0;
														
 
															+      for (const rc of rankedClusters) {
														
 
															+        const sectionLen = buildSection(rc.c).length + (chosenIndices.size > 0 ? GAP_MARKER.length : 0);
														
 
															+        // Always take the top-ranked cluster, even if oversize, so we don't
														
 
															+        // return an empty file section (agent would then re-Read the file,
														
 
															+        // negating the savings).
														
 
															+        if (chosenIndices.size === 0) {
														
 
															+          chosenIndices.add(rc.idx);
														
 
															+          projectedChars += sectionLen;
														
 
															+          continue;
														
 
															+        }
														
 
															+        if (projectedChars + sectionLen > budget.maxCharsPerFile) continue;
														
 
															+        chosenIndices.add(rc.idx);
														
 
															+        projectedChars += sectionLen;
														
 
															+      }
														
 
															+
														
 
															+      // Emit chosen clusters in source order so the file reads top-to-bottom.
														
 
															       let fileSection = '';
														
 
															       const allSymbols: string[] = [];
														
 
															-
														
 
															-      for (const cluster of clusters) {
														
 
															-        const startIdx = Math.max(0, cluster.start - 1 - contextPadding);
														
 
															-        const endIdx = Math.min(fileLines.length, cluster.end + contextPadding);
														
 
															-        const section = fileLines.slice(startIdx, endIdx).join('\n');
														
 
															-
														
 
															-        if (fileSection.length > 0) {
														
 
															-          fileSection += '\n\n// ... (gap) ...\n\n';
														
 
															-        }
														
 
															+      let fileTrimmed = false;
														
 
															+      for (let i = 0; i < clusters.length; i++) {
														
 
															+        if (!chosenIndices.has(i)) continue;
														
 
															+        const cluster = clusters[i]!;
														
 
															+        const section = buildSection(cluster);
														
 
															+        if (fileSection.length > 0) fileSection += GAP_MARKER;
														
 
															         fileSection += section;
														
 
															         allSymbols.push(...cluster.symbols);
														
 
															       }
														
 
															-      // Skip if this section would blow the output limit
														
 
															-      if (totalChars + fileSection.length + 200 > ToolHandler.EXPLORE_MAX_OUTPUT) {
														
 
															-        const budget = ToolHandler.EXPLORE_MAX_OUTPUT - totalChars - 200;
														
 
															-        if (budget < 500) break;
														
 
															-        const trimmed = fileSection.slice(0, budget) + '\n// ... trimmed ...';
														
 
															+      // If a single chosen cluster is still oversize (long monolithic
														
 
															+      // function), tail-trim it. Better one trimmed view than nothing.
														
 
															+      if (fileSection.length > budget.maxCharsPerFile) {
														
 
															+        fileSection = fileSection.slice(0, budget.maxCharsPerFile) + '\n// ... trimmed ...';
														
 
															+        fileTrimmed = true;
														
 
															+      }
														
 
															+      if (chosenIndices.size < clusters.length || fileTrimmed) {
														
 
															+        anyFileTrimmed = true;
														
 
															+      }
														
 
															-        lines.push(`#### ${filePath} — ${allSymbols.join(', ')}`);
														
 
															+      // Dedupe + cap the symbols list shown in the per-file header. Some
														
 
															+      // files (Session.swift in Alamofire) produced 3.4KB symbol lists
														
 
															+      // from cluster scoring + edge-source lines, dwarfing the per-file
														
 
															+      // body cap. Show top names by frequency, with a "+N more" tail.
														
 
															+      const symbolCounts = new Map<string, number>();
														
 
															+      for (const s of allSymbols) {
														
 
															+        symbolCounts.set(s, (symbolCounts.get(s) ?? 0) + 1);
														
 
															+      }
														
 
															+      const sortedSymbols = [...symbolCounts.entries()]
														
 
															+        .sort((a, b) => b[1] - a[1])
														
 
															+        .map(([name]) => name);
														
 
															+      const headerCap = budget.maxSymbolsInFileHeader;
														
 
															+      const headerSymbols = sortedSymbols.slice(0, headerCap);
														
 
															+      const omittedCount = sortedSymbols.length - headerSymbols.length;
														
 
															+      const headerSuffix = omittedCount > 0
														
 
															+        ? `${headerSymbols.join(', ')}, +${omittedCount} more`
														
 
															+        : headerSymbols.join(', ');
														
 
															+      const fileHeader = `#### ${filePath} — ${headerSuffix}`;
														
 
															+
														
 
															+      // Respect the total output cap on a file-by-file basis.
														
 
															+      if (totalChars + fileSection.length + 200 > budget.maxOutputChars) {
														
 
															+        const remaining = budget.maxOutputChars - totalChars - 200;
														
 
															+        if (remaining < 500) break;
														
 
															+        const trimmed = fileSection.slice(0, remaining) + '\n// ... trimmed ...';
														
 
															+
														
 
															+        lines.push(fileHeader);
														
 
															         lines.push('');
														
 
															         lines.push('```' + lang);
														
 
															         lines.push(trimmed);
														
@@ -899,10 +1104,11 @@ export class ToolHandler {
 
															         lines.push('');
														
 
															         totalChars += trimmed.length + 200;
														
 
															         filesIncluded++;
														
 
															+        anyFileTrimmed = true;
														
 
															         break;
														
 
															       }
														
 
															-      lines.push(`#### ${filePath} — ${allSymbols.join(', ')}`);
														
 
															+      lines.push(fileHeader);
														
 
															       lines.push('');
														
 
															       lines.push('```' + lang);
														
 
															       lines.push(fileSection);
														
@@ -913,37 +1119,51 @@ export class ToolHandler {
 
															       filesIncluded++;
														
 
															     }
														
 
															-    // Add remaining files as references (from both relevant and peripheral files)
														
 
															-    const remainingRelevant = sortedFiles.slice(filesIncluded);
														
 
															-    const peripheralFiles = [...fileGroups.entries()]
														
 
															-      .filter(([, group]) => group.score < 3)
														
 
															-      .sort((a, b) => b[1].score - a[1].score);
														
 
															-    const remainingFiles = [...remainingRelevant, ...peripheralFiles];
														
 
															-    if (remainingFiles.length > 0) {
														
 
															-      lines.push('### Additional relevant files (not shown)');
														
 
															-      lines.push('');
														
 
															-      for (const [filePath, group] of remainingFiles.slice(0, 10)) {
														
 
															-        const symbols = group.nodes.map(n => `${n.name}:${n.startLine}`).join(', ');
														
 
															-        lines.push(`- ${filePath}: ${symbols}`);
														
 
															-      }
														
 
															-      if (remainingFiles.length > 10) {
														
 
															-        lines.push(`- ... and ${remainingFiles.length - 10} more files`);
														
 
															+    // Add remaining files as references (from both relevant and peripheral files).
														
 
															+    // Small projects (per budget) skip this — the relevant story already fits
														
 
															+    // in the source section, and a trailing pointer list is pure overhead.
														
 
															+    if (budget.includeAdditionalFiles) {
														
 
															+      const remainingRelevant = sortedFiles.slice(filesIncluded);
														
 
															+      const peripheralFiles = [...fileGroups.entries()]
														
 
															+        .filter(([, group]) => group.score < 3)
														
 
															+        .sort((a, b) => b[1].score - a[1].score);
														
 
															+      const remainingFiles = [...remainingRelevant, ...peripheralFiles];
														
 
															+      if (remainingFiles.length > 0) {
														
 
															+        lines.push('### Additional relevant files (not shown)');
														
 
															+        lines.push('');
														
 
															+        for (const [filePath, group] of remainingFiles.slice(0, 10)) {
														
 
															+          const symbols = group.nodes.map(n => `${n.name}:${n.startLine}`).join(', ');
														
 
															+          lines.push(`- ${filePath}: ${symbols}`);
														
 
															+        }
														
 
															+        if (remainingFiles.length > 10) {
														
 
															+          lines.push(`- ... and ${remainingFiles.length - 10} more files`);
														
 
															+        }
														
 
															       }
														
 
															     }
														
 
															-    // Add completeness signal so agents know they don't need to re-read these files
														
 
															-    lines.push('');
														
 
															-    lines.push('---');
														
 
															-    lines.push(`> **Complete source code is included above for ${filesIncluded} files.** You do NOT need to re-read these files — the relevant sections are already shown in full. Only use Read/Grep for files listed under "Additional relevant files" if you need more detail.`);
														
 
															+    // Add completeness signal so agents know they don't need to re-read these files.
														
 
															+    // On small projects the budget gates this off — but if we actually had to
														
 
															+    // trim or drop clusters, surface a brief note so the agent knows it can
														
 
															+    // still Read for more detail.
														
 
															+    if (budget.includeCompletenessSignal) {
														
 
															+      lines.push('');
														
 
															+      lines.push('---');
														
 
															+      lines.push(`> **Complete source code is included above for ${filesIncluded} files.** You do NOT need to re-read these files — the relevant sections are already shown in full. Only use Read/Grep for files listed under "Additional relevant files" if you need more detail.`);
														
 
															+    } else if (anyFileTrimmed) {
														
 
															+      lines.push('');
														
 
															+      lines.push(`> Some file sections were trimmed for size. Use \`codegraph_node\` or Read for the full source if needed.`);
														
 
															+    }
														
 
															     // Add explore budget note based on project size
														
 
															-    try {
														
 
															-      const stats = cg.getStats();
														
 
															-      const budget = getExploreBudget(stats.fileCount);
														
 
															-      lines.push('');
														
 
															-      lines.push(`> **Explore budget: ${budget} calls max for this project (${stats.fileCount.toLocaleString()} files indexed).** Stop exploring and synthesize your answer once you've used ${budget} calls — do NOT make additional explore calls beyond this budget.`);
														
 
															-    } catch {
														
 
															-      // Stats unavailable — skip budget note
														
 
															+    if (budget.includeBudgetNote) {
														
 
															+      try {
														
 
															+        const stats = cg.getStats();
														
 
															+        const callBudget = getExploreBudget(stats.fileCount);
														
 
															+        lines.push('');
														
 
															+        lines.push(`> **Explore budget: ${callBudget} calls max for this project (${stats.fileCount.toLocaleString()} files indexed).** Stop exploring and synthesize your answer once you've used ${callBudget} calls — do NOT make additional explore calls beyond this budget.`);
														
 
															+      } catch {
														
 
															+        // Stats unavailable — skip budget note
														
 
															+      }
														
 
															     }
														
 
															     return this.textResult(lines.join('\n'));