| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373 |
- /**
- * Regression test for adaptive `codegraph_explore` sizing — sibling
- * skeletonization (branch `feat/adaptive-explore-sizing`, commit d6d059f).
- *
- * Feature: when a file is BOTH (1) off the synthesized flow spine AND (2) a
- * polymorphic sibling — its class implements/extends a supertype shared by
- * >= MIN_SIBLINGS (3) implementers — `codegraph_explore` renders it as a
- * class + member *signature* skeleton (bodies elided) instead of full source,
- * keeping the on-spine exemplar and the mechanism full. This sizes the
- * response to the answer rather than the budget cap on sibling-heavy flows
- * (OkHttp's interceptor chain) without starving diffuse ones (distinct
- * pipeline steps stay full). Default ON; CODEGRAPH_ADAPTIVE_EXPLORE=0 disables.
- *
- * The fixture is OkHttp's interceptor chain in miniature:
- * - `Interceptor` interface with FOUR implementers (>= 3 => a sibling family)
- * - a 3-hop call spine `dispatch -> proceed -> handleLogging` that passes
- * THROUGH LoggingInterceptor — so that file is the on-spine exemplar
- * - Bridge/Cache/RetryInterceptor: off-spine members of the sibling family
- * => skeletonize
- * - ResponseFormatter implements `Formatter`, which has only ONE impl (< 3)
- * => a distinct step: off-spine but NOT a sibling => stays full
- *
- * Guards the two ways the feature can silently regress: skeletonizing too much
- * (a distinct step or the on-spine exemplar) or too little (the off-spine
- * siblings), plus the escape hatch.
- */
- import { describe, it, expect, beforeAll, afterAll, beforeEach } from 'vitest';
- import * as fs from 'fs';
- import * as path from 'path';
- import * as os from 'os';
- import { ToolHandler } from '../src/mcp/tools';
- import CodeGraph from '../src/index';
- const SKELETON_MARK = '· skeleton (signatures only; Read for a full body)';
- /** Return the `#### <path> ...` section for a file basename, header through the
- * line before the next `###`/`####` header (or end of output). */
- function sectionFor(text: string, basename: string): string {
- const lines = text.split('\n');
- const start = lines.findIndex((l) => l.startsWith('#### ') && l.includes(basename));
- if (start < 0) return '';
- let end = lines.length;
- for (let i = start + 1; i < lines.length; i++) {
- if (lines[i].startsWith('### ') || lines[i].startsWith('#### ')) {
- end = i;
- break;
- }
- }
- return lines.slice(start, end).join('\n');
- }
- describe('adaptive codegraph_explore sizing — sibling skeletonization', () => {
- let testDir: string;
- let cg: CodeGraph;
- let handler: ToolHandler;
- // Names the spine (dispatch/proceed/handleLogging), the on-spine exemplar,
- // the three off-spine siblings, and the distinct step — so every file we
- // assert on is gathered as relevant. maxFiles overrides the very-tiny tier's
- // 4-file default so all of them land in one call.
- const QUERY =
- 'dispatch proceed handleLogging LoggingInterceptor BridgeInterceptor CacheInterceptor RetryInterceptor ResponseFormatter';
- beforeAll(async () => {
- testDir = fs.mkdtempSync(path.join(os.tmpdir(), 'codegraph-adaptive-explore-'));
- const srcDir = path.join(testDir, 'src');
- fs.mkdirSync(srcDir);
- const write = (name: string, body: string) =>
- fs.writeFileSync(path.join(srcDir, name), body.trimStart());
- // The interchangeable contract — 4 implementers below => sibling family.
- write(
- 'interceptor.ts',
- `
- export interface Interceptor {
- intercept(request: string): string;
- }
- `
- );
- // The mechanism + the spine: dispatch -> proceed -> (LoggingInterceptor) handleLogging.
- // Unique method names so the call edges resolve unambiguously.
- write(
- 'dispatcher.ts',
- `
- import { LoggingInterceptor } from './logging-interceptor';
- export class RequestDispatcher {
- dispatch(): string {
- const chain = new InterceptorChain();
- return chain.proceed();
- }
- }
- export class InterceptorChain {
- proceed(): string {
- const exemplar = new LoggingInterceptor();
- return exemplar.handleLogging();
- }
- }
- `
- );
- // On-spine exemplar: handleLogging is the spine's tail, so this whole file
- // is on-spine and must stay FULL even though it's a sibling (implements Interceptor).
- write(
- 'logging-interceptor.ts',
- `
- import { Interceptor } from './interceptor';
- export class LoggingInterceptor implements Interceptor {
- handleLogging(): string {
- const tag = 'LOGGING_BODY_MARKER';
- return this.intercept(tag);
- }
- intercept(request: string): string {
- return 'logged:' + request;
- }
- }
- `
- );
- // Off-spine siblings — interchangeable impls of Interceptor => SKELETONIZE.
- // Each body carries a unique marker that must NOT survive skeletonization.
- write(
- 'bridge-interceptor.ts',
- `
- import { Interceptor } from './interceptor';
- export class BridgeInterceptor implements Interceptor {
- intercept(request: string): string {
- const detail = 'BRIDGE_BODY_MARKER';
- return 'bridged:' + request + detail;
- }
- }
- `
- );
- write(
- 'cache-interceptor.ts',
- `
- import { Interceptor } from './interceptor';
- export class CacheInterceptor implements Interceptor {
- intercept(request: string): string {
- const detail = 'CACHE_BODY_MARKER';
- return 'cached:' + request + detail;
- }
- }
- `
- );
- write(
- 'retry-interceptor.ts',
- `
- import { Interceptor } from './interceptor';
- export class RetryInterceptor implements Interceptor {
- intercept(request: string): string {
- const detail = 'RETRY_BODY_MARKER';
- return 'retried:' + request + detail;
- }
- }
- `
- );
- // A 1:1 interface->impl pair: off-spine, implements something, but the
- // supertype has only ONE impl (< MIN_SIBLINGS) => a DISTINCT step => FULL.
- write(
- 'formatter.ts',
- `
- export interface Formatter {
- format(input: string): string;
- }
- `
- );
- write(
- 'response-formatter.ts',
- `
- import { Formatter } from './formatter';
- import { JsonCodec } from './codec';
- export class ResponseFormatter implements Formatter {
- format(input: string): string {
- const detail = 'FORMATTER_BODY_MARKER';
- // Calls into the Codec family from OFF the dispatch spine, so codec.ts is
- // gathered as relevant but stays off-spine (mirrors Django: compiler.py is
- // referenced by the flow yet off the QuerySet-iteration spine).
- return new JsonCodec().encode(input) + detail;
- }
- }
- `
- );
- // An off-spine sibling (implements Interceptor) the agent would otherwise
- // skeletonize — BUT it owns a uniquely-named method `authenticate` the agent
- // names in the query. Mirrors OkHttp's RealCall (named getResponseWith-
- // InterceptorChain): a named callable means "show me this", so it stays full.
- write(
- 'auth-interceptor.ts',
- `
- import { Interceptor } from './interceptor';
- export class AuthInterceptor implements Interceptor {
- authenticate(token: string): string {
- const detail = 'AUTH_BODY_MARKER';
- return 'auth:' + token + detail;
- }
- intercept(request: string): string {
- return this.authenticate(request);
- }
- }
- `
- );
- // A base class that DEFINES a >=3-impl supertype AND co-locates its
- // subclasses in the same file — mirrors Django's compiler.py (SQLCompiler +
- // SQLInsertCompiler/SQLUpdateCompiler/...). The subclasses' `extends` edges
- // make the file look like a sibling, but it's the family's base/mechanism,
- // so it must stay full.
- write(
- 'codec.ts',
- `
- export class Codec {
- encode(input: string): string {
- const detail = 'CODEC_BASE_MARKER';
- return input + detail;
- }
- }
- export class JsonCodec extends Codec {
- encode(input: string): string { return '{' + input + '}'; }
- }
- export class XmlCodec extends Codec {
- encode(input: string): string { return '<' + input + '>'; }
- }
- export class YamlCodec extends Codec {
- encode(input: string): string { return '- ' + input; }
- }
- `
- );
- cg = CodeGraph.initSync(testDir, { config: { include: ['**/*.ts'], exclude: [] } });
- await cg.indexAll();
- handler = new ToolHandler(cg);
- });
- afterAll(() => {
- if (cg) cg.destroy();
- if (testDir && fs.existsSync(testDir)) {
- fs.rmSync(testDir, { recursive: true, force: true });
- }
- });
- beforeEach(() => {
- // Each test asserts against the default (ON) behaviour unless it opts out.
- delete process.env.CODEGRAPH_ADAPTIVE_EXPLORE;
- });
- it('fixture sanity: Interceptor has >=3 implementers, Formatter has <3', () => {
- const find = (name: string, kind: string) =>
- cg.searchNodes(name).map((r) => r.node).find((n) => n.name === name && n.kind === kind);
- const interceptor = find('Interceptor', 'interface');
- const formatter = find('Formatter', 'interface');
- expect(interceptor).toBeTruthy();
- expect(formatter).toBeTruthy();
- const implementers = (id: string) =>
- cg.getIncomingEdges(id).filter((e) => e.kind === 'implements' || e.kind === 'extends').length;
- // The whole gate hinges on this signal — assert the fixture actually
- // produces the >=3 / <3 split, so a TS-extraction change fails here loudly
- // rather than silently flipping the skeletonization downstream.
- expect(implementers(interceptor!.id)).toBeGreaterThanOrEqual(3);
- expect(implementers(formatter!.id)).toBeLessThan(3);
- });
- it('skeletonizes off-spine polymorphic siblings (bodies elided, signatures kept)', async () => {
- const result = await handler.execute('codegraph_explore', { query: QUERY, maxFiles: 12 });
- const text = result.content?.[0]?.text ?? '';
- // Precondition: the spine must have formed, or nothing skeletonizes.
- expect(text).toContain('## Flow (call path among the symbols you queried)');
- for (const [file, marker] of [
- ['bridge-interceptor.ts', 'BRIDGE_BODY_MARKER'],
- ['cache-interceptor.ts', 'CACHE_BODY_MARKER'],
- ['retry-interceptor.ts', 'RETRY_BODY_MARKER'],
- ] as const) {
- const section = sectionFor(text, file);
- expect(section, `${file} should be present in the explore output`).not.toBe('');
- expect(section, `${file} should be skeletonized`).toContain(SKELETON_MARK);
- // The signature line survives; the body (with its marker) is elided.
- expect(section).toContain('intercept(request');
- expect(section, `${file} body marker must NOT survive skeletonization`).not.toContain(marker);
- }
- });
- it('keeps the on-spine exemplar full even though it is a sibling', async () => {
- const result = await handler.execute('codegraph_explore', { query: QUERY, maxFiles: 12 });
- const text = result.content?.[0]?.text ?? '';
- const section = sectionFor(text, 'logging-interceptor.ts');
- expect(section, 'logging-interceptor.ts should be present').not.toBe('');
- expect(section, 'on-spine exemplar must NOT be skeletonized').not.toContain(SKELETON_MARK);
- // Full source => the body marker is present.
- expect(section).toContain('LOGGING_BODY_MARKER');
- });
- it('keeps a distinct step full (off-spine but supertype has < 3 implementers)', async () => {
- const result = await handler.execute('codegraph_explore', { query: QUERY, maxFiles: 12 });
- const text = result.content?.[0]?.text ?? '';
- const section = sectionFor(text, 'response-formatter.ts');
- expect(section, 'response-formatter.ts should be present').not.toBe('');
- expect(section, 'a 1:1 interface impl is not a sibling and must stay full').not.toContain(SKELETON_MARK);
- expect(section).toContain('FORMATTER_BODY_MARKER');
- });
- it('CODEGRAPH_ADAPTIVE_EXPLORE=0 disables skeletonization (siblings render full)', async () => {
- process.env.CODEGRAPH_ADAPTIVE_EXPLORE = '0';
- try {
- const result = await handler.execute('codegraph_explore', { query: QUERY, maxFiles: 12 });
- const text = result.content?.[0]?.text ?? '';
- expect(text, 'no file should be skeletonized with the flag off').not.toContain(SKELETON_MARK);
- // The previously-skeletonized siblings now render their full bodies.
- const section = sectionFor(text, 'bridge-interceptor.ts');
- expect(section).not.toBe('');
- expect(section).toContain('BRIDGE_BODY_MARKER');
- } finally {
- delete process.env.CODEGRAPH_ADAPTIVE_EXPLORE;
- }
- });
- // Names AuthInterceptor's `authenticate` and Codec's `encode` (both methods),
- // plus the spine tokens so a spine still forms. Same Interceptor family as the
- // skeleton test, plus the Codec base+subclasses family.
- const SPARE_QUERY = `${QUERY} authenticate encode AuthInterceptor Codec JsonCodec`;
- it('spares an off-spine sibling when the agent NAMED a callable in it (RealCall fix)', async () => {
- const result = await handler.execute('codegraph_explore', { query: SPARE_QUERY, maxFiles: 15 });
- const text = result.content?.[0]?.text ?? '';
- expect(text).toContain('## Flow (call path among the symbols you queried)');
- // auth-interceptor.ts is an off-spine Interceptor sibling — would skeletonize —
- // but the agent named its method `authenticate`, so it stays FULL.
- const auth = sectionFor(text, 'auth-interceptor.ts');
- expect(auth, 'auth-interceptor.ts should be present').not.toBe('');
- expect(auth, 'a file holding an agent-named callable must NOT be skeletonized').not.toContain(SKELETON_MARK);
- expect(auth).toContain('AUTH_BODY_MARKER');
- // Contrast: bridge-interceptor.ts — same family, named only by TYPE — still skeletonizes.
- const bridge = sectionFor(text, 'bridge-interceptor.ts');
- expect(bridge, 'a sibling named only by type still skeletonizes').toContain(SKELETON_MARK);
- expect(bridge).not.toContain('BRIDGE_BODY_MARKER');
- });
- it('skeletonizes a base+subclasses family file even when named (compiler.py: family override beats the named spare)', async () => {
- const result = await handler.execute('codegraph_explore', { query: SPARE_QUERY, maxFiles: 15 });
- const text = result.content?.[0]?.text ?? '';
- // codec.ts defines the base Codec (>=3 subclasses extend it) and co-locates the
- // subclasses — a redundant, Read-anyway "family" file (Django's compiler.py). Even
- // though the agent named `encode`, it STILL skeletonizes: a full one would eat the
- // explore budget and starve the sibling files. Contrast auth-interceptor.ts above,
- // which is named AND not a family file → spared. This is the override that keeps
- // Django from regressing (sparing the family file cost more and Read more).
- const codec = sectionFor(text, 'codec.ts');
- expect(codec, 'codec.ts should be present').not.toBe('');
- expect(codec, 'a named base+subclasses family file still skeletonizes (budget)').toContain(SKELETON_MARK);
- expect(codec, 'the elided base body marker must NOT survive').not.toContain('CODEC_BASE_MARKER');
- });
- });
|