| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245 |
- /**
- * Database Layer
- *
- * Handles SQLite database initialization and connection management.
- */
- import { SqliteDatabase, SqliteBackend, createDatabase } from './sqlite-adapter';
- import * as fs from 'fs';
- import * as path from 'path';
- import { SchemaVersion } from '../types';
- import { runMigrations, getCurrentVersion, CURRENT_SCHEMA_VERSION } from './migrations';
- import { getCodeGraphDir } from '../directory';
- export { SqliteDatabase, SqliteBackend } from './sqlite-adapter';
- /**
- * Apply connection-level PRAGMAs. Shared by `initialize` and `open` so the two
- * paths can't drift.
- *
- * `busy_timeout` is set FIRST, before any pragma that might touch the database
- * file (notably `journal_mode`). If another process holds a write lock at open
- * time, the later pragmas — and the connection's first query — then wait out
- * the lock instead of throwing "database is locked" immediately. See issue #238.
- *
- * The 5s window (was 120s) rides out a normal incremental sync; the old
- * 2-minute wait presented as a frozen, hung agent. With WAL, reads never block
- * on a writer, so this timeout only governs cross-process write contention
- * (e.g. the git-hook `codegraph sync` running while the MCP server writes).
- */
- function configureConnection(db: SqliteDatabase): void {
- db.pragma('busy_timeout = 5000'); // MUST be first — see above
- db.pragma('foreign_keys = ON');
- db.pragma('journal_mode = WAL'); // node:sqlite supports WAL on every platform
- db.pragma('synchronous = NORMAL'); // safe with WAL mode
- db.pragma('cache_size = -64000'); // 64 MB page cache
- db.pragma('temp_store = MEMORY'); // temp tables in memory
- db.pragma('mmap_size = 268435456'); // 256 MB memory-mapped I/O
- }
- /**
- * Database connection wrapper with lifecycle management
- */
- export class DatabaseConnection {
- private db: SqliteDatabase;
- private dbPath: string;
- private backend: SqliteBackend;
- private constructor(db: SqliteDatabase, dbPath: string, backend: SqliteBackend) {
- this.db = db;
- this.dbPath = dbPath;
- this.backend = backend;
- }
- /**
- * Initialize a new database at the given path
- */
- static initialize(dbPath: string): DatabaseConnection {
- // Ensure parent directory exists
- const dir = path.dirname(dbPath);
- if (!fs.existsSync(dir)) {
- fs.mkdirSync(dir, { recursive: true });
- }
- // Create and configure database
- const { db, backend } = createDatabase(dbPath);
- configureConnection(db);
- // Run schema initialization
- const schemaPath = path.join(__dirname, 'schema.sql');
- const schema = fs.readFileSync(schemaPath, 'utf-8');
- db.exec(schema);
- // Record current schema version so migrations aren't re-applied on open
- const currentVersion = getCurrentVersion(db);
- if (currentVersion < CURRENT_SCHEMA_VERSION) {
- db.prepare(
- 'INSERT OR IGNORE INTO schema_versions (version, applied_at, description) VALUES (?, ?, ?)'
- ).run(CURRENT_SCHEMA_VERSION, Date.now(), 'Initial schema includes all migrations');
- }
- return new DatabaseConnection(db, dbPath, backend);
- }
- /**
- * Open an existing database
- */
- static open(dbPath: string): DatabaseConnection {
- if (!fs.existsSync(dbPath)) {
- throw new Error(`Database not found: ${dbPath}`);
- }
- const { db, backend } = createDatabase(dbPath);
- configureConnection(db);
- // Check and run migrations if needed
- const conn = new DatabaseConnection(db, dbPath, backend);
- const currentVersion = getCurrentVersion(db);
- if (currentVersion < CURRENT_SCHEMA_VERSION) {
- runMigrations(db, currentVersion);
- }
- return conn;
- }
- /**
- * Get the underlying database instance
- */
- getDb(): SqliteDatabase {
- return this.db;
- }
- /**
- * Get the SQLite backend serving this connection. Per-instance so
- * MCP cross-project queries report the right backend even when
- * multiple project DBs are open in the same process.
- */
- getBackend(): SqliteBackend {
- return this.backend;
- }
- /**
- * Get database file path
- */
- getPath(): string {
- return this.dbPath;
- }
- /**
- * The journal mode actually in effect (e.g. 'wal', 'delete').
- *
- * SQLite silently keeps the prior mode if WAL can't be enabled — e.g. on
- * filesystems without shared-memory support (some network/virtualized mounts,
- * WSL2 /mnt), and always on the wasm backend. So the effective mode can differ
- * from what `configureConnection` requested. Surfaced in `codegraph status` so
- * a "database is locked" report is triageable: 'wal' ⇒ readers never block on a
- * writer; anything else ⇒ they can. See issue #238.
- */
- getJournalMode(): string {
- const raw = this.db.pragma('journal_mode');
- const row = Array.isArray(raw) ? raw[0] : raw;
- const mode = row && typeof row === 'object'
- ? (row as Record<string, unknown>).journal_mode
- : row;
- return String(mode ?? '').toLowerCase();
- }
- /**
- * Get current schema version
- */
- getSchemaVersion(): SchemaVersion | null {
- const row = this.db
- .prepare('SELECT version, applied_at, description FROM schema_versions ORDER BY version DESC LIMIT 1')
- .get() as { version: number; applied_at: number; description: string | null } | undefined;
- if (!row) return null;
- return {
- version: row.version,
- appliedAt: row.applied_at,
- description: row.description ?? undefined,
- };
- }
- /**
- * Execute a function within a transaction
- */
- transaction<T>(fn: () => T): T {
- return this.db.transaction(fn)();
- }
- /**
- * Get database file size in bytes
- */
- getSize(): number {
- const stats = fs.statSync(this.dbPath);
- return stats.size;
- }
- /**
- * Optimize database (vacuum and analyze)
- */
- optimize(): void {
- this.db.exec('VACUUM');
- this.db.exec('ANALYZE');
- }
- /**
- * Lightweight, non-blocking maintenance to run after bulk writes
- * (indexAll, sync). Two operations:
- *
- * - `PRAGMA optimize` — incremental ANALYZE; SQLite only re-analyzes
- * tables whose row counts changed materially since the last
- * ANALYZE. Without it, the query planner has no statistics on the
- * freshly-bulk-loaded tables and can pick suboptimal indexes.
- *
- * - `PRAGMA wal_checkpoint(PASSIVE)` — fold pending WAL pages back
- * into the main database file so the WAL file doesn't grow
- * unboundedly between automatic checkpoints (auto-fires at 1000
- * pages by default; large indexAll runs blow past that).
- *
- * Both operations are silently swallowed on failure — they're a
- * best-effort optimization, never load-bearing for correctness.
- */
- runMaintenance(): void {
- try {
- this.db.exec('PRAGMA optimize');
- } catch {
- // ignore
- }
- try {
- this.db.exec('PRAGMA wal_checkpoint(PASSIVE)');
- } catch {
- // ignore (e.g., not in WAL mode)
- }
- }
- /**
- * Close the database connection
- */
- close(): void {
- this.db.close();
- }
- /**
- * Check if the database connection is open
- */
- isOpen(): boolean {
- return this.db.open;
- }
- }
- /**
- * Default database filename
- */
- export const DATABASE_FILENAME = 'codegraph.db';
- /**
- * Get the default database path for a project
- */
- export function getDatabasePath(projectRoot: string): string {
- return path.join(getCodeGraphDir(projectRoot), DATABASE_FILENAME);
- }
|