sql_state_manager.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. SQL State Manager - SQLite 状态管理模块 (v5.4)
  5. 基于 IndexManager 扩展,提供与 StateManager 兼容的高级接口,
  6. 将大数据(实体、别名、状态变化、关系)存储到 SQLite 而非 JSON。
  7. 目标(v5.1 引入,v5.4 沿用):
  8. - 替代 state.json 中的大数据字段
  9. - 保持与 Data Agent / Context Agent 的接口兼容
  10. - 支持增量写入和按需查询
  11. """
  12. import json
  13. from typing import Dict, List, Optional, Any
  14. from dataclasses import dataclass, field
  15. from datetime import datetime
  16. from .index_manager import (
  17. IndexManager,
  18. EntityMeta,
  19. StateChangeMeta,
  20. RelationshipMeta,
  21. RelationshipEventMeta,
  22. )
  23. from .config import get_config
  24. from .observability import safe_log_tool_call
  25. @dataclass
  26. class EntityData:
  27. """实体数据(用于 Data Agent 输入)"""
  28. id: str
  29. type: str # 角色/地点/物品/势力/招式
  30. name: str
  31. tier: str = "装饰"
  32. desc: str = ""
  33. current: Dict[str, Any] = field(default_factory=dict)
  34. aliases: List[str] = field(default_factory=list)
  35. first_appearance: int = 0
  36. last_appearance: int = 0
  37. is_protagonist: bool = False
  38. class SQLStateManager:
  39. """
  40. SQLite 状态管理器(v5.1 引入,v5.4 沿用)
  41. 提供与 StateManager 兼容的接口,但数据存储在 SQLite (index.db) 中。
  42. 用于替代 state.json 中膨胀的数据结构。
  43. 用法:
  44. ```python
  45. manager = SQLStateManager(config)
  46. # 写入实体
  47. manager.upsert_entity(EntityData(
  48. id="xiaoyan",
  49. type="角色",
  50. name="萧炎",
  51. tier="核心",
  52. current={"realm": "斗师", "location": "天云宗"},
  53. aliases=["小炎子", "废柴"],
  54. is_protagonist=True
  55. ))
  56. # 写入状态变化
  57. manager.record_state_change(
  58. entity_id="xiaoyan",
  59. field="realm",
  60. old_value="斗者",
  61. new_value="斗师",
  62. reason="闭关突破",
  63. chapter=100
  64. )
  65. # 写入关系
  66. manager.upsert_relationship(
  67. from_entity="xiaoyan",
  68. to_entity="yaolao",
  69. type="师徒",
  70. description="药老收萧炎为徒",
  71. chapter=5
  72. )
  73. # 读取
  74. protagonist = manager.get_protagonist()
  75. core_entities = manager.get_core_entities()
  76. changes = manager.get_recent_state_changes(limit=50)
  77. ```
  78. """
  79. # v5.0 引入的实体类型
  80. ENTITY_TYPES = ["角色", "地点", "物品", "势力", "招式"]
  81. def __init__(self, config=None):
  82. self.config = config or get_config()
  83. self._index_manager = IndexManager(config)
  84. # ==================== 实体操作 ====================
  85. def upsert_entity(self, entity: EntityData) -> bool:
  86. """
  87. 插入或更新实体
  88. 自动处理:
  89. - 实体基本信息写入 entities 表
  90. - 别名写入 aliases 表
  91. - canonical_name 自动添加为别名
  92. 返回: 是否为新实体
  93. """
  94. # 构建 EntityMeta
  95. meta = EntityMeta(
  96. id=entity.id,
  97. type=entity.type,
  98. canonical_name=entity.name,
  99. tier=entity.tier,
  100. desc=entity.desc,
  101. current=entity.current,
  102. first_appearance=entity.first_appearance,
  103. last_appearance=entity.last_appearance,
  104. is_protagonist=entity.is_protagonist,
  105. is_archived=False
  106. )
  107. is_new = self._index_manager.upsert_entity(meta)
  108. # 注册别名
  109. # 1. canonical_name 本身作为别名
  110. self._index_manager.register_alias(entity.name, entity.id, entity.type)
  111. # 2. 其他别名
  112. for alias in entity.aliases:
  113. if alias and alias != entity.name:
  114. self._index_manager.register_alias(alias, entity.id, entity.type)
  115. return is_new
  116. def get_entity(self, entity_id: str) -> Optional[Dict]:
  117. """获取实体详情"""
  118. entity = self._index_manager.get_entity(entity_id)
  119. if entity:
  120. # 添加别名
  121. entity["aliases"] = self._index_manager.get_entity_aliases(entity_id)
  122. return entity
  123. def get_entities_by_type(self, entity_type: str, include_archived: bool = False) -> List[Dict]:
  124. """按类型获取实体"""
  125. entities = self._index_manager.get_entities_by_type(entity_type, include_archived)
  126. for e in entities:
  127. e["aliases"] = self._index_manager.get_entity_aliases(e["id"])
  128. return entities
  129. def get_core_entities(self) -> List[Dict]:
  130. """
  131. 获取核心实体(用于 Context Agent 全量加载)
  132. 返回所有 tier=核心/重要 或 is_protagonist=1 的实体
  133. (次要/装饰实体按需查询,不全量加载)
  134. """
  135. entities = self._index_manager.get_core_entities()
  136. for e in entities:
  137. e["aliases"] = self._index_manager.get_entity_aliases(e["id"])
  138. return entities
  139. def get_protagonist(self) -> Optional[Dict]:
  140. """获取主角实体"""
  141. protagonist = self._index_manager.get_protagonist()
  142. if protagonist:
  143. protagonist["aliases"] = self._index_manager.get_entity_aliases(protagonist["id"])
  144. return protagonist
  145. def update_entity_current(self, entity_id: str, updates: Dict) -> bool:
  146. """增量更新实体的 current 字段"""
  147. return self._index_manager.update_entity_current(entity_id, updates)
  148. def resolve_alias(self, alias: str) -> List[Dict]:
  149. """
  150. 根据别名解析实体(一对多)
  151. 返回所有匹配的实体
  152. """
  153. return self._index_manager.get_entities_by_alias(alias)
  154. def register_alias(self, alias: str, entity_id: str, entity_type: str) -> bool:
  155. """注册别名"""
  156. return self._index_manager.register_alias(alias, entity_id, entity_type)
  157. # ==================== 状态变化操作 ====================
  158. def record_state_change(
  159. self,
  160. entity_id: str,
  161. field: str,
  162. old_value: Any,
  163. new_value: Any,
  164. reason: str,
  165. chapter: int
  166. ) -> int:
  167. """
  168. 记录状态变化
  169. 返回: 记录 ID
  170. """
  171. change = StateChangeMeta(
  172. entity_id=entity_id,
  173. field=field,
  174. old_value=str(old_value) if old_value is not None else "",
  175. new_value=str(new_value),
  176. reason=reason,
  177. chapter=chapter
  178. )
  179. return self._index_manager.record_state_change(change)
  180. def get_entity_state_changes(self, entity_id: str, limit: int = 20) -> List[Dict]:
  181. """获取实体的状态变化历史"""
  182. return self._index_manager.get_entity_state_changes(entity_id, limit)
  183. def get_recent_state_changes(self, limit: int = 50) -> List[Dict]:
  184. """获取最近的状态变化"""
  185. return self._index_manager.get_recent_state_changes(limit)
  186. def get_chapter_state_changes(self, chapter: int) -> List[Dict]:
  187. """获取某章的所有状态变化"""
  188. return self._index_manager.get_chapter_state_changes(chapter)
  189. # ==================== 关系操作 ====================
  190. def upsert_relationship(
  191. self,
  192. from_entity: str,
  193. to_entity: str,
  194. type: str,
  195. description: str,
  196. chapter: int
  197. ) -> bool:
  198. """
  199. 插入或更新关系
  200. 返回: 是否为新关系
  201. """
  202. rel = RelationshipMeta(
  203. from_entity=from_entity,
  204. to_entity=to_entity,
  205. type=type,
  206. description=description,
  207. chapter=chapter
  208. )
  209. return self._index_manager.upsert_relationship(rel)
  210. def get_entity_relationships(self, entity_id: str, direction: str = "both") -> List[Dict]:
  211. """获取实体的关系"""
  212. return self._index_manager.get_entity_relationships(entity_id, direction)
  213. def get_relationship_between(self, entity1: str, entity2: str) -> List[Dict]:
  214. """获取两个实体之间的所有关系"""
  215. return self._index_manager.get_relationship_between(entity1, entity2)
  216. def get_recent_relationships(self, limit: int = 30) -> List[Dict]:
  217. """获取最近建立的关系"""
  218. return self._index_manager.get_recent_relationships(limit)
  219. # ==================== 批量写入(供 Data Agent 使用) ====================
  220. def process_chapter_entities(
  221. self,
  222. chapter: int,
  223. entities_appeared: List[Dict],
  224. entities_new: List[Dict],
  225. state_changes: List[Dict],
  226. relationships_new: List[Dict]
  227. ) -> Dict[str, int]:
  228. """
  229. 处理章节的实体数据(Data Agent 主入口)
  230. 参数:
  231. - chapter: 章节号
  232. - entities_appeared: 出场的已有实体
  233. [{"id": "xiaoyan", "type": "角色", "mentions": ["萧炎", "他"], "confidence": 0.95}]
  234. - entities_new: 新发现的实体
  235. [{"suggested_id": "hongyi_girl", "name": "红衣女子", "type": "角色", "tier": "装饰"}]
  236. - state_changes: 状态变化
  237. [{"entity_id": "xiaoyan", "field": "realm", "old": "斗者", "new": "斗师", "reason": "突破"}]
  238. - relationships_new: 新关系
  239. [{"from": "xiaoyan", "to": "hongyi_girl", "type": "相识", "description": "初次见面"}]
  240. 返回: 写入统计
  241. """
  242. stats = {
  243. "entities_updated": 0,
  244. "entities_created": 0,
  245. "state_changes": 0,
  246. "relationships": 0,
  247. "aliases": 0
  248. }
  249. # 1. 处理出场实体(更新 last_appearance)
  250. for entity in entities_appeared:
  251. entity_id = entity.get("id")
  252. if not entity_id:
  253. continue
  254. self._index_manager.update_entity_current(entity_id, {}) # 触发 updated_at
  255. # 更新 last_appearance
  256. existing = self._index_manager.get_entity(entity_id)
  257. if existing:
  258. # 使用 SQL 直接更新 last_appearance
  259. self._update_last_appearance(entity_id, chapter)
  260. stats["entities_updated"] += 1
  261. # 记录出场(保留原有逻辑)
  262. self._index_manager.record_appearance(
  263. entity_id=entity_id,
  264. chapter=chapter,
  265. mentions=entity.get("mentions", []),
  266. confidence=entity.get("confidence", 1.0)
  267. )
  268. # 2. 处理新实体
  269. for entity in entities_new:
  270. suggested_id = entity.get("suggested_id") or entity.get("id")
  271. if not suggested_id:
  272. continue
  273. entity_data = EntityData(
  274. id=suggested_id,
  275. type=entity.get("type", "角色"),
  276. name=entity.get("name", suggested_id),
  277. tier=entity.get("tier", "装饰"),
  278. desc=entity.get("desc", ""),
  279. current=entity.get("current", {}),
  280. aliases=entity.get("aliases", []),
  281. first_appearance=chapter,
  282. last_appearance=chapter,
  283. is_protagonist=entity.get("is_protagonist", False)
  284. )
  285. is_new = self.upsert_entity(entity_data)
  286. if is_new:
  287. stats["entities_created"] += 1
  288. else:
  289. stats["entities_updated"] += 1
  290. # 统计别名
  291. stats["aliases"] += 1 + len(entity_data.aliases)
  292. # 记录新实体的首次出场(解决 appearances 缺失问题)
  293. mentions = entity.get("mentions", [])
  294. if not mentions:
  295. mentions = [entity_data.name] # 至少包含实体名
  296. self._index_manager.record_appearance(
  297. entity_id=suggested_id,
  298. chapter=chapter,
  299. mentions=mentions,
  300. confidence=entity.get("confidence", 1.0)
  301. )
  302. # 3. 处理状态变化
  303. for change in state_changes:
  304. entity_id = change.get("entity_id")
  305. if not entity_id:
  306. continue
  307. self.record_state_change(
  308. entity_id=entity_id,
  309. field=change.get("field", ""),
  310. old_value=change.get("old", change.get("old_value", "")),
  311. new_value=change.get("new", change.get("new_value", "")),
  312. reason=change.get("reason", ""),
  313. chapter=chapter
  314. )
  315. stats["state_changes"] += 1
  316. # 同步更新实体的 current
  317. field_name = change.get("field")
  318. new_value = change.get("new", change.get("new_value"))
  319. # 注意:new_value 可能是 0/""/False 等 falsy 值,需要用 is not None 判断
  320. if field_name and new_value is not None:
  321. self._index_manager.update_entity_current(entity_id, {field_name: new_value})
  322. # 4. 处理新关系
  323. for rel in relationships_new:
  324. from_entity = rel.get("from", rel.get("from_entity"))
  325. to_entity = rel.get("to", rel.get("to_entity"))
  326. if not from_entity or not to_entity:
  327. continue
  328. rel_type = rel.get("type", "相识")
  329. description = rel.get("description", "")
  330. # v5.5: 先记录关系事件,再更新关系快照
  331. self._index_manager.record_relationship_event(
  332. RelationshipEventMeta(
  333. from_entity=from_entity,
  334. to_entity=to_entity,
  335. type=rel_type,
  336. chapter=chapter,
  337. action=rel.get("action", "update"),
  338. polarity=rel.get("polarity", 0),
  339. strength=rel.get("strength", 0.5),
  340. description=description,
  341. scene_index=rel.get("scene_index", 0),
  342. evidence=rel.get("evidence", ""),
  343. confidence=rel.get("confidence", 1.0),
  344. )
  345. )
  346. self.upsert_relationship(
  347. from_entity=from_entity,
  348. to_entity=to_entity,
  349. type=rel_type,
  350. description=description,
  351. chapter=chapter
  352. )
  353. stats["relationships"] += 1
  354. return stats
  355. def _update_last_appearance(self, entity_id: str, chapter: int):
  356. """更新实体的 last_appearance"""
  357. with self._index_manager._get_conn() as conn:
  358. cursor = conn.cursor()
  359. cursor.execute("""
  360. UPDATE entities SET
  361. last_appearance = MAX(last_appearance, ?),
  362. updated_at = CURRENT_TIMESTAMP
  363. WHERE id = ?
  364. """, (chapter, entity_id))
  365. conn.commit()
  366. # ==================== 统计 ====================
  367. def get_stats(self) -> Dict[str, int]:
  368. """获取统计信息"""
  369. return self._index_manager.get_stats()
  370. # ==================== 格式转换(兼容性) ====================
  371. def export_to_entities_v3_format(self) -> Dict[str, Dict[str, Dict]]:
  372. """
  373. 导出为 entities_v3 格式(用于兼容性)
  374. 返回: {"角色": {"xiaoyan": {...}}, "地点": {...}, ...}
  375. """
  376. result = {t: {} for t in self.ENTITY_TYPES}
  377. for entity_type in self.ENTITY_TYPES:
  378. entities = self.get_entities_by_type(entity_type, include_archived=True)
  379. for e in entities:
  380. entity_dict = {
  381. "canonical_name": e.get("canonical_name"),
  382. "name": e.get("canonical_name"), # 兼容性别名
  383. "tier": e.get("tier", "装饰"),
  384. "aliases": e.get("aliases", []),
  385. "desc": e.get("desc", ""),
  386. "current": e.get("current_json", {}),
  387. "history": [], # 历史记录需要从 state_changes 表查询
  388. "first_appearance": e.get("first_appearance", 0),
  389. "last_appearance": e.get("last_appearance", 0)
  390. }
  391. if e.get("is_protagonist"):
  392. entity_dict["is_protagonist"] = True
  393. result[entity_type][e["id"]] = entity_dict
  394. return result
  395. def export_to_alias_index_format(self) -> Dict[str, List[Dict[str, str]]]:
  396. """
  397. 导出为 alias_index 格式(用于兼容性)
  398. 返回: {"萧炎": [{"type": "角色", "id": "xiaoyan"}], ...}
  399. """
  400. result = {}
  401. with self._index_manager._get_conn() as conn:
  402. cursor = conn.cursor()
  403. cursor.execute("SELECT alias, entity_id, entity_type FROM aliases")
  404. for row in cursor.fetchall():
  405. alias = row["alias"]
  406. if alias not in result:
  407. result[alias] = []
  408. result[alias].append({
  409. "type": row["entity_type"],
  410. "id": row["entity_id"]
  411. })
  412. return result
  413. # ==================== CLI 接口 ====================
  414. def main():
  415. import argparse
  416. import sys
  417. from .cli_output import print_success, print_error
  418. from .cli_args import normalize_global_project_root, load_json_arg
  419. from .index_manager import IndexManager
  420. parser = argparse.ArgumentParser(description="SQL State Manager CLI (v5.4)")
  421. parser.add_argument("--project-root", type=str, help="项目根目录")
  422. subparsers = parser.add_subparsers(dest="command")
  423. # 获取统计
  424. subparsers.add_parser("stats")
  425. # 获取主角
  426. subparsers.add_parser("get-protagonist")
  427. # 获取核心实体
  428. subparsers.add_parser("get-core-entities")
  429. # 导出 entities_v3 格式
  430. subparsers.add_parser("export-entities-v3")
  431. # 导出 alias_index 格式
  432. subparsers.add_parser("export-alias-index")
  433. # 处理章节数据
  434. process_parser = subparsers.add_parser("process-chapter")
  435. process_parser.add_argument("--chapter", type=int, required=True)
  436. process_parser.add_argument("--data", required=True, help="JSON 格式的章节数据")
  437. argv = normalize_global_project_root(sys.argv[1:])
  438. args = parser.parse_args(argv)
  439. # 初始化
  440. config = None
  441. if args.project_root:
  442. # 允许传入“工作区根目录”,统一解析到真正的 book project_root(必须包含 .webnovel/state.json)
  443. from project_locator import resolve_project_root
  444. from .config import DataModulesConfig
  445. resolved_root = resolve_project_root(args.project_root)
  446. config = DataModulesConfig.from_project_root(resolved_root)
  447. manager = SQLStateManager(config)
  448. logger = IndexManager(config)
  449. tool_name = f"sql_state_manager:{args.command or 'unknown'}"
  450. def emit_success(data=None, message: str = "ok"):
  451. print_success(data, message=message)
  452. safe_log_tool_call(logger, tool_name=tool_name, success=True)
  453. def emit_error(code: str, message: str, suggestion: str | None = None):
  454. print_error(code, message, suggestion=suggestion)
  455. safe_log_tool_call(
  456. logger,
  457. tool_name=tool_name,
  458. success=False,
  459. error_code=code,
  460. error_message=message,
  461. )
  462. if args.command == "stats":
  463. stats = manager.get_stats()
  464. emit_success(stats, message="stats")
  465. elif args.command == "get-protagonist":
  466. protagonist = manager.get_protagonist()
  467. if protagonist:
  468. emit_success(protagonist, message="protagonist")
  469. else:
  470. emit_error("NOT_FOUND", "未设置主角")
  471. elif args.command == "get-core-entities":
  472. entities = manager.get_core_entities()
  473. emit_success(entities, message="core_entities")
  474. elif args.command == "export-entities-v3":
  475. data = manager.export_to_entities_v3_format()
  476. emit_success(data, message="entities_v3")
  477. elif args.command == "export-alias-index":
  478. data = manager.export_to_alias_index_format()
  479. emit_success(data, message="alias_index")
  480. elif args.command == "process-chapter":
  481. data = load_json_arg(args.data)
  482. stats = manager.process_chapter_entities(
  483. chapter=args.chapter,
  484. entities_appeared=data.get("entities_appeared", []),
  485. entities_new=data.get("entities_new", []),
  486. state_changes=data.get("state_changes", []),
  487. relationships_new=data.get("relationships_new", []),
  488. )
  489. emit_success(stats, message="chapter_processed")
  490. else:
  491. emit_error("UNKNOWN_COMMAND", "未指定有效命令", suggestion="请查看 --help")
  492. if __name__ == "__main__":
  493. main()