sql_state_manager.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. SQL State Manager - SQLite 状态管理模块 (v5.4)
  5. 基于 IndexManager 扩展,提供与 StateManager 兼容的高级接口,
  6. 将大数据(实体、别名、状态变化、关系)存储到 SQLite 而非 JSON。
  7. 目标(v5.1 引入,v5.4 沿用):
  8. - 替代 state.json 中的大数据字段
  9. - 保持与 Data Agent / Context Agent 的接口兼容
  10. - 支持增量写入和按需查询
  11. """
  12. import json
  13. from typing import Dict, List, Optional, Any
  14. from dataclasses import dataclass, field
  15. from datetime import datetime
  16. from .index_manager import (
  17. IndexManager,
  18. EntityMeta,
  19. StateChangeMeta,
  20. RelationshipMeta
  21. )
  22. from .config import get_config
  23. @dataclass
  24. class EntityData:
  25. """实体数据(用于 Data Agent 输入)"""
  26. id: str
  27. type: str # 角色/地点/物品/势力/招式
  28. name: str
  29. tier: str = "装饰"
  30. desc: str = ""
  31. current: Dict[str, Any] = field(default_factory=dict)
  32. aliases: List[str] = field(default_factory=list)
  33. first_appearance: int = 0
  34. last_appearance: int = 0
  35. is_protagonist: bool = False
  36. class SQLStateManager:
  37. """
  38. SQLite 状态管理器(v5.1 引入,v5.4 沿用)
  39. 提供与 StateManager 兼容的接口,但数据存储在 SQLite (index.db) 中。
  40. 用于替代 state.json 中膨胀的数据结构。
  41. 用法:
  42. ```python
  43. manager = SQLStateManager(config)
  44. # 写入实体
  45. manager.upsert_entity(EntityData(
  46. id="xiaoyan",
  47. type="角色",
  48. name="萧炎",
  49. tier="核心",
  50. current={"realm": "斗师", "location": "天云宗"},
  51. aliases=["小炎子", "废柴"],
  52. is_protagonist=True
  53. ))
  54. # 写入状态变化
  55. manager.record_state_change(
  56. entity_id="xiaoyan",
  57. field="realm",
  58. old_value="斗者",
  59. new_value="斗师",
  60. reason="闭关突破",
  61. chapter=100
  62. )
  63. # 写入关系
  64. manager.upsert_relationship(
  65. from_entity="xiaoyan",
  66. to_entity="yaolao",
  67. type="师徒",
  68. description="药老收萧炎为徒",
  69. chapter=5
  70. )
  71. # 读取
  72. protagonist = manager.get_protagonist()
  73. core_entities = manager.get_core_entities()
  74. changes = manager.get_recent_state_changes(limit=50)
  75. ```
  76. """
  77. # v5.0 引入的实体类型
  78. ENTITY_TYPES = ["角色", "地点", "物品", "势力", "招式"]
  79. def __init__(self, config=None):
  80. self.config = config or get_config()
  81. self._index_manager = IndexManager(config)
  82. # ==================== 实体操作 ====================
  83. def upsert_entity(self, entity: EntityData) -> bool:
  84. """
  85. 插入或更新实体
  86. 自动处理:
  87. - 实体基本信息写入 entities 表
  88. - 别名写入 aliases 表
  89. - canonical_name 自动添加为别名
  90. 返回: 是否为新实体
  91. """
  92. # 构建 EntityMeta
  93. meta = EntityMeta(
  94. id=entity.id,
  95. type=entity.type,
  96. canonical_name=entity.name,
  97. tier=entity.tier,
  98. desc=entity.desc,
  99. current=entity.current,
  100. first_appearance=entity.first_appearance,
  101. last_appearance=entity.last_appearance,
  102. is_protagonist=entity.is_protagonist,
  103. is_archived=False
  104. )
  105. is_new = self._index_manager.upsert_entity(meta)
  106. # 注册别名
  107. # 1. canonical_name 本身作为别名
  108. self._index_manager.register_alias(entity.name, entity.id, entity.type)
  109. # 2. 其他别名
  110. for alias in entity.aliases:
  111. if alias and alias != entity.name:
  112. self._index_manager.register_alias(alias, entity.id, entity.type)
  113. return is_new
  114. def get_entity(self, entity_id: str) -> Optional[Dict]:
  115. """获取实体详情"""
  116. entity = self._index_manager.get_entity(entity_id)
  117. if entity:
  118. # 添加别名
  119. entity["aliases"] = self._index_manager.get_entity_aliases(entity_id)
  120. return entity
  121. def get_entities_by_type(self, entity_type: str, include_archived: bool = False) -> List[Dict]:
  122. """按类型获取实体"""
  123. entities = self._index_manager.get_entities_by_type(entity_type, include_archived)
  124. for e in entities:
  125. e["aliases"] = self._index_manager.get_entity_aliases(e["id"])
  126. return entities
  127. def get_core_entities(self) -> List[Dict]:
  128. """
  129. 获取核心实体(用于 Context Agent 全量加载)
  130. 返回所有 tier=核心/重要 或 is_protagonist=1 的实体
  131. (次要/装饰实体按需查询,不全量加载)
  132. """
  133. entities = self._index_manager.get_core_entities()
  134. for e in entities:
  135. e["aliases"] = self._index_manager.get_entity_aliases(e["id"])
  136. return entities
  137. def get_protagonist(self) -> Optional[Dict]:
  138. """获取主角实体"""
  139. protagonist = self._index_manager.get_protagonist()
  140. if protagonist:
  141. protagonist["aliases"] = self._index_manager.get_entity_aliases(protagonist["id"])
  142. return protagonist
  143. def update_entity_current(self, entity_id: str, updates: Dict) -> bool:
  144. """增量更新实体的 current 字段"""
  145. return self._index_manager.update_entity_current(entity_id, updates)
  146. def resolve_alias(self, alias: str) -> List[Dict]:
  147. """
  148. 根据别名解析实体(一对多)
  149. 返回所有匹配的实体
  150. """
  151. return self._index_manager.get_entities_by_alias(alias)
  152. def register_alias(self, alias: str, entity_id: str, entity_type: str) -> bool:
  153. """注册别名"""
  154. return self._index_manager.register_alias(alias, entity_id, entity_type)
  155. # ==================== 状态变化操作 ====================
  156. def record_state_change(
  157. self,
  158. entity_id: str,
  159. field: str,
  160. old_value: Any,
  161. new_value: Any,
  162. reason: str,
  163. chapter: int
  164. ) -> int:
  165. """
  166. 记录状态变化
  167. 返回: 记录 ID
  168. """
  169. change = StateChangeMeta(
  170. entity_id=entity_id,
  171. field=field,
  172. old_value=str(old_value) if old_value is not None else "",
  173. new_value=str(new_value),
  174. reason=reason,
  175. chapter=chapter
  176. )
  177. return self._index_manager.record_state_change(change)
  178. def get_entity_state_changes(self, entity_id: str, limit: int = 20) -> List[Dict]:
  179. """获取实体的状态变化历史"""
  180. return self._index_manager.get_entity_state_changes(entity_id, limit)
  181. def get_recent_state_changes(self, limit: int = 50) -> List[Dict]:
  182. """获取最近的状态变化"""
  183. return self._index_manager.get_recent_state_changes(limit)
  184. def get_chapter_state_changes(self, chapter: int) -> List[Dict]:
  185. """获取某章的所有状态变化"""
  186. return self._index_manager.get_chapter_state_changes(chapter)
  187. # ==================== 关系操作 ====================
  188. def upsert_relationship(
  189. self,
  190. from_entity: str,
  191. to_entity: str,
  192. type: str,
  193. description: str,
  194. chapter: int
  195. ) -> bool:
  196. """
  197. 插入或更新关系
  198. 返回: 是否为新关系
  199. """
  200. rel = RelationshipMeta(
  201. from_entity=from_entity,
  202. to_entity=to_entity,
  203. type=type,
  204. description=description,
  205. chapter=chapter
  206. )
  207. return self._index_manager.upsert_relationship(rel)
  208. def get_entity_relationships(self, entity_id: str, direction: str = "both") -> List[Dict]:
  209. """获取实体的关系"""
  210. return self._index_manager.get_entity_relationships(entity_id, direction)
  211. def get_relationship_between(self, entity1: str, entity2: str) -> List[Dict]:
  212. """获取两个实体之间的所有关系"""
  213. return self._index_manager.get_relationship_between(entity1, entity2)
  214. def get_recent_relationships(self, limit: int = 30) -> List[Dict]:
  215. """获取最近建立的关系"""
  216. return self._index_manager.get_recent_relationships(limit)
  217. # ==================== 批量写入(供 Data Agent 使用) ====================
  218. def process_chapter_entities(
  219. self,
  220. chapter: int,
  221. entities_appeared: List[Dict],
  222. entities_new: List[Dict],
  223. state_changes: List[Dict],
  224. relationships_new: List[Dict]
  225. ) -> Dict[str, int]:
  226. """
  227. 处理章节的实体数据(Data Agent 主入口)
  228. 参数:
  229. - chapter: 章节号
  230. - entities_appeared: 出场的已有实体
  231. [{"id": "xiaoyan", "type": "角色", "mentions": ["萧炎", "他"], "confidence": 0.95}]
  232. - entities_new: 新发现的实体
  233. [{"suggested_id": "hongyi_girl", "name": "红衣女子", "type": "角色", "tier": "装饰"}]
  234. - state_changes: 状态变化
  235. [{"entity_id": "xiaoyan", "field": "realm", "old": "斗者", "new": "斗师", "reason": "突破"}]
  236. - relationships_new: 新关系
  237. [{"from": "xiaoyan", "to": "hongyi_girl", "type": "相识", "description": "初次见面"}]
  238. 返回: 写入统计
  239. """
  240. stats = {
  241. "entities_updated": 0,
  242. "entities_created": 0,
  243. "state_changes": 0,
  244. "relationships": 0,
  245. "aliases": 0
  246. }
  247. # 1. 处理出场实体(更新 last_appearance)
  248. for entity in entities_appeared:
  249. entity_id = entity.get("id")
  250. if not entity_id:
  251. continue
  252. self._index_manager.update_entity_current(entity_id, {}) # 触发 updated_at
  253. # 更新 last_appearance
  254. existing = self._index_manager.get_entity(entity_id)
  255. if existing:
  256. # 使用 SQL 直接更新 last_appearance
  257. self._update_last_appearance(entity_id, chapter)
  258. stats["entities_updated"] += 1
  259. # 记录出场(保留原有逻辑)
  260. self._index_manager.record_appearance(
  261. entity_id=entity_id,
  262. chapter=chapter,
  263. mentions=entity.get("mentions", []),
  264. confidence=entity.get("confidence", 1.0)
  265. )
  266. # 2. 处理新实体
  267. for entity in entities_new:
  268. suggested_id = entity.get("suggested_id") or entity.get("id")
  269. if not suggested_id:
  270. continue
  271. entity_data = EntityData(
  272. id=suggested_id,
  273. type=entity.get("type", "角色"),
  274. name=entity.get("name", suggested_id),
  275. tier=entity.get("tier", "装饰"),
  276. desc=entity.get("desc", ""),
  277. current=entity.get("current", {}),
  278. aliases=entity.get("aliases", []),
  279. first_appearance=chapter,
  280. last_appearance=chapter,
  281. is_protagonist=entity.get("is_protagonist", False)
  282. )
  283. is_new = self.upsert_entity(entity_data)
  284. if is_new:
  285. stats["entities_created"] += 1
  286. else:
  287. stats["entities_updated"] += 1
  288. # 统计别名
  289. stats["aliases"] += 1 + len(entity_data.aliases)
  290. # 记录新实体的首次出场(解决 appearances 缺失问题)
  291. mentions = entity.get("mentions", [])
  292. if not mentions:
  293. mentions = [entity_data.name] # 至少包含实体名
  294. self._index_manager.record_appearance(
  295. entity_id=suggested_id,
  296. chapter=chapter,
  297. mentions=mentions,
  298. confidence=entity.get("confidence", 1.0)
  299. )
  300. # 3. 处理状态变化
  301. for change in state_changes:
  302. entity_id = change.get("entity_id")
  303. if not entity_id:
  304. continue
  305. self.record_state_change(
  306. entity_id=entity_id,
  307. field=change.get("field", ""),
  308. old_value=change.get("old", change.get("old_value", "")),
  309. new_value=change.get("new", change.get("new_value", "")),
  310. reason=change.get("reason", ""),
  311. chapter=chapter
  312. )
  313. stats["state_changes"] += 1
  314. # 同步更新实体的 current
  315. field_name = change.get("field")
  316. new_value = change.get("new", change.get("new_value"))
  317. # 注意:new_value 可能是 0/""/False 等 falsy 值,需要用 is not None 判断
  318. if field_name and new_value is not None:
  319. self._index_manager.update_entity_current(entity_id, {field_name: new_value})
  320. # 4. 处理新关系
  321. for rel in relationships_new:
  322. from_entity = rel.get("from", rel.get("from_entity"))
  323. to_entity = rel.get("to", rel.get("to_entity"))
  324. if not from_entity or not to_entity:
  325. continue
  326. self.upsert_relationship(
  327. from_entity=from_entity,
  328. to_entity=to_entity,
  329. type=rel.get("type", "相识"),
  330. description=rel.get("description", ""),
  331. chapter=chapter
  332. )
  333. stats["relationships"] += 1
  334. return stats
  335. def _update_last_appearance(self, entity_id: str, chapter: int):
  336. """更新实体的 last_appearance"""
  337. with self._index_manager._get_conn() as conn:
  338. cursor = conn.cursor()
  339. cursor.execute("""
  340. UPDATE entities SET
  341. last_appearance = MAX(last_appearance, ?),
  342. updated_at = CURRENT_TIMESTAMP
  343. WHERE id = ?
  344. """, (chapter, entity_id))
  345. conn.commit()
  346. # ==================== 统计 ====================
  347. def get_stats(self) -> Dict[str, int]:
  348. """获取统计信息"""
  349. return self._index_manager.get_stats()
  350. # ==================== 格式转换(兼容性) ====================
  351. def export_to_entities_v3_format(self) -> Dict[str, Dict[str, Dict]]:
  352. """
  353. 导出为 entities_v3 格式(用于兼容性)
  354. 返回: {"角色": {"xiaoyan": {...}}, "地点": {...}, ...}
  355. """
  356. result = {t: {} for t in self.ENTITY_TYPES}
  357. for entity_type in self.ENTITY_TYPES:
  358. entities = self.get_entities_by_type(entity_type, include_archived=True)
  359. for e in entities:
  360. entity_dict = {
  361. "canonical_name": e.get("canonical_name"),
  362. "name": e.get("canonical_name"), # 兼容性别名
  363. "tier": e.get("tier", "装饰"),
  364. "aliases": e.get("aliases", []),
  365. "desc": e.get("desc", ""),
  366. "current": e.get("current_json", {}),
  367. "history": [], # 历史记录需要从 state_changes 表查询
  368. "first_appearance": e.get("first_appearance", 0),
  369. "last_appearance": e.get("last_appearance", 0)
  370. }
  371. if e.get("is_protagonist"):
  372. entity_dict["is_protagonist"] = True
  373. result[entity_type][e["id"]] = entity_dict
  374. return result
  375. def export_to_alias_index_format(self) -> Dict[str, List[Dict[str, str]]]:
  376. """
  377. 导出为 alias_index 格式(用于兼容性)
  378. 返回: {"萧炎": [{"type": "角色", "id": "xiaoyan"}], ...}
  379. """
  380. result = {}
  381. with self._index_manager._get_conn() as conn:
  382. cursor = conn.cursor()
  383. cursor.execute("SELECT alias, entity_id, entity_type FROM aliases")
  384. for row in cursor.fetchall():
  385. alias = row["alias"]
  386. if alias not in result:
  387. result[alias] = []
  388. result[alias].append({
  389. "type": row["entity_type"],
  390. "id": row["entity_id"]
  391. })
  392. return result
  393. # ==================== CLI 接口 ====================
  394. def main():
  395. import argparse
  396. from .cli_output import print_success, print_error
  397. from .index_manager import IndexManager
  398. parser = argparse.ArgumentParser(description="SQL State Manager CLI (v5.4)")
  399. parser.add_argument("--project-root", type=str, help="项目根目录")
  400. subparsers = parser.add_subparsers(dest="command")
  401. # 获取统计
  402. subparsers.add_parser("stats")
  403. # 获取主角
  404. subparsers.add_parser("get-protagonist")
  405. # 获取核心实体
  406. subparsers.add_parser("get-core-entities")
  407. # 导出 entities_v3 格式
  408. subparsers.add_parser("export-entities-v3")
  409. # 导出 alias_index 格式
  410. subparsers.add_parser("export-alias-index")
  411. # 处理章节数据
  412. process_parser = subparsers.add_parser("process-chapter")
  413. process_parser.add_argument("--chapter", type=int, required=True)
  414. process_parser.add_argument("--data", required=True, help="JSON 格式的章节数据")
  415. args = parser.parse_args()
  416. # 初始化
  417. config = None
  418. if args.project_root:
  419. from .config import DataModulesConfig
  420. config = DataModulesConfig.from_project_root(args.project_root)
  421. manager = SQLStateManager(config)
  422. logger = IndexManager(config)
  423. tool_name = f"sql_state_manager:{args.command or 'unknown'}"
  424. def emit_success(data=None, message: str = "ok"):
  425. print_success(data, message=message)
  426. try:
  427. logger.log_tool_call(tool_name, True)
  428. except Exception:
  429. pass
  430. def emit_error(code: str, message: str, suggestion: str | None = None):
  431. print_error(code, message, suggestion=suggestion)
  432. try:
  433. logger.log_tool_call(tool_name, False, error_code=code, error_message=message)
  434. except Exception:
  435. pass
  436. if args.command == "stats":
  437. stats = manager.get_stats()
  438. emit_success(stats, message="stats")
  439. elif args.command == "get-protagonist":
  440. protagonist = manager.get_protagonist()
  441. if protagonist:
  442. emit_success(protagonist, message="protagonist")
  443. else:
  444. emit_error("NOT_FOUND", "未设置主角")
  445. elif args.command == "get-core-entities":
  446. entities = manager.get_core_entities()
  447. emit_success(entities, message="core_entities")
  448. elif args.command == "export-entities-v3":
  449. data = manager.export_to_entities_v3_format()
  450. emit_success(data, message="entities_v3")
  451. elif args.command == "export-alias-index":
  452. data = manager.export_to_alias_index_format()
  453. emit_success(data, message="alias_index")
  454. elif args.command == "process-chapter":
  455. data = json.loads(args.data)
  456. stats = manager.process_chapter_entities(
  457. chapter=args.chapter,
  458. entities_appeared=data.get("entities_appeared", []),
  459. entities_new=data.get("entities_new", []),
  460. state_changes=data.get("state_changes", []),
  461. relationships_new=data.get("relationships_new", []),
  462. )
  463. emit_success(stats, message="chapter_processed")
  464. else:
  465. emit_error("UNKNOWN_COMMAND", "未指定有效命令", suggestion="请查看 --help")
  466. if __name__ == "__main__":
  467. main()