test_context_manager.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. ContextManager and SnapshotManager tests
  5. """
  6. import json
  7. import logging
  8. import pytest
  9. from data_modules.config import DataModulesConfig
  10. from data_modules.index_manager import (
  11. IndexManager,
  12. EntityMeta,
  13. ChapterReadingPowerMeta,
  14. ReviewMetrics,
  15. )
  16. from data_modules.context_manager import ContextManager
  17. from data_modules.snapshot_manager import SnapshotManager, SnapshotVersionMismatch
  18. from data_modules.query_router import QueryRouter
  19. @pytest.fixture
  20. def temp_project(tmp_path):
  21. cfg = DataModulesConfig.from_project_root(tmp_path)
  22. cfg.ensure_dirs()
  23. return cfg
  24. def test_snapshot_manager_roundtrip(temp_project):
  25. manager = SnapshotManager(temp_project)
  26. payload = {"hello": "world"}
  27. manager.save_snapshot(1, payload)
  28. loaded = manager.load_snapshot(1)
  29. assert loaded["payload"] == payload
  30. def test_snapshot_version_mismatch(temp_project):
  31. manager = SnapshotManager(temp_project, version="1.0")
  32. manager.save_snapshot(1, {"a": 1})
  33. other = SnapshotManager(temp_project, version="2.0")
  34. with pytest.raises(SnapshotVersionMismatch):
  35. other.load_snapshot(1)
  36. def test_context_manager_build_and_filter(temp_project):
  37. state = {
  38. "protagonist_state": {"name": "萧炎", "location": {"current": "天云宗"}},
  39. "chapter_meta": {"0001": {"hook": "测试"}},
  40. }
  41. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  42. # preferences and memory
  43. (temp_project.webnovel_dir / "preferences.json").write_text(json.dumps({"tone": "热血"}, ensure_ascii=False), encoding="utf-8")
  44. (temp_project.webnovel_dir / "project_memory.json").write_text(json.dumps({"patterns": []}, ensure_ascii=False), encoding="utf-8")
  45. idx = IndexManager(temp_project)
  46. idx.upsert_entity(
  47. EntityMeta(
  48. id="xiaoyan",
  49. type="角色",
  50. canonical_name="萧炎",
  51. current={},
  52. first_appearance=1,
  53. last_appearance=1,
  54. )
  55. )
  56. idx.upsert_entity(
  57. EntityMeta(
  58. id="bad",
  59. type="角色",
  60. canonical_name="坏人",
  61. current={},
  62. first_appearance=1,
  63. last_appearance=1,
  64. )
  65. )
  66. idx.record_appearance("xiaoyan", 1, ["萧炎"], 1.0)
  67. idx.record_appearance("bad", 1, ["坏人"], 1.0)
  68. invalid_id = idx.mark_invalid_fact("entity", "bad", "错误")
  69. idx.resolve_invalid_fact(invalid_id, "confirm")
  70. manager = ContextManager(temp_project)
  71. payload = manager.build_context(1, use_snapshot=False, save_snapshot=False)
  72. characters = payload["sections"]["scene"]["content"]["appearing_characters"]
  73. assert any(c.get("entity_id") == "xiaoyan" for c in characters)
  74. assert not any(c.get("entity_id") == "bad" for c in characters)
  75. assert payload["sections"]["preferences"]["content"].get("tone") == "热血"
  76. def test_query_router():
  77. router = QueryRouter()
  78. assert router.route("角色是谁") == "entity"
  79. assert router.route("发生了什么剧情") == "plot"
  80. assert "A" in router.split("A, B;C")
  81. def test_context_snapshot_respects_template(temp_project):
  82. state = {
  83. "protagonist_state": {"name": "萧炎"},
  84. "chapter_meta": {},
  85. "disambiguation_warnings": [],
  86. "disambiguation_pending": [],
  87. }
  88. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  89. manager = ContextManager(temp_project)
  90. plot_payload = manager.build_context(1, template="plot", use_snapshot=True, save_snapshot=True)
  91. battle_payload = manager.build_context(1, template="battle", use_snapshot=True, save_snapshot=True)
  92. assert plot_payload.get("template") == "plot"
  93. assert battle_payload.get("template") == "battle"
  94. def test_context_manager_applies_ranker_and_contract_meta(temp_project):
  95. state = {
  96. "protagonist_state": {"name": "萧炎"},
  97. "chapter_meta": {
  98. "0002": {"hook": "平稳"},
  99. "0003": {"hook": "留下悬念"},
  100. },
  101. "disambiguation_warnings": [
  102. {"chapter": 1, "message": "普通告警"},
  103. {"chapter": 3, "message": "critical 冲突告警", "severity": "high"},
  104. ],
  105. "disambiguation_pending": [],
  106. }
  107. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  108. manager = ContextManager(temp_project)
  109. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  110. assert payload["meta"].get("context_contract_version") == "v2"
  111. recent_meta = payload["sections"]["core"]["content"]["recent_meta"]
  112. if recent_meta:
  113. assert recent_meta[0]["chapter"] == 3
  114. warnings = payload["sections"]["alerts"]["content"]["disambiguation_warnings"]
  115. if warnings and isinstance(warnings[0], dict):
  116. assert "critical" in str(warnings[0].get("message", "")) or warnings[0].get("severity") == "high"
  117. def test_context_manager_includes_reader_signal_and_genre_profile(temp_project):
  118. state = {
  119. "project": {"genre": "xuanhuan"},
  120. "protagonist_state": {"name": "萧炎"},
  121. "chapter_meta": {},
  122. "disambiguation_warnings": [],
  123. "disambiguation_pending": [],
  124. }
  125. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  126. idx = IndexManager(temp_project)
  127. idx.save_chapter_reading_power(
  128. ChapterReadingPowerMeta(
  129. chapter=3,
  130. hook_type="悬念钩",
  131. hook_strength="strong",
  132. coolpoint_patterns=["身份掉马"],
  133. )
  134. )
  135. idx.save_review_metrics(
  136. ReviewMetrics(
  137. start_chapter=1,
  138. end_chapter=3,
  139. overall_score=72,
  140. dimension_scores={"plot": 72},
  141. severity_counts={"high": 1},
  142. critical_issues=["节奏拖沓"],
  143. )
  144. )
  145. manager = ContextManager(temp_project)
  146. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  147. reader_signal = payload["sections"]["reader_signal"]["content"]
  148. assert "recent_reading_power" in reader_signal
  149. assert "pattern_usage" in reader_signal
  150. assert "hook_type_usage" in reader_signal
  151. assert "review_trend" in reader_signal
  152. assert isinstance(reader_signal.get("low_score_ranges"), list)
  153. genre_profile = payload["sections"]["genre_profile"]["content"]
  154. assert genre_profile.get("genre") == "xuanhuan"
  155. assert "profile_excerpt" in genre_profile
  156. assert "taxonomy_excerpt" in genre_profile
  157. def test_context_manager_genre_section_and_refs_extraction(temp_project):
  158. refs_dir = temp_project.project_root / ".claude" / "references"
  159. refs_dir.mkdir(parents=True, exist_ok=True)
  160. (refs_dir / "genre-profiles.md").write_text(
  161. """
  162. ## shuangwen
  163. - 节奏快
  164. - 打脸密集
  165. ## xuanhuan
  166. - 升级线清晰
  167. - 资源争夺
  168. """.strip(),
  169. encoding="utf-8",
  170. )
  171. (refs_dir / "reading-power-taxonomy.md").write_text(
  172. """
  173. ## xuanhuan
  174. - 钩子强度优先 strong
  175. - 爽点使用战力跨级
  176. """.strip(),
  177. encoding="utf-8",
  178. )
  179. manager = ContextManager(temp_project)
  180. profile = manager._load_genre_profile({"project": {"genre": "xuanhuan"}})
  181. assert profile["genre"] == "xuanhuan"
  182. assert "升级线清晰" in profile["profile_excerpt"]
  183. assert "钩子强度" in profile["taxonomy_excerpt"]
  184. assert isinstance(profile["reference_hints"], list)
  185. assert profile["reference_hints"]
  186. fallback_excerpt = manager._extract_genre_section("## a\n1\n## b\n2", "unknown")
  187. assert fallback_excerpt.startswith("## a")
  188. def test_context_manager_reader_signal_with_debt_and_disable_switch(temp_project):
  189. manager = ContextManager(temp_project)
  190. manager.config.context_reader_signal_include_debt = True
  191. signal = manager._load_reader_signal(chapter=5)
  192. assert "debt_summary" in signal
  193. manager.config.context_reader_signal_enabled = False
  194. assert manager._load_reader_signal(chapter=5) == {}
  195. manager.config.context_genre_profile_enabled = False
  196. assert manager._load_genre_profile({"project": {"genre": "xuanhuan"}}) == {}
  197. def test_context_manager_includes_writing_guidance(temp_project):
  198. state = {
  199. "project": {"genre": "xuanhuan"},
  200. "protagonist_state": {"name": "萧炎"},
  201. "chapter_meta": {},
  202. "disambiguation_warnings": [],
  203. "disambiguation_pending": [],
  204. }
  205. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  206. idx = IndexManager(temp_project)
  207. idx.save_chapter_reading_power(
  208. ChapterReadingPowerMeta(
  209. chapter=3,
  210. hook_type="悬念钩",
  211. hook_strength="strong",
  212. coolpoint_patterns=["身份掉马"],
  213. )
  214. )
  215. idx.save_review_metrics(
  216. ReviewMetrics(
  217. start_chapter=1,
  218. end_chapter=3,
  219. overall_score=70,
  220. dimension_scores={"plot": 70},
  221. severity_counts={"high": 1},
  222. critical_issues=["节奏拖沓"],
  223. )
  224. )
  225. manager = ContextManager(temp_project)
  226. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  227. guidance = payload["sections"]["writing_guidance"]["content"]
  228. assert guidance.get("chapter") == 4
  229. items = guidance.get("guidance_items") or []
  230. assert isinstance(items, list)
  231. assert items
  232. assert guidance.get("signals_used", {}).get("genre") == "xuanhuan"
  233. checklist = guidance.get("checklist") or []
  234. assert isinstance(checklist, list)
  235. assert checklist
  236. checklist_score = guidance.get("checklist_score") or {}
  237. assert isinstance(checklist_score, dict)
  238. assert "score" in checklist_score
  239. assert "completion_rate" in checklist_score
  240. first_item = checklist[0]
  241. assert isinstance(first_item, dict)
  242. assert {"id", "label", "weight", "required", "source", "verify_hint"}.issubset(first_item.keys())
  243. persisted = idx.get_writing_checklist_score(4)
  244. assert isinstance(persisted, dict)
  245. assert persisted.get("chapter") == 4
  246. assert persisted.get("score") is not None
  247. def test_context_manager_dynamic_weights_and_composite_genre(temp_project):
  248. refs_dir = temp_project.project_root / ".claude" / "references"
  249. refs_dir.mkdir(parents=True, exist_ok=True)
  250. (refs_dir / "genre-profiles.md").write_text(
  251. """
  252. ## xuanhuan
  253. - 升级线清晰
  254. ## realistic
  255. - 社会议题映射
  256. """.strip(),
  257. encoding="utf-8",
  258. )
  259. (refs_dir / "reading-power-taxonomy.md").write_text(
  260. """
  261. ## xuanhuan
  262. - 钩子强度优先
  263. ## realistic
  264. - 人物动机一致
  265. """.strip(),
  266. encoding="utf-8",
  267. )
  268. state = {
  269. "project": {"genre": "xuanhuan+realistic"},
  270. "protagonist_state": {"name": "萧炎"},
  271. "chapter_meta": {},
  272. "disambiguation_warnings": [],
  273. "disambiguation_pending": [],
  274. }
  275. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  276. manager = ContextManager(temp_project)
  277. payload_early = manager.build_context(10, template="plot", use_snapshot=False, save_snapshot=False)
  278. payload_late = manager.build_context(150, template="plot", use_snapshot=False, save_snapshot=False)
  279. assert payload_early.get("weights", {}).get("core") >= payload_late.get("weights", {}).get("core")
  280. assert payload_late.get("weights", {}).get("global") >= payload_early.get("weights", {}).get("global")
  281. assert payload_early.get("meta", {}).get("context_weight_stage") == "early"
  282. assert payload_late.get("meta", {}).get("context_weight_stage") == "late"
  283. profile = payload_early["sections"]["genre_profile"]["content"]
  284. assert profile.get("composite") is True
  285. assert profile.get("genre") == "xuanhuan"
  286. assert isinstance(profile.get("genres"), list)
  287. assert "realistic" in (profile.get("genres") or [])
  288. assert isinstance(profile.get("composite_hints"), list)
  289. assert profile.get("composite_hints")
  290. def test_context_manager_genre_alias_guidance_and_heading_extraction(temp_project):
  291. refs_dir = temp_project.project_root / ".claude" / "references"
  292. refs_dir.mkdir(parents=True, exist_ok=True)
  293. (refs_dir / "genre-profiles.md").write_text(
  294. """
  295. ### 电竞
  296. - 联赛升级
  297. ### 直播文
  298. - 反馈闭环
  299. ### 克苏鲁
  300. - 真相代价
  301. """.strip(),
  302. encoding="utf-8",
  303. )
  304. (refs_dir / "reading-power-taxonomy.md").write_text(
  305. """
  306. ### 电竞
  307. - 战术决策点
  308. """.strip(),
  309. encoding="utf-8",
  310. )
  311. state = {
  312. "project": {"genre": "电竞"},
  313. "protagonist_state": {"name": "林燃"},
  314. "chapter_meta": {},
  315. "disambiguation_warnings": [],
  316. "disambiguation_pending": [],
  317. }
  318. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  319. manager = ContextManager(temp_project)
  320. payload = manager.build_context(12, template="plot", use_snapshot=False, save_snapshot=False)
  321. guidance = payload["sections"]["writing_guidance"]["content"]
  322. items = guidance.get("guidance_items") or []
  323. assert any("战术决策点" in str(text) for text in items)
  324. assert any("网文节奏基线" in str(text) for text in items)
  325. assert any("兑现密度基线" in str(text) for text in items)
  326. def test_context_manager_genre_aliases_normalized_for_profile_lookup(temp_project):
  327. refs_dir = temp_project.project_root / ".claude" / "references"
  328. refs_dir.mkdir(parents=True, exist_ok=True)
  329. (refs_dir / "genre-profiles.md").write_text(
  330. """
  331. ## 电竞
  332. - 联赛升级
  333. ## 直播文
  334. - 实时反馈
  335. ## 克苏鲁
  336. - 真相代价
  337. """.strip(),
  338. encoding="utf-8",
  339. )
  340. (refs_dir / "reading-power-taxonomy.md").write_text(
  341. """
  342. ## 电竞
  343. - 决策后果
  344. ## 直播文
  345. - 数据闭环
  346. ## 克苏鲁
  347. - 规则优先
  348. """.strip(),
  349. encoding="utf-8",
  350. )
  351. manager = ContextManager(temp_project)
  352. assert manager._parse_genre_tokens("电竞文") == ["电竞"]
  353. assert manager._parse_genre_tokens("直播") == ["直播文"]
  354. assert manager._parse_genre_tokens("克系") == ["克苏鲁"]
  355. assert manager._parse_genre_tokens("修仙/玄幻") == ["修仙"]
  356. assert manager._parse_genre_tokens("都市修真") == ["都市异能"]
  357. assert manager._parse_genre_tokens("古言脑洞") == ["古言"]
  358. state = {
  359. "project": {"genre": "电竞文+直播"},
  360. "protagonist_state": {"name": "叶修"},
  361. "chapter_meta": {},
  362. "disambiguation_warnings": [],
  363. "disambiguation_pending": [],
  364. }
  365. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  366. payload = manager.build_context(20, template="plot", use_snapshot=False, save_snapshot=False)
  367. profile = payload["sections"]["genre_profile"]["content"]
  368. assert profile.get("genre") == "电竞"
  369. assert "直播文" in (profile.get("genres") or [])
  370. def test_context_manager_compact_text_truncation(temp_project):
  371. manager = ContextManager(temp_project)
  372. manager.config.context_compact_text_enabled = True
  373. manager.config.context_compact_min_budget = 80
  374. manager.config.context_compact_head_ratio = 0.6
  375. content = {"a": "x" * 200, "b": "y" * 200}
  376. compact = manager._compact_json_text(content, budget=120)
  377. assert len(compact) <= 120
  378. assert "[TRUNCATED]" in compact
  379. manager.config.context_compact_text_enabled = False
  380. raw_cut = manager._compact_json_text(content, budget=100)
  381. assert len(raw_cut) <= 100
  382. def test_context_manager_persist_writing_checklist_score_logs_failure(temp_project, monkeypatch, caplog):
  383. manager = ContextManager(temp_project)
  384. def _raise_save_error(_meta):
  385. raise RuntimeError("simulated save failure")
  386. monkeypatch.setattr(manager.index_manager, "save_writing_checklist_score", _raise_save_error)
  387. with caplog.at_level(logging.WARNING):
  388. manager._persist_writing_checklist_score(
  389. {
  390. "chapter": 6,
  391. "score": 70.0,
  392. "total_items": 3,
  393. "required_items": 1,
  394. "completed_items": 1,
  395. "completed_required": 1,
  396. "total_weight": 3.0,
  397. "completed_weight": 1.0,
  398. "completion_rate": 0.33,
  399. "pending_items": ["test"],
  400. }
  401. )
  402. message_text = "\n".join(record.getMessage() for record in caplog.records)
  403. assert "failed to persist writing checklist score" in message_text
  404. def test_context_manager_composite_genre_boundary_three_plus(temp_project):
  405. manager = ContextManager(temp_project)
  406. manager.config.context_genre_profile_support_composite = True
  407. manager.config.context_genre_profile_max_genres = 3
  408. genre_raw = "电竞文+直播+克系+修仙/玄幻+电竞文"
  409. tokens = manager._parse_genre_tokens(genre_raw)
  410. assert tokens[:4] == ["电竞", "直播文", "克苏鲁", "修仙"]
  411. state = {
  412. "project": {"genre": genre_raw},
  413. "protagonist_state": {"name": "主角"},
  414. "chapter_meta": {},
  415. "disambiguation_warnings": [],
  416. "disambiguation_pending": [],
  417. }
  418. profile = manager._load_genre_profile(state)
  419. assert profile.get("composite") is True
  420. assert profile.get("genres") == ["电竞", "直播文", "克苏鲁"]
  421. assert profile.get("secondary_genres") == ["直播文", "克苏鲁"]
  422. profile_again = manager._load_genre_profile(state)
  423. assert profile_again.get("genres") == profile.get("genres")
  424. def test_context_manager_dynamic_weights_from_config_override(temp_project):
  425. manager = ContextManager(temp_project)
  426. manager.config.context_dynamic_budget_enabled = True
  427. manager.config.context_template_weights_dynamic = {
  428. "early": {
  429. "plot": {"core": 0.60, "scene": 0.20, "global": 0.20},
  430. }
  431. }
  432. weights = manager._resolve_template_weights("plot", chapter=1)
  433. assert weights == {"core": 0.60, "scene": 0.20, "global": 0.20}