test_context_manager.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. ContextManager and SnapshotManager tests
  5. """
  6. import json
  7. import logging
  8. import pytest
  9. from data_modules.config import DataModulesConfig
  10. from data_modules.index_manager import (
  11. IndexManager,
  12. EntityMeta,
  13. ChapterReadingPowerMeta,
  14. ReviewMetrics,
  15. )
  16. from data_modules.context_manager import ContextManager
  17. from data_modules.snapshot_manager import SnapshotManager, SnapshotVersionMismatch
  18. from data_modules.query_router import QueryRouter
  19. @pytest.fixture
  20. def temp_project(tmp_path):
  21. cfg = DataModulesConfig.from_project_root(tmp_path)
  22. cfg.ensure_dirs()
  23. return cfg
  24. def test_snapshot_manager_roundtrip(temp_project):
  25. manager = SnapshotManager(temp_project)
  26. payload = {"hello": "world"}
  27. manager.save_snapshot(1, payload)
  28. loaded = manager.load_snapshot(1)
  29. assert loaded["payload"] == payload
  30. def test_snapshot_version_mismatch(temp_project):
  31. manager = SnapshotManager(temp_project, version="1.0")
  32. manager.save_snapshot(1, {"a": 1})
  33. other = SnapshotManager(temp_project, version="2.0")
  34. with pytest.raises(SnapshotVersionMismatch):
  35. other.load_snapshot(1)
  36. def test_snapshot_delete_roundtrip(temp_project):
  37. manager = SnapshotManager(temp_project)
  38. manager.save_snapshot(2, {"x": 1})
  39. assert manager.delete_snapshot(2) is True
  40. assert manager.load_snapshot(2) is None
  41. def test_context_manager_build_and_filter(temp_project):
  42. state = {
  43. "protagonist_state": {"name": "萧炎", "location": {"current": "天云宗"}},
  44. "chapter_meta": {"0001": {"hook": "测试"}},
  45. }
  46. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  47. # preferences and memory
  48. (temp_project.webnovel_dir / "preferences.json").write_text(json.dumps({"tone": "热血"}, ensure_ascii=False), encoding="utf-8")
  49. (temp_project.webnovel_dir / "project_memory.json").write_text(json.dumps({"patterns": []}, ensure_ascii=False), encoding="utf-8")
  50. idx = IndexManager(temp_project)
  51. idx.upsert_entity(
  52. EntityMeta(
  53. id="xiaoyan",
  54. type="角色",
  55. canonical_name="萧炎",
  56. current={},
  57. first_appearance=1,
  58. last_appearance=1,
  59. )
  60. )
  61. idx.upsert_entity(
  62. EntityMeta(
  63. id="bad",
  64. type="角色",
  65. canonical_name="坏人",
  66. current={},
  67. first_appearance=1,
  68. last_appearance=1,
  69. )
  70. )
  71. idx.record_appearance("xiaoyan", 1, ["萧炎"], 1.0)
  72. idx.record_appearance("bad", 1, ["坏人"], 1.0)
  73. invalid_id = idx.mark_invalid_fact("entity", "bad", "错误")
  74. idx.resolve_invalid_fact(invalid_id, "confirm")
  75. manager = ContextManager(temp_project)
  76. payload = manager.build_context(1, use_snapshot=False, save_snapshot=False)
  77. characters = payload["sections"]["scene"]["content"]["appearing_characters"]
  78. assert any(c.get("entity_id") == "xiaoyan" for c in characters)
  79. assert not any(c.get("entity_id") == "bad" for c in characters)
  80. assert payload["sections"]["preferences"]["content"].get("tone") == "热血"
  81. def test_query_router():
  82. router = QueryRouter()
  83. assert router.route("角色是谁") == "entity"
  84. assert router.route("发生了什么剧情") == "plot"
  85. assert "A" in router.split("A, B;C")
  86. def test_context_snapshot_respects_template(temp_project):
  87. state = {
  88. "protagonist_state": {"name": "萧炎"},
  89. "chapter_meta": {},
  90. "disambiguation_warnings": [],
  91. "disambiguation_pending": [],
  92. }
  93. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  94. manager = ContextManager(temp_project)
  95. plot_payload = manager.build_context(1, template="plot", use_snapshot=True, save_snapshot=True)
  96. battle_payload = manager.build_context(1, template="battle", use_snapshot=True, save_snapshot=True)
  97. assert plot_payload.get("template") == "plot"
  98. assert battle_payload.get("template") == "battle"
  99. def test_context_manager_applies_ranker_and_contract_meta(temp_project):
  100. state = {
  101. "protagonist_state": {"name": "萧炎"},
  102. "chapter_meta": {
  103. "0002": {"hook": "平稳"},
  104. "0003": {"hook": "留下悬念"},
  105. },
  106. "disambiguation_warnings": [
  107. {"chapter": 1, "message": "普通告警"},
  108. {"chapter": 3, "message": "critical 冲突告警", "severity": "high"},
  109. ],
  110. "disambiguation_pending": [],
  111. }
  112. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  113. manager = ContextManager(temp_project)
  114. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  115. assert payload["meta"].get("context_contract_version") == "v2"
  116. recent_meta = payload["sections"]["core"]["content"]["recent_meta"]
  117. if recent_meta:
  118. assert recent_meta[0]["chapter"] == 3
  119. warnings = payload["sections"]["alerts"]["content"]["disambiguation_warnings"]
  120. if warnings and isinstance(warnings[0], dict):
  121. assert "critical" in str(warnings[0].get("message", "")) or warnings[0].get("severity") == "high"
  122. def test_context_manager_includes_reader_signal_and_genre_profile(temp_project):
  123. state = {
  124. "project": {"genre": "xuanhuan"},
  125. "protagonist_state": {"name": "萧炎"},
  126. "chapter_meta": {},
  127. "disambiguation_warnings": [],
  128. "disambiguation_pending": [],
  129. }
  130. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  131. idx = IndexManager(temp_project)
  132. idx.save_chapter_reading_power(
  133. ChapterReadingPowerMeta(
  134. chapter=3,
  135. hook_type="悬念钩",
  136. hook_strength="strong",
  137. coolpoint_patterns=["身份掉马"],
  138. )
  139. )
  140. idx.save_review_metrics(
  141. ReviewMetrics(
  142. start_chapter=1,
  143. end_chapter=3,
  144. overall_score=72,
  145. dimension_scores={"plot": 72},
  146. severity_counts={"high": 1},
  147. critical_issues=["节奏拖沓"],
  148. )
  149. )
  150. manager = ContextManager(temp_project)
  151. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  152. reader_signal = payload["sections"]["reader_signal"]["content"]
  153. assert "recent_reading_power" in reader_signal
  154. assert "pattern_usage" in reader_signal
  155. assert "hook_type_usage" in reader_signal
  156. assert "review_trend" in reader_signal
  157. assert isinstance(reader_signal.get("low_score_ranges"), list)
  158. genre_profile = payload["sections"]["genre_profile"]["content"]
  159. assert genre_profile.get("genre") == "xuanhuan"
  160. assert "profile_excerpt" in genre_profile
  161. assert "taxonomy_excerpt" in genre_profile
  162. def test_context_manager_genre_section_and_refs_extraction(temp_project):
  163. refs_dir = temp_project.project_root / ".claude" / "references"
  164. refs_dir.mkdir(parents=True, exist_ok=True)
  165. (refs_dir / "genre-profiles.md").write_text(
  166. """
  167. ## shuangwen
  168. - 节奏快
  169. - 打脸密集
  170. ## xuanhuan
  171. - 升级线清晰
  172. - 资源争夺
  173. """.strip(),
  174. encoding="utf-8",
  175. )
  176. (refs_dir / "reading-power-taxonomy.md").write_text(
  177. """
  178. ## xuanhuan
  179. - 钩子强度优先 strong
  180. - 爽点使用战力跨级
  181. """.strip(),
  182. encoding="utf-8",
  183. )
  184. manager = ContextManager(temp_project)
  185. profile = manager._load_genre_profile({"project": {"genre": "xuanhuan"}})
  186. assert profile["genre"] == "xuanhuan"
  187. assert "升级线清晰" in profile["profile_excerpt"]
  188. assert "钩子强度" in profile["taxonomy_excerpt"]
  189. assert isinstance(profile["reference_hints"], list)
  190. assert profile["reference_hints"]
  191. fallback_excerpt = manager._extract_genre_section("## a\n1\n## b\n2", "unknown")
  192. assert fallback_excerpt.startswith("## a")
  193. def test_context_manager_reader_signal_with_debt_and_disable_switch(temp_project):
  194. manager = ContextManager(temp_project)
  195. manager.config.context_reader_signal_include_debt = True
  196. signal = manager._load_reader_signal(chapter=5)
  197. assert "debt_summary" in signal
  198. manager.config.context_reader_signal_enabled = False
  199. assert manager._load_reader_signal(chapter=5) == {}
  200. manager.config.context_genre_profile_enabled = False
  201. assert manager._load_genre_profile({"project": {"genre": "xuanhuan"}}) == {}
  202. def test_context_manager_includes_writing_guidance(temp_project):
  203. state = {
  204. "project": {"genre": "xuanhuan"},
  205. "protagonist_state": {"name": "萧炎"},
  206. "chapter_meta": {},
  207. "disambiguation_warnings": [],
  208. "disambiguation_pending": [],
  209. }
  210. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  211. idx = IndexManager(temp_project)
  212. idx.save_chapter_reading_power(
  213. ChapterReadingPowerMeta(
  214. chapter=3,
  215. hook_type="悬念钩",
  216. hook_strength="strong",
  217. coolpoint_patterns=["身份掉马"],
  218. )
  219. )
  220. idx.save_review_metrics(
  221. ReviewMetrics(
  222. start_chapter=1,
  223. end_chapter=3,
  224. overall_score=70,
  225. dimension_scores={"plot": 70},
  226. severity_counts={"high": 1},
  227. critical_issues=["节奏拖沓"],
  228. )
  229. )
  230. manager = ContextManager(temp_project)
  231. payload = manager.build_context(4, use_snapshot=False, save_snapshot=False)
  232. guidance = payload["sections"]["writing_guidance"]["content"]
  233. assert guidance.get("chapter") == 4
  234. items = guidance.get("guidance_items") or []
  235. assert isinstance(items, list)
  236. assert items
  237. assert guidance.get("signals_used", {}).get("genre") == "xuanhuan"
  238. checklist = guidance.get("checklist") or []
  239. assert isinstance(checklist, list)
  240. assert checklist
  241. checklist_score = guidance.get("checklist_score") or {}
  242. assert isinstance(checklist_score, dict)
  243. assert "score" in checklist_score
  244. assert "completion_rate" in checklist_score
  245. first_item = checklist[0]
  246. assert isinstance(first_item, dict)
  247. assert {"id", "label", "weight", "required", "source", "verify_hint"}.issubset(first_item.keys())
  248. persisted = idx.get_writing_checklist_score(4)
  249. assert isinstance(persisted, dict)
  250. assert persisted.get("chapter") == 4
  251. assert persisted.get("score") is not None
  252. def test_context_manager_dynamic_weights_and_composite_genre(temp_project):
  253. refs_dir = temp_project.project_root / ".claude" / "references"
  254. refs_dir.mkdir(parents=True, exist_ok=True)
  255. (refs_dir / "genre-profiles.md").write_text(
  256. """
  257. ## xuanhuan
  258. - 升级线清晰
  259. ## realistic
  260. - 社会议题映射
  261. """.strip(),
  262. encoding="utf-8",
  263. )
  264. (refs_dir / "reading-power-taxonomy.md").write_text(
  265. """
  266. ## xuanhuan
  267. - 钩子强度优先
  268. ## realistic
  269. - 人物动机一致
  270. """.strip(),
  271. encoding="utf-8",
  272. )
  273. state = {
  274. "project": {"genre": "xuanhuan+realistic"},
  275. "protagonist_state": {"name": "萧炎"},
  276. "chapter_meta": {},
  277. "disambiguation_warnings": [],
  278. "disambiguation_pending": [],
  279. }
  280. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  281. manager = ContextManager(temp_project)
  282. payload_early = manager.build_context(10, template="plot", use_snapshot=False, save_snapshot=False)
  283. payload_late = manager.build_context(150, template="plot", use_snapshot=False, save_snapshot=False)
  284. assert payload_early.get("weights", {}).get("core") >= payload_late.get("weights", {}).get("core")
  285. assert payload_late.get("weights", {}).get("global") >= payload_early.get("weights", {}).get("global")
  286. assert payload_early.get("meta", {}).get("context_weight_stage") == "early"
  287. assert payload_late.get("meta", {}).get("context_weight_stage") == "late"
  288. profile = payload_early["sections"]["genre_profile"]["content"]
  289. assert profile.get("composite") is True
  290. assert profile.get("genre") == "xuanhuan"
  291. assert isinstance(profile.get("genres"), list)
  292. assert "realistic" in (profile.get("genres") or [])
  293. assert isinstance(profile.get("composite_hints"), list)
  294. assert profile.get("composite_hints")
  295. def test_context_manager_genre_alias_guidance_and_heading_extraction(temp_project):
  296. refs_dir = temp_project.project_root / ".claude" / "references"
  297. refs_dir.mkdir(parents=True, exist_ok=True)
  298. (refs_dir / "genre-profiles.md").write_text(
  299. """
  300. ### 电竞
  301. - 联赛升级
  302. ### 直播文
  303. - 反馈闭环
  304. ### 克苏鲁
  305. - 真相代价
  306. """.strip(),
  307. encoding="utf-8",
  308. )
  309. (refs_dir / "reading-power-taxonomy.md").write_text(
  310. """
  311. ### 电竞
  312. - 战术决策点
  313. """.strip(),
  314. encoding="utf-8",
  315. )
  316. state = {
  317. "project": {"genre": "电竞"},
  318. "protagonist_state": {"name": "林燃"},
  319. "chapter_meta": {},
  320. "disambiguation_warnings": [],
  321. "disambiguation_pending": [],
  322. }
  323. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  324. manager = ContextManager(temp_project)
  325. payload = manager.build_context(12, template="plot", use_snapshot=False, save_snapshot=False)
  326. guidance = payload["sections"]["writing_guidance"]["content"]
  327. items = guidance.get("guidance_items") or []
  328. assert any("战术决策点" in str(text) for text in items)
  329. assert any("网文节奏基线" in str(text) for text in items)
  330. assert any("兑现密度基线" in str(text) for text in items)
  331. def test_context_manager_genre_aliases_normalized_for_profile_lookup(temp_project):
  332. refs_dir = temp_project.project_root / ".claude" / "references"
  333. refs_dir.mkdir(parents=True, exist_ok=True)
  334. (refs_dir / "genre-profiles.md").write_text(
  335. """
  336. ## 电竞
  337. - 联赛升级
  338. ## 直播文
  339. - 实时反馈
  340. ## 克苏鲁
  341. - 真相代价
  342. """.strip(),
  343. encoding="utf-8",
  344. )
  345. (refs_dir / "reading-power-taxonomy.md").write_text(
  346. """
  347. ## 电竞
  348. - 决策后果
  349. ## 直播文
  350. - 数据闭环
  351. ## 克苏鲁
  352. - 规则优先
  353. """.strip(),
  354. encoding="utf-8",
  355. )
  356. manager = ContextManager(temp_project)
  357. assert manager._parse_genre_tokens("电竞文") == ["电竞"]
  358. assert manager._parse_genre_tokens("直播") == ["直播文"]
  359. assert manager._parse_genre_tokens("克系") == ["克苏鲁"]
  360. assert manager._parse_genre_tokens("修仙/玄幻") == ["修仙"]
  361. assert manager._parse_genre_tokens("都市修真") == ["都市异能"]
  362. assert manager._parse_genre_tokens("古言脑洞") == ["古言"]
  363. state = {
  364. "project": {"genre": "电竞文+直播"},
  365. "protagonist_state": {"name": "叶修"},
  366. "chapter_meta": {},
  367. "disambiguation_warnings": [],
  368. "disambiguation_pending": [],
  369. }
  370. temp_project.state_file.write_text(json.dumps(state, ensure_ascii=False), encoding="utf-8")
  371. payload = manager.build_context(20, template="plot", use_snapshot=False, save_snapshot=False)
  372. profile = payload["sections"]["genre_profile"]["content"]
  373. assert profile.get("genre") == "电竞"
  374. assert "直播文" in (profile.get("genres") or [])
  375. def test_context_manager_compact_text_truncation(temp_project):
  376. manager = ContextManager(temp_project)
  377. manager.config.context_compact_text_enabled = True
  378. manager.config.context_compact_min_budget = 80
  379. manager.config.context_compact_head_ratio = 0.6
  380. content = {"a": "x" * 200, "b": "y" * 200}
  381. compact = manager._compact_json_text(content, budget=120)
  382. assert len(compact) <= 120
  383. assert "[TRUNCATED]" in compact
  384. manager.config.context_compact_text_enabled = False
  385. raw_cut = manager._compact_json_text(content, budget=100)
  386. assert len(raw_cut) <= 100
  387. def test_context_manager_persist_writing_checklist_score_logs_failure(temp_project, monkeypatch, caplog):
  388. manager = ContextManager(temp_project)
  389. def _raise_save_error(_meta):
  390. raise RuntimeError("simulated save failure")
  391. monkeypatch.setattr(manager.index_manager, "save_writing_checklist_score", _raise_save_error)
  392. with caplog.at_level(logging.WARNING):
  393. manager._persist_writing_checklist_score(
  394. {
  395. "chapter": 6,
  396. "score": 70.0,
  397. "total_items": 3,
  398. "required_items": 1,
  399. "completed_items": 1,
  400. "completed_required": 1,
  401. "total_weight": 3.0,
  402. "completed_weight": 1.0,
  403. "completion_rate": 0.33,
  404. "pending_items": ["test"],
  405. }
  406. )
  407. message_text = "\n".join(record.getMessage() for record in caplog.records)
  408. assert "failed to persist writing checklist score" in message_text
  409. def test_context_manager_composite_genre_boundary_three_plus(temp_project):
  410. manager = ContextManager(temp_project)
  411. manager.config.context_genre_profile_support_composite = True
  412. manager.config.context_genre_profile_max_genres = 3
  413. genre_raw = "电竞文+直播+克系+修仙/玄幻+电竞文"
  414. tokens = manager._parse_genre_tokens(genre_raw)
  415. assert tokens[:4] == ["电竞", "直播文", "克苏鲁", "修仙"]
  416. state = {
  417. "project": {"genre": genre_raw},
  418. "protagonist_state": {"name": "主角"},
  419. "chapter_meta": {},
  420. "disambiguation_warnings": [],
  421. "disambiguation_pending": [],
  422. }
  423. profile = manager._load_genre_profile(state)
  424. assert profile.get("composite") is True
  425. assert profile.get("genres") == ["电竞", "直播文", "克苏鲁"]
  426. assert profile.get("secondary_genres") == ["直播文", "克苏鲁"]
  427. profile_again = manager._load_genre_profile(state)
  428. assert profile_again.get("genres") == profile.get("genres")
  429. def test_context_manager_dynamic_weights_from_config_override(temp_project):
  430. manager = ContextManager(temp_project)
  431. manager.config.context_dynamic_budget_enabled = True
  432. manager.config.context_template_weights_dynamic = {
  433. "early": {
  434. "plot": {"core": 0.60, "scene": 0.20, "global": 0.20},
  435. }
  436. }
  437. weights = manager._resolve_template_weights("plot", chapter=1)
  438. assert weights == {"core": 0.60, "scene": 0.20, "global": 0.20}
  439. def test_context_manager_genre_profile_fallbacks_to_project_info(temp_project):
  440. manager = ContextManager(temp_project)
  441. profile = manager._load_genre_profile({"project_info": {"genre": "xuanhuan"}})
  442. assert profile.get("genre_raw") == "xuanhuan"
  443. assert profile.get("genre") == "xuanhuan"
  444. def test_context_manager_genre_profile_prefers_project_over_project_info(temp_project):
  445. manager = ContextManager(temp_project)
  446. profile = manager._load_genre_profile(
  447. {
  448. "project": {"genre": "xuanhuan"},
  449. "project_info": {"genre": "dushi"},
  450. }
  451. )
  452. assert profile.get("genre_raw") == "xuanhuan"
  453. assert profile.get("genre") == "xuanhuan"