test_semantic_logic.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425
  1. """
  2. 语义逻辑审查模块 — 链路测试
  3. 测试 semantic_logic.py 中的 SemanticLogicReviewer 完整调用链路
  4. 链路: prompt_loader → ChatPromptTemplate.format_messages() → generate_model_client.get_model_generate_invoke() → ReviewResult
  5. """
  6. import pytest
  7. import asyncio
  8. import sys
  9. import os
  10. from unittest.mock import Mock, patch, AsyncMock, MagicMock, PropertyMock
  11. from core.construction_review.component.reviewers.semantic_logic import (
  12. SemanticLogicReviewer,
  13. semantic_logic_reviewer,
  14. )
  15. from core.construction_review.component.reviewers.base_reviewer import ReviewResult
  16. # ─── helpers ───────────────────────────────────────────────────────────────────
  17. def _make_mock_prompt_template(messages=None):
  18. """构造一个模拟的 ChatPromptTemplate,format_messages() 返回指定消息列表"""
  19. from langchain_core.messages import SystemMessage, HumanMessage
  20. if messages is None:
  21. messages = [
  22. SystemMessage(content="你是语义逻辑审查专家"),
  23. HumanMessage(content="请审查:测试施工方案内容"),
  24. ]
  25. tmpl = MagicMock()
  26. tmpl.format_messages.return_value = messages
  27. return tmpl
  28. def _make_mock_state():
  29. """构造模拟的 state 字典(含 progress_manager)"""
  30. pm = AsyncMock()
  31. pm.update_stage_progress = AsyncMock()
  32. return {
  33. "progress_manager": pm,
  34. "callback_task_id": "test_callback_001",
  35. }
  36. # ─── 单元测试:初始化 ──────────────────────────────────────────────────────────
  37. class TestInit:
  38. """审查器初始化测试"""
  39. def test_init_model_client_set(self):
  40. """初始化后 model_client 应为 GenerateModelClient 实例"""
  41. r = SemanticLogicReviewer()
  42. from foundation.ai.agent.generate.model_generate import GenerateModelClient
  43. assert isinstance(r.model_client, GenerateModelClient)
  44. def test_global_singleton(self):
  45. """全局单例实例"""
  46. assert isinstance(semantic_logic_reviewer, SemanticLogicReviewer)
  47. # ─── 单元测试:成功路径 ────────────────────────────────────────────────────────
  48. class TestCheckSemanticLogicSuccess:
  49. """检查语义逻辑 — 成功路径"""
  50. @pytest.mark.asyncio
  51. async def test_success_path(self):
  52. """
  53. 验证完整成功链路:
  54. prompt_loader.get_prompt_template → format_messages → model_client.get_model_generate_invoke → ReviewResult
  55. """
  56. reviewer = SemanticLogicReviewer()
  57. mock_tmpl = _make_mock_prompt_template()
  58. fake_response = '{"issue_point": "无", "location": "", "suggestion": "", "reason": "", "risk_level": ""}'
  59. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  60. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  61. mock_invoke.return_value = fake_response
  62. mock_get_prompt.return_value = mock_tmpl
  63. result = await reviewer.check_semantic_logic(
  64. trace_id="trace_001",
  65. review_content="测试施工方案内容",
  66. )
  67. # 链路1: prompt_loader 被正确调用
  68. mock_get_prompt.assert_called_once_with(
  69. "basic", "semantic_logic_check",
  70. review_content="测试施工方案内容",
  71. review_references="",
  72. )
  73. # 链路2: format_messages 被调用
  74. mock_tmpl.format_messages.assert_called_once()
  75. # 链路3: model_client 使用 function_name="grammar_check"
  76. mock_invoke.assert_awaited_once()
  77. call_kwargs = mock_invoke.call_args.kwargs
  78. assert call_kwargs["trace_id"] == "trace_001"
  79. assert call_kwargs["function_name"] == "grammar_check"
  80. assert call_kwargs["messages"] == mock_tmpl.format_messages.return_value
  81. # 链路4: 返回正确的 ReviewResult
  82. assert isinstance(result, ReviewResult)
  83. assert result.success is True
  84. assert result.details["name"] == "semantic_logic_check"
  85. assert result.details["response"] == fake_response
  86. assert result.error_message is None
  87. assert result.execution_time > 0
  88. @pytest.mark.asyncio
  89. async def test_with_state_triggers_progress(self):
  90. """有 state 时触发进度推送"""
  91. reviewer = SemanticLogicReviewer()
  92. mock_tmpl = _make_mock_prompt_template()
  93. fake_response = "无明显问题"
  94. state = _make_mock_state()
  95. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  96. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  97. mock_invoke.return_value = fake_response
  98. mock_get_prompt.return_value = mock_tmpl
  99. result = await reviewer.check_semantic_logic(
  100. trace_id="trace_002",
  101. review_content="施工方案内容...",
  102. state=state,
  103. stage_name="basic_check",
  104. )
  105. assert result.success is True
  106. # 进度推送是 fire-and-forget (asyncio.create_task),等待一下
  107. await asyncio.sleep(0.1)
  108. pm = state["progress_manager"]
  109. assert pm.update_stage_progress.called
  110. call_kwargs = pm.update_stage_progress.call_args.kwargs
  111. assert call_kwargs["callback_task_id"] == "test_callback_001"
  112. assert call_kwargs["stage_name"] == "basic_check"
  113. # issues 中包含审查结果数据
  114. assert len(call_kwargs["issues"]) == 1
  115. assert call_kwargs["issues"][0]["name"] == "semantic_logic_check"
  116. assert call_kwargs["issues"][0]["success"] is True
  117. @pytest.mark.asyncio
  118. async def test_without_state_no_progress_call(self):
  119. """无 state 时不触发进度推送,不抛异常"""
  120. reviewer = SemanticLogicReviewer()
  121. mock_tmpl = _make_mock_prompt_template()
  122. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  123. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  124. mock_invoke.return_value = "无明显问题"
  125. mock_get_prompt.return_value = mock_tmpl
  126. result = await reviewer.check_semantic_logic(
  127. trace_id="trace_003",
  128. review_content="内容",
  129. state=None,
  130. stage_name=None,
  131. )
  132. assert result.success is True
  133. # 不应抛异常
  134. # ─── 单元测试:错误路径 ────────────────────────────────────────────────────────
  135. class TestCheckSemanticLogicError:
  136. """检查语义逻辑 — 错误路径"""
  137. @pytest.mark.asyncio
  138. async def test_model_call_failure(self):
  139. """模型调用抛异常 → 返回 success=False 的 ReviewResult"""
  140. reviewer = SemanticLogicReviewer()
  141. mock_tmpl = _make_mock_prompt_template()
  142. state = _make_mock_state()
  143. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  144. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  145. mock_invoke.side_effect = Exception("模型服务连接超时")
  146. mock_get_prompt.return_value = mock_tmpl
  147. result = await reviewer.check_semantic_logic(
  148. trace_id="trace_err_001",
  149. review_content="内容",
  150. state=state,
  151. stage_name="basic_check",
  152. )
  153. assert isinstance(result, ReviewResult)
  154. assert result.success is False
  155. assert result.details["name"] == "semantic_logic_check"
  156. assert "模型服务连接超时" in result.error_message
  157. assert result.execution_time > 0
  158. # 失败也应推送进度
  159. await asyncio.sleep(0.1)
  160. assert state["progress_manager"].update_stage_progress.called
  161. @pytest.mark.asyncio
  162. async def test_prompt_loader_failure(self):
  163. """prompt_loader 抛异常 → 应被捕获"""
  164. reviewer = SemanticLogicReviewer()
  165. with patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  166. mock_get_prompt.side_effect = RuntimeError("YAML 解析失败")
  167. result = await reviewer.check_semantic_logic(
  168. trace_id="trace_err_002",
  169. review_content="内容",
  170. )
  171. assert result.success is False
  172. assert "YAML 解析失败" in result.error_message
  173. @pytest.mark.asyncio
  174. async def test_error_without_state(self):
  175. """错误时无 state 也不应抛异常"""
  176. reviewer = SemanticLogicReviewer()
  177. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  178. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  179. mock_invoke.side_effect = Exception("boom")
  180. mock_get_prompt.return_value = _make_mock_prompt_template()
  181. result = await reviewer.check_semantic_logic(
  182. trace_id="trace_err_003",
  183. review_content="内容",
  184. state=None,
  185. )
  186. assert result.success is False
  187. assert "boom" in result.error_message
  188. # ─── 链路集成测试:真实 prompt_loader + mock AI 调用 ────────────────────────────
  189. class TestChainIntegration:
  190. """集成链路测试:使用真实 prompt_loader 验证完整链路(仅 mock AI 调用)"""
  191. @pytest.mark.asyncio
  192. async def test_full_chain_with_real_prompt_loader(self):
  193. """
  194. 使用真实 prompt_loader 加载 basic/semantic_logic_check 模板,
  195. 仅 mock 底层 AI 调用,验证完整链路畅通。
  196. """
  197. reviewer = SemanticLogicReviewer()
  198. fake_ai_response = "无明显问题"
  199. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke:
  200. mock_invoke.return_value = fake_ai_response
  201. result = await reviewer.check_semantic_logic(
  202. trace_id="chain_001",
  203. review_content="1. 工程概况\n本工程位于四川省,全长120公里。\n2. 施工安排\n先进行基础施工,再进行上部结构施工。",
  204. )
  205. assert result.success is True
  206. assert result.details["name"] == "semantic_logic_check"
  207. assert result.details["response"] == fake_ai_response
  208. # 验证 AI 调用确实收到了正确格式的消息
  209. call_kwargs = mock_invoke.call_args.kwargs
  210. assert call_kwargs["function_name"] == "grammar_check"
  211. messages = call_kwargs["messages"]
  212. assert len(messages) >= 2 # system + user
  213. # system message 应包含角色定义
  214. system_msg = messages[0]
  215. assert "语义逻辑审查" in system_msg.content or "role" in system_msg.content.lower()
  216. # user message 应包含待审查内容
  217. user_msg = messages[-1]
  218. assert "工程概况" in user_msg.content or "120公里" in user_msg.content
  219. @pytest.mark.asyncio
  220. async def test_chain_with_state_progress(self):
  221. """集成链路 + 进度推送"""
  222. reviewer = SemanticLogicReviewer()
  223. state = _make_mock_state()
  224. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke:
  225. mock_invoke.return_value = '{"issue_point": "逻辑矛盾", "location": "第2条", "suggestion": "调整", "reason": "前后矛盾", "risk_level": "中风险"}'
  226. result = await reviewer.check_semantic_logic(
  227. trace_id="chain_002",
  228. review_content="前文采用A方法。后文说不能采用A方法。",
  229. state=state,
  230. stage_name="semantic_stage",
  231. )
  232. assert result.success is True
  233. await asyncio.sleep(0.1)
  234. assert state["progress_manager"].update_stage_progress.called
  235. # ─── 边界情况测试 ──────────────────────────────────────────────────────────────
  236. class TestEdgeCases:
  237. """边界情况测试"""
  238. @pytest.mark.asyncio
  239. async def test_empty_content(self):
  240. """空内容 — 链路正常完成"""
  241. reviewer = SemanticLogicReviewer()
  242. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  243. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  244. mock_invoke.return_value = "内容为空,无法审查"
  245. mock_get_prompt.return_value = _make_mock_prompt_template()
  246. result = await reviewer.check_semantic_logic(
  247. trace_id="edge_001",
  248. review_content="",
  249. )
  250. assert result.success is True
  251. assert result.details["name"] == "semantic_logic_check"
  252. @pytest.mark.asyncio
  253. async def test_long_content(self):
  254. """长内容 — 链路正常完成"""
  255. reviewer = SemanticLogicReviewer()
  256. long_text = "第{}条 施工技术要求详细说明...\n".format
  257. content = "\n".join(long_text(i) for i in range(500))
  258. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  259. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  260. mock_invoke.return_value = "无明显问题"
  261. mock_get_prompt.return_value = _make_mock_prompt_template()
  262. result = await reviewer.check_semantic_logic(
  263. trace_id="edge_002",
  264. review_content=content,
  265. )
  266. assert result.success is True
  267. @pytest.mark.asyncio
  268. async def test_special_characters(self):
  269. """特殊字符内容"""
  270. reviewer = SemanticLogicReviewer()
  271. content = "特殊字符:@#$%^&*(){}[]|\\:;\"'<>,.?/~` ±×÷≈≠≤≥∞"
  272. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  273. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  274. mock_invoke.return_value = "无明显问题"
  275. mock_get_prompt.return_value = _make_mock_prompt_template()
  276. result = await reviewer.check_semantic_logic(
  277. trace_id="edge_003",
  278. review_content=content,
  279. )
  280. assert result.success is True
  281. @pytest.mark.asyncio
  282. async def test_unicode_multilang(self):
  283. """多语言 Unicode 内容"""
  284. reviewer = SemanticLogicReviewer()
  285. content = "中文 / English / 日本語 / 한국어 / Русский / العربية / 🚧🏗️"
  286. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  287. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  288. mock_invoke.return_value = "无明显问题"
  289. mock_get_prompt.return_value = _make_mock_prompt_template()
  290. result = await reviewer.check_semantic_logic(
  291. trace_id="edge_004",
  292. review_content=content,
  293. )
  294. assert result.success is True
  295. @pytest.mark.asyncio
  296. async def test_execution_time_tracking(self):
  297. """验证执行时间被正确记录"""
  298. reviewer = SemanticLogicReviewer()
  299. async def slow_response(*args, **kwargs):
  300. await asyncio.sleep(0.15)
  301. return "响应"
  302. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  303. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  304. mock_invoke.side_effect = slow_response
  305. mock_get_prompt.return_value = _make_mock_prompt_template()
  306. result = await reviewer.check_semantic_logic(
  307. trace_id="edge_005",
  308. review_content="测试",
  309. )
  310. assert result.execution_time >= 0.15
  311. # ─── 实际 API 集成测试(需手动开启)─────────────────────────────────────────────
  312. class TestLiveAPI:
  313. """实际 API 调用测试(标记为 integration,默认跳过)"""
  314. @pytest.mark.asyncio
  315. @pytest.mark.integration
  316. async def test_live_api_call(self):
  317. """真实调用 AI 接口(需服务可用)"""
  318. pytest.skip("需要实际 API 服务,手动运行")
  319. reviewer = SemanticLogicReviewer()
  320. result = await reviewer.check_semantic_logic(
  321. trace_id="live_001",
  322. review_content="1. 工程概况\n本工程为高速公路桥梁项目。\n2. 施工顺序\n先施工上部结构,再进行基础施工。",
  323. )
  324. assert isinstance(result, ReviewResult)
  325. # 不强制断言 success,依赖实际服务状态
  326. assert result.execution_time is not None
  327. if __name__ == "__main__":
  328. pytest.main([__file__, "-v", "-s", "--tb=short"])