test_semantic_logic.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426
  1. """
  2. 语义逻辑审查模块 — 链路测试
  3. 测试 semantic_logic.py 中的 SemanticLogicReviewer 完整调用链路
  4. 链路: prompt_loader → ChatPromptTemplate.format_messages() → generate_model_client.get_model_generate_invoke() → ReviewResult
  5. """
  6. import pytest
  7. import asyncio
  8. import sys
  9. import os
  10. from unittest.mock import Mock, patch, AsyncMock, MagicMock, PropertyMock
  11. sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..', '..')))
  12. from core.construction_review.component.reviewers.semantic_logic import (
  13. SemanticLogicReviewer,
  14. semantic_logic_reviewer,
  15. )
  16. from core.construction_review.component.reviewers.base_reviewer import ReviewResult
  17. # ─── helpers ───────────────────────────────────────────────────────────────────
  18. def _make_mock_prompt_template(messages=None):
  19. """构造一个模拟的 ChatPromptTemplate,format_messages() 返回指定消息列表"""
  20. from langchain_core.messages import SystemMessage, HumanMessage
  21. if messages is None:
  22. messages = [
  23. SystemMessage(content="你是语义逻辑审查专家"),
  24. HumanMessage(content="请审查:测试施工方案内容"),
  25. ]
  26. tmpl = MagicMock()
  27. tmpl.format_messages.return_value = messages
  28. return tmpl
  29. def _make_mock_state():
  30. """构造模拟的 state 字典(含 progress_manager)"""
  31. pm = AsyncMock()
  32. pm.update_stage_progress = AsyncMock()
  33. return {
  34. "progress_manager": pm,
  35. "callback_task_id": "test_callback_001",
  36. }
  37. # ─── 单元测试:初始化 ──────────────────────────────────────────────────────────
  38. class TestInit:
  39. """审查器初始化测试"""
  40. def test_init_model_client_set(self):
  41. """初始化后 model_client 应为 GenerateModelClient 实例"""
  42. r = SemanticLogicReviewer()
  43. from foundation.ai.agent.generate.model_generate import GenerateModelClient
  44. assert isinstance(r.model_client, GenerateModelClient)
  45. def test_global_singleton(self):
  46. """全局单例实例"""
  47. assert isinstance(semantic_logic_reviewer, SemanticLogicReviewer)
  48. # ─── 单元测试:成功路径 ────────────────────────────────────────────────────────
  49. class TestCheckSemanticLogicSuccess:
  50. """检查语义逻辑 — 成功路径"""
  51. @pytest.mark.asyncio
  52. async def test_success_path(self):
  53. """
  54. 验证完整成功链路:
  55. prompt_loader.get_prompt_template → format_messages → model_client.get_model_generate_invoke → ReviewResult
  56. """
  57. reviewer = SemanticLogicReviewer()
  58. mock_tmpl = _make_mock_prompt_template()
  59. fake_response = '{"issue_point": "无", "location": "", "suggestion": "", "reason": "", "risk_level": ""}'
  60. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  61. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  62. mock_invoke.return_value = fake_response
  63. mock_get_prompt.return_value = mock_tmpl
  64. result = await reviewer.check_semantic_logic(
  65. trace_id="trace_001",
  66. review_content="测试施工方案内容",
  67. )
  68. # 链路1: prompt_loader 被正确调用
  69. mock_get_prompt.assert_called_once_with(
  70. "basic", "semantic_logic_check",
  71. review_content="测试施工方案内容",
  72. review_references="",
  73. )
  74. # 链路2: format_messages 被调用
  75. mock_tmpl.format_messages.assert_called_once()
  76. # 链路3: model_client 使用 function_name="grammar_check"
  77. mock_invoke.assert_awaited_once()
  78. call_kwargs = mock_invoke.call_args.kwargs
  79. assert call_kwargs["trace_id"] == "trace_001"
  80. assert call_kwargs["function_name"] == "grammar_check"
  81. assert call_kwargs["messages"] == mock_tmpl.format_messages.return_value
  82. # 链路4: 返回正确的 ReviewResult
  83. assert isinstance(result, ReviewResult)
  84. assert result.success is True
  85. assert result.details["name"] == "semantic_logic_check"
  86. assert result.details["response"] == fake_response
  87. assert result.error_message is None
  88. assert result.execution_time > 0
  89. @pytest.mark.asyncio
  90. async def test_with_state_triggers_progress(self):
  91. """有 state 时触发进度推送"""
  92. reviewer = SemanticLogicReviewer()
  93. mock_tmpl = _make_mock_prompt_template()
  94. fake_response = "无明显问题"
  95. state = _make_mock_state()
  96. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  97. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  98. mock_invoke.return_value = fake_response
  99. mock_get_prompt.return_value = mock_tmpl
  100. result = await reviewer.check_semantic_logic(
  101. trace_id="trace_002",
  102. review_content="施工方案内容...",
  103. state=state,
  104. stage_name="basic_check",
  105. )
  106. assert result.success is True
  107. # 进度推送是 fire-and-forget (asyncio.create_task),等待一下
  108. await asyncio.sleep(0.1)
  109. pm = state["progress_manager"]
  110. assert pm.update_stage_progress.called
  111. call_kwargs = pm.update_stage_progress.call_args.kwargs
  112. assert call_kwargs["callback_task_id"] == "test_callback_001"
  113. assert call_kwargs["stage_name"] == "basic_check"
  114. # issues 中包含审查结果数据
  115. assert len(call_kwargs["issues"]) == 1
  116. assert call_kwargs["issues"][0]["name"] == "semantic_logic_check"
  117. assert call_kwargs["issues"][0]["success"] is True
  118. @pytest.mark.asyncio
  119. async def test_without_state_no_progress_call(self):
  120. """无 state 时不触发进度推送,不抛异常"""
  121. reviewer = SemanticLogicReviewer()
  122. mock_tmpl = _make_mock_prompt_template()
  123. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  124. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  125. mock_invoke.return_value = "无明显问题"
  126. mock_get_prompt.return_value = mock_tmpl
  127. result = await reviewer.check_semantic_logic(
  128. trace_id="trace_003",
  129. review_content="内容",
  130. state=None,
  131. stage_name=None,
  132. )
  133. assert result.success is True
  134. # 不应抛异常
  135. # ─── 单元测试:错误路径 ────────────────────────────────────────────────────────
  136. class TestCheckSemanticLogicError:
  137. """检查语义逻辑 — 错误路径"""
  138. @pytest.mark.asyncio
  139. async def test_model_call_failure(self):
  140. """模型调用抛异常 → 返回 success=False 的 ReviewResult"""
  141. reviewer = SemanticLogicReviewer()
  142. mock_tmpl = _make_mock_prompt_template()
  143. state = _make_mock_state()
  144. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  145. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  146. mock_invoke.side_effect = Exception("模型服务连接超时")
  147. mock_get_prompt.return_value = mock_tmpl
  148. result = await reviewer.check_semantic_logic(
  149. trace_id="trace_err_001",
  150. review_content="内容",
  151. state=state,
  152. stage_name="basic_check",
  153. )
  154. assert isinstance(result, ReviewResult)
  155. assert result.success is False
  156. assert result.details["name"] == "semantic_logic_check"
  157. assert "模型服务连接超时" in result.error_message
  158. assert result.execution_time > 0
  159. # 失败也应推送进度
  160. await asyncio.sleep(0.1)
  161. assert state["progress_manager"].update_stage_progress.called
  162. @pytest.mark.asyncio
  163. async def test_prompt_loader_failure(self):
  164. """prompt_loader 抛异常 → 应被捕获"""
  165. reviewer = SemanticLogicReviewer()
  166. with patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  167. mock_get_prompt.side_effect = RuntimeError("YAML 解析失败")
  168. result = await reviewer.check_semantic_logic(
  169. trace_id="trace_err_002",
  170. review_content="内容",
  171. )
  172. assert result.success is False
  173. assert "YAML 解析失败" in result.error_message
  174. @pytest.mark.asyncio
  175. async def test_error_without_state(self):
  176. """错误时无 state 也不应抛异常"""
  177. reviewer = SemanticLogicReviewer()
  178. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  179. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  180. mock_invoke.side_effect = Exception("boom")
  181. mock_get_prompt.return_value = _make_mock_prompt_template()
  182. result = await reviewer.check_semantic_logic(
  183. trace_id="trace_err_003",
  184. review_content="内容",
  185. state=None,
  186. )
  187. assert result.success is False
  188. assert "boom" in result.error_message
  189. # ─── 链路集成测试:真实 prompt_loader + mock AI 调用 ────────────────────────────
  190. class TestChainIntegration:
  191. """集成链路测试:使用真实 prompt_loader 验证完整链路(仅 mock AI 调用)"""
  192. @pytest.mark.asyncio
  193. async def test_full_chain_with_real_prompt_loader(self):
  194. """
  195. 使用真实 prompt_loader 加载 basic/semantic_logic_check 模板,
  196. 仅 mock 底层 AI 调用,验证完整链路畅通。
  197. """
  198. reviewer = SemanticLogicReviewer()
  199. fake_ai_response = "无明显问题"
  200. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke:
  201. mock_invoke.return_value = fake_ai_response
  202. result = await reviewer.check_semantic_logic(
  203. trace_id="chain_001",
  204. review_content="1. 工程概况\n本工程位于四川省,全长120公里。\n2. 施工安排\n先进行基础施工,再进行上部结构施工。",
  205. )
  206. assert result.success is True
  207. assert result.details["name"] == "semantic_logic_check"
  208. assert result.details["response"] == fake_ai_response
  209. # 验证 AI 调用确实收到了正确格式的消息
  210. call_kwargs = mock_invoke.call_args.kwargs
  211. assert call_kwargs["function_name"] == "grammar_check"
  212. messages = call_kwargs["messages"]
  213. assert len(messages) >= 2 # system + user
  214. # system message 应包含角色定义
  215. system_msg = messages[0]
  216. assert "语义逻辑审查" in system_msg.content or "role" in system_msg.content.lower()
  217. # user message 应包含待审查内容
  218. user_msg = messages[-1]
  219. assert "工程概况" in user_msg.content or "120公里" in user_msg.content
  220. @pytest.mark.asyncio
  221. async def test_chain_with_state_progress(self):
  222. """集成链路 + 进度推送"""
  223. reviewer = SemanticLogicReviewer()
  224. state = _make_mock_state()
  225. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke:
  226. mock_invoke.return_value = '{"issue_point": "逻辑矛盾", "location": "第2条", "suggestion": "调整", "reason": "前后矛盾", "risk_level": "中风险"}'
  227. result = await reviewer.check_semantic_logic(
  228. trace_id="chain_002",
  229. review_content="前文采用A方法。后文说不能采用A方法。",
  230. state=state,
  231. stage_name="semantic_stage",
  232. )
  233. assert result.success is True
  234. await asyncio.sleep(0.1)
  235. assert state["progress_manager"].update_stage_progress.called
  236. # ─── 边界情况测试 ──────────────────────────────────────────────────────────────
  237. class TestEdgeCases:
  238. """边界情况测试"""
  239. @pytest.mark.asyncio
  240. async def test_empty_content(self):
  241. """空内容 — 链路正常完成"""
  242. reviewer = SemanticLogicReviewer()
  243. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  244. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  245. mock_invoke.return_value = "内容为空,无法审查"
  246. mock_get_prompt.return_value = _make_mock_prompt_template()
  247. result = await reviewer.check_semantic_logic(
  248. trace_id="edge_001",
  249. review_content="",
  250. )
  251. assert result.success is True
  252. assert result.details["name"] == "semantic_logic_check"
  253. @pytest.mark.asyncio
  254. async def test_long_content(self):
  255. """长内容 — 链路正常完成"""
  256. reviewer = SemanticLogicReviewer()
  257. long_text = "第{}条 施工技术要求详细说明...\n".format
  258. content = "\n".join(long_text(i) for i in range(500))
  259. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  260. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  261. mock_invoke.return_value = "无明显问题"
  262. mock_get_prompt.return_value = _make_mock_prompt_template()
  263. result = await reviewer.check_semantic_logic(
  264. trace_id="edge_002",
  265. review_content=content,
  266. )
  267. assert result.success is True
  268. @pytest.mark.asyncio
  269. async def test_special_characters(self):
  270. """特殊字符内容"""
  271. reviewer = SemanticLogicReviewer()
  272. content = "特殊字符:@#$%^&*(){}[]|\\:;\"'<>,.?/~` ±×÷≈≠≤≥∞"
  273. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  274. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  275. mock_invoke.return_value = "无明显问题"
  276. mock_get_prompt.return_value = _make_mock_prompt_template()
  277. result = await reviewer.check_semantic_logic(
  278. trace_id="edge_003",
  279. review_content=content,
  280. )
  281. assert result.success is True
  282. @pytest.mark.asyncio
  283. async def test_unicode_multilang(self):
  284. """多语言 Unicode 内容"""
  285. reviewer = SemanticLogicReviewer()
  286. content = "中文 / English / 日本語 / 한국어 / Русский / العربية / 🚧🏗️"
  287. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  288. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  289. mock_invoke.return_value = "无明显问题"
  290. mock_get_prompt.return_value = _make_mock_prompt_template()
  291. result = await reviewer.check_semantic_logic(
  292. trace_id="edge_004",
  293. review_content=content,
  294. )
  295. assert result.success is True
  296. @pytest.mark.asyncio
  297. async def test_execution_time_tracking(self):
  298. """验证执行时间被正确记录"""
  299. reviewer = SemanticLogicReviewer()
  300. async def slow_response(*args, **kwargs):
  301. await asyncio.sleep(0.15)
  302. return "响应"
  303. with patch.object(reviewer.model_client, 'get_model_generate_invoke', new_callable=AsyncMock) as mock_invoke, \
  304. patch('core.construction_review.component.reviewers.semantic_logic.prompt_loader.get_prompt_template') as mock_get_prompt:
  305. mock_invoke.side_effect = slow_response
  306. mock_get_prompt.return_value = _make_mock_prompt_template()
  307. result = await reviewer.check_semantic_logic(
  308. trace_id="edge_005",
  309. review_content="测试",
  310. )
  311. assert result.execution_time >= 0.15
  312. # ─── 实际 API 集成测试(需手动开启)─────────────────────────────────────────────
  313. class TestLiveAPI:
  314. """实际 API 调用测试(标记为 integration,默认跳过)"""
  315. @pytest.mark.asyncio
  316. @pytest.mark.integration
  317. async def test_live_api_call(self):
  318. """真实调用 AI 接口(需服务可用)"""
  319. pytest.skip("需要实际 API 服务,手动运行")
  320. reviewer = SemanticLogicReviewer()
  321. result = await reviewer.check_semantic_logic(
  322. trace_id="live_001",
  323. review_content="1. 工程概况\n本工程为高速公路桥梁项目。\n2. 施工顺序\n先施工上部结构,再进行基础施工。",
  324. )
  325. assert isinstance(result, ReviewResult)
  326. # 不强制断言 success,依赖实际服务状态
  327. assert result.execution_time is not None
  328. if __name__ == "__main__":
  329. pytest.main([__file__, "-v", "-s", "--tb=short"])