пре 1 недеља · 6e223b0ef8
--- a/core/construction_review/component/ai_review_engine.py
+++ b/core/construction_review/component/ai_review_engine.py
@@ -854,14 +854,149 @@ class AIReviewEngine(BaseReviewer):
 
				             }
			
 
				             return error_result, trace_id_idx
			
 
				 
			
 
				-    async def outline_Check(self, trace_id_idx: str, review_content: Dict[str, Any],
			
 
				-                            state: str, stage_name: str) -> Dict[str, Any]:
			
 
				-            if state and isinstance(state, dict):
			
 
				-                structured = state.get('structured_content', {})
			
 
				+    async def check_outline_catalogue(
			
 
				+        self,
			
 
				+        trace_id_idx: str,
			
 
				+        outline_data: Dict[str, Any],
			
 
				+        state: Dict[str, Any],
			
 
				+        stage_name: str
			
 
				+    ) -> Dict[str, Any]:
			
 
				+        """
			
 
				+        基于文档目录(outline)的一二级分类缺失检查。
			
 
				+
			
 
				+        使用模糊匹配算法，支持基于名称相似度的目录匹配。
			
 
				+
			
 
				+        Args:
			
 
				+            trace_id_idx: 追踪ID索引
			
 
				+            outline_data: 包含 outline 的字典（通常来自 structured_content）
			
 
				+            state: 状态字典，可从中回退获取 structured_content.outline
			
 
				+            stage_name: 阶段名称
			
 
				+
			
 
				+        Returns:
			
 
				+            Dict[str, Any]: 包含缺失一级、二级目录的统计结果
			
 
				+        """
			
 
				+        from .outline_catalogue_matcher import OutlineCatalogueMatcher
			
 
				+
			
 
				+        start_time = time.time()
			
 
				+        name = "outline_catalogue_check"
			
 
				+
			
 
				+        try:
			
 
				+            logger.info(f"[{name}] 开始目录一二级缺失检查")
			
 
				+
			
 
				+            # CSV路径
			
 
				+            csv_path = str(
			
 
				+                Path(__file__).parent / 'doc_worker' / 'config' /
			
 
				+                'StandardCategoryTable.csv'
			
 
				+            )
			
 
				+            raw_content_csv = str(
			
 
				+                Path(__file__).parent / 'doc_worker' / 'config' /
			
 
				+                'construction_plan_standards.csv'
			
 
				+            )
			
 
				+
			
 
				+            # 从 outline_data 或 state 中获取 chapters 列表
			
 
				+            outline_chapters = []
			
 
				+            if outline_data and isinstance(outline_data, dict):
			
 
				+                outline_raw = outline_data.get('outline') or outline_data
			
 
				+                if isinstance(outline_raw, dict):
			
 
				+                    outline_chapters = outline_raw.get('chapters', [])
			
 
				+                elif isinstance(outline_raw, list):
			
 
				+                    outline_chapters = outline_raw
			
 
				 
			
 
				+            if not outline_chapters and state and isinstance(state, dict):
			
 
				+                structured = state.get('structured_content', {})
			
 
				+                outline_raw = structured.get('outline', {})
			
 
				+                if isinstance(outline_raw, dict):
			
 
				+                    outline_chapters = outline_raw.get('chapters', [])
			
 
				+                elif isinstance(outline_raw, list):
			
 
				+                    outline_chapters = outline_raw
			
 
				+
			
 
				+            # 提取一级和二级信息
			
 
				+            outline_first = set()
			
 
				+            outline_secondary = {}
			
 
				+            
			
 
				+            for chapter in outline_chapters:
			
 
				+                if not isinstance(chapter, dict):
			
 
				+                    continue
			
 
				                 
			
 
				-                outline = structured.get('outline')
			
 
				-                all_chunks = structured.get('chunks', [])
			
 
				+                first_code = chapter.get('chapter_classification', '')
			
 
				+                if first_code:
			
 
				+                    outline_first.add(first_code)
			
 
				+                
			
 
				+                # 提取 subsections 中的二级章节
			
 
				+                for sub in chapter.get('subsections', []):
			
 
				+                    if not isinstance(sub, dict):
			
 
				+                        continue
			
 
				+                    second_code = sub.get('secondary_category_code', '')
			
 
				+                    if first_code and second_code:
			
 
				+                        outline_secondary[(first_code, second_code)] = sub.get('title', '')
			
 
				+            
			
 
				+            logger.info(f"[{name}] 获取到 {len(outline_first)} 个一级, {len(outline_secondary)} 个二级")
			
 
				+
			
 
				+            # 使用模糊匹配
			
 
				+            matcher = OutlineCatalogueMatcher(csv_path, raw_content_csv)
			
 
				+            match_result = matcher.match_catalogue(
			
 
				+                outline_first=outline_first,
			
 
				+                outline_secondary=outline_secondary,
			
 
				+                threshold=0.6
			
 
				+            )
			
 
				+            
			
 
				+            catalogue_result = {
			
 
				+                "level": "primary_and_secondary",
			
 
				+                "is_complete": match_result['missing_first_count'] == 0 and match_result['missing_second_count'] == 0,
			
 
				+                "first_level": {
			
 
				+                    "total_required": len(matcher.first_names),
			
 
				+                    "actual_present": len(match_result['matched_first']),
			
 
				+                    "missing_count": match_result['missing_first_count'],
			
 
				+                    "missing": match_result['missing_first']
			
 
				+                },
			
 
				+                "second_level": {
			
 
				+                    "total_required": len(matcher.second_names),
			
 
				+                    "actual_present": len(match_result['matched_second']),
			
 
				+                    "missing_count": match_result['missing_second_count'],
			
 
				+                    "missing": match_result['missing_second']
			
 
				+                },
			
 
				+                "match_details": match_result['match_details']
			
 
				+            }
			
 
				+
			
 
				+            execution_time = time.time() - start_time
			
 
				+            logger.info(
			
 
				+                f"[{name}] 检查完成，耗时: {execution_time:.2f}s, "
			
 
				+                f"缺失一级: {match_result['missing_first_count']} 个, "
			
 
				+                f"缺失二级: {match_result['missing_second_count']} 个"
			
 
				+            )
			
 
				+
			
 
				+            return {
			
 
				+                "success": True,
			
 
				+                "execution_time": execution_time,
			
 
				+                "details": {
			
 
				+                    "name": name,
			
 
				+                    "missing_first_count": match_result['missing_first_count'],
			
 
				+                    "missing_second_count": match_result['missing_second_count'],
			
 
				+                    "missing_first": match_result['missing_first'],
			
 
				+                    "missing_second": match_result['missing_second'],
			
 
				+                    "catalogue_check": catalogue_result
			
 
				+                }
			
 
				+            }
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            execution_time = time.time() - start_time
			
 
				+            error_msg = f"[{name}] 检查失败: {str(e)}"
			
 
				+            logger.error(error_msg, exc_info=True)
			
 
				+
			
 
				+            return {
			
 
				+                "success": False,
			
 
				+                "execution_time": execution_time,
			
 
				+                "error": str(e),
			
 
				+                "details": {
			
 
				+                    "name": name,
			
 
				+                    "missing_first_count": 0,
			
 
				+                    "missing_second_count": 0,
			
 
				+                    "missing_first": [],
			
 
				+                    "missing_second": [],
			
 
				+                    "catalogue_check": {}
			
 
				+                }
			
 
				+            }
			
 
				+
			
 
				     async def check_sensitive(self, trace_id_idx: str, review_content: str,
			
 
				                             state: str, stage_name: str) -> Dict[str, Any]:
			
 
				         """
			
--- a/core/construction_review/component/outline_catalogue_matcher.py
+++ b/core/construction_review/component/outline_catalogue_matcher.py
@@ -0,0 +1,388 @@
 
				+#!/usr/bin/env python
			
 
				+# -*- coding: utf-8 -*-
			
 
				+"""
			
 
				+目录缺失检查 - 模糊匹配模块
			
 
				+
			
 
				+独立模块，用于 AIReviewEngine.check_outline_catalogue 方法
			
 
				+提供基于模糊匹配的目录缺失统计功能
			
 
				+"""
			
 
				+
			
 
				+import difflib
			
 
				+import re
			
 
				+from typing import Dict, List, Optional, Set, Tuple, Any
			
 
				+from collections import defaultdict
			
 
				+from pathlib import Path
			
 
				+
			
 
				+import pandas as pd
			
 
				+
			
 
				+
			
 
				+class OutlineCatalogueMatcher:
			
 
				+    """
			
 
				+    目录模糊匹配器
			
 
				+    
			
 
				+    提供独立于 LightweightCompletenessChecker 的模糊匹配功能
			
 
				+    支持基于名称相似度的目录匹配
			
 
				+    """
			
 
				+    
			
 
				+    def __init__(self, standard_csv_path: str, raw_content_csv_path: str = None):
			
 
				+        """
			
 
				+        初始化匹配器
			
 
				+        
			
 
				+        Args:
			
 
				+            standard_csv_path: StandardCategoryTable.csv 路径
			
 
				+            raw_content_csv_path: construction_plan_standards.csv 路径（可选）
			
 
				+        """
			
 
				+        self.standard_csv_path = standard_csv_path
			
 
				+        self.raw_content_csv_path = raw_content_csv_path
			
 
				+        
			
 
				+        # 加载标准数据
			
 
				+        self.first_names: Dict[str, str] = {}  # code -> name
			
 
				+        self.second_names: Dict[Tuple[str, str], str] = {}  # (first_code, second_code) -> name
			
 
				+        self.first_seq: Dict[str, int] = {}  # code -> seq
			
 
				+        self.second_seq: Dict[Tuple[str, str], int] = {}  # (first_code, second_code) -> seq
			
 
				+        
			
 
				+        # 详细定义内容
			
 
				+        self.second_raw_content: Dict[Tuple[str, str], str] = {}  # (first_name, second_name) -> content
			
 
				+        
			
 
				+        self._load_standard_csv()
			
 
				+        if raw_content_csv_path:
			
 
				+            self._load_raw_content_csv()
			
 
				+    
			
 
				+    def _load_standard_csv(self) -> None:
			
 
				+        """加载标准分类表"""
			
 
				+        encodings = ['utf-8-sig', 'utf-16', 'gbk', 'utf-8']
			
 
				+        df = None
			
 
				+        
			
 
				+        for encoding in encodings:
			
 
				+            try:
			
 
				+                df = pd.read_csv(self.standard_csv_path, encoding=encoding, sep=None, engine='python')
			
 
				+                break
			
 
				+            except UnicodeDecodeError:
			
 
				+                continue
			
 
				+        
			
 
				+        if df is None:
			
 
				+            raise ValueError(f"无法读取CSV文件: {self.standard_csv_path}")
			
 
				+        
			
 
				+        df.columns = [c.strip().lower().replace(' ', '_') for c in df.columns]
			
 
				+        
			
 
				+        # 提取一级和二级信息（去重）
			
 
				+        for _, row in df.iterrows():
			
 
				+            first_code = str(row.get('first_code', '')).strip()
			
 
				+            second_code = str(row.get('second_code', '')).strip()
			
 
				+            first_name = str(row.get('first_name', '')).strip()
			
 
				+            second_name = str(row.get('second_name', '')).strip()
			
 
				+            
			
 
				+            if not all([first_code, second_code, first_name, second_name]):
			
 
				+                continue
			
 
				+            
			
 
				+            try:
			
 
				+                first_seq = int(row.get('first_seq', 0) or 0)
			
 
				+                second_seq = int(row.get('second_seq', 0) or 0)
			
 
				+            except:
			
 
				+                first_seq = 0
			
 
				+                second_seq = 0
			
 
				+            
			
 
				+            # 存储一级信息
			
 
				+            if first_code not in self.first_names:
			
 
				+                self.first_names[first_code] = first_name
			
 
				+                self.first_seq[first_code] = first_seq
			
 
				+            
			
 
				+            # 存储二级信息
			
 
				+            sec_key = (first_code, second_code)
			
 
				+            if sec_key not in self.second_names:
			
 
				+                self.second_names[sec_key] = second_name
			
 
				+                self.second_seq[sec_key] = second_seq
			
 
				+    
			
 
				+    def _load_raw_content_csv(self) -> None:
			
 
				+        """加载详细定义表"""
			
 
				+        try:
			
 
				+            encodings = ['utf-8-sig', 'utf-16', 'gbk', 'utf-8']
			
 
				+            df = None
			
 
				+            
			
 
				+            for encoding in encodings:
			
 
				+                try:
			
 
				+                    df = pd.read_csv(self.raw_content_csv_path, encoding=encoding, sep=None, engine='python')
			
 
				+                    break
			
 
				+                except UnicodeDecodeError:
			
 
				+                    continue
			
 
				+            
			
 
				+            if df is None:
			
 
				+                return
			
 
				+            
			
 
				+            df.columns = [c.strip().lower().replace(' ', '_') for c in df.columns]
			
 
				+            
			
 
				+            if 'second_raw_content' not in df.columns:
			
 
				+                return
			
 
				+            
			
 
				+            for _, row in df.iterrows():
			
 
				+                first_name = str(row.get('first_name', '')).strip()
			
 
				+                second_name = str(row.get('second_name', '')).strip()
			
 
				+                raw_content = str(row.get('second_raw_content', '')).strip()
			
 
				+                
			
 
				+                if first_name and second_name and raw_content and raw_content != 'nan':
			
 
				+                    self.second_raw_content[(first_name, second_name)] = raw_content
			
 
				+                    
			
 
				+        except Exception:
			
 
				+            pass  # 加载失败不影响主功能
			
 
				+    
			
 
				+    def _normalize_text(self, text: str) -> str:
			
 
				+        """文本标准化"""
			
 
				+        if not text:
			
 
				+            return ""
			
 
				+        text = re.sub(r'[\s\n\r\t.,;:!?，。；：！？、""''（）()【】\[\]《》<>]', '', text)
			
 
				+        return text.lower().strip()
			
 
				+    
			
 
				+    def _calculate_similarity(self, text1: str, text2: str) -> float:
			
 
				+        """计算两个文本的相似度"""
			
 
				+        if not text1 or not text2:
			
 
				+            return 0.0
			
 
				+        
			
 
				+        norm1 = self._normalize_text(text1)
			
 
				+        norm2 = self._normalize_text(text2)
			
 
				+        
			
 
				+        if not norm1 or not norm2:
			
 
				+            return 0.0
			
 
				+        
			
 
				+        return difflib.SequenceMatcher(None, norm1, norm2).ratio()
			
 
				+    
			
 
				+    def _extract_keywords(self, text: str) -> List[str]:
			
 
				+        """提取关键词"""
			
 
				+        stopwords = {'的', '及', '与', '或', '和', '等', '之', '第', '章', '节', '条',
			
 
				+                     '编制', '施工', '措施', '要求', '管理', '保证', '质量', '安全',
			
 
				+                     '技术', '计划', '人员', '组织', '体系', '条件', '概述', '概况'}
			
 
				+        
			
 
				+        words = []
			
 
				+        for word in text:
			
 
				+            if word not in stopwords and len(word.strip()) > 0:
			
 
				+                words.append(word)
			
 
				+        
			
 
				+        if not words and text:
			
 
				+            return list(text)
			
 
				+        
			
 
				+        return words
			
 
				+    
			
 
				+    def _calculate_enhanced_similarity(
			
 
				+        self,
			
 
				+        standard_name: str,
			
 
				+        actual_title: str,
			
 
				+        standard_raw_content: str = None
			
 
				+    ) -> float:
			
 
				+        """
			
 
				+        增强的相似度计算 - 基础相似度主导
			
 
				+        
			
 
				+        策略：
			
 
				+        1. 基础相似度（SequenceMatcher）- 核心，必须 >= 0.3 才能进入加分
			
 
				+        2. 关键词匹配（+0.2）- 辅助
			
 
				+        3. 包含关系（+0.1）- 辅助
			
 
				+        4. 详细定义匹配（+0.2）- 辅助
			
 
				+        
			
 
				+        规则：基础相似度 < 0.3 时，直接返回基础分（避免完全不相关的匹配）
			
 
				+        """
			
 
				+        if not standard_name or not actual_title:
			
 
				+            return 0.0
			
 
				+        
			
 
				+        # 1. 基础相似度（核心）
			
 
				+        base_similarity = self._calculate_similarity(standard_name, actual_title)
			
 
				+        
			
 
				+        # 基础相似度太低，说明完全不相关，不进入加分阶段
			
 
				+        if base_similarity < 0.3:
			
 
				+            return base_similarity
			
 
				+        
			
 
				+        # 基础相似度达标，开始计算加分
			
 
				+        scores = [base_similarity]
			
 
				+        
			
 
				+        norm_standard = self._normalize_text(standard_name)
			
 
				+        norm_actual = self._normalize_text(actual_title)
			
 
				+        
			
 
				+        # 2. 关键词匹配（权重0.2，比原来降低）
			
 
				+        keyword_bonus = 0.0
			
 
				+        standard_keywords = self._extract_keywords(norm_standard)
			
 
				+        actual_keywords = self._extract_keywords(norm_actual)
			
 
				+        
			
 
				+        if standard_keywords and actual_keywords:
			
 
				+            matched = len(set(standard_keywords) & set(actual_keywords))
			
 
				+            total = len(set(standard_keywords) | set(actual_keywords))
			
 
				+            if total > 0:
			
 
				+                # 权重从0.3降到0.2，避免关键词过度影响
			
 
				+                keyword_bonus = (matched / total) * 0.2
			
 
				+        
			
 
				+        scores.append(keyword_bonus)
			
 
				+        
			
 
				+        # 3. 包含关系（权重0.1，比原来降低）
			
 
				+        contain_bonus = 0.0
			
 
				+        if norm_standard in norm_actual or norm_actual in norm_standard:
			
 
				+            contain_bonus = 0.1
			
 
				+        scores.append(contain_bonus)
			
 
				+        
			
 
				+        # 4. 详细定义匹配（权重0.2，比原来降低）
			
 
				+        if standard_raw_content and standard_raw_content != 'nan':
			
 
				+            raw_content_score = self._calculate_similarity(
			
 
				+                self._normalize_text(standard_raw_content),
			
 
				+                norm_actual
			
 
				+            )
			
 
				+            # 阈值提高到0.6（原来0.5），确保详细定义必须足够相关才加分
			
 
				+            if raw_content_score > 0.6:
			
 
				+                # 权重从0.4降到0.2，避免详细定义过度影响
			
 
				+                scores.append(raw_content_score * 0.2)
			
 
				+        
			
 
				+        return min(sum(scores), 1.0)
			
 
				+    
			
 
				+    def match_catalogue(
			
 
				+        self,
			
 
				+        outline_first: Set[str],
			
 
				+        outline_secondary: Dict[Tuple[str, str], str],
			
 
				+        threshold: float = 0.6
			
 
				+    ) -> Dict[str, Any]:
			
 
				+        """
			
 
				+        执行目录匹配
			
 
				+        
			
 
				+        Args:
			
 
				+            outline_first: 从outline中提取的一级code集合
			
 
				+            outline_secondary: 从outline中提取的二级 {(first_code, second_code): title}
			
 
				+            threshold: 模糊匹配阈值（默认0.6）
			
 
				+            
			
 
				+        Returns:
			
 
				+            匹配结果，包含：
			
 
				+            - matched_first: 匹配的一级code集合
			
 
				+            - matched_second: 匹配的二级key集合
			
 
				+            - missing_first: 缺失的一级列表
			
 
				+            - missing_second: 缺失的二级列表
			
 
				+            - match_details: 匹配详情
			
 
				+        """
			
 
				+        required_first = set(self.first_names.keys())
			
 
				+        required_second = set(self.second_names.keys())
			
 
				+        
			
 
				+        # 一级匹配
			
 
				+        matched_first = outline_first & required_first
			
 
				+        missing_first = required_first - matched_first
			
 
				+        
			
 
				+        # 二级匹配
			
 
				+        matched_second = set()
			
 
				+        missing_second = set()
			
 
				+        match_details = []
			
 
				+        
			
 
				+        # 精确匹配
			
 
				+        outline_second_keys = set(outline_secondary.keys())
			
 
				+        exact_matches = outline_second_keys & required_second
			
 
				+        matched_second.update(exact_matches)
			
 
				+        
			
 
				+        for key in exact_matches:
			
 
				+            first_code, second_code = key
			
 
				+            match_details.append({
			
 
				+                'level': 'second',
			
 
				+                'required_first_code': first_code,
			
 
				+                'required_second_code': second_code,
			
 
				+                'required_second_name': self.second_names.get(key, ''),
			
 
				+                'matched': True,
			
 
				+                'match_type': 'exact',
			
 
				+                'similarity': 1.0
			
 
				+            })
			
 
				+        
			
 
				+        # 模糊匹配（对未精确匹配的）
			
 
				+        required_remaining = required_second - exact_matches
			
 
				+        outline_remaining = outline_second_keys - exact_matches
			
 
				+        
			
 
				+        if required_remaining and outline_remaining:
			
 
				+            # 准备outline数据
			
 
				+            outline_list = []
			
 
				+            for key in outline_remaining:
			
 
				+                first_code, second_code = key
			
 
				+                title = outline_secondary.get(key, "")
			
 
				+                outline_list.append({
			
 
				+                    'key': key,
			
 
				+                    'first_code': first_code,
			
 
				+                    'second_code': second_code,
			
 
				+                    'title': title
			
 
				+                })
			
 
				+            
			
 
				+            # 对每个required进行模糊匹配
			
 
				+            for req_key in required_remaining:
			
 
				+                first_code, second_code = req_key
			
 
				+                second_name = self.second_names.get(req_key, '')
			
 
				+                first_name = self.first_names.get(first_code, '')
			
 
				+                
			
 
				+                # 获取详细定义
			
 
				+                raw_content = self.second_raw_content.get((first_name, second_name))
			
 
				+                
			
 
				+                best_match = None
			
 
				+                best_score = 0.0
			
 
				+                
			
 
				+                for item in outline_list:
			
 
				+                    # 计算相似度
			
 
				+                    score1 = self._calculate_enhanced_similarity(second_name, item['title'])
			
 
				+                    score2 = self._calculate_enhanced_similarity(
			
 
				+                        f"{first_name}{second_name}",
			
 
				+                        item['title']
			
 
				+                    )
			
 
				+                    score = max(score1, score2)
			
 
				+                    
			
 
				+                    # 如果有详细定义，也计算
			
 
				+                    if raw_content:
			
 
				+                        score3 = self._calculate_enhanced_similarity(
			
 
				+                            second_name,
			
 
				+                            item['title'],
			
 
				+                            raw_content
			
 
				+                        )
			
 
				+                        score = max(score, score3)
			
 
				+                    
			
 
				+                    if score > best_score:
			
 
				+                        best_score = score
			
 
				+                        best_match = item
			
 
				+                
			
 
				+                if best_score >= threshold:
			
 
				+                    matched_second.add(req_key)
			
 
				+                    match_details.append({
			
 
				+                        'level': 'second',
			
 
				+                        'required_first_code': first_code,
			
 
				+                        'required_second_code': second_code,
			
 
				+                        'required_second_name': second_name,
			
 
				+                        'matched': True,
			
 
				+                        'match_type': 'fuzzy',
			
 
				+                        'similarity': best_score,
			
 
				+                        'matched_title': best_match['title'] if best_match else None,
			
 
				+                        'used_raw_content': raw_content is not None
			
 
				+                    })
			
 
				+                else:
			
 
				+                    missing_second.add(req_key)
			
 
				+                    match_details.append({
			
 
				+                        'level': 'second',
			
 
				+                        'required_first_code': first_code,
			
 
				+                        'required_second_code': second_code,
			
 
				+                        'required_second_name': second_name,
			
 
				+                        'matched': False,
			
 
				+                        'match_type': 'none',
			
 
				+                        'similarity': best_score
			
 
				+                    })
			
 
				+        else:
			
 
				+            missing_second = required_remaining
			
 
				+        
			
 
				+        # 构建缺失详情
			
 
				+        missing_first_details = []
			
 
				+        for code in sorted(missing_first, key=lambda x: self.first_seq.get(x, 0)):
			
 
				+            missing_first_details.append({
			
 
				+                'first_code': code,
			
 
				+                'first_name': self.first_names.get(code, code),
			
 
				+                'first_seq': self.first_seq.get(code, 0)
			
 
				+            })
			
 
				+        
			
 
				+        missing_second_details = []
			
 
				+        for key in sorted(missing_second, key=lambda x: (self.first_seq.get(x[0], 0), self.second_seq.get(x, 0))):
			
 
				+            first_code, second_code = key
			
 
				+            missing_second_details.append({
			
 
				+                'first_code': first_code,
			
 
				+                'first_name': self.first_names.get(first_code, first_code),
			
 
				+                'first_seq': self.first_seq.get(first_code, 0),
			
 
				+                'secondary_code': second_code,
			
 
				+                'secondary_name': self.second_names.get(key, ''),
			
 
				+                'second_seq': self.second_seq.get(key, 0)
			
 
				+            })
			
 
				+        
			
 
				+        return {
			
 
				+            'matched_first': matched_first,
			
 
				+            'matched_second': matched_second,
			
 
				+            'missing_first': missing_first_details,
			
 
				+            'missing_second': missing_second_details,
			
 
				+            'missing_first_count': len(missing_first),
			
 
				+            'missing_second_count': len(missing_second),
			
 
				+            'match_details': match_details
			
 
				+        }
			
--- a/core/construction_review/component/reviewers/completeness_reviewer.py
+++ b/core/construction_review/component/reviewers/completeness_reviewer.py
@@ -355,7 +355,9 @@ JSON输出："""
 
				         second_name: str = None,
			
 
				         tertiary_items: List[TertiaryItem] = None,
			
 
				         outline_title: str = None,
			
 
				-        timeout: int = 30
			
 
				+        timeout: int = 30,
			
 
				+        first_seq: int = 0,
			
 
				+        second_seq: int = 0
			
 
				     ) -> Dict[str, str]:
			
 
				         """
			
 
				         使用大模型生成建议
			
@@ -905,7 +907,8 @@ JSON输出："""
 
				                     level="一级",
			
 
				                     first_code=first_code,
			
 
				                     first_name=first_name,
			
 
				-                    first_seq=first_seq
			
 
				+                    first_seq=first_seq,
			
 
				+                    second_seq=0
			
 
				                 )
			
 
				 
			
 
				                 if llm_result and llm_result.get("suggestion"):
			
@@ -945,7 +948,9 @@ JSON输出："""
 
				                         first_code=cat1,
			
 
				                         first_name=first_name,
			
 
				                         second_code=cat2,
			
 
				-                        second_name=second_name
			
 
				+                        second_name=second_name,
			
 
				+                        first_seq=first_seq,
			
 
				+                        second_seq=second_seq
			
 
				                     )
			
 
				 
			
 
				                     if llm_result and llm_result.get("suggestion"):
			
@@ -988,7 +993,9 @@ JSON输出："""
 
				                     first_name=first_name,
			
 
				                     second_code=cat2,
			
 
				                     second_name=second_name,
			
 
				-                    tertiary_items=missing_t_items
			
 
				+                    tertiary_items=missing_t_items,
			
 
				+                    first_seq=first_seq,
			
 
				+                    second_seq=second_seq
			
 
				                 )
			
 
				 
			
 
				                 if llm_result and llm_result.get("suggestion"):
			
@@ -1029,7 +1036,9 @@ JSON输出："""
 
				                     first_code="",
			
 
				                     first_name=f_name,
			
 
				                     second_name=sec_title,
			
 
				-                    outline_title=sec_title
			
 
				+                    outline_title=sec_title,
			
 
				+                    first_seq=0,
			
 
				+                    second_seq=0
			
 
				                 )
			
 
				 
			
 
				                 if llm_result and llm_result.get("suggestion"):
			
--- a/core/construction_review/component/reviewers/utils/inter_tool.py
+++ b/core/construction_review/component/reviewers/utils/inter_tool.py
@@ -344,6 +344,110 @@ class InterTool:
 
				                 logger.info(f"🔍 内容时效性审查结果处理完成，添加 {len(batch_results)} 个问题项")
			
 
				                 continue
			
 
				 
			
 
				+            # 🔧 特殊处理：outline_catalogue_check 的返回格式（目录一二级缺失统计）
			
 
				+            if check_key == 'outline_catalogue_check' and isinstance(check_result, dict):
			
 
				+                details = check_result.get('details', {})
			
 
				+                missing_first = details.get('missing_first', [])
			
 
				+                missing_second = details.get('missing_second', [])
			
 
				+                missing_first_count = details.get('missing_first_count', 0)
			
 
				+                missing_second_count = details.get('missing_second_count', 0)
			
 
				+                
			
 
				+                logger.debug(f"🔍 [DEBUG] 处理目录缺失统计结果，缺失一级: {missing_first_count}, 缺失二级: {missing_second_count}")
			
 
				+                
			
 
				+                # 如果没有缺失目录，添加一个通过记录
			
 
				+                if not missing_first and not missing_second:
			
 
				+                    review_lists.append({
			
 
				+                        "check_item": "outline_catalogue_check",
			
 
				+                        "chapter_code": chapter_code,
			
 
				+                        "check_item_code": f"{chapter_code}_outline_catalogue_check",
			
 
				+                        "check_result": {
			
 
				+                            "issue_point": "目录结构完整",
			
 
				+                            "location": "整篇文档",
			
 
				+                            "suggestion": "无",
			
 
				+                            "reason": "一二级目录结构符合标准规范要求",
			
 
				+                            "risk_level": "low"
			
 
				+                        },
			
 
				+                        "exist_issue": False,
			
 
				+                        "risk_info": {"risk_level": "low"}
			
 
				+                    })
			
 
				+                else:
			
 
				+                    # 有缺失目录时，先生成汇总统计
			
 
				+                    total_missing = missing_first_count + missing_second_count
			
 
				+                    
			
 
				+                    # 构建缺失目录名称列表
			
 
				+                    missing_first_names = [item.get('first_name', '未知') for item in missing_first if isinstance(item, dict)]
			
 
				+                    missing_second_names = [f"{item.get('first_name', '')}.{item.get('secondary_name', '未知')}" for item in missing_second if isinstance(item, dict)]
			
 
				+                    
			
 
				+                    # 构建建议文本
			
 
				+                    suggestion_parts = []
			
 
				+                    if missing_first_names:
			
 
				+                        suggestion_parts.append(f"一级目录（{missing_first_count}个）：{', '.join(missing_first_names)}")
			
 
				+                    if missing_second_names:
			
 
				+                        suggestion_parts.append(f"二级目录（{missing_second_count}个）：{', '.join(missing_second_names)}")
			
 
				+                    suggestion_text = "建议补充以下缺失目录：\n" + "\n".join(suggestion_parts) if suggestion_parts else "无"
			
 
				+                    
			
 
				+                    # 添加汇总统计问题（放在最前面）
			
 
				+                    review_lists.append({
			
 
				+                        "check_item": "outline_catalogue_check",
			
 
				+                        "chapter_code": chapter_code,
			
 
				+                        "check_item_code": f"{chapter_code}_outline_catalogue_check",
			
 
				+                        "check_result": {
			
 
				+                            "issue_point": f"目录缺失汇总统计（共缺失 {total_missing} 个目录）",
			
 
				+                            "location": "整篇文档",
			
 
				+                            "suggestion": suggestion_text,
			
 
				+                            "reason": f"根据标准分类表对比，共发现 {total_missing} 个缺失目录：缺失一级 {missing_first_count} 个，缺失二级 {missing_second_count} 个",
			
 
				+                            "risk_level": "medium",
			
 
				+                            "summary": {
			
 
				+                                "missing_first_count": missing_first_count,
			
 
				+                                "missing_second_count": missing_second_count,
			
 
				+                                "missing_total": total_missing,
			
 
				+                                "missing_first_names": missing_first_names,
			
 
				+                                "missing_second_names": missing_second_names
			
 
				+                            }
			
 
				+                        },
			
 
				+                        "exist_issue": True,
			
 
				+                        "risk_info": {"risk_level": "medium"}
			
 
				+                    })
			
 
				+                    
			
 
				+                    # 然后逐个添加详细的缺失目录问题
			
 
				+                    for item in missing_first:
			
 
				+                        if isinstance(item, dict):
			
 
				+                            review_lists.append({
			
 
				+                                "check_item": "outline_catalogue_check",
			
 
				+                                "chapter_code": chapter_code,
			
 
				+                                "check_item_code": f"{chapter_code}_outline_catalogue_check",
			
 
				+                                "check_result": {
			
 
				+                                    "issue_point": f"缺失一级目录：{item.get('first_name', '未知')}",
			
 
				+                                    "location": f"{item.get('first_seq', '')}. {item.get('first_name', '')}",
			
 
				+                                    "suggestion": f"补充一级目录：{item.get('first_name', '')}（编码：{item.get('first_code', '')}）",
			
 
				+                                    "reason": "根据标准分类表，该一级目录应当出现但未找到",
			
 
				+                                    "risk_level": "medium"
			
 
				+                                },
			
 
				+                                "exist_issue": True,
			
 
				+                                "risk_info": {"risk_level": "medium"}
			
 
				+                            })
			
 
				+                    
			
 
				+                    for item in missing_second:
			
 
				+                        if isinstance(item, dict):
			
 
				+                            review_lists.append({
			
 
				+                                "check_item": "outline_catalogue_check",
			
 
				+                                "chapter_code": chapter_code,
			
 
				+                                "check_item_code": f"{chapter_code}_outline_catalogue_check",
			
 
				+                                "check_result": {
			
 
				+                                    "issue_point": f"缺失二级目录：{item.get('secondary_name', '未知')}",
			
 
				+                                    "location": f"{item.get('first_seq', '')}.{item.get('second_seq', '')} {item.get('first_name', '')} > {item.get('secondary_name', '')}",
			
 
				+                                    "suggestion": f"补充二级目录：{item.get('secondary_name', '')}（编码：{item.get('secondary_code', '')}）",
			
 
				+                                    "reason": f"在'{item.get('first_name', '未知')}'章节下，该二级目录应当出现但未找到",
			
 
				+                                    "risk_level": "medium"
			
 
				+                                },
			
 
				+                                "exist_issue": True,
			
 
				+                                "risk_info": {"risk_level": "medium"}
			
 
				+                            })
			
 
				+                
			
 
				+                total_missing = missing_first_count + missing_second_count
			
 
				+                logger.info(f"🔍 目录缺失统计处理完成，缺失一级: {missing_first_count}, 缺失二级: {missing_second_count}, 共生成 {len(review_lists)} 个问题项（含汇总）")
			
 
				+                continue
			
 
				+
			
 
				             # 🔧 类型安全检查：支持字典和 base_reviewer.ReviewResult 对象
			
 
				             is_dict = isinstance(check_result, dict)
			
 
				             is_review_result = hasattr(check_result, 'details') and hasattr(check_result, 'success')
			
--- a/core/construction_review/workflows/ai_review_workflow.py
+++ b/core/construction_review/workflows/ai_review_workflow.py
@@ -298,7 +298,8 @@ class AIReviewWorkflow:
 
				                 'reference_check': 'reference_basis_reviewer',
			
 
				                 'sensitive_check': 'check_sensitive',
			
 
				                 'non_parameter_compliance_check': 'check_non_parameter_compliance',
			
 
				-                'parameter_compliance_check': 'check_parameter_compliance'
			
 
				+                'parameter_compliance_check': 'check_parameter_compliance',
			
 
				+                'outline_catalogue_check': 'check_outline_catalogue'  # 目录一二级缺失检查（模糊匹配）
			
 
				             }
			
 
				 
			
 
				             # 获取审查项配置
			
@@ -457,10 +458,18 @@ class AIReviewWorkflow:
 
				             # 主流程完成后，串行处理 catalogue（目录审查）
			
 
				             # 注意：catalogue 是系统强制添加的审查单元，已计入 total_chunks
			
 
				             logger.info("开始处理目录审查（catalogue）")
			
 
				+            # 从配置中获取 catalogue 章节的方法列表，默认包含 check_completeness 和 outline_catalogue_check
			
 
				+            catalogue_funcs = review_item_dict_sorted.get("catalogue", ["check_completeness", "outline_catalogue_check"])
			
 
				+            # 确保 check_completeness 在列表中（向后兼容）
			
 
				+            if "check_completeness" not in catalogue_funcs:
			
 
				+                catalogue_funcs = ["check_completeness"] + catalogue_funcs
			
 
				+            # 确保 outline_catalogue_check 在列表中（新增目录缺失统计）
			
 
				+            if "outline_catalogue_check" not in catalogue_funcs:
			
 
				+                catalogue_funcs.append("outline_catalogue_check")
			
 
				             chunks_completed, all_issues = await self.core_fun._process_chapter_item(
			
 
				                 "catalogue",                 # chapter_code
			
 
				                 catalogue,                   # chapter_content
			
 
				-                ["check_completeness"],      # func_names
			
 
				+                catalogue_funcs,             # func_names（从配置获取）
			
 
				                 state,
			
 
				                 all_issues,
			
 
				                 completed_chunks,
			
--- a/core/construction_review/workflows/core_functions/ai_review_core_fun.py
+++ b/core/construction_review/workflows/core_functions/ai_review_core_fun.py
@@ -354,7 +354,18 @@ class AIReviewCoreFun:
 
				         """
			
 
				       
			
 
				         # 从ai_review_engine获取对应的方法
			
 
				-        if not hasattr(self.ai_review_engine, func_name):
			
 
				+        # 方法名映射：配置名 -> 实际方法名
			
 
				+        # 用于处理配置标识名与AIReviewEngine方法名不一致的情况
			
 
				+        method_name_mapping = {
			
 
				+            'outline_catalogue_check': 'check_outline_catalogue',
			
 
				+        }
			
 
				+
			
 
				+        # 转换方法名（如果存在映射）
			
 
				+        actual_method_name = method_name_mapping.get(func_name, func_name)
			
 
				+        original_func_name = func_name
			
 
				+
			
 
				+        # 从ai_review_engine获取对应的方法
			
 
				+        if not hasattr(self.ai_review_engine, actual_method_name):
			
 
				             logger.warning(f"AIReviewEngine中未找到方法: {func_name}")
			
 
				             # 返回错误结果的 UnitReviewResult
			
 
				             return UnitReviewResult(
			
@@ -367,16 +378,16 @@ class AIReviewCoreFun:
 
				                 is_sse_push=True
			
 
				             )
			
 
				 
			
 
				-        method = getattr(self.ai_review_engine, func_name)
			
 
				+        method = getattr(self.ai_review_engine, actual_method_name)
			
 
				 
			
 
				         # 基础参数
			
 
				         trace_id = f"{state['callback_task_id']}_{chapter_code}_chunk{chunk_index}"
			
 
				-        stage_name = f"{chapter_code}_{func_name}"
			
 
				+        stage_name = f"{chapter_code}_{original_func_name}"
			
 
				 
			
 
				         # 获取块内容
			
 
				         review_content = chunk.get("content", "")
			
 
				         is_complete_field = chunk.get("is_complete_field", False)
			
 
				-        logger.debug(f"执行审查: {trace_id} -> {func_name}")
			
 
				+        logger.debug(f"执行审查: {trace_id} -> {original_func_name}")
			
 
				 
			
 
				         # 根据func_name构建对应的参数并调用
			
 
				         if func_name == "sensitive_word_check" and not is_complete_field:
			
@@ -571,6 +582,38 @@ class AIReviewCoreFun:
 
				                 is_sse_push=True
			
 
				             )
			
 
				 
			
 
				+        elif original_func_name == "outline_catalogue_check":
			
 
				+            # 目录一二级缺失检查（模糊匹配）- 针对整个文档的 outline 进行检查
			
 
				+            outline_data = state.get("structured_content", {})
			
 
				+            outline_result = await self.ai_review_engine.check_outline_catalogue(
			
 
				+                trace_id_idx=trace_id,
			
 
				+                outline_data=outline_data,
			
 
				+                state=state,
			
 
				+                stage_name=stage_name
			
 
				+            )
			
 
				+            
			
 
				+            # 计算风险等级：如果有缺失目录则标记为 medium
			
 
				+            overall_risk = "low"
			
 
				+            if outline_result.get("success"):
			
 
				+                missing_count = (
			
 
				+                    outline_result.get("details", {}).get("missing_first_count", 0) +
			
 
				+                    outline_result.get("details", {}).get("missing_second_count", 0)
			
 
				+                )
			
 
				+                if missing_count > 0:
			
 
				+                    overall_risk = "medium"
			
 
				+            else:
			
 
				+                overall_risk = "error"
			
 
				+            
			
 
				+            return UnitReviewResult(
			
 
				+                unit_index=chunk_index,
			
 
				+                unit_content=chunk,
			
 
				+                basic_compliance={"outline_catalogue_check": outline_result},
			
 
				+                technical_compliance={},
			
 
				+                rag_enhanced={},
			
 
				+                overall_risk=overall_risk,
			
 
				+                is_sse_push=True
			
 
				+            )
			
 
				+
			
 
				         else:
			
 
				             # 处理 check_completeness 但 is_complete_field=False 的情况
			
 
				             if func_name == "check_completeness" and not is_complete_field:
			
--- a/views/construction_review/launch_review.py
+++ b/views/construction_review/launch_review.py
@@ -190,8 +190,8 @@ def validate_review_item_config(review_item_config: List[str]) -> None:
 
				             invalid_chapter.append(chapter_code)
			
 
				             continue  # 章节不支持时不继续检查审查项
			
 
				 
			
 
				-        # 5. 特殊规则：目录章节只能使用完整性审查
			
 
				-        if chapter_code == "catalogue" and review_dim != "completeness_check":
			
 
				+        # 5. 特殊规则：目录章节只能使用完整性审查或目录缺失统计
			
 
				+        if chapter_code == "catalogue" and review_dim not in ["completeness_check", "outline_catalogue_check"]:
			
 
				             catalogue_invalid.append(item)
			
 
				             continue  # 目录章节违反规则时不继续检查