пре 3 месеци · 93f9312efe
--- a/full_server.py
+++ b/full_server.py
@@ -15,13 +15,53 @@ sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'src'))
 
															 from dotenv import load_dotenv
														
 
															 load_dotenv()
														
 
															-from fastapi import FastAPI, HTTPException, Depends, Request, Response
														
 
															+from fastapi import FastAPI, HTTPException, Depends, Request, Response, BackgroundTasks
														
 
															+from fastapi.responses import HTMLResponse, JSONResponse
														
 
															 from fastapi.middleware.cors import CORSMiddleware
														
 
															 from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
														
 
															 from pydantic import BaseModel
														
 
															 from typing import Optional, Any, Union
														
 
															 import hashlib
														
 
															 import secrets
														
 
															+import requests
														
 
															+from urllib.parse import urlparse
														
 
															+
														
 
															+# MIME 类型到后缀的映射
														
 
															+MIME_MAP = {
														
 
															+    'application/pdf': '.pdf',
														
 
															+    'application/vnd.openxmlformats-officedocument.wordprocessingml.document': '.docx',
														
 
															+    'application/msword': '.doc',
														
 
															+    'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': '.xlsx',
														
 
															+    'application/vnd.ms-excel': '.xls',
														
 
															+    'application/vnd.openxmlformats-officedocument.presentationml.presentation': '.pptx',
														
 
															+    'application/vnd.ms-powerpoint': '.ppt',
														
 
															+    'text/markdown': '.md',
														
 
															+    'text/plain': '.txt',
														
 
															+    'text/html': '.html',
														
 
															+    'image/jpeg': '.jpg',
														
 
															+    'image/png': '.png',
														
 
															+    'application/zip': '.zip',
														
 
															+}
														
 
															+
														
 
															+def detect_file_extension(url: str) -> str:
														
 
															+    """通过 URL 路径或 HEAD 请求检测文件后缀"""
														
 
															+    if not url:
														
 
															+        return ""
														
 
															+    
														
 
															+    # 1. 尝试从路径解析
														
 
															+    path = urlparse(url).path
														
 
															+    ext = os.path.splitext(path)[1].lower()
														
 
															+    if ext and len(ext) <= 6:
														
 
															+        return ext
														
 
															+    
														
 
															+    # 2. 尝试 HEAD 请求检测 Content-Type
														
 
															+    try:
														
 
															+        response = requests.head(url, allow_redirects=True, timeout=5)
														
 
															+        content_type = response.headers.get('Content-Type', '').split(';')[0].strip()
														
 
															+        return MIME_MAP.get(content_type, "")
														
 
															+    except Exception as e:
														
 
															+        print(f"检测文件后缀失败: {e}")
														
 
															+        return ""
														
 
															 # 修复JWT导入 - 确保使用正确的JWT库
														
 
															 try:
														
 
															     # 首先尝试使用PyJWT
														
@@ -95,6 +135,75 @@ TABLE_MAP = {
 
															     "job": "t_job_of_preparation"      # 办公制度
														
 
															 }
														
 
															+def get_db_connection():
														
 
															+    """获取数据库连接"""
														
 
															+    try:
														
 
															+        database_url = os.getenv('DATABASE_URL', '')
														
 
															+        if not database_url:
														
 
															+            return None
														
 
															+            
														
 
															+        parsed = urlparse(database_url)
														
 
															+        config = {
														
 
															+            'host': parsed.hostname or 'localhost',
														
 
															+            'port': parsed.port or 3306,
														
 
															+            'user': parsed.username or 'root',
														
 
															+            'password': parsed.password or '',
														
 
															+            'database': parsed.path[1:] if parsed.path else 'sso_db',
														
 
															+            'charset': 'utf8mb4'
														
 
															+        }
														
 
															+        
														
 
															+        return pymysql.connect(**config)
														
 
															+    except Exception as e:
														
 
															+        print(f"数据库连接失败: {e}")
														
 
															+        return None
														
 
															+
														
 
															+# --- 初始化主表 ---
														
 
															+def init_master_table():
														
 
															+    """初始化主表结构，并确保所有必要字段都存在"""
														
 
															+    conn = get_db_connection()
														
 
															+    if not conn:
														
 
															+        return
														
 
															+    try:
														
 
															+        cursor = conn.cursor()
														
 
															+        # 1. 创建主表 (如果不存在)
														
 
															+        cursor.execute("""
														
 
															+            CREATE TABLE IF NOT EXISTS t_document_main (
														
 
															+                id CHAR(36) PRIMARY KEY,
														
 
															+                title VARCHAR(255) NOT NULL,
														
 
															+                standard_no VARCHAR(100),
														
 
															+                issuing_authority VARCHAR(255),
														
 
															+                release_date DATE,
														
 
															+                document_type VARCHAR(100),
														
 
															+                professional_field VARCHAR(100),
														
 
															+                validity VARCHAR(50) DEFAULT '现行',
														
 
															+                created_by VARCHAR(100),
														
 
															+                created_time DATETIME DEFAULT CURRENT_TIMESTAMP,
														
 
															+                updated_time DATETIME DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP,
														
 
															+                conversion_status TINYINT DEFAULT 0, -- 0:待转化, 1:转化中, 2:已完成, 3:失败
														
 
															+                conversion_progress INT DEFAULT 0,
														
 
															+                converted_file_name VARCHAR(255),
														
 
															+                conversion_error TEXT,
														
 
															+                whether_to_enter TINYINT DEFAULT 0, -- 0:未入库, 1:已入库
														
 
															+                source_type ENUM('basis', 'work', 'job') NOT NULL,
														
 
															+                source_id CHAR(36) NOT NULL,
														
 
															+                file_url TEXT,
														
 
															+                file_extension VARCHAR(10),
														
 
															+                content TEXT,
														
 
															+                primary_category_id INT,
														
 
															+                secondary_category_id INT,
														
 
															+                year INT
														
 
															+            ) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4;
														
 
															+        """)
														
 
															+        conn.commit()
														
 
															+        print("✅ 主表 t_document_main 初始化成功")
														
 
															+    except Exception as e:
														
 
															+        print(f"❌ 初始化主表失败: {e}")
														
 
															+    finally:
														
 
															+        conn.close()
														
 
															+
														
 
															+# 执行初始化
														
 
															+init_master_table()
														
 
															+
														
 
															 def get_table_name(table_type: Optional[str]) -> str:
														
 
															     """根据类型获取对应的数据库表名，默认为编制依据"""
														
 
															     return TABLE_MAP.get(table_type, "t_basis_of_preparation")
														
@@ -105,14 +214,29 @@ class DocumentAdd(BaseModel):
 
															     primary_category_id: Optional[Any] = None
														
 
															     secondary_category_id: Optional[Any] = None
														
 
															     year: Optional[int] = None
														
 
															-    table_type: Optional[str] = "basis" # 增加表类型参数
														
 
															+    table_type: Optional[str] = "basis"
														
 
															+    # 新增编辑需要的字段
														
 
															+    id: Optional[str] = None
														
 
															+    source_id: Optional[str] = None
														
 
															+    # 扩展字段 (子表特有属性)
														
 
															+    standard_no: Optional[str] = None
														
 
															+    issuing_authority: Optional[str] = None
														
 
															+    release_date: Optional[str] = None
														
 
															+    document_type: Optional[str] = None
														
 
															+    professional_field: Optional[str] = None
														
 
															+    validity: Optional[str] = None
														
 
															+    project_name: Optional[str] = None
														
 
															+    project_section: Optional[str] = None
														
 
															+    # 文件相关字段
														
 
															+    file_url: Optional[str] = None
														
 
															+    file_extension: Optional[str] = None
														
 
															 class DocumentListRequest(BaseModel):
														
 
															-    primaryCategoryId: Optional[int] = None
														
 
															-    secondaryCategoryId: Optional[int] = None
														
 
															     page: int = 1
														
 
															     size: int = 50
														
 
															-    sort_by: str = "created_at"  # created_at or updated_at
														
 
															+    keyword: Optional[str] = None
														
 
															+    table_type: Optional[str] = None
														
 
															+    whether_to_enter: Optional[int] = None
														
 
															 # 配置
														
 
															 JWT_SECRET_KEY = os.getenv("JWT_SECRET_KEY", "dev-jwt-secret-key-12345")
														
@@ -134,28 +258,6 @@ def find_available_port(start_port=8000, max_port=8010):
 
															             return port
														
 
															     return None
														
 
															-def get_db_connection():
														
 
															-    """获取数据库连接"""
														
 
															-    try:
														
 
															-        database_url = os.getenv('DATABASE_URL', '')
														
 
															-        if not database_url:
														
 
															-            return None
														
 
															-            
														
 
															-        parsed = urlparse(database_url)
														
 
															-        config = {
														
 
															-            'host': parsed.hostname or 'localhost',
														
 
															-            'port': parsed.port or 3306,
														
 
															-            'user': parsed.username or 'root',
														
 
															-            'password': parsed.password or '',
														
 
															-            'database': parsed.path[1:] if parsed.path else 'sso_db',
														
 
															-            'charset': 'utf8mb4'
														
 
															-        }
														
 
															-        
														
 
															-        return pymysql.connect(**config)
														
 
															-    except Exception as e:
														
 
															-        print(f"数据库连接失败: {e}")
														
 
															-        return None
														
 
															-
														
 
															 def verify_password_simple(password: str, stored_hash: str) -> bool:
														
 
															     """验证密码（简化版）"""
														
 
															     if stored_hash.startswith("sha256$"):
														
@@ -3553,16 +3655,16 @@ import httpx
 
															 from fastapi.responses import HTMLResponse
														
 
															 class BatchEnterRequest(BaseModel):
														
 
															-    ids: list[int]
														
 
															-    table_type: Optional[str] = "basis"
														
 
															+    ids: list[Union[int, str]]
														
 
															+    table_type: Optional[str] = None
														
 
															 class BatchDeleteRequest(BaseModel):
														
 
															     ids: list[Union[int, str]]
														
 
															-    table_type: Optional[str] = "basis"
														
 
															+    table_type: Optional[str] = None
														
 
															 class ConvertRequest(BaseModel):
														
 
															     id: Union[int, str]
														
 
															-    table_type: Optional[str] = "basis"
														
 
															+    table_type: Optional[str] = None
														
 
															 # --- 文档管理中心 API ---
														
@@ -3640,24 +3742,53 @@ async def batch_enter_knowledge_base(req: BatchEnterRequest, credentials: HTTPAu
 
															             return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															         cursor = conn.cursor()
														
 
															-        table_name = get_table_name(req.table_type)
														
 
															-        # 批量更新 whether_to_enter 为 1
														
 
															-        # 只更新尚未入库的数据 (whether_to_enter = 0)
														
 
															+        
														
 
															+        # 1. 批量更新主表 t_document_main
														
 
															+        # 只更新尚未入库的数据 (whether_to_enter = 0)，同时更新修改时间和修改人（如果需要）
														
 
															         placeholders = ', '.join(['%s'] * len(req.ids))
														
 
															-        sql = f"UPDATE {table_name} SET whether_to_enter = 1, updated_at = NOW() WHERE id IN ({placeholders}) AND whether_to_enter = 0"
														
 
															-        cursor.execute(sql, req.ids)
														
 
															-        conn.commit()
														
 
															+        username = payload.get("username", "admin")
														
 
															+        # 首先更新主表
														
 
															+        sql_main = f"""
														
 
															+            UPDATE t_document_main 
														
 
															+            SET whether_to_enter = 1, updated_time = NOW() 
														
 
															+            WHERE id IN ({placeholders}) AND whether_to_enter = 0
														
 
															+        """
														
 
															+        cursor.execute(sql_main, req.ids)
														
 
															         affected_rows = cursor.rowcount
														
 
															+        
														
 
															+        # 2. 尝试更新对应的子表以保持同步
														
 
															+        try:
														
 
															+            # 查询这些 ID 对应的 source_type 和 source_id
														
 
															+            cursor.execute(f"SELECT id, source_type, source_id FROM t_document_main WHERE id IN ({placeholders})", req.ids)
														
 
															+            docs = cursor.fetchall()
														
 
															+            
														
 
															+            for doc_row in docs:
														
 
															+                d_id, s_type, s_id = doc_row
														
 
															+                if s_type and s_id:
														
 
															+                    sub_table = get_table_name(s_type)
														
 
															+                    if sub_table:
														
 
															+                        # 更新子表中的 whether_to_enter 字段（如果存在）
														
 
															+                        # 注意：子表中的主键可能是 id 且值为 s_id
														
 
															+                        sub_sql = f"UPDATE {sub_table} SET whether_to_enter = 1, updated_at = NOW(), updated_by = %s WHERE id = %s"
														
 
															+                        try:
														
 
															+                            cursor.execute(sub_sql, (username, s_id))
														
 
															+                        except Exception as sub_e:
														
 
															+                            print(f"更新子表 {sub_table} 失败 (可能字段不存在): {sub_e}")
														
 
															+        except Exception as sync_e:
														
 
															+            print(f"同步更新子表失败: {sync_e}")
														
 
															+
														
 
															+        conn.commit()
														
 
															         cursor.close()
														
 
															         conn.close()
														
 
															         message = f"成功将 {affected_rows} 条数据加入知识库"
														
 
															         if affected_rows < len(req.ids):
														
 
															-            message += f"（跳过了 {len(req.ids) - affected_rows} 条已入库数据）"
														
 
															+            message += f"（跳过了 {len(req.ids) - affected_rows} 条已入库数据或未找到数据）"
														
 
															         return ApiResponse(code=0, message=message, timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															     except Exception as e:
														
 
															+        print(f"批量操作失败: {e}")
														
 
															         return ApiResponse(code=500, message=f"批量操作失败: {str(e)}", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															 @app.post("/api/v1/documents/batch-delete")
														
@@ -3675,18 +3806,39 @@ async def batch_delete_documents(req: BatchDeleteRequest, credentials: HTTPAutho
 
															             return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															         cursor = conn.cursor()
														
 
															-        table_name = get_table_name(req.table_type)
														
 
															         if not req.ids:
														
 
															             return ApiResponse(code=400, message="未指定要删除的文档 ID", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															         placeholders = ', '.join(['%s'] * len(req.ids))
														
 
															-        sql = f"DELETE FROM {table_name} WHERE id IN ({placeholders})"
														
 
															-        cursor.execute(sql, req.ids)
														
 
															-        conn.commit()
														
 
															+        # 1. 尝试同步删除子表中的数据
														
 
															+        try:
														
 
															+            # 查询这些 ID 对应的 source_type 和 source_id
														
 
															+            cursor.execute(f"SELECT source_type, source_id FROM t_document_main WHERE id IN ({placeholders})", req.ids)
														
 
															+            docs = cursor.fetchall()
														
 
															+            
														
 
															+            for doc_row in docs:
														
 
															+                s_type, s_id = doc_row
														
 
															+                if s_type and s_id:
														
 
															+                    sub_table = get_table_name(s_type)
														
 
															+                    if sub_table:
														
 
															+                        # 删除子表数据
														
 
															+                        sub_sql = f"DELETE FROM {sub_table} WHERE id = %s"
														
 
															+                        try:
														
 
															+                            cursor.execute(sub_sql, (s_id,))
														
 
															+                        except Exception as sub_e:
														
 
															+                            print(f"删除子表 {sub_table} 数据失败: {sub_e}")
														
 
															+        except Exception as sync_e:
														
 
															+            print(f"同步删除子表数据失败: {sync_e}")
														
 
															+
														
 
															+        # 2. 删除主表 t_document_main 中的数据
														
 
															+        sql_main = f"DELETE FROM t_document_main WHERE id IN ({placeholders})"
														
 
															+        cursor.execute(sql_main, req.ids)
														
 
															         affected_rows = cursor.rowcount
														
 
															+        conn.commit()
														
 
															+        
														
 
															         return ApiResponse(
														
 
															             code=0, 
														
 
															             message=f"成功删除 {affected_rows} 条文档数据", 
														
@@ -3701,30 +3853,90 @@ async def batch_delete_documents(req: BatchDeleteRequest, credentials: HTTPAutho
 
															         if conn:
														
 
															             conn.close()
														
 
															+async def simulate_conversion(doc_id: str):
														
 
															+    """模拟文档转换过程"""
														
 
															+    import time
														
 
															+    conn = None
														
 
															+    try:
														
 
															+        conn = get_db_connection()
														
 
															+        cursor = conn.cursor()
														
 
															+        
														
 
															+        # 1. 模拟开始 (10%)
														
 
															+        cursor.execute("UPDATE t_document_main SET conversion_status = 1, conversion_progress = 10 WHERE id = %s", (doc_id,))
														
 
															+        conn.commit()
														
 
															+        time.sleep(2)
														
 
															+        
														
 
															+        # 2. 模拟进行中 (40%)
														
 
															+        cursor.execute("UPDATE t_document_main SET conversion_progress = 40 WHERE id = %s", (doc_id,))
														
 
															+        conn.commit()
														
 
															+        time.sleep(3)
														
 
															+        
														
 
															+        # 3. 模拟进行中 (75%)
														
 
															+        cursor.execute("UPDATE t_document_main SET conversion_progress = 75 WHERE id = %s", (doc_id,))
														
 
															+        conn.commit()
														
 
															+        time.sleep(2)
														
 
															+        
														
 
															+        # 4. 模拟完成 (100%)
														
 
															+        cursor.execute("""
														
 
															+            UPDATE t_document_main 
														
 
															+            SET conversion_status = 2, conversion_progress = 100, 
														
 
															+                converted_file_name = CONCAT(title, '_已转换.pdf') 
														
 
															+            WHERE id = %s
														
 
															+        """, (doc_id,))
														
 
															+        conn.commit()
														
 
															+        
														
 
															+    except Exception as e:
														
 
															+        print(f"模拟转换出错: {e}")
														
 
															+        if conn:
														
 
															+            cursor = conn.cursor()
														
 
															+            cursor.execute("UPDATE t_document_main SET conversion_status = 3, conversion_error = %s WHERE id = %s", (str(e), doc_id))
														
 
															+            conn.commit()
														
 
															+    finally:
														
 
															+        if conn:
														
 
															+            conn.close()
														
 
															+
														
 
															 @app.post("/api/v1/documents/convert")
														
 
															-async def convert_document(req: ConvertRequest, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															-    """异步启动文档转换"""
														
 
															-    import subprocess
														
 
															+async def convert_document(req: ConvertRequest, background_tasks: BackgroundTasks, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															+    """启动文档转换 (支持真实脚本与模拟逻辑)"""
														
 
															     try:
														
 
															         payload = verify_token(credentials.credentials)
														
 
															         if not payload or not payload.get("is_superuser"):
														
 
															             return ApiResponse(code=403, message="权限不足", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															-        # 启动后台进程执行转换
														
 
															-        # 脚本位于 d:\UGit\LQAdminPlatform\scripts\miner_u.py
														
 
															+        table_type = req.table_type
														
 
															+        # 如果没有提供 table_type，从主表查询
														
 
															+        if not table_type:
														
 
															+            try:
														
 
															+                conn = get_db_connection()
														
 
															+                if conn:
														
 
															+                    cursor = conn.cursor()
														
 
															+                    cursor.execute("SELECT source_type FROM t_document_main WHERE id = %s", (req.id,))
														
 
															+                    res = cursor.fetchone()
														
 
															+                    if res:
														
 
															+                        table_type = res[0]
														
 
															+                    cursor.close()
														
 
															+                    conn.close()
														
 
															+            except Exception as e:
														
 
															+                print(f"从主表获取 source_type 失败: {e}")
														
 
															+
														
 
															+        # 1. 优先尝试启动真实转换脚本
														
 
															         script_path = os.path.abspath(os.path.join(os.path.dirname(__file__), "scripts", "miner_u.py"))
														
 
															-        # 使用当前 python 解释器
														
 
															-        python_exe = sys.executable
														
 
															-        
														
 
															-        # 异步启动，不等待结束
														
 
															-        subprocess.Popen([python_exe, script_path, str(req.table_type), str(req.id)], 
														
 
															-                         stdout=subprocess.DEVNULL, 
														
 
															-                         stderr=subprocess.DEVNULL,
														
 
															-                         creationflags=subprocess.CREATE_NO_WINDOW if os.name == 'nt' else 0)
														
 
															+        if os.path.exists(script_path):
														
 
															+            import subprocess
														
 
															+            python_exe = sys.executable
														
 
															+            # 传递 table_type 和 id 给脚本
														
 
															+            subprocess.Popen([python_exe, script_path, str(table_type or "basis"), str(req.id)], 
														
 
															+                             stdout=subprocess.DEVNULL, 
														
 
															+                             stderr=subprocess.DEVNULL,
														
 
															+                             creationflags=subprocess.CREATE_NO_WINDOW if os.name == 'nt' else 0)
														
 
															+            return ApiResponse(code=0, message="转换任务已在后台启动", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        
														
 
															+        # 2. 如果脚本不存在，则启动模拟转换逻辑
														
 
															+        background_tasks.add_task(simulate_conversion, str(req.id))
														
 
															         return ApiResponse(
														
 
															             code=0, 
														
 
															-            message="转换任务已启动", 
														
 
															+            message="转换任务已启动 (模拟模式)", 
														
 
															             timestamp=datetime.now(timezone.utc).isoformat()
														
 
															         ).model_dump()
														
 
															     except Exception as e:
														
@@ -3733,155 +3945,469 @@ async def convert_document(req: ConvertRequest, credentials: HTTPAuthorizationCr
 
															 @app.post("/api/v1/documents/add")
														
 
															 async def add_document(doc: DocumentAdd, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															-    """添加新文档"""
														
 
															+    """添加新文档 (同步主表和子表)"""
														
 
															     try:
														
 
															         payload = verify_token(credentials.credentials)
														
 
															-        if not payload or not payload.get("is_superuser"):
														
 
															-            return ApiResponse(code=403, message="权限不足", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        if not payload:
														
 
															+            return ApiResponse(code=401, message="无效的访问令牌", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        user_id = payload.get("username", "admin")
														
 
															         conn = get_db_connection()
														
 
															         if not conn:
														
 
															             return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															-        
														
 
															+            
														
 
															         cursor = conn.cursor()
														
 
															-        table_name = get_table_name(doc.table_type)
														
 
															-        # 修正列名：reference_basis -> reference_basis_list
														
 
															-        sql = f"""
														
 
															-            INSERT INTO {table_name} 
														
 
															-            (chinese_name, reference_basis_list, document_type, professional_field, release_date, created_at, updated_at)
														
 
															-            VALUES (%s, %s, %s, %s, %s, NOW(), NOW())
														
 
															-        """
														
 
															-        # 构造日期：如果是年份，转为 YYYY-01-01
														
 
															-        release_date = f"{doc.year}-01-01" if doc.year else None
														
 
															-        
														
 
															-        cursor.execute(sql, (doc.title, doc.content, str(doc.primary_category_id) if doc.primary_category_id else None, 
														
 
															-                             str(doc.secondary_category_id) if doc.secondary_category_id else None, release_date))
														
 
															-        conn.commit()
														
 
															-        cursor.close()
														
 
															-        conn.close()
														
 
															+        doc_id = str(uuid.uuid4())
														
 
															+        source_id = str(uuid.uuid4())
														
 
															+        table_name = TABLE_MAP.get(doc.table_type, "t_basis_of_preparation")
														
 
															-        return ApiResponse(code=0, message="文档添加成功", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        try:
														
 
															+            # 1. 插入子表
														
 
															+            if doc.table_type == 'basis':
														
 
															+                cursor.execute(
														
 
															+                    f"INSERT INTO {table_name} (id, chinese_name, created_by) VALUES (%s, %s, %s)",
														
 
															+                    (source_id, doc.title, user_id)
														
 
															+                )
														
 
															+            elif doc.table_type == 'work':
														
 
															+                cursor.execute(
														
 
															+                    f"INSERT INTO {table_name} (id, plan_name, created_by) VALUES (%s, %s, %s)",
														
 
															+                    (source_id, doc.title, user_id)
														
 
															+                )
														
 
															+            elif doc.table_type == 'job':
														
 
															+                cursor.execute(
														
 
															+                    f"INSERT INTO {table_name} (id, file_name, created_by) VALUES (%s, %s, %s)",
														
 
															+                    (source_id, doc.title, user_id)
														
 
															+                )
														
 
															+                
														
 
															+            # 2. 插入主表
														
 
															+            cursor.execute("""
														
 
															+                INSERT INTO t_document_main 
														
 
															+                (id, title, content, created_by, source_type, source_id, whether_to_enter, primary_category_id, secondary_category_id, year, file_url, file_extension) 
														
 
															+                VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
														
 
															+            """, (doc_id, doc.title, doc.content, user_id, doc.table_type, source_id, 0, doc.primary_category_id, doc.secondary_category_id, doc.year, doc.file_url, doc.file_extension))
														
 
															+            
														
 
															+            conn.commit()
														
 
															+            return ApiResponse(code=0, message="文档添加成功", data={"id": doc_id}, timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        except Exception as e:
														
 
															+            conn.rollback()
														
 
															+            raise e
														
 
															+        finally:
														
 
															+            cursor.close()
														
 
															+            conn.close()
														
 
															     except Exception as e:
														
 
															-        print(f"添加文档错误: {e}")
														
 
															-        return ApiResponse(code=500, message=f"服务器内部错误: {str(e)}", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        print(f"添加文档失败: {e}")
														
 
															+        return ApiResponse(code=500, message=str(e), timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+
														
 
															+@app.get("/api/v1/documents/detail/{doc_id}")
														
 
															+async def get_document_detail(doc_id: str, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															+    """获取文档详情 (关联查询子表)"""
														
 
															+    print(f"🔍 正在获取文档详情: {doc_id}")
														
 
															+    try:
														
 
															+        payload = verify_token(credentials.credentials)
														
 
															+        if not payload:
														
 
															+            return ApiResponse(code=401, message="无效的访问令牌", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        conn = get_db_connection()
														
 
															+        if not conn:
														
 
															+            return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        cursor = conn.cursor()
														
 
															+        try:
														
 
															+            # 1. 查询主表
														
 
															+            cursor.execute("SELECT * FROM t_document_main WHERE id = %s", (doc_id,))
														
 
															+            main_row = cursor.fetchone()
														
 
															+            if not main_row:
														
 
															+                print(f"❌ 文档不存在: {doc_id}")
														
 
															+                return ApiResponse(code=404, message="文档不存在", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+                
														
 
															+            columns = [desc[0] for desc in cursor.description]
														
 
															+            doc = dict(zip(columns, main_row))
														
 
															+            print(f"✅ 找到主表数据: {doc.get('title')}")
														
 
															+            
														
 
															+            # 2. 查询子表
														
 
															+            source_type = doc.get('source_type')
														
 
															+            source_id = doc.get('source_id')
														
 
															+            table_name = TABLE_MAP.get(source_type)
														
 
															+            
														
 
															+            if table_name and source_id:
														
 
															+                cursor.execute(f"SELECT * FROM {table_name} WHERE id = %s", (source_id,))
														
 
															+                sub_row = cursor.fetchone()
														
 
															+                if sub_row:
														
 
															+                    sub_columns = [desc[0] for desc in cursor.description]
														
 
															+                    sub_data = dict(zip(sub_columns, sub_row))
														
 
															+                    
														
 
															+                    # 将子表字段映射到通用字段名，方便前端处理
														
 
															+                    if source_type == 'basis':
														
 
															+                        doc['standard_no'] = sub_data.get('standard_number')
														
 
															+                        doc['issuing_authority'] = sub_data.get('issuing_authority')
														
 
															+                        doc['release_date'] = str(sub_data.get('release_date')) if sub_data.get('release_date') else None
														
 
															+                        doc['document_type'] = sub_data.get('document_type')
														
 
															+                        doc['professional_field'] = sub_data.get('professional_field')
														
 
															+                        doc['validity'] = sub_data.get('validity')
														
 
															+                    elif source_type == 'work':
														
 
															+                        doc['project_name'] = sub_data.get('project_name')
														
 
															+                        doc['project_section'] = sub_data.get('project_section')
														
 
															+                        doc['issuing_authority'] = sub_data.get('compiling_unit')
														
 
															+                        doc['release_date'] = str(sub_data.get('compiling_date')) if sub_data.get('compiling_date') else None
														
 
															+                    elif source_type == 'job':
														
 
															+                        doc['issuing_authority'] = sub_data.get('issuing_department')
														
 
															+                        doc['document_type'] = sub_data.get('document_type')
														
 
															+                        doc['release_date'] = str(sub_data.get('publish_date')) if sub_data.get('publish_date') else None
														
 
															+            
														
 
															+            # 格式化主表时间
														
 
															+            if doc.get('created_time'):
														
 
															+                doc['created_time'] = doc['created_time'].isoformat()
														
 
															+            if doc.get('updated_time'):
														
 
															+                doc['updated_time'] = doc['updated_time'].isoformat()
														
 
															+            if doc.get('release_date') and not isinstance(doc['release_date'], str):
														
 
															+                doc['release_date'] = doc['release_date'].isoformat()
														
 
															+
														
 
															+            return ApiResponse(code=0, message="获取详情成功", data=doc, timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        finally:
														
 
															+            cursor.close()
														
 
															+            conn.close()
														
 
															+    except Exception as e:
														
 
															+        print(f"获取文档详情失败: {e}")
														
 
															+        return ApiResponse(code=500, message=str(e), timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															 @app.get("/api/v1/documents/list")
														
 
															 async def get_document_list(
														
 
															-    primaryCategoryId: Optional[str] = None,
														
 
															-    secondaryCategoryId: Optional[str] = None,
														
 
															-    year: Optional[int] = None,
														
 
															     whether_to_enter: Optional[int] = None,
														
 
															     keyword: Optional[str] = None,
														
 
															-    table_type: Optional[str] = "basis",
														
 
															+    table_type: Optional[str] = None,
														
 
															     page: int = 1, 
														
 
															     size: int = 50,
														
 
															-    sort_by: str = "created_at",
														
 
															     credentials: HTTPAuthorizationCredentials = Depends(security)
														
 
															 ):
														
 
															-    """获取文档列表（支持过滤与搜索）"""
														
 
															-    conn = None
														
 
															-    cursor = None
														
 
															+    """获取文档列表 (从主表查询)"""
														
 
															     try:
														
 
															         payload = verify_token(credentials.credentials)
														
 
															-        if not payload or not payload.get("is_superuser"):
														
 
															-            return ApiResponse(code=403, message="权限不足", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        if not payload:
														
 
															+            return ApiResponse(code=401, message="无效的访问令牌", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															         conn = get_db_connection()
														
 
															         if not conn:
														
 
															             return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															-        
														
 
															+            
														
 
															         cursor = conn.cursor()
														
 
															-        table_name = get_table_name(table_type)
														
 
															-        
														
 
															         where_clauses = []
														
 
															         params = []
														
 
															-        if primaryCategoryId:
														
 
															-            where_clauses.append("document_type = %s")
														
 
															-            params.append(primaryCategoryId)
														
 
															-        if secondaryCategoryId:
														
 
															-            where_clauses.append("professional_field = %s")
														
 
															-            params.append(secondaryCategoryId)
														
 
															-        if year:
														
 
															-            where_clauses.append("YEAR(release_date) = %s")
														
 
															-            params.append(year)
														
 
															+        if table_type:
														
 
															+            where_clauses.append("source_type = %s")
														
 
															+            params.append(table_type)
														
 
															         if whether_to_enter is not None:
														
 
															-            where_clauses.append("CAST(whether_to_enter AS UNSIGNED) = %s")
														
 
															+            where_clauses.append("whether_to_enter = %s")
														
 
															             params.append(whether_to_enter)
														
 
															         if keyword:
														
 
															-            where_clauses.append("(chinese_name LIKE %s OR reference_basis_list LIKE %s OR standard_no LIKE %s)")
														
 
															-            like_keyword = f"%{keyword}%"
														
 
															-            params.extend([like_keyword, like_keyword, like_keyword])
														
 
															+            where_clauses.append("(title LIKE %s OR content LIKE %s)")
														
 
															+            params.extend([f"%{keyword}%", f"%{keyword}%"])
														
 
															-        where_stmt = " WHERE " + " AND ".join(where_clauses) if where_clauses else ""
														
 
															-        
														
 
															-        # 排序逻辑：按创建时间倒序
														
 
															-        sort_field = "created_at" if sort_by == "created_at" else "updated_at"
														
 
															-        order_by = f"ORDER BY {sort_field} DESC"
														
 
															-        
														
 
															-        # 分页
														
 
															+        where_sql = " WHERE " + " AND ".join(where_clauses) if where_clauses else ""
														
 
															         offset = (page - 1) * size
														
 
															-        # 返回更多字段
														
 
															-        sql = f"""
														
 
															-            SELECT id, chinese_name as title, reference_basis_list as content, 
														
 
															-            document_type, professional_field, 
														
 
															-            YEAR(release_date) as year, release_date, standard_no, status, 
														
 
															-            CAST(whether_to_enter AS UNSIGNED) as whether_to_enter, file_url,
														
 
															-            conversion_status, conversion_progress, conversion_error,
														
 
															-            created_at, updated_at 
														
 
															-            FROM {table_name} {where_stmt} 
														
 
															-            {order_by} LIMIT %s OFFSET %s
														
 
															-        """
														
 
															+        sql = f"SELECT * FROM t_document_main {where_sql} ORDER BY created_time DESC LIMIT %s OFFSET %s"
														
 
															         params.extend([size, offset])
														
 
															-        cursor.execute(sql, params)
														
 
															-        columns = [col[0] for col in cursor.description]
														
 
															-        items = [dict(zip(columns, row)) for row in cursor.fetchall()]
														
 
															-        
														
 
															-        # 格式化时间
														
 
															-        for item in items:
														
 
															-            for key, value in item.items():
														
 
															-                if isinstance(value, (datetime, date)):
														
 
															-                    item[key] = value.isoformat()
														
 
															-        
														
 
															-        # 获取总数
														
 
															-        count_sql = f"SELECT COUNT(*) FROM {table_name} {where_stmt}"
														
 
															-        cursor.execute(count_sql, params[:-2])
														
 
															+        cursor.execute(sql, tuple(params))
														
 
															+        columns = [desc[0] for desc in cursor.description]
														
 
															+        items = []
														
 
															+        for row in cursor.fetchall():
														
 
															+            item = dict(zip(columns, row))
														
 
															+            # 格式化时间
														
 
															+            for key in ['created_time', 'updated_time', 'release_date']:
														
 
															+                if item.get(key) and hasattr(item[key], 'isoformat'):
														
 
															+                    item[key] = item[key].isoformat()
														
 
															+            items.append(item)
														
 
															+            
														
 
															+        # 总数
														
 
															+        count_sql = f"SELECT COUNT(*) FROM t_document_main {where_sql}"
														
 
															+        cursor.execute(count_sql, tuple(params[:-2]))
														
 
															         total = cursor.fetchone()[0]
														
 
															-        # 优化统计查询：合并全局总数和已入库总数的查询，减少数据库交互
														
 
															-        stats_sql = f"SELECT COUNT(*), SUM(CASE WHEN CAST(whether_to_enter AS UNSIGNED) = 1 THEN 1 ELSE 0 END) FROM {table_name}"
														
 
															-        cursor.execute(stats_sql)
														
 
															-        stats_result = cursor.fetchone()
														
 
															+        # 统计数据
														
 
															+        cursor.execute("SELECT COUNT(*) FROM t_document_main")
														
 
															+        all_total = cursor.fetchone()[0]
														
 
															+        cursor.execute("SELECT COUNT(*) FROM t_document_main WHERE whether_to_enter = 1")
														
 
															+        total_entered = cursor.fetchone()[0]
														
 
															-        all_total = 0
														
 
															-        total_entered = 0
														
 
															-        if stats_result:
														
 
															-            all_total = stats_result[0] or 0
														
 
															-            total_entered = int(stats_result[1] or 0)
														
 
															+        cursor.close()
														
 
															+        conn.close()
														
 
															         return ApiResponse(
														
 
															-            code=0,
														
 
															-            message="获取成功",
														
 
															+            code=0, 
														
 
															+            message="查询成功", 
														
 
															             data={
														
 
															                 "items": items, 
														
 
															                 "total": total, 
														
 
															-                "all_total": all_total,
														
 
															-                "total_entered": total_entered,
														
 
															                 "page": page, 
														
 
															-                "size": size
														
 
															+                "size": size,
														
 
															+                "all_total": all_total,
														
 
															+                "total_entered": total_entered
														
 
															             },
														
 
															             timestamp=datetime.now(timezone.utc).isoformat()
														
 
															         ).model_dump()
														
 
															     except Exception as e:
														
 
															-        print(f"获取文档列表错误: {e}")
														
 
															-        return ApiResponse(code=500, message=f"服务器内部错误: {str(e)}", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															-    finally:
														
 
															-        if cursor:
														
 
															+        print(f"获取文档列表失败: {e}")
														
 
															+        return ApiResponse(code=500, message=str(e), timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+
														
 
															+@app.post("/api/v1/documents/edit")
														
 
															+async def edit_document(doc: DocumentAdd, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															+    """编辑文档 (同步主表和子表)"""
														
 
															+    try:
														
 
															+        payload = verify_token(credentials.credentials)
														
 
															+        if not payload:
														
 
															+            return ApiResponse(code=401, message="无效的访问令牌", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        if not doc.id or not doc.source_id:
														
 
															+            return ApiResponse(code=400, message="缺少ID参数", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        conn = get_db_connection()
														
 
															+        if not conn:
														
 
															+            return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        cursor = conn.cursor()
														
 
															+        table_name = TABLE_MAP.get(doc.table_type, "t_basis_of_preparation")
														
 
															+        
														
 
															+        try:
														
 
															+            # 1. 更新子表内容
														
 
															+            if doc.table_type == 'basis':
														
 
															+                cursor.execute(f"""
														
 
															+                    UPDATE {table_name} 
														
 
															+                    SET chinese_name = %s, standard_number = %s, issuing_authority = %s, 
														
 
															+                        release_date = %s, document_type = %s, professional_field = %s, validity = %s
														
 
															+                    WHERE id = %s
														
 
															+                """, (doc.title, doc.standard_no, doc.issuing_authority, doc.release_date, 
														
 
															+                      doc.document_type, doc.professional_field, doc.validity, doc.source_id))
														
 
															+            elif doc.table_type == 'work':
														
 
															+                cursor.execute(f"""
														
 
															+                    UPDATE {table_name} 
														
 
															+                    SET plan_name = %s, project_name = %s, project_section = %s, 
														
 
															+                        compiling_unit = %s, compiling_date = %s
														
 
															+                    WHERE id = %s
														
 
															+                """, (doc.title, doc.project_name, doc.project_section, doc.issuing_authority, 
														
 
															+                      doc.release_date, doc.source_id))
														
 
															+            elif doc.table_type == 'job':
														
 
															+                cursor.execute(f"""
														
 
															+                    UPDATE {table_name} 
														
 
															+                    SET file_name = %s, issuing_department = %s, document_type = %s, publish_date = %s
														
 
															+                    WHERE id = %s
														
 
															+                """, (doc.title, doc.issuing_authority, doc.document_type, doc.release_date, doc.source_id))
														
 
															+                
														
 
															+            # 2. 更新主表内容
														
 
															+            cursor.execute("""
														
 
															+                UPDATE t_document_main 
														
 
															+                SET title = %s, content = %s, updated_time = NOW(),
														
 
															+                    primary_category_id = %s, secondary_category_id = %s, year = %s,
														
 
															+                    file_url = %s, file_extension = %s
														
 
															+                WHERE id = %s
														
 
															+            """, (doc.title, doc.content, doc.primary_category_id, doc.secondary_category_id, doc.year, 
														
 
															+                  doc.file_url, doc.file_extension, doc.id))
														
 
															+            
														
 
															+            conn.commit()
														
 
															+            return ApiResponse(code=0, message="文档更新成功", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        except Exception as e:
														
 
															+            conn.rollback()
														
 
															+            raise e
														
 
															+        finally:
														
 
															             cursor.close()
														
 
															-        if conn:
														
 
															             conn.close()
														
 
															+    except Exception as e:
														
 
															+        print(f"编辑文档失败: {e}")
														
 
															+        return ApiResponse(code=500, message=str(e), timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+
														
 
															+@app.post("/api/v1/documents/enter")
														
 
															+async def enter_document(data: dict, credentials: HTTPAuthorizationCredentials = Depends(security)):
														
 
															+    """文档入库"""
														
 
															+    try:
														
 
															+        doc_id = data.get("id")
														
 
															+        if not doc_id:
														
 
															+            return ApiResponse(code=400, message="缺少ID", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        payload = verify_token(credentials.credentials)
														
 
															+        username = payload.get("username", "admin") if payload else "admin"
														
 
															+        
														
 
															+        conn = get_db_connection()
														
 
															+        if not conn:
														
 
															+            return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        cursor = conn.cursor()
														
 
															+        
														
 
															+        # 1. 更新主表
														
 
															+        cursor.execute("UPDATE t_document_main SET whether_to_enter = 1, updated_time = NOW() WHERE id = %s", (doc_id,))
														
 
															+        
														
 
															+        # 2. 尝试同步更新子表
														
 
															+        try:
														
 
															+            cursor.execute("SELECT source_type, source_id FROM t_document_main WHERE id = %s", (doc_id,))
														
 
															+            res = cursor.fetchone()
														
 
															+            if res and res[0] and res[1]:
														
 
															+                s_type, s_id = res
														
 
															+                sub_table = get_table_name(s_type)
														
 
															+                if sub_table:
														
 
															+                    sub_sql = f"UPDATE {sub_table} SET whether_to_enter = 1, updated_at = NOW(), updated_by = %s WHERE id = %s"
														
 
															+                    try:
														
 
															+                        cursor.execute(sub_sql, (username, s_id))
														
 
															+                    except Exception as sub_e:
														
 
															+                        print(f"入库同步子表 {sub_table} 失败: {sub_e}")
														
 
															+        except Exception as sync_e:
														
 
															+            print(f"入库同步子表异常: {sync_e}")
														
 
															+            
														
 
															+        conn.commit()
														
 
															+        cursor.close()
														
 
															+        conn.close()
														
 
															+        return ApiResponse(code=0, message="入库成功", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+    except Exception as e:
														
 
															+        print(f"入库失败: {e}")
														
 
															+        return ApiResponse(code=500, message=str(e), timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+
														
 
															+@app.get("/api/v1/basic-info/list")
														
 
															+async def get_basic_info_list(
														
 
															+    type: str,
														
 
															+    page: int = 1,
														
 
															+    size: int = 50,
														
 
															+    keyword: Optional[str] = None,
														
 
															+    title: Optional[str] = None,
														
 
															+    standard_no: Optional[str] = None,
														
 
															+    document_type: Optional[str] = None,
														
 
															+    professional_field: Optional[str] = None,
														
 
															+    validity: Optional[str] = None,
														
 
															+    issuing_authority: Optional[str] = None,
														
 
															+    release_date_start: Optional[str] = None,
														
 
															+    release_date_end: Optional[str] = None,
														
 
															+    credentials: HTTPAuthorizationCredentials = Depends(security)
														
 
															+):
														
 
															+    """获取基本信息列表 (支持多条件检索)"""
														
 
															+    try:
														
 
															+        payload = verify_token(credentials.credentials)
														
 
															+        if not payload:
														
 
															+            return ApiResponse(code=401, message="无效的访问令牌", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        conn = get_db_connection()
														
 
															+        if not conn:
														
 
															+            return ApiResponse(code=500, message="数据库连接失败", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+        
														
 
															+        cursor = conn.cursor()
														
 
															+        
														
 
															+        # 根据类型选择表名和字段映射
														
 
															+        if type == 'basis':
														
 
															+            table_name = "t_basis_of_preparation"
														
 
															+            fields = "id, chinese_name as title, standard_number as standard_no, issuing_authority, release_date, document_type, professional_field, validity, created_by, created_time as created_at"
														
 
															+            # 字段名映射供过滤使用
														
 
															+            field_map = {
														
 
															+                'title': 'chinese_name',
														
 
															+                'standard_no': 'standard_number',
														
 
															+                'issuing_authority': 'issuing_authority',
														
 
															+                'release_date': 'release_date',
														
 
															+                'document_type': 'document_type',
														
 
															+                'professional_field': 'professional_field',
														
 
															+                'validity': 'validity'
														
 
															+            }
														
 
															+        elif type == 'work':
														
 
															+            table_name = "t_work_of_preparation"
														
 
															+            fields = "id, plan_name as title, NULL as standard_no, compiling_unit as issuing_authority, compiling_date as release_date, NULL as document_type, NULL as professional_field, NULL as validity, created_by, created_time as created_at"
														
 
															+            field_map = {
														
 
															+                'title': 'plan_name',
														
 
															+                'issuing_authority': 'compiling_unit',
														
 
															+                'release_date': 'compiling_date'
														
 
															+            }
														
 
															+        elif type == 'job':
														
 
															+            table_name = "t_job_of_preparation"
														
 
															+            fields = "id, file_name as title, NULL as standard_no, issuing_department as issuing_authority, publish_date as release_date, document_type, NULL as professional_field, NULL as validity, created_by, created_time as created_at"
														
 
															+            field_map = {
														
 
															+                'title': 'file_name',
														
 
															+                'issuing_authority': 'issuing_department',
														
 
															+                'release_date': 'publish_date',
														
 
															+                'document_type': 'document_type'
														
 
															+            }
														
 
															+        else:
														
 
															+            return ApiResponse(code=400, message="无效的类型", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															+            
														
 
															+        where_clauses = []
														
 
															+        params = []
														
 
															+        
														
 
															+        # 1. 统一关键字搜索 (保持兼容)
														
 
															+        if keyword:
														
 
															+            if type == 'basis':
														
 
															+                where_clauses.append("(chinese_name LIKE %s OR standard_number LIKE %s)")
														
 
															+                params.extend([f"%{keyword}%", f"%{keyword}%"])
														
 
															+            elif type == 'work':
														
 
															+                where_clauses.append("plan_name LIKE %s")
														
 
															+                params.append(f"%{keyword}%")
														
 
															+            elif type == 'job':
														
 
															+                where_clauses.append("file_name LIKE %s")
														
 
															+                params.append(f"%{keyword}%")
														
 
															+
														
 
															+        # 2. 精细化检索
														
 
															+        if title and 'title' in field_map:
														
 
															+            where_clauses.append(f"{field_map['title']} LIKE %s")
														
 
															+            params.append(f"%{title}%")
														
 
															+        
														
 
															+        if standard_no and 'standard_no' in field_map:
														
 
															+            where_clauses.append(f"{field_map['standard_no']} LIKE %s")
														
 
															+            params.append(f"%{standard_no}%")
														
 
															+            
														
 
															+        if document_type and 'document_type' in field_map:
														
 
															+            where_clauses.append(f"{field_map['document_type']} = %s")
														
 
															+            params.append(document_type)
														
 
															+            
														
 
															+        if professional_field and 'professional_field' in field_map:
														
 
															+            where_clauses.append(f"{field_map['professional_field']} = %s")
														
 
															+            params.append(professional_field)
														
 
															+            
														
 
															+        if validity and 'validity' in field_map:
														
 
															+            where_clauses.append(f"{field_map['validity']} = %s")
														
 
															+            params.append(validity)
														
 
															+            
														
 
															+        if issuing_authority and 'issuing_authority' in field_map:
														
 
															+            where_clauses.append(f"{field_map['issuing_authority']} LIKE %s")
														
 
															+            params.append(f"%{issuing_authority}%")
														
 
															+            
														
 
															+        if release_date_start and 'release_date' in field_map:
														
 
															+            where_clauses.append(f"{field_map['release_date']} >= %s")
														
 
															+            params.append(release_date_start)
														
 
															+            
														
 
															+        if release_date_end and 'release_date' in field_map:
														
 
															+            where_clauses.append(f"{field_map['release_date']} <= %s")
														
 
															+            params.append(release_date_end)
														
 
															+                
														
 
															+        where_sql = " WHERE " + " AND ".join(where_clauses) if where_clauses else ""
														
 
															+        
														
 
															+        # 分页查询
														
 
															+        offset = (page - 1) * size
														
 
															+        sql = f"SELECT {fields} FROM {table_name}{where_sql} ORDER BY created_at DESC LIMIT %s OFFSET %s"
														
 
															+        params.extend([size, offset])
														
 
															+        
														
 
															+        cursor.execute(sql, tuple(params))
														
 
															+        columns = [desc[0] for desc in cursor.description]
														
 
															+        items = []
														
 
															+        for row in cursor.fetchall():
														
 
															+            item = dict(zip(columns, row))
														
 
															+            # 格式化日期
														
 
															+            for key in ['release_date', 'created_at']:
														
 
															+                if item.get(key) and hasattr(item[key], 'isoformat'):
														
 
															+                    item[key] = item[key].isoformat()
														
 
															+                elif item.get(key):
														
 
															+                    item[key] = str(item[key])
														
 
															+            items.append(item)
														
 
															+            
														
 
															+        # 总数查询
														
 
															+        count_sql = f"SELECT COUNT(*) FROM {table_name}{where_sql}"
														
 
															+        cursor.execute(count_sql, tuple(params[:-2]))
														
 
															+        total = cursor.fetchone()[0]
														
 
															+        
														
 
															+        cursor.close()
														
 
															+        conn.close()
														
 
															+        
														
 
															+        return ApiResponse(
														
 
															+            code=0,
														
 
															+            message="查询成功",
														
 
															+            data={"items": items, "total": total, "page": page, "size": size},
														
 
															+            timestamp=datetime.now(timezone.utc).isoformat()
														
 
															+        ).model_dump()
														
 
															+        
														
 
															+    except Exception as e:
														
 
															+        print(f"查询基本信息失败: {e}")
														
 
															+        return ApiResponse(code=500, message=f"服务器内部错误: {str(e)}", timestamp=datetime.now(timezone.utc).isoformat()).model_dump()
														
 
															 @app.get("/api/v1/documents/categories/primary")
														
 
															 async def get_primary_categories(credentials: HTTPAuthorizationCredentials = Depends(security)):
														
--- a/scripts/fix_db_indexes.py
+++ b/scripts/fix_db_indexes.py
@@ -3,7 +3,9 @@ import pymysql
 
															 from urllib.parse import urlparse
														
 
															 from dotenv import load_dotenv
														
 
															-load_dotenv()
														
 
															+# 加载环境变量 - 配置文件在脚本所在目录的上一级
														
 
															+env_path = os.path.join(os.path.dirname(__file__), "..", ".env")
														
 
															+load_dotenv(dotenv_path=env_path)
														
 
															 def fix_indexes():
														
 
															     """执行索引添加 SQL"""
														
--- a/scripts/miner_u.py
+++ b/scripts/miner_u.py
@@ -44,7 +44,7 @@ def get_db_connection():
 
															         print(f"Database connection error: {e}")
														
 
															         return None
														
 
															-def update_db_status(table_name, doc_id, status=None, progress=None, error=None):
														
 
															+def update_db_status(doc_id, status=None, progress=None, error=None, converted_file_name=None):
														
 
															     conn = get_db_connection()
														
 
															     if not conn:
														
 
															         return
														
@@ -61,11 +61,17 @@ def update_db_status(table_name, doc_id, status=None, progress=None, error=None)
 
															             if error is not None:
														
 
															                 updates.append("conversion_error = %s")
														
 
															                 params.append(error)
														
 
															+            if converted_file_name is not None:
														
 
															+                updates.append("converted_file_name = %s")
														
 
															+                params.append(converted_file_name)
														
 
															             if not updates:
														
 
															                 return
														
 
															+            
														
 
															+            # 同时更新修改时间
														
 
															+            updates.append("updated_time = NOW()")
														
 
															-            sql = f"UPDATE {table_name} SET {', '.join(updates)} WHERE id = %s"
														
 
															+            sql = f"UPDATE t_document_main SET {', '.join(updates)} WHERE id = %s"
														
 
															             params.append(doc_id)
														
 
															             cursor.execute(sql, params)
														
 
															     except Exception as e:
														
@@ -109,10 +115,10 @@ def poll_batch(batch_id, interval_sec=5, timeout_sec=1800):
 
															             raise TimeoutError(f"poll timeout for batch_id={batch_id}")
														
 
															         time.sleep(interval_sec)
														
 
															-def process_document(table_name, doc_id, chinese_name, file_url, out_dir):
														
 
															+def process_document(doc_id, chinese_name, file_url, out_dir):
														
 
															     try:
														
 
															         # 1. 更新状态：开始转换
														
 
															-        update_db_status(table_name, doc_id, status=1, progress=10)
														
 
															+        update_db_status(doc_id, status=1, progress=10)
														
 
															         # 2. 下载原始文件
														
 
															         print(f"Downloading {file_url}...")
														
@@ -120,19 +126,24 @@ def process_document(table_name, doc_id, chinese_name, file_url, out_dir):
 
															         resp.raise_for_status()
														
 
															         file_content = resp.content
														
 
															+        # 检查文件类型
														
 
															+        content_type = resp.headers.get("Content-Type", "").lower()
														
 
															+        if "text/html" in content_type:
														
 
															+            raise RuntimeError("不支持对网页链接进行转换，请直接查看原链接。")
														
 
															+        
														
 
															         file_ext = Path(urlparse(file_url).path).suffix.lower()
														
 
															         if not file_ext:
														
 
															             file_ext = ".pdf" # Default
														
 
															         file_name = f"{chinese_name}{file_ext}"
														
 
															-        update_db_status(table_name, doc_id, progress=30)
														
 
															+        update_db_status(doc_id, progress=30)
														
 
															         # 3. 提交到 MinerU
														
 
															         files_meta = [{"name": file_name, "data_id": doc_id}]
														
 
															         batch_id, upload_urls = apply_upload_urls(files_meta)
														
 
															         upload_files([file_content], upload_urls)
														
 
															-        update_db_status(table_name, doc_id, progress=50)
														
 
															+        update_db_status(doc_id, progress=50)
														
 
															         # 4. 轮询结果
														
 
															         results = poll_batch(batch_id)
														
@@ -142,23 +153,24 @@ def process_document(table_name, doc_id, chinese_name, file_url, out_dir):
 
															             zip_url = result.get("full_zip_url")
														
 
															             if zip_url:
														
 
															                 # 5. 下载并处理结果
														
 
															-                update_db_status(table_name, doc_id, progress=80)
														
 
															+                update_db_status(doc_id, progress=80)
														
 
															                 zip_resp = requests.get(zip_url, timeout=300)
														
 
															                 zip_resp.raise_for_status()
														
 
															                 # 解压并保存 Markdown
														
 
															+                converted_file_name = f"{chinese_name}.md"
														
 
															                 with zipfile.ZipFile(io.BytesIO(zip_resp.content)) as z:
														
 
															                     # 查找 .md 文件
														
 
															                     md_files = [f for f in z.namelist() if f.endswith(".md")]
														
 
															                     if md_files:
														
 
															                         md_content = z.read(md_files[0])
														
 
															-                        save_path = Path(out_dir) / f"{chinese_name}.md"
														
 
															+                        save_path = Path(out_dir) / converted_file_name
														
 
															                         save_path.parent.mkdir(parents=True, exist_ok=True)
														
 
															                         with open(save_path, "wb") as f:
														
 
															                             f.write(md_content)
														
 
															                         print(f"Saved Markdown to {save_path}")
														
 
															-                update_db_status(table_name, doc_id, status=2, progress=100)
														
 
															+                update_db_status(doc_id, status=2, progress=100, converted_file_name=converted_file_name)
														
 
															                 return True
														
 
															             else:
														
 
															                 raise RuntimeError("No zip URL in result")
														
@@ -168,19 +180,11 @@ def process_document(table_name, doc_id, chinese_name, file_url, out_dir):
 
															     except Exception as e:
														
 
															         print(f"Process failed: {e}")
														
 
															-        update_db_status(table_name, doc_id, status=3, error=str(e))
														
 
															+        update_db_status(doc_id, status=3, error=str(e))
														
 
															         return False
														
 
															-def main_cli(table_type, doc_id, out_dir=r"d:\UGit\MinerU"):
														
 
															-    # 获取表名
														
 
															-    TABLE_MAP = {
														
 
															-        "basis": "t_basis_of_preparation",
														
 
															-        "work": "t_work_of_preparation",
														
 
															-        "job": "t_job_of_preparation"
														
 
															-    }
														
 
															-    table_name = TABLE_MAP.get(table_type, "t_basis_of_preparation")
														
 
															-    
														
 
															-    # 从数据库获取详细信息
														
 
															+def main_cli(doc_id, out_dir=r"d:\UGit\MinerU"):
														
 
															+    # 从数据库获取详细信息 - 直接从 t_document_main 获取
														
 
															     conn = get_db_connection()
														
 
															     if not conn:
														
 
															         print("Database connection failed")
														
@@ -188,21 +192,60 @@ def main_cli(table_type, doc_id, out_dir=r"d:\UGit\MinerU"):
 
															     try:
														
 
															         with conn.cursor() as cursor:
														
 
															-            cursor.execute(f"SELECT chinese_name, file_url FROM {table_name} WHERE id = %s", (doc_id,))
														
 
															+            # 优先从 t_document_main 获取 title 和 file_url
														
 
															+            cursor.execute("SELECT title, file_url FROM t_document_main WHERE id = %s", (doc_id,))
														
 
															             row = cursor.fetchone()
														
 
															-            if not row:
														
 
															-                print(f"Document not found: {doc_id} in {table_name}")
														
 
															+            if not row or not row[1]: # 如果主表没有 file_url，尝试从子表获取
														
 
															+                if not row:
														
 
															+                    print(f"Document not found: {doc_id}")
														
 
															+                    return
														
 
															+                
														
 
															+                title = row[0]
														
 
															+                # 尝试从子表获取 (兼容旧数据)
														
 
															+                cursor.execute("SELECT source_type, source_id FROM t_document_main WHERE id = %s", (doc_id,))
														
 
															+                st_row = cursor.fetchone()
														
 
															+                if st_row:
														
 
															+                    source_type, source_id = st_row
														
 
															+                    TABLE_MAP = {
														
 
															+                        "basis": "t_basis_of_preparation",
														
 
															+                        "work": "t_work_of_preparation",
														
 
															+                        "job": "t_job_of_preparation"
														
 
															+                    }
														
 
															+                    table_name = TABLE_MAP.get(source_type)
														
 
															+                    if table_name:
														
 
															+                        # 尝试不同的 url 字段名
														
 
															+                        url_fields = ['file_url', 'source_url', 'url']
														
 
															+                        for field in url_fields:
														
 
															+                            try:
														
 
															+                                cursor.execute(f"SELECT {field} FROM {table_name} WHERE id = %s", (source_id,))
														
 
															+                                url_row = cursor.fetchone()
														
 
															+                                if url_row and url_row[0]:
														
 
															+                                    file_url = url_row[0]
														
 
															+                                    process_document(doc_id, title, file_url, out_dir)
														
 
															+                                    return
														
 
															+                            except:
														
 
															+                                continue
														
 
															+                
														
 
															+                print(f"No file_url found for document: {doc_id}")
														
 
															+                update_db_status(doc_id, status=3, error="未找到文件链接(file_url)")
														
 
															                 return
														
 
															-            chinese_name, file_url = row
														
 
															-        process_document(table_name, doc_id, chinese_name, file_url, out_dir)
														
 
															+            title, file_url = row
														
 
															+            process_document(doc_id, title, file_url, out_dir)
														
 
															     finally:
														
 
															         conn.close()
														
 
															 if __name__ == "__main__":
														
 
															-    # 示例用法：python miner_u.py basis <doc_id>
														
 
															+    # 示例用法：python miner_u.py <doc_id>
														
 
															     import sys
														
 
															-    if len(sys.argv) > 2:
														
 
															-        main_cli(sys.argv[1], sys.argv[2])
														
 
															+    if len(sys.argv) > 1:
														
 
															+        # 这里的参数处理需要微调，因为以前是 python miner_u.py <table_type> <doc_id>
														
 
															+        # 现在我们只需要 <doc_id>，但为了兼容性，我们可以检查参数个数
														
 
															+        if len(sys.argv) == 3:
														
 
															+            # 旧格式: python miner_u.py basis <doc_id>
														
 
															+            main_cli(sys.argv[2])
														
 
															+        else:
														
 
															+            # 新格式: python miner_u.py <doc_id>
														
 
															+            main_cli(sys.argv[1])
														
 
															     else:
														
 
															-        print("Usage: python miner_u.py <table_type> <doc_id>")
														
 
															+        print("Usage: python miner_u.py <doc_id>")