chat.py 70 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837
  1. from fastapi import APIRouter, Depends, Request
  2. from fastapi.responses import StreamingResponse, JSONResponse
  3. from sqlalchemy.orm import Session
  4. from pydantic import BaseModel
  5. from typing import Optional
  6. from database import get_db, SessionLocal
  7. from models.chat import AIConversation, AIMessage
  8. from models.total import RecommendQuestion
  9. from utils.config import settings
  10. from utils.logger import logger
  11. from services.qwen_service import qwen_service
  12. from services.deepseek_service import deepseek_service
  13. from utils.prompt_loader import load_prompt
  14. from utils.thinking_summary import split_thinking_and_answer, summarize_thinking_content
  15. import time
  16. import json
  17. import httpx
  18. import re
  19. router = APIRouter()
  20. def _build_conversation_preview(content: str, limit: int = 50) -> str:
  21. content = (content or "").strip()
  22. if len(content) <= limit:
  23. return content
  24. return content[:limit] + "..."
  25. def _to_frontend_timestamp(timestamp: Optional[int]) -> Optional[int]:
  26. if not timestamp:
  27. return None
  28. return timestamp if timestamp >= 10**12 else timestamp * 1000
  29. def _build_conversation_title(conversation: AIConversation) -> str:
  30. if conversation.business_type == 3 and (conversation.exam_name or "").strip():
  31. return conversation.exam_name.strip()
  32. return _build_conversation_preview(conversation.content or "", limit=30)
  33. def _normalize_related_question(question: str) -> str:
  34. if not isinstance(question, str):
  35. return ""
  36. text = question.strip().strip('"').strip("'")
  37. text = re.sub(r"^[0-9]+[\.\)\]、]\s*", "", text)
  38. text = re.sub(r"^[-*]\s*", "", text)
  39. return text.strip()
  40. def _is_placeholder_related_question(question: str) -> bool:
  41. normalized = _normalize_related_question(question).lower()
  42. if not normalized:
  43. return True
  44. placeholder_patterns = (
  45. r"^q\s*\d+$",
  46. r"^question\s*\d+$",
  47. r"^questions?\s*\d+$",
  48. r"^问题\s*\d+$",
  49. r"^相关问题\s*\d+$",
  50. r"^推荐问题\s*\d+$",
  51. r"^更多相关问题$",
  52. r"^更多问题$",
  53. )
  54. return any(re.fullmatch(pattern, normalized) for pattern in placeholder_patterns)
  55. def _contains_chinese(text: str) -> bool:
  56. return any("\u4e00" <= char <= "\u9fff" for char in text or "")
  57. def _is_invalid_related_question(question: str) -> bool:
  58. normalized = _normalize_related_question(question)
  59. if (
  60. not normalized
  61. or len(normalized) < 4
  62. or _is_placeholder_related_question(normalized)
  63. or not _contains_chinese(normalized)
  64. ):
  65. return True
  66. lowered = normalized.lower()
  67. blocked_keywords = (
  68. "thinking process",
  69. "analyze the request",
  70. "role:",
  71. "**role",
  72. "professional question recommendation",
  73. "infrastructure construction technology",
  74. "output format",
  75. "json",
  76. "prompt",
  77. "system",
  78. "assistant",
  79. "角色定义",
  80. "任务目标",
  81. "输入内容",
  82. "生成要求",
  83. "输出格式",
  84. "开始生成",
  85. )
  86. return any(keyword in lowered for keyword in blocked_keywords)
  87. def _extract_related_question_topic(content: str) -> str:
  88. if not content:
  89. return "当前话题"
  90. text = re.sub(r"<[^>]+>", " ", str(content))
  91. text = re.sub(r"\s+", " ", text).strip()
  92. text = re.sub(
  93. r"^(好的[!!,, ]*|我理解您提出的问题[,, ]*|这个问题[,, ]*|总的来说[::,, ]*)+",
  94. "",
  95. text,
  96. )
  97. pattern = re.search(
  98. r"(?:主要围绕|围绕|关于|针对|聚焦)([^。!?\n,,;;]{4,32})",
  99. text,
  100. )
  101. if pattern:
  102. topic = pattern.group(1).strip("“”\"' ::,,")
  103. if topic:
  104. return topic
  105. sentence = re.split(r"[。!?\n]", text, maxsplit=1)[0].strip("“”\"' ::,,")
  106. if sentence:
  107. return sentence[:24]
  108. return "当前话题"
  109. def _build_related_question_fallbacks(content: str) -> list[str]:
  110. topic = _extract_related_question_topic(content)
  111. return [
  112. f"{topic}在现场实施时需要重点关注哪些风险点?",
  113. f"{topic}相关的方案编制、审批和验收要求有哪些?",
  114. f"针对{topic},日常检查和监测应抓住哪些关键指标?",
  115. ]
  116. def _finalize_related_questions(questions: list, content: str, limit: int = 3) -> list[str]:
  117. cleaned_questions = []
  118. seen = set()
  119. for question in questions or []:
  120. normalized = _normalize_related_question(question)
  121. lowered = normalized.lower()
  122. if (
  123. _is_invalid_related_question(normalized)
  124. or lowered in seen
  125. ):
  126. continue
  127. cleaned_questions.append(normalized)
  128. seen.add(lowered)
  129. if len(cleaned_questions) == limit:
  130. return cleaned_questions
  131. for fallback in _build_related_question_fallbacks(content):
  132. lowered = fallback.lower()
  133. if lowered in seen:
  134. continue
  135. cleaned_questions.append(fallback)
  136. seen.add(lowered)
  137. if len(cleaned_questions) == limit:
  138. break
  139. return cleaned_questions[:limit]
  140. def _refresh_conversation_snapshot(db: Session, conversation_id: int, user_id: int) -> None:
  141. latest_message = (
  142. db.query(AIMessage)
  143. .filter(
  144. AIMessage.ai_conversation_id == conversation_id,
  145. AIMessage.user_id == user_id,
  146. AIMessage.is_deleted == 0,
  147. )
  148. .order_by(AIMessage.id.desc())
  149. .first()
  150. )
  151. if not latest_message:
  152. db.query(AIConversation).filter(
  153. AIConversation.id == conversation_id,
  154. AIConversation.user_id == user_id,
  155. ).update({"is_deleted": 1, "updated_at": int(time.time())})
  156. return
  157. latest_user_message = (
  158. db.query(AIMessage)
  159. .filter(
  160. AIMessage.ai_conversation_id == conversation_id,
  161. AIMessage.user_id == user_id,
  162. AIMessage.type == "user",
  163. AIMessage.is_deleted == 0,
  164. )
  165. .order_by(AIMessage.id.desc())
  166. .first()
  167. )
  168. preview_source = (
  169. latest_user_message.content
  170. if latest_user_message and latest_user_message.content
  171. else latest_message.content
  172. )
  173. preview_content = _build_conversation_preview(
  174. preview_source or "", limit=100)
  175. db.query(AIConversation).filter(
  176. AIConversation.id == conversation_id,
  177. AIConversation.user_id == user_id,
  178. ).update(
  179. {
  180. "content": preview_content or " ",
  181. "updated_at": int(time.time()),
  182. }
  183. )
  184. # ─────────────────────────────────────────────────────────────────────────
  185. # 辅助函数
  186. # ─────────────────────────────────────────────────────────────────────────
  187. async def _rag_search(message: str, top_k: int = 5) -> str:
  188. """调用 search API 做 RAG 检索,返回上下文文本"""
  189. try:
  190. search_cfg = getattr(settings, 'search', None)
  191. if not search_cfg or not hasattr(search_cfg, 'api_url'):
  192. return ""
  193. search_url = search_cfg.api_url
  194. if not search_url:
  195. return ""
  196. async with httpx.AsyncClient(timeout=10.0) as client:
  197. resp = await client.post(
  198. search_url,
  199. json={"query": message, "n_results": top_k},
  200. )
  201. if resp.status_code == 200:
  202. data = resp.json()
  203. docs = data.get("results") or data.get("documents") or []
  204. return "\n\n".join(
  205. d.get("content") or d.get("text") or str(d)
  206. for d in docs[:top_k]
  207. if d.get("content") or d.get("text")
  208. )
  209. except Exception as e:
  210. logger.warning(f"[RAG] 检索失败(可忽略): {e}")
  211. return ""
  212. SAFETY_TRAINING_PLAN_SYSTEM_PROMPT = """
  213. 你是安全培训需求整理助手。请把用户的自然语言输入整理成安全培训PPT大纲生成任务。
  214. 规则:
  215. 1. 只输出一个 JSON 对象,不要输出 Markdown、解释或额外文字。
  216. 2. 即使用户说“通知”“材料”“文档”,也必须理解为安全培训模块中的 PPT 大纲需求,不要切换到其他文档生成任务。
  217. 3. 如果字段缺失,请根据安全培训场景合理补全,但不要编造具体制度编号、人员姓名或不存在的事实。
  218. 4. template 字段用于选择大纲模板,默认填“标准安全培训PPT大纲”。
  219. 5. content_focus 至少给出 3 个要点。
  220. JSON 字段:
  221. {
  222. "topic": "培训主题",
  223. "template": "模板名称",
  224. "content_focus": ["内容要点1", "内容要点2", "内容要点3"],
  225. "audience": "参训对象",
  226. "time": "培训时间",
  227. "location": "培训地点",
  228. "goal": "培训目标",
  229. "notes": "其他要求",
  230. "normalized_request": "归一化后的安全培训PPT大纲生成需求"
  231. }
  232. """
  233. def _extract_tag_value(message: str, tag: str) -> str:
  234. match = re.search(fr"<{tag}>(.*?)</{tag}>", message or "", re.DOTALL)
  235. return match.group(1).strip() if match else ""
  236. def _strip_document_tags(message: str) -> str:
  237. text = message or ""
  238. for tag in ("word", "filename", "filesize"):
  239. text = re.sub(fr"<{tag}>.*?</{tag}>", " ", text, flags=re.DOTALL)
  240. return re.sub(r"\s+", " ", text).strip()
  241. def _extract_safety_training_request_payload(message: str) -> dict:
  242. return {
  243. "document_content": _extract_tag_value(message, "word"),
  244. "filename": _extract_tag_value(message, "filename"),
  245. "filesize": _extract_tag_value(message, "filesize"),
  246. "request": _strip_document_tags(message),
  247. }
  248. def _clean_safety_training_topic(message: str) -> str:
  249. request_text = _extract_safety_training_request_payload(message)["request"]
  250. first_clause = re.split(r"[,。;;,\n]", request_text, maxsplit=1)[0].strip()
  251. topic = first_clause or request_text or "安全培训"
  252. for token in ("请", "帮我", "帮忙", "生成", "制作", "输出", "一份", "一个", "一下", "PPT大纲", "ppt大纲", "大纲", "通知", "文档", "材料"):
  253. topic = topic.replace(token, "")
  254. topic = re.sub(r"\s+", "", topic).strip(" ::,,。;;")
  255. if not topic:
  256. topic = "安全培训"
  257. if "培训" not in topic:
  258. topic = f"{topic}安全培训"
  259. return topic
  260. def _parse_json_object(text: str) -> dict:
  261. if not text:
  262. return {}
  263. cleaned = re.sub(r"```(?:json)?\s*", "", str(text)).replace("```", "").strip()
  264. match = re.search(r"\{.*\}", cleaned, re.DOTALL)
  265. if not match:
  266. return {}
  267. try:
  268. parsed = json.loads(match.group(0))
  269. return parsed if isinstance(parsed, dict) else {}
  270. except json.JSONDecodeError:
  271. return {}
  272. def _build_fallback_safety_training_plan(message: str) -> dict:
  273. topic = _clean_safety_training_topic(message)
  274. payload = _extract_safety_training_request_payload(message)
  275. return {
  276. "topic": topic,
  277. "template": "标准安全培训PPT大纲",
  278. "content_focus": ["安全生产责任", "现场风险识别", "安全意识提升", "培训纪律与行为规范"],
  279. "audience": "参训员工",
  280. "time": "",
  281. "location": "",
  282. "goal": "提升参训人员安全意识和施工现场风险防控能力",
  283. "notes": payload["request"],
  284. "normalized_request": f"围绕{topic}生成安全培训PPT大纲",
  285. }
  286. def _normalize_safety_training_plan(message: str, raw_plan: dict) -> dict:
  287. plan = _build_fallback_safety_training_plan(message)
  288. if not isinstance(raw_plan, dict):
  289. return plan
  290. for key in ("topic", "template", "audience", "time", "location", "goal", "notes", "normalized_request"):
  291. value = raw_plan.get(key)
  292. if isinstance(value, str) and value.strip():
  293. plan[key] = value.strip()
  294. focus = raw_plan.get("content_focus")
  295. if isinstance(focus, list):
  296. normalized_focus = [str(item).strip() for item in focus if str(item).strip()]
  297. if normalized_focus:
  298. plan["content_focus"] = normalized_focus
  299. elif isinstance(focus, str) and focus.strip():
  300. plan["content_focus"] = [item.strip() for item in re.split(r"[、,,;\n]", focus) if item.strip()]
  301. if "培训" not in plan["topic"]:
  302. plan["topic"] = f"{plan['topic']}安全培训"
  303. if "PPT大纲" not in plan["template"]:
  304. plan["template"] = f"{plan['template']}PPT大纲"
  305. return plan
  306. def _build_safety_training_generation_message(message: str, plan: dict) -> str:
  307. payload = _extract_safety_training_request_payload(message)
  308. focus_text = "、".join(plan.get("content_focus") or [])
  309. lines = [
  310. "输出类型:安全培训PPT大纲",
  311. "请基于以下结构化需求生成安全培训PPT大纲,不要生成通知正文,不要切换到其他文档生成任务。",
  312. f"主题:{plan.get('topic') or '安全培训'}",
  313. f"模板:{plan.get('template') or '标准安全培训PPT大纲'}",
  314. f"内容要点:{focus_text or '安全生产责任、风险识别、应急处置、安全意识提升'}",
  315. f"参训对象:{plan.get('audience') or '参训员工'}",
  316. f"培训时间:{plan.get('time') or '未指定'}",
  317. f"培训地点:{plan.get('location') or '未指定'}",
  318. f"培训目标:{plan.get('goal') or '提升参训人员安全意识和风险防控能力'}",
  319. f"其他要求:{plan.get('notes') or '无'}",
  320. f"归一化需求:{plan.get('normalized_request') or ''}",
  321. f"原始需求:{payload['request'] or message}",
  322. ]
  323. if payload["filename"] or payload["document_content"]:
  324. lines.extend([
  325. f"上传文档名称:{payload['filename'] or '未命名文档'}",
  326. f"上传文档大小:{payload['filesize'] or '未知'}",
  327. "上传文档内容:",
  328. payload["document_content"] or "无",
  329. ])
  330. return "\n".join(lines)
  331. async def _infer_safety_training_plan(message: str) -> dict:
  332. payload = _extract_safety_training_request_payload(message)
  333. planning_input = payload["request"] or message
  334. if payload["document_content"]:
  335. planning_input = (
  336. f"{planning_input}\n\n"
  337. f"上传文档名称:{payload['filename'] or '未命名文档'}\n"
  338. f"上传文档内容摘要:{payload['document_content'][:3000]}"
  339. )
  340. try:
  341. response = await qwen_service.chat([
  342. {"role": "system", "content": SAFETY_TRAINING_PLAN_SYSTEM_PROMPT},
  343. {"role": "user", "content": planning_input},
  344. ])
  345. return _normalize_safety_training_plan(message, _parse_json_object(response))
  346. except Exception as e:
  347. logger.warning(f"[safety_training] 需求整理失败,使用兜底结构: {type(e).__name__}: {e}")
  348. return _build_fallback_safety_training_plan(message)
  349. def _clean_ai_writing_response(content: str) -> str:
  350. text = str(content or "").strip()
  351. if not text:
  352. return ""
  353. text = re.sub(r"```(?:html)?\s*", "", text, flags=re.IGNORECASE).replace("```", "").strip()
  354. body_match = re.search(r"<body[^>]*>(.*?)</body>", text, re.IGNORECASE | re.DOTALL)
  355. if body_match:
  356. text = body_match.group(1).strip()
  357. first_content_tag = re.search(
  358. r"<(?:article|section|main|div|h[1-6]|p|table|ul|ol)\b",
  359. text,
  360. re.IGNORECASE,
  361. )
  362. if first_content_tag and text[:first_content_tag.start()].strip():
  363. text = text[first_content_tag.start():]
  364. cleanup_patterns = (
  365. r"<!DOCTYPE[^>]*>",
  366. r"<html[^>]*>",
  367. r"</html>",
  368. r"<head[^>]*>.*?</head>",
  369. r"<body[^>]*>",
  370. r"</body>",
  371. r"<style[^>]*>.*?</style>",
  372. r"<script[^>]*>.*?</script>",
  373. r"<meta[^>]*>",
  374. r"<title[^>]*>.*?</title>",
  375. )
  376. for pattern in cleanup_patterns:
  377. text = re.sub(pattern, "", text, flags=re.IGNORECASE | re.DOTALL)
  378. return text.strip()
  379. async def _generate_ai_writing_response(message: str) -> str:
  380. rag_context = await _rag_search(message, top_k=10)
  381. system_content = load_prompt(
  382. "document_writing",
  383. userMessage=message,
  384. contextJSON=rag_context if rag_context else "暂无相关知识库内容",
  385. )
  386. messages = [
  387. {"role": "system", "content": system_content},
  388. {
  389. "role": "user",
  390. "content": (
  391. "请根据上面的写作规范和我的原始需求,直接生成可放入富文本编辑器的公文正文 HTML 片段。"
  392. "不要输出道歉、解释、DOCTYPE、html、head、body、style 或 script 标签。\n\n"
  393. f"原始需求:\n{message}"
  394. ),
  395. },
  396. ]
  397. raw_response = await deepseek_service.chat(messages)
  398. raw_thinking, raw_answer = split_thinking_and_answer(raw_response)
  399. answer_text = _clean_ai_writing_response(raw_answer or raw_response)
  400. if raw_thinking:
  401. thinking_summary = await summarize_thinking_content(
  402. user_question=message,
  403. raw_thinking=raw_thinking,
  404. final_answer=answer_text,
  405. chat_service=deepseek_service,
  406. context="document_writing",
  407. )
  408. return (
  409. f"思考过程:\n{thinking_summary}\n\n回答:\n{answer_text}"
  410. if thinking_summary
  411. else answer_text
  412. )
  413. return answer_text
  414. async def _generate_ppt_outline_response(message: str) -> str:
  415. training_plan = await _infer_safety_training_plan(message)
  416. generation_message = _build_safety_training_generation_message(message, training_plan)
  417. rag_context = await _rag_search(generation_message, top_k=10)
  418. system_content = load_prompt(
  419. "ppt_outline",
  420. userMessage=generation_message,
  421. contextJSON=rag_context if rag_context else "暂无相关知识库内容",
  422. )
  423. messages = [
  424. {"role": "system", "content": system_content},
  425. {"role": "user", "content": "请直接输出安全培训PPT大纲正文,从标题开始,不要解释提示词或安全规则。"},
  426. ]
  427. raw_response = await qwen_service.chat(messages)
  428. raw_thinking, raw_answer = split_thinking_and_answer(raw_response)
  429. answer_text = raw_answer or raw_response
  430. if raw_thinking:
  431. thinking_summary = await summarize_thinking_content(
  432. user_question=message,
  433. raw_thinking=raw_thinking,
  434. final_answer=answer_text,
  435. chat_service=qwen_service,
  436. context="ppt_outline",
  437. )
  438. return (
  439. f"思考过程:\n{thinking_summary}\n\n回答:\n{answer_text}"
  440. if thinking_summary
  441. else answer_text
  442. )
  443. return answer_text
  444. def _persist_message_pair(db: Session, conv_id: int, user, user_content: str, ai_content: str):
  445. now_ts = int(time.time())
  446. user_message = AIMessage(
  447. ai_conversation_id=conv_id,
  448. user_id=user.user_id,
  449. type="user",
  450. content=user_content,
  451. created_at=now_ts,
  452. updated_at=now_ts,
  453. is_deleted=0,
  454. )
  455. db.add(user_message)
  456. db.commit()
  457. db.refresh(user_message)
  458. ai_message = AIMessage(
  459. ai_conversation_id=conv_id,
  460. user_id=user.user_id,
  461. type="ai",
  462. content=ai_content,
  463. prev_user_id=user_message.id,
  464. created_at=now_ts,
  465. updated_at=now_ts,
  466. is_deleted=0,
  467. )
  468. db.add(ai_message)
  469. db.commit()
  470. db.refresh(ai_message)
  471. return user_message, ai_message
  472. def _build_history_messages(conv_id: int, limit: int = 10) -> list:
  473. """从数据库读取最近对话历史,构建 messages 列表"""
  474. db = SessionLocal()
  475. try:
  476. msgs = (
  477. db.query(AIMessage)
  478. .filter(AIMessage.ai_conversation_id == conv_id, AIMessage.is_deleted == 0)
  479. .order_by(AIMessage.id.desc())
  480. .limit(limit)
  481. .all()
  482. )
  483. msgs.reverse()
  484. result = []
  485. for m in msgs:
  486. role = "user" if m.type == "user" else "assistant"
  487. if m.content:
  488. result.append({"role": role, "content": m.content})
  489. return result
  490. finally:
  491. db.close()
  492. # ─────────────────────────────────────────────────────────────────────────
  493. # 非流式接口
  494. # ─────────────────────────────────────────────────────────────────────────
  495. class SendMessageRequest(BaseModel):
  496. message: str
  497. conversation_id: Optional[int] = None
  498. ai_conversation_id: Optional[int] = None
  499. business_type: int = 0 # 0=AI问答, 1=PPT大纲, 2=AI写作, 3=考试工坊
  500. exam_name: str = ""
  501. ai_message_id: int = 0
  502. @router.post("/send_deepseek_message")
  503. async def send_deepseek_message(
  504. request: Request,
  505. data: SendMessageRequest,
  506. db: Session = Depends(get_db),
  507. ):
  508. """
  509. 发送消息(非流式)
  510. 支持多种业务类型:
  511. - 0: AI问答(意图识别 + RAG)
  512. - 1: PPT大纲生成
  513. - 2: AI写作
  514. - 3: 考试工坊
  515. """
  516. user = request.state.user
  517. if not user:
  518. return {"statusCode": 401, "msg": "未授权"}
  519. try:
  520. message = data.message.strip()
  521. if not message:
  522. return {"statusCode": 400, "msg": "消息不能为空"}
  523. conversation_id = data.conversation_id or data.ai_conversation_id
  524. # 创建或获取对话
  525. if not conversation_id:
  526. conversation = AIConversation(
  527. user_id=user.user_id,
  528. content=message[:100],
  529. business_type=data.business_type,
  530. exam_name=data.exam_name if data.business_type == 3 else "",
  531. created_at=int(time.time()),
  532. updated_at=int(time.time()),
  533. is_deleted=0,
  534. )
  535. db.add(conversation)
  536. db.commit()
  537. db.refresh(conversation)
  538. conv_id = conversation.id
  539. else:
  540. conv_id = conversation_id
  541. db.query(AIConversation).filter(
  542. AIConversation.id == conv_id,
  543. AIConversation.user_id == user.user_id,
  544. AIConversation.is_deleted == 0,
  545. ).update({
  546. "content": message[:100],
  547. "business_type": data.business_type,
  548. "exam_name": data.exam_name if data.business_type == 3 else "",
  549. "updated_at": int(time.time()),
  550. })
  551. db.commit()
  552. response_text = ""
  553. ai_message_id = 0
  554. if data.business_type == 0:
  555. # AI问答:意图识别 + RAG
  556. try:
  557. intent_result = await qwen_service.intent_recognition(message)
  558. intent_type = ""
  559. if isinstance(intent_result, dict):
  560. intent_type = (
  561. intent_result.get("intent_type") or intent_result.get(
  562. "intent") or ""
  563. ).lower()
  564. rag_context = ""
  565. if intent_type in ("query_knowledge_base", "知识库查询", "技术咨询"):
  566. rag_context = await _rag_search(message, top_k=10)
  567. # 使用prompt加载器加载最终回答prompt
  568. system_content = load_prompt(
  569. "final_answer",
  570. userMessage=message,
  571. contextJSON=rag_context if rag_context else "暂无相关知识库内容"
  572. )
  573. messages = [
  574. {"role": "user", "content": system_content},
  575. ]
  576. qwen_response = await qwen_service.chat(messages)
  577. raw_thinking, raw_answer = split_thinking_and_answer(qwen_response)
  578. answer_source = raw_answer or qwen_response
  579. # 兼容模型直接返回 JSON 的场景
  580. answer_text = answer_source
  581. try:
  582. if isinstance(answer_source, str) and answer_source.strip().startswith("{"):
  583. response_json = json.loads(answer_source)
  584. answer_text = response_json.get(
  585. "natural_language_answer", answer_source
  586. )
  587. except Exception:
  588. answer_text = answer_source
  589. if raw_thinking:
  590. thinking_summary = await summarize_thinking_content(
  591. user_question=message,
  592. raw_thinking=raw_thinking,
  593. final_answer=answer_text,
  594. chat_service=qwen_service,
  595. context="send_message",
  596. )
  597. response_text = (
  598. f"思考过程:\n{thinking_summary}\n\n回答:\n{answer_text}"
  599. if thinking_summary
  600. else answer_text
  601. )
  602. else:
  603. response_text = answer_text
  604. except Exception as e:
  605. error_detail = str(e).strip() if str(e).strip() else f"未知错误({type(e).__name__})"
  606. logger.error(f"[send_deepseek_message] AI问答异常: {type(e).__name__}: {error_detail}")
  607. response_text = f"处理失败: {error_detail}"
  608. elif data.business_type == 1:
  609. # PPT大纲生成
  610. try:
  611. response_text = await _generate_ppt_outline_response(message)
  612. _, ai_message = _persist_message_pair(
  613. db=db,
  614. conv_id=conv_id,
  615. user=user,
  616. user_content=message,
  617. ai_content=response_text,
  618. )
  619. ai_message_id = ai_message.id
  620. _refresh_conversation_snapshot(db, conv_id, user.user_id)
  621. db.commit()
  622. return {
  623. "statusCode": 200,
  624. "msg": "success",
  625. "data": {
  626. "conversation_id": conv_id,
  627. "ai_conversation_id": conv_id,
  628. "response": response_text,
  629. "reply": response_text,
  630. "content": response_text,
  631. "message": response_text,
  632. "ai_message_id": ai_message_id,
  633. "user_id": user.user_id,
  634. "business_type": data.business_type,
  635. },
  636. }
  637. except Exception as e:
  638. error_detail = str(e).strip() if str(e).strip() else f"未知错误({type(e).__name__})"
  639. logger.error(f"[send_deepseek_message] PPT大纲生成异常: {type(e).__name__}: {error_detail}")
  640. response_text = f"处理失败: {error_detail}"
  641. elif data.business_type == 2:
  642. # AI写作
  643. try:
  644. response_text = await _generate_ai_writing_response(message)
  645. _, ai_message = _persist_message_pair(
  646. db=db,
  647. conv_id=conv_id,
  648. user=user,
  649. user_content=message,
  650. ai_content=response_text,
  651. )
  652. ai_message_id = ai_message.id
  653. _refresh_conversation_snapshot(db, conv_id, user.user_id)
  654. db.commit()
  655. return {
  656. "statusCode": 200,
  657. "msg": "success",
  658. "data": {
  659. "conversation_id": conv_id,
  660. "ai_conversation_id": conv_id,
  661. "response": response_text,
  662. "reply": response_text,
  663. "content": response_text,
  664. "message": response_text,
  665. "ai_message_id": ai_message_id,
  666. "user_id": user.user_id,
  667. "business_type": data.business_type,
  668. },
  669. }
  670. except Exception as e:
  671. error_detail = str(e).strip() if str(e).strip() else f"未知错误({type(e).__name__})"
  672. logger.error(f"[send_deepseek_message] AI写作异常: {type(e).__name__}: {error_detail}")
  673. response_text = f"处理失败: {error_detail}"
  674. elif data.business_type == 3:
  675. # 考试工坊:生成题目
  676. try:
  677. system_content = (
  678. "你是一个专业的考试题目生成助手,专注于路桥隧轨施工安全领域。\n"
  679. "请根据用户需求生成专业的考试题目,包括单选题、多选题、判断题、简答题等。\n"
  680. "用户消息中已经包含考试标题、题型要求和出题依据内容,必须以其中的出题依据内容为核心生成题目,不能脱离依据内容自由发挥。\n"
  681. "题干、选项、答案和解析都要与出题依据内容中的知识点、专业术语、操作流程、规范要求或培训主题直接相关。\n"
  682. "输出必须是可直接 JSON.parse 的纯 JSON,不要包含 markdown 代码块、解释文字或额外前后缀。\n"
  683. "JSON 顶层结构必须包含 singleChoice、judge、multiple、short 四个字段。\n"
  684. "singleChoice.questions 和 multiple.questions 中每道题必须包含 text、options、answer、analysis。\n"
  685. "options 必须是数组,元素格式为 {\"key\":\"A\",\"text\":\"具体选项内容\"},禁止输出“选项A”这类占位文本。\n"
  686. "judge.questions 中每道题必须包含 text、answer、analysis。\n"
  687. "short.questions 中每道题必须包含 text、outline,其中 outline 至少包含 keyFactors。\n"
  688. "所有题目内容、选项内容、答案和解析都要结合用户给出的工程类型、题型数量、分值和课件内容具体生成。"
  689. )
  690. messages = [
  691. {"role": "system", "content": system_content},
  692. {"role": "user", "content": message},
  693. ]
  694. response_text = await qwen_service.chat(messages)
  695. now_ts = int(time.time())
  696. user_message = AIMessage(
  697. ai_conversation_id=conv_id,
  698. user_id=user.user_id,
  699. type="user",
  700. content=message,
  701. created_at=now_ts,
  702. updated_at=now_ts,
  703. is_deleted=0,
  704. )
  705. db.add(user_message)
  706. db.commit()
  707. db.refresh(user_message)
  708. ai_message = AIMessage(
  709. ai_conversation_id=conv_id,
  710. user_id=user.user_id,
  711. type="ai",
  712. content=response_text,
  713. prev_user_id=user_message.id,
  714. created_at=now_ts,
  715. updated_at=now_ts,
  716. is_deleted=0,
  717. )
  718. db.add(ai_message)
  719. db.commit()
  720. _refresh_conversation_snapshot(db, conv_id, user.user_id)
  721. db.commit()
  722. if data.exam_name:
  723. db.query(AIConversation).filter(AIConversation.id == conv_id).update(
  724. {"exam_name": data.exam_name,
  725. "updated_at": int(time.time())}
  726. )
  727. db.commit()
  728. except Exception as e:
  729. error_detail = str(e).strip() if str(e).strip() else f"未知错误({type(e).__name__})"
  730. logger.error(f"[send_deepseek_message] 考试工坊异常: {type(e).__name__}: {error_detail}")
  731. response_text = f"处理失败: {error_detail}"
  732. else:
  733. return {"statusCode": 400, "msg": f"不支持的业务类型: {data.business_type}"}
  734. return {
  735. "statusCode": 200,
  736. "msg": "success",
  737. "data": {
  738. "conversation_id": conv_id,
  739. "ai_conversation_id": conv_id,
  740. "response": response_text,
  741. "reply": response_text,
  742. "content": response_text,
  743. "message": response_text,
  744. "user_id": user.user_id,
  745. "business_type": data.business_type,
  746. },
  747. }
  748. except Exception as e:
  749. logger.error(f"[send_deepseek_message] 异常: {e}")
  750. return {"statusCode": 500, "msg": f"处理失败: {str(e)}"}
  751. @router.get("/get_history_record")
  752. async def get_history_record(
  753. request: Request,
  754. ai_conversation_id: int = 0,
  755. business_type: Optional[int] = None,
  756. db: Session = Depends(get_db),
  757. ):
  758. """兼容前端的历史记录查询:ai_conversation_id=0 返回对话列表,否则返回消息详情。"""
  759. user = request.state.user
  760. if not user:
  761. return {"statusCode": 401, "msg": "未授权"}
  762. if ai_conversation_id > 0:
  763. messages = (
  764. db.query(AIMessage)
  765. .filter(
  766. AIMessage.ai_conversation_id == ai_conversation_id,
  767. AIMessage.user_id == user.user_id,
  768. AIMessage.is_deleted == 0,
  769. )
  770. .order_by(AIMessage.id.asc())
  771. .all()
  772. )
  773. return {
  774. "statusCode": 200,
  775. "msg": "success",
  776. "total": len(messages),
  777. "data": [
  778. {
  779. "id": message.id,
  780. "ai_conversation_id": message.ai_conversation_id,
  781. "user_id": message.user_id,
  782. "type": message.type,
  783. "content": message.content,
  784. "user_feedback": message.user_feedback,
  785. "prev_user_id": message.prev_user_id,
  786. "search_source": message.search_source or "",
  787. "guess_you_want": message.guess_you_want or "",
  788. "created_at": _to_frontend_timestamp(message.created_at),
  789. "updated_at": _to_frontend_timestamp(message.updated_at),
  790. }
  791. for message in messages
  792. ],
  793. }
  794. conversations_query = db.query(AIConversation).filter(
  795. AIConversation.user_id == user.user_id,
  796. AIConversation.is_deleted == 0,
  797. )
  798. if business_type is not None:
  799. conversations_query = conversations_query.filter(
  800. AIConversation.business_type == business_type
  801. )
  802. total = conversations_query.count()
  803. conversations = (
  804. conversations_query
  805. .order_by(AIConversation.updated_at.desc(), AIConversation.id.desc())
  806. .limit(50)
  807. .all()
  808. )
  809. return {
  810. "statusCode": 200,
  811. "msg": "success",
  812. "total": total,
  813. "data": [
  814. {
  815. "id": conv.id,
  816. "title": _build_conversation_title(conv),
  817. "content": conv.content or "",
  818. "business_type": conv.business_type,
  819. "exam_name": conv.exam_name or "",
  820. "created_at": _to_frontend_timestamp(conv.created_at),
  821. "updated_at": _to_frontend_timestamp(conv.updated_at),
  822. }
  823. for conv in conversations
  824. ],
  825. }
  826. class DeleteConversationRequest(BaseModel):
  827. ai_conversation_id: int = 0
  828. ai_message_id: int = 0
  829. @router.post("/delete_conversation")
  830. async def delete_conversation(
  831. request: Request, data: DeleteConversationRequest, db: Session = Depends(get_db)
  832. ):
  833. """
  834. 删除对话(软删除)
  835. 同时软删除对话记录和所有关联的消息
  836. """
  837. user = request.state.user
  838. if not user:
  839. return {"statusCode": 401, "msg": "未授权"}
  840. now_ts = int(time.time())
  841. if data.ai_message_id:
  842. ai_message = (
  843. db.query(AIMessage)
  844. .filter(
  845. AIMessage.id == data.ai_message_id,
  846. AIMessage.user_id == user.user_id,
  847. AIMessage.type == "ai",
  848. AIMessage.is_deleted == 0,
  849. )
  850. .first()
  851. )
  852. if not ai_message:
  853. return {"statusCode": 404, "msg": "消息不存在"}
  854. db.query(AIMessage).filter(
  855. AIMessage.id == ai_message.id,
  856. AIMessage.user_id == user.user_id,
  857. ).update({"is_deleted": 1, "updated_at": now_ts})
  858. if ai_message.prev_user_id:
  859. db.query(AIMessage).filter(
  860. AIMessage.id == ai_message.prev_user_id,
  861. AIMessage.user_id == user.user_id,
  862. AIMessage.ai_conversation_id == ai_message.ai_conversation_id,
  863. ).update({"is_deleted": 1, "updated_at": now_ts})
  864. _refresh_conversation_snapshot(
  865. db, ai_message.ai_conversation_id, user.user_id)
  866. db.commit()
  867. return {"statusCode": 200, "msg": "删除成功"}
  868. if not data.ai_conversation_id:
  869. return {"statusCode": 400, "msg": "缺少删除参数"}
  870. db.query(AIConversation).filter(
  871. AIConversation.id == data.ai_conversation_id,
  872. AIConversation.user_id == user.user_id,
  873. ).update({"is_deleted": 1, "updated_at": now_ts})
  874. db.query(AIMessage).filter(
  875. AIMessage.ai_conversation_id == data.ai_conversation_id,
  876. AIMessage.user_id == user.user_id,
  877. ).update({"is_deleted": 1, "updated_at": now_ts})
  878. db.commit()
  879. return {"statusCode": 200, "msg": "删除成功"}
  880. class DeleteHistoryRequest(BaseModel):
  881. ai_conversation_id: int
  882. @router.post("/delete_history_record")
  883. async def delete_history_record(
  884. request: Request, data: DeleteHistoryRequest, db: Session = Depends(get_db)
  885. ):
  886. """删除历史记录(软删除)"""
  887. user = request.state.user
  888. if not user:
  889. return {"statusCode": 401, "msg": "未授权"}
  890. db.query(AIConversation).filter(
  891. AIConversation.id == data.ai_conversation_id,
  892. AIConversation.user_id == user.user_id,
  893. ).update({"is_deleted": 1, "updated_at": int(time.time())})
  894. db.commit()
  895. return {"statusCode": 200, "msg": "删除成功"}
  896. # ─────────────────────────────────────────────────────────────────────────
  897. # 流式接口 /stream/chat(无 DB,意图识别 + RAG)
  898. # ─────────────────────────────────────────────────────────────────────────
  899. class StreamChatRequest(BaseModel):
  900. message: str
  901. model: str = ""
  902. @router.post("/stream/chat")
  903. async def stream_chat(request: Request, data: StreamChatRequest):
  904. """流式聊天(SSE,不写 DB)"""
  905. message = data.message.strip()
  906. if not message:
  907. return JSONResponse(content={"statusCode": 400, "msg": "消息不能为空"})
  908. async def event_generator():
  909. intent_type = ""
  910. try:
  911. intent_result = await qwen_service.intent_recognition(message)
  912. if isinstance(intent_result, dict):
  913. intent_type = (
  914. intent_result.get("intent_type") or intent_result.get(
  915. "intent") or ""
  916. ).lower()
  917. except Exception as ie:
  918. logger.warning(f"[stream/chat] 意图识别异常: {ie}")
  919. rag_context = ""
  920. if intent_type in ("query_knowledge_base", "知识库查询", "技术咨询"):
  921. rag_context = await _rag_search(message)
  922. # 使用prompt加载器加载最终回答prompt
  923. system_content = load_prompt(
  924. "final_answer",
  925. userMessage=message,
  926. contextJSON=rag_context if rag_context else "暂无相关知识库内容"
  927. )
  928. messages = [
  929. {"role": "user", "content": system_content},
  930. ]
  931. try:
  932. buffer = ""
  933. pre_answer = ""
  934. thinking_buf = ""
  935. in_think = False
  936. thinking_done = False
  937. max_input_chars = getattr(settings.thinking_summary, "max_input_chars", 1500)
  938. async for chunk in qwen_service.stream_chat(messages):
  939. buffer += chunk
  940. while buffer:
  941. lower = buffer.lower()
  942. if not thinking_done:
  943. if not in_think:
  944. start_idx = lower.find("<think>")
  945. if start_idx == -1:
  946. yield f"data: {json.dumps({'content': buffer}, ensure_ascii=False)}\n\n"
  947. buffer = ""
  948. break
  949. pre_answer += buffer[:start_idx]
  950. buffer = buffer[start_idx + len("<think>"):]
  951. in_think = True
  952. continue
  953. end_idx = lower.find("</think>")
  954. if end_idx == -1:
  955. if max_input_chars and len(thinking_buf) < max_input_chars:
  956. thinking_buf += buffer[: max_input_chars - len(thinking_buf)]
  957. buffer = ""
  958. break
  959. if max_input_chars and len(thinking_buf) < max_input_chars:
  960. thinking_part = buffer[:end_idx]
  961. thinking_buf += thinking_part[: max_input_chars - len(thinking_buf)]
  962. buffer = buffer[end_idx + len("</think>"):]
  963. in_think = False
  964. thinking_done = True
  965. thinking_summary = await summarize_thinking_content(
  966. user_question=message,
  967. raw_thinking=thinking_buf,
  968. final_answer="",
  969. chat_service=qwen_service,
  970. context="stream_chat",
  971. )
  972. if thinking_summary:
  973. prefix = f"思考过程:\n{thinking_summary}\n\n回答:\n"
  974. yield f"data: {json.dumps({'content': prefix}, ensure_ascii=False)}\n\n"
  975. answer_chunk = (pre_answer + buffer).lstrip()
  976. if answer_chunk:
  977. yield f"data: {json.dumps({'content': answer_chunk}, ensure_ascii=False)}\n\n"
  978. pre_answer = ""
  979. buffer = ""
  980. break
  981. yield f"data: {json.dumps({'content': buffer}, ensure_ascii=False)}\n\n"
  982. buffer = ""
  983. # 流结束但未遇到 </think>:仅尝试生成要点(不回退输出 raw thinking)
  984. if in_think and not thinking_done and thinking_buf:
  985. thinking_summary = await summarize_thinking_content(
  986. user_question=message,
  987. raw_thinking=thinking_buf,
  988. final_answer="",
  989. chat_service=qwen_service,
  990. context="stream_chat_eof",
  991. )
  992. if thinking_summary:
  993. prefix = f"思考过程:\n{thinking_summary}\n\n回答:\n"
  994. yield f"data: {json.dumps({'content': prefix}, ensure_ascii=False)}\n\n"
  995. if pre_answer:
  996. yield f"data: {json.dumps({'content': pre_answer}, ensure_ascii=False)}\n\n"
  997. except Exception as e:
  998. logger.error(f"[stream/chat] 流式输出异常: {e}")
  999. yield f"data: {json.dumps({'error': str(e)}, ensure_ascii=False)}\n\n"
  1000. finally:
  1001. yield "data: [DONE]\n\n"
  1002. return StreamingResponse(event_generator(), media_type="text/event-stream")
  1003. # ─────────────────────────────────────────────────────────────────────────
  1004. # 流式接口 /stream/chat-with-db(前端主聊天接口)
  1005. # ─────────────────────────────────────────────────────────────────────────
  1006. class StreamChatWithDBRequest(BaseModel):
  1007. message: str
  1008. ai_conversation_id: int = 0
  1009. business_type: int = 0
  1010. exam_name: str = ""
  1011. ai_message_id: int = 0
  1012. online_search_content: str = ""
  1013. @router.post("/stream/chat-with-db")
  1014. async def stream_chat_with_db(request: Request, data: StreamChatWithDBRequest):
  1015. """
  1016. 带 DB 操作的流式聊天(SSE)
  1017. 流程:
  1018. 1. 创建/获取对话
  1019. 2. 插入用户消息和 AI 占位消息
  1020. 3. 发送 initial 事件
  1021. 4. RAG 检索
  1022. 5. 构建历史上下文
  1023. 6. 流式输出
  1024. 7. 更新 AI 消息内容
  1025. """
  1026. user = request.state.user
  1027. if not user:
  1028. return JSONResponse(content={"statusCode": 401, "msg": "未授权"})
  1029. message = data.message.strip()
  1030. if not message:
  1031. return JSONResponse(content={"statusCode": 400, "msg": "消息不能为空"})
  1032. async def event_generator():
  1033. db = SessionLocal()
  1034. try:
  1035. # 1. 创建或获取对话
  1036. if data.ai_conversation_id == 0:
  1037. conversation = AIConversation(
  1038. user_id=user.user_id,
  1039. content=_build_conversation_preview(message, limit=100),
  1040. business_type=data.business_type,
  1041. exam_name=data.exam_name,
  1042. created_at=int(time.time()),
  1043. updated_at=int(time.time()),
  1044. is_deleted=0,
  1045. )
  1046. db.add(conversation)
  1047. db.commit()
  1048. db.refresh(conversation)
  1049. conv_id = conversation.id
  1050. else:
  1051. existing_conversation = (
  1052. db.query(AIConversation)
  1053. .filter(
  1054. AIConversation.id == data.ai_conversation_id,
  1055. AIConversation.user_id == user.user_id,
  1056. AIConversation.is_deleted == 0,
  1057. )
  1058. .first()
  1059. )
  1060. if existing_conversation:
  1061. conv_id = existing_conversation.id
  1062. db.query(AIConversation).filter(
  1063. AIConversation.id == conv_id,
  1064. AIConversation.user_id == user.user_id,
  1065. ).update(
  1066. {
  1067. "content": _build_conversation_preview(message, limit=100),
  1068. "business_type": data.business_type,
  1069. "exam_name": data.exam_name if data.business_type == 3 else "",
  1070. "updated_at": int(time.time()),
  1071. }
  1072. )
  1073. db.commit()
  1074. else:
  1075. conversation = AIConversation(
  1076. user_id=user.user_id,
  1077. content=_build_conversation_preview(
  1078. message, limit=100),
  1079. business_type=data.business_type,
  1080. exam_name=data.exam_name if data.business_type == 3 else "",
  1081. created_at=int(time.time()),
  1082. updated_at=int(time.time()),
  1083. is_deleted=0,
  1084. )
  1085. db.add(conversation)
  1086. db.commit()
  1087. db.refresh(conversation)
  1088. conv_id = conversation.id
  1089. # 2. 插入用户消息
  1090. user_msg = AIMessage(
  1091. ai_conversation_id=conv_id,
  1092. user_id=user.user_id,
  1093. type="user",
  1094. content=message,
  1095. created_at=int(time.time()),
  1096. updated_at=int(time.time()),
  1097. is_deleted=0,
  1098. )
  1099. db.add(user_msg)
  1100. db.commit()
  1101. db.refresh(user_msg)
  1102. # 3. 插入 AI 占位消息
  1103. ai_msg = AIMessage(
  1104. ai_conversation_id=conv_id,
  1105. user_id=user.user_id,
  1106. type="ai",
  1107. content="",
  1108. prev_user_id=user_msg.id,
  1109. created_at=int(time.time()),
  1110. updated_at=int(time.time()),
  1111. is_deleted=0,
  1112. )
  1113. db.add(ai_msg)
  1114. db.commit()
  1115. db.refresh(ai_msg)
  1116. # 4. 发送 initial 事件
  1117. yield f"data: {json.dumps({'type': 'initial', 'ai_conversation_id': conv_id, 'ai_message_id': ai_msg.id}, ensure_ascii=False)}\n\n"
  1118. # 5. RAG search
  1119. rag_context = await _rag_search(message, top_k=10)
  1120. if data.business_type in (1, 2):
  1121. # PPT outline / AI writing: use dedicated prompt
  1122. prompt_name = "ppt_outline" if data.business_type == 1 else "document_writing"
  1123. system_content = load_prompt(
  1124. prompt_name,
  1125. userMessage=message,
  1126. contextJSON=rag_context if rag_context else "?????????"
  1127. )
  1128. messages = [
  1129. {"role": "user", "content": system_content},
  1130. ]
  1131. else:
  1132. # 6. History context (last 4 items, 2 turns)
  1133. history_msgs = (
  1134. db.query(AIMessage)
  1135. .filter(
  1136. AIMessage.ai_conversation_id == conv_id,
  1137. AIMessage.id < ai_msg.id,
  1138. AIMessage.is_deleted == 0,
  1139. )
  1140. .order_by(AIMessage.updated_at.desc())
  1141. .limit(4)
  1142. .all()
  1143. )
  1144. history_msgs.reverse()
  1145. history_context = ""
  1146. for msg in history_msgs:
  1147. role = "??" if msg.type == "user" else "??"
  1148. history_context += f"{role}: {msg.content}\n\n"
  1149. # 7. Build final prompt
  1150. context_parts = []
  1151. if rag_context:
  1152. context_parts.append(f"??????\n{rag_context}")
  1153. if data.online_search_content:
  1154. context_parts.append(f"???????\n{data.online_search_content}")
  1155. context_json = "\n\n".join(
  1156. context_parts) if context_parts else "?????????"
  1157. system_content = load_prompt(
  1158. "final_answer",
  1159. userMessage=message,
  1160. contextJSON=context_json,
  1161. historyContext=history_context if history_context else ""
  1162. )
  1163. messages = [
  1164. {"role": "user", "content": system_content},
  1165. ]
  1166. # 8. 流式输出并收集完整回复
  1167. full_response = ""
  1168. try:
  1169. summary_enabled = getattr(settings.thinking_summary, "enabled", True)
  1170. max_input_chars = getattr(settings.thinking_summary, "max_input_chars", 1500)
  1171. buffer = ""
  1172. pre_answer = ""
  1173. thinking_buf = ""
  1174. in_think = False
  1175. thinking_done = False
  1176. async for chunk in qwen_service.stream_chat(messages):
  1177. if not summary_enabled:
  1178. escaped_chunk = chunk.replace("\n", "\\n")
  1179. full_response += chunk
  1180. yield f"data: {escaped_chunk}\n\n"
  1181. continue
  1182. buffer += chunk
  1183. while buffer:
  1184. lower = buffer.lower()
  1185. if not thinking_done:
  1186. if not in_think:
  1187. start_idx = lower.find("<think>")
  1188. if start_idx == -1:
  1189. escaped_text = buffer.replace("\n", "\\n")
  1190. full_response += buffer
  1191. yield f"data: {escaped_text}\n\n"
  1192. buffer = ""
  1193. break
  1194. pre_answer += buffer[:start_idx]
  1195. buffer = buffer[start_idx + len("<think>") :]
  1196. in_think = True
  1197. continue
  1198. end_idx = lower.find("</think>")
  1199. if end_idx == -1:
  1200. if max_input_chars and len(thinking_buf) < max_input_chars:
  1201. thinking_buf += buffer[: max_input_chars - len(thinking_buf)]
  1202. buffer = ""
  1203. break
  1204. if max_input_chars and len(thinking_buf) < max_input_chars:
  1205. thinking_part = buffer[:end_idx]
  1206. thinking_buf += thinking_part[: max_input_chars - len(thinking_buf)]
  1207. buffer = buffer[end_idx + len("</think>") :]
  1208. in_think = False
  1209. thinking_done = True
  1210. thinking_summary = await summarize_thinking_content(
  1211. user_question=message,
  1212. raw_thinking=thinking_buf,
  1213. final_answer="",
  1214. chat_service=qwen_service,
  1215. context="stream_chat_with_db",
  1216. )
  1217. if thinking_summary:
  1218. prefix = f"思考过程:\n{thinking_summary}\n\n回答:\n"
  1219. full_response += prefix
  1220. escaped_prefix = prefix.replace('\n', '\\n')
  1221. yield f"data: {escaped_prefix}\n\n"
  1222. answer_chunk = (pre_answer + buffer).lstrip()
  1223. if answer_chunk:
  1224. full_response += answer_chunk
  1225. escaped_answer = answer_chunk.replace('\n', '\\n')
  1226. yield f"data: {escaped_answer}\n\n"
  1227. pre_answer = ""
  1228. buffer = ""
  1229. break
  1230. escaped_text = buffer.replace("\n", "\\n")
  1231. full_response += buffer
  1232. yield f"data: {escaped_text}\n\n"
  1233. buffer = ""
  1234. except Exception as e:
  1235. logger.error(f"[stream/chat-with-db] 流式输出异常: {e}")
  1236. yield f"data: {json.dumps({'error': str(e)}, ensure_ascii=False)}\n\n"
  1237. # 流结束但未遇到 </think>:仅尝试生成要点(不回退输出 raw thinking)
  1238. if summary_enabled and in_think and not thinking_done and thinking_buf:
  1239. thinking_summary = await summarize_thinking_content(
  1240. user_question=message,
  1241. raw_thinking=thinking_buf,
  1242. final_answer="",
  1243. chat_service=qwen_service,
  1244. context="stream_chat_with_db_eof",
  1245. )
  1246. if thinking_summary:
  1247. prefix = f"思考过程:\n{thinking_summary}\n\n回答:\n"
  1248. full_response += prefix
  1249. escaped_prefix = prefix.replace('\n', '\\n')
  1250. yield f"data: {escaped_prefix}\n\n"
  1251. if pre_answer:
  1252. full_response += pre_answer
  1253. escaped_pre_answer = pre_answer.replace('\n', '\\n')
  1254. yield f"data: {escaped_pre_answer}\n\n"
  1255. # 9. 更新 AI 消息内容
  1256. if full_response:
  1257. now_ts = int(time.time())
  1258. db.query(AIMessage).filter(AIMessage.id == ai_msg.id).update(
  1259. {"content": full_response, "updated_at": now_ts}
  1260. )
  1261. db.query(AIConversation).filter(
  1262. AIConversation.id == conv_id,
  1263. AIConversation.user_id == user.user_id,
  1264. ).update(
  1265. {
  1266. "content": _build_conversation_preview(message, limit=100),
  1267. "business_type": data.business_type,
  1268. "exam_name": data.exam_name if data.business_type == 3 else "",
  1269. "updated_at": now_ts,
  1270. }
  1271. )
  1272. db.commit()
  1273. # 10. 结束标记
  1274. yield "data: [DONE]\n\n"
  1275. except Exception as e:
  1276. logger.error(f"[stream/chat-with-db] 处理异常: {e}")
  1277. yield f"data: {json.dumps({'error': str(e)}, ensure_ascii=False)}\n\n"
  1278. finally:
  1279. db.close()
  1280. return StreamingResponse(event_generator(), media_type="text/event-stream")
  1281. # ─────────────────────────────────────────────────────────────────────────
  1282. # 猜你想问
  1283. # ─────────────────────────────────────────────────────────────────────────
  1284. class GuessYouWantRequest(BaseModel):
  1285. ai_message_id: int
  1286. @router.post("/guess_you_want")
  1287. async def guess_you_want(
  1288. request: Request,
  1289. data: GuessYouWantRequest,
  1290. db: Session = Depends(get_db),
  1291. ):
  1292. """生成"猜你想问"的3个关联问题,保存到 AIMessage.guess_you_want"""
  1293. user = request.state.user
  1294. if not user:
  1295. return {"statusCode": 401, "msg": "未授权"}
  1296. try:
  1297. ai_msg = (
  1298. db.query(AIMessage)
  1299. .filter(AIMessage.id == data.ai_message_id, AIMessage.is_deleted == 0)
  1300. .first()
  1301. )
  1302. if not ai_msg:
  1303. return {"statusCode": 404, "msg": "消息不存在"}
  1304. # 使用prompt加载器加载猜你想问prompt
  1305. system_content = load_prompt(
  1306. "guess_questions",
  1307. currentContent=ai_msg.content[:500]
  1308. )
  1309. messages = [
  1310. {"role": "user", "content": system_content},
  1311. ]
  1312. response = await qwen_service.chat(messages)
  1313. try:
  1314. # 尝试从响应中提取 JSON
  1315. json_match = re.search(
  1316. r'\{[^{}]*"questions"[^{}]*\}', response, re.DOTALL)
  1317. if json_match:
  1318. response_json = json.loads(json_match.group())
  1319. else:
  1320. response_json = json.loads(response)
  1321. questions = response_json.get("questions", [])
  1322. except Exception:
  1323. lines = [l.strip() for l in response.split("\n") if l.strip()]
  1324. questions = []
  1325. for line in lines:
  1326. clean = line.lstrip("0123456789.-、 ").strip()
  1327. if clean and len(clean) > 5:
  1328. questions.append(clean)
  1329. if not questions:
  1330. questions = ["该话题的具体应用场景?", "有哪些注意事项?", "相关案例分析?"]
  1331. questions = _finalize_related_questions(questions, ai_msg.content, limit=3)
  1332. guess_json = json.dumps({"questions": questions}, ensure_ascii=False)
  1333. db.query(AIMessage).filter(AIMessage.id == data.ai_message_id).update(
  1334. {"guess_you_want": guess_json, "updated_at": int(time.time())}
  1335. )
  1336. db.commit()
  1337. return {
  1338. "statusCode": 200,
  1339. "msg": "success",
  1340. "data": {"ai_message_id": data.ai_message_id, "questions": questions},
  1341. }
  1342. except Exception as e:
  1343. logger.error(f"[guess_you_want] 处理异常: {e}")
  1344. return {"statusCode": 500, "msg": f"处理失败: {str(e)}"}
  1345. # ─────────────────────────────────────────────────────────────────────────
  1346. # 在线搜索(Dify 工作流集成)
  1347. # ─────────────────────────────────────────────────────────────────────────
  1348. @router.get("/online_search")
  1349. async def online_search(question: str, request: Request, db: Session = Depends(get_db)):
  1350. """
  1351. 在线搜索
  1352. 流程:Qwen 提炼关键词 → Dify 工作流 → 返回摘要
  1353. """
  1354. user = request.state.user
  1355. if not user:
  1356. return {"statusCode": 401, "msg": "未授权"}
  1357. try:
  1358. keywords = await qwen_service.extract_keywords(question)
  1359. dify_config = getattr(settings, "dify", None)
  1360. if not dify_config or not getattr(dify_config, "workflow_url", None):
  1361. return {"statusCode": 500, "msg": "Dify 配置未设置"}
  1362. headers = {
  1363. "Authorization": f"Bearer {dify_config.auth_token}",
  1364. "Content-Type": "application/json",
  1365. }
  1366. payload = {
  1367. "workflow_id": dify_config.workflow_id,
  1368. "inputs": {
  1369. "keywords": keywords,
  1370. "num": 5, # 搜索结果数量
  1371. "max_text_len": 4000 # 最大文本长度
  1372. },
  1373. "response_mode": "blocking",
  1374. "user": getattr(user, "account", str(user.user_id)),
  1375. }
  1376. async with httpx.AsyncClient(timeout=30.0) as client:
  1377. resp = await client.post(dify_config.workflow_url, headers=headers, json=payload)
  1378. if resp.status_code != 200:
  1379. logger.error(
  1380. f"[online_search] Dify 调用失败: {resp.status_code}, 响应: {resp.text}")
  1381. return {"statusCode": 500, "msg": f"搜索服务异常: {resp.status_code}"}
  1382. result = resp.json()
  1383. search_text = result.get("data", {}).get(
  1384. "outputs", {}).get("text", "")
  1385. return {
  1386. "statusCode": 200,
  1387. "msg": "success",
  1388. "data": {"keywords": keywords, "result": search_text},
  1389. }
  1390. except Exception as e:
  1391. logger.error(f"[online_search] 处理异常: {e}")
  1392. return {"statusCode": 500, "msg": f"搜索失败: {str(e)}"}
  1393. class SaveOnlineSearchResultRequest(BaseModel):
  1394. ai_message_id: int
  1395. search_result: str
  1396. @router.post("/save_online_search_result")
  1397. async def save_online_search_result(
  1398. request: Request,
  1399. data: SaveOnlineSearchResultRequest,
  1400. db: Session = Depends(get_db),
  1401. ):
  1402. """保存联网搜索结果到 AIMessage.search_source"""
  1403. user = request.state.user
  1404. if not user:
  1405. return {"statusCode": 401, "msg": "未授权"}
  1406. try:
  1407. db.query(AIMessage).filter(AIMessage.id == data.ai_message_id).update(
  1408. {"search_source": data.search_result,
  1409. "updated_at": int(time.time())}
  1410. )
  1411. db.commit()
  1412. return {"statusCode": 200, "msg": "保存成功"}
  1413. except Exception as e:
  1414. logger.error(f"[save_online_search_result] 处理异常: {e}")
  1415. return {"statusCode": 500, "msg": f"保存失败: {str(e)}"}
  1416. # ─────────────────────────────────────────────────────────────────────────
  1417. # 意图识别独立接口
  1418. # ─────────────────────────────────────────────────────────────────────────
  1419. class IntentRecognitionRequest(BaseModel):
  1420. message: str
  1421. save_to_db: bool = False
  1422. ai_conversation_id: int = 0
  1423. @router.post("/intent_recognition")
  1424. async def intent_recognition(
  1425. request: Request,
  1426. data: IntentRecognitionRequest,
  1427. db: Session = Depends(get_db),
  1428. ):
  1429. """独立意图识别接口;若为 greeting/faq 且 save_to_db=True 则直接存 DB"""
  1430. user = request.state.user
  1431. if not user:
  1432. return {"statusCode": 401, "msg": "未授权"}
  1433. try:
  1434. intent_result = await qwen_service.intent_recognition(data.message)
  1435. intent_type = ""
  1436. response_text = ""
  1437. if isinstance(intent_result, dict):
  1438. intent_type = (
  1439. intent_result.get("intent_type") or intent_result.get(
  1440. "intent") or ""
  1441. ).lower()
  1442. response_text = intent_result.get("response", "")
  1443. if data.save_to_db and intent_type in ("greeting", "问候", "faq", "常见问题"):
  1444. if data.ai_conversation_id == 0:
  1445. conversation = AIConversation(
  1446. user_id=user.user_id,
  1447. content=data.message[:100],
  1448. business_type=0,
  1449. created_at=int(time.time()),
  1450. updated_at=int(time.time()),
  1451. is_deleted=0,
  1452. )
  1453. db.add(conversation)
  1454. db.commit()
  1455. db.refresh(conversation)
  1456. conv_id = conversation.id
  1457. else:
  1458. conv_id = data.ai_conversation_id
  1459. user_msg = AIMessage(
  1460. ai_conversation_id=conv_id,
  1461. user_id=user.user_id,
  1462. type="user",
  1463. content=data.message,
  1464. created_at=int(time.time()),
  1465. updated_at=int(time.time()),
  1466. is_deleted=0,
  1467. )
  1468. db.add(user_msg)
  1469. db.commit()
  1470. ai_msg = AIMessage(
  1471. ai_conversation_id=conv_id,
  1472. user_id=user.user_id,
  1473. type="ai",
  1474. content=response_text,
  1475. prev_user_id=user_msg.id,
  1476. created_at=int(time.time()),
  1477. updated_at=int(time.time()),
  1478. is_deleted=0,
  1479. )
  1480. db.add(ai_msg)
  1481. db.commit()
  1482. db.refresh(ai_msg)
  1483. return {
  1484. "statusCode": 200,
  1485. "msg": "success",
  1486. "data": {
  1487. "intent_type": intent_type,
  1488. "response": response_text,
  1489. "ai_conversation_id": conv_id,
  1490. "ai_message_id": ai_msg.id,
  1491. "saved_to_db": True,
  1492. },
  1493. }
  1494. return {
  1495. "statusCode": 200,
  1496. "msg": "success",
  1497. "data": {
  1498. "intent_type": intent_type,
  1499. "response": response_text,
  1500. "saved_to_db": False,
  1501. },
  1502. }
  1503. except Exception as e:
  1504. logger.error(f"[intent_recognition] 处理异常: {e}")
  1505. return {"statusCode": 500, "msg": f"处理失败: {str(e)}"}
  1506. # ─────────────────────────────────────────────────────────────────────────
  1507. # 获取用户推荐问题(模糊查询 QA / RecommendQuestion 表)
  1508. # ─────────────────────────────────────────────────────────────────────────
  1509. @router.get("/get_user_recommend_question")
  1510. async def get_user_recommend_question(
  1511. keyword: str = "",
  1512. limit: int = 10,
  1513. db: Session = Depends(get_db),
  1514. ):
  1515. """获取推荐问题(支持模糊查询)"""
  1516. try:
  1517. query = db.query(RecommendQuestion).filter(
  1518. RecommendQuestion.is_deleted == 0)
  1519. if keyword:
  1520. query = query.filter(
  1521. RecommendQuestion.question.like(f"%{keyword}%"))
  1522. questions = query.order_by(
  1523. RecommendQuestion.id.desc()).limit(limit).all()
  1524. return {
  1525. "statusCode": 200,
  1526. "msg": "success",
  1527. "data": [
  1528. {"id": q.id, "question": q.question, "created_at": q.created_at}
  1529. for q in questions
  1530. ],
  1531. }
  1532. except Exception as e:
  1533. logger.error(f"[get_user_recommend_question] 处理异常: {e}")
  1534. return {"statusCode": 500, "msg": f"查询失败: {str(e)}"}
  1535. # ─────────────────────────────────────────────────────────────────────────
  1536. # PPT 大纲 / 文档编辑保存
  1537. # ─────────────────────────────────────────────────────────────────────────
  1538. class SavePPTOutlineRequest(BaseModel):
  1539. ai_message_id: int
  1540. content: str
  1541. @router.post("/save_ppt_outline")
  1542. async def save_ppt_outline(
  1543. request: Request,
  1544. data: SavePPTOutlineRequest,
  1545. db: Session = Depends(get_db),
  1546. ):
  1547. """更新 AIMessage.content 保存 PPT 大纲内容"""
  1548. user = request.state.user
  1549. if not user:
  1550. return {"statusCode": 401, "msg": "未授权"}
  1551. try:
  1552. db.query(AIMessage).filter(AIMessage.id == data.ai_message_id).update(
  1553. {"content": data.content, "updated_at": int(time.time())}
  1554. )
  1555. db.commit()
  1556. return {"statusCode": 200, "msg": "保存成功"}
  1557. except Exception as e:
  1558. logger.error(f"[save_ppt_outline] 处理异常: {e}")
  1559. return {"statusCode": 500, "msg": f"保存失败: {str(e)}"}
  1560. class SaveEditDocumentRequest(BaseModel):
  1561. ai_message_id: int
  1562. content: str
  1563. @router.post("/save_edit_document")
  1564. async def save_edit_document(
  1565. request: Request,
  1566. data: SaveEditDocumentRequest,
  1567. db: Session = Depends(get_db),
  1568. ):
  1569. """更新 ai 类型 AIMessage.content(AI写作编辑保存)"""
  1570. user = request.state.user
  1571. if not user:
  1572. return {"statusCode": 401, "msg": "未授权"}
  1573. try:
  1574. db.query(AIMessage).filter(
  1575. AIMessage.id == data.ai_message_id,
  1576. AIMessage.type == "ai",
  1577. ).update({"content": data.content, "updated_at": int(time.time())})
  1578. db.commit()
  1579. return {"statusCode": 200, "msg": "保存成功"}
  1580. except Exception as e:
  1581. logger.error(f"[save_edit_document] 处理异常: {e}")
  1582. return {"statusCode": 500, "msg": f"保存失败: {str(e)}"}