model_setting.yaml 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
  1. # 模型功能配置
  2. # 按功能模块配置使用的模型及参数
  3. # 可用模型列表(必须与 model_handler.py 中的模型类型名称一致)
  4. # 参考: foundation/ai/models/model_handler.py
  5. available_models:
  6. # DashScope 系列
  7. - qwen3_5_35b_a3b # DashScope Qwen3.5-35B-A3B(默认兜底模型)
  8. - qwen3_5_27b # DashScope Qwen3.5-27B
  9. - qwen3_5_122b_a10b # DashScope Qwen3.5-122B-A10B
  10. # 豆包系列
  11. - doubao # 豆包模型
  12. - doubao-1.5-pro-256k # 豆包1.5 Pro
  13. - doubao-1.5-lite-32k # 豆包1.5 Lite
  14. # DeepSeek 系列
  15. - deepseek # DeepSeek 模型
  16. - deepseek-v3 # DeepSeek V3
  17. # 本地模型系列
  18. - lq_qwen3_8b # 本地Qwen3-8B
  19. - lq_qwen3_8b_lq_lora # 本地Qwen3-8B-lq-lora
  20. - lq_qwen3_4b # 本地Qwen3-4B
  21. - qwen_local_14b # 本地Qwen3-14B
  22. # 蜀天算力系列
  23. - shutian_qwen3_5_122b # 蜀天Qwen3.5-122B
  24. - shutian_qwen3_8b # 蜀天Qwen3-8B
  25. - shutian_qwen3_5_35b # 蜀天Qwen3.5-35B
  26. # Embedding 模型
  27. - lq_qwen3_8b_emd # 本地Qwen3-Embedding-8B
  28. - siliconflow_embed # 硅基流动Embedding
  29. - shutian_qwen3_embed # 蜀天Embedding
  30. # Reranker 模型
  31. - lq_bge_reranker_v2_m3 # BGE-reranker-v2-m3
  32. - shutian_qwen3_reranker # 蜀天Reranker
  33. # 功能模块模型配置
  34. model_settings:
  35. # 文档分类 - 一级分类(使用完整章节标题进行分类)
  36. doc_classification_primary:
  37. model: shutian_qwen3_5_35b
  38. enable_thinking: false
  39. description: "文档一级分类,使用章节标题,蜀天35B"
  40. # 文档分类 - 二级分类(需要快速响应)
  41. doc_classification_secondary:
  42. model: shutian_qwen3_5_122b
  43. enable_thinking: false
  44. description: "文档二级分类,蜀天35B"
  45. # 文档分类 - 三级分类(需要高精度行级分类)
  46. doc_classification_tertiary:
  47. model: shutian_qwen3_5_122b
  48. enable_thinking: false
  49. description: "文档三级分类,蜀天122B"
  50. # 文档分类 - 三级分类复杂段落(可选更强的模型)
  51. doc_classification_tertiary_complex:
  52. model: shutian_qwen3_5_122b
  53. enable_thinking: false
  54. description: "文档三级分类-复杂段落,蜀天122B"
  55. # 完整性审查 - 内容生成
  56. completeness_review_generate:
  57. model: shutian_qwen3_5_122b
  58. enable_thinking: false
  59. description: "完整性审查内容生成,蜀天122B"
  60. # 完整性审查 - 分类识别
  61. completeness_review_classify:
  62. model: shutian_qwen3_5_35b
  63. enable_thinking: false
  64. description: "完整性审查快速分类,蜀天35B"
  65. # RAG 检索 - 查询理解
  66. rag_query_understand:
  67. model: shutian_qwen3_5_35b
  68. enable_thinking: false
  69. description: "RAG查询理解,蜀天35B"
  70. # RAG 检索 - 答案生成
  71. rag_answer_generate:
  72. model: shutian_qwen3_5_122b
  73. enable_thinking: false
  74. description: "RAG答案生成,蜀天122B"
  75. # 敏感信息检查
  76. sensitive_check:
  77. model: shutian_qwen3_5_35b
  78. enable_thinking: false
  79. description: "敏感信息快速检查,蜀天35B"
  80. # 语法检查
  81. grammar_check:
  82. model: shutian_qwen3_5_35b
  83. enable_thinking: false
  84. description: "语法快速检查,蜀天35B"
  85. # 时效性审查
  86. timeliness_review:
  87. model: shutian_qwen3_5_35b
  88. enable_thinking: false
  89. description: "时效性审查,蜀天35B"
  90. # 规范性审查(引用匹配)
  91. reference_review:
  92. model: shutian_qwen3_5_35b
  93. enable_thinking: false
  94. description: "规范性审查(引用匹配),蜀天35B"
  95. # 时效规范审查抽取(目录提取)
  96. directory_extraction:
  97. model: shutian_qwen3_5_35b
  98. enable_thinking: false
  99. description: "时效规范审查抽取(目录提取),蜀天35B"
  100. # Embedding 模型(用于相似度计算)
  101. embedding:
  102. model: lq_qwen3_8b_emd
  103. description: "文本Embedding向量生成"
  104. # 默认配置(当功能未指定时使用)
  105. default:
  106. model: shutian_qwen3_5_35b
  107. enable_thinking: false