test_thinking_mode_simple.py 2.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. """
  4. 简化版思考模式测试 - 快速验证
  5. 运行方式:
  6. cd D:/wx_work/sichuan_luqiao/LQAgentPlatform
  7. python utils_test/Model_Test/test_thinking_mode_simple.py
  8. """
  9. import asyncio
  10. import time
  11. import sys
  12. from pathlib import Path
  13. project_root = Path(__file__).parent.parent.parent
  14. sys.path.insert(0, str(project_root))
  15. from foundation.ai.agent.generate.model_generate import generate_model_client
  16. async def quick_test():
  17. """快速测试思考模式开关"""
  18. print("\n" + "=" * 60)
  19. print("快速测试: Qwen3.5 思考模式开关")
  20. print("=" * 60)
  21. # 测试 1: 默认禁用思考模式
  22. print("\n[Test 1] 默认禁用思考模式 (enable_thinking=False)")
  23. start = time.time()
  24. try:
  25. resp = await generate_model_client.get_model_generate_invoke(
  26. trace_id="test_quick_disabled",
  27. system_prompt="简洁回答",
  28. user_prompt="2+2=?",
  29. model_name="qwen3_5_35b_a3b",
  30. enable_thinking=False,
  31. timeout=60
  32. )
  33. elapsed = time.time() - start
  34. print(f" ✅ 成功 ({elapsed:.2f}s): {resp[:50]}...")
  35. assert elapsed < 60, f"响应时间过长: {elapsed:.2f}s,思考模式可能未禁用"
  36. except Exception as e:
  37. print(f" ❌ 失败: {e}")
  38. return False
  39. # 测试 2: 显式启用思考模式(可选,耗时较长)
  40. print("\n[Test 2] 显式启用思考模式 (enable_thinking=True) - 可选")
  41. print(" [跳过] 取消注释以下代码以运行")
  42. # start = time.time()
  43. # try:
  44. # resp = await generate_model_client.get_model_generate_invoke(
  45. # trace_id="test_quick_enabled",
  46. # system_prompt="详细推理后回答",
  47. # user_prompt="请解释勾股定理",
  48. # model_name="qwen3_5_35b_a3b",
  49. # enable_thinking=True,
  50. # timeout=180
  51. # )
  52. # elapsed = time.time() - start
  53. # print(f" ✅ 成功 ({elapsed:.2f}s): {resp[:100]}...")
  54. # except Exception as e:
  55. # print(f" ❌ 失败: {e}")
  56. # return False
  57. # 测试 3: 非 Qwen3.5 模型
  58. print("\n[Test 3] 非 Qwen3.5 模型")
  59. start = time.time()
  60. try:
  61. resp = await generate_model_client.get_model_generate_invoke(
  62. trace_id="test_quick_doubao",
  63. system_prompt="简洁回答",
  64. user_prompt="3+3=?",
  65. model_name="doubao-1.5-pro-256k",
  66. enable_thinking=False, # 应被忽略
  67. timeout=30
  68. )
  69. elapsed = time.time() - start
  70. print(f" ✅ 成功 ({elapsed:.2f}s): {resp[:50]}...")
  71. except Exception as e:
  72. print(f" ❌ 失败: {e}")
  73. return False
  74. print("\n" + "=" * 60)
  75. print("🎉 所有快速测试通过!")
  76. print("=" * 60 + "\n")
  77. return True
  78. if __name__ == "__main__":
  79. success = asyncio.run(quick_test())
  80. sys.exit(0 if success else 1)