qwen-plus.json 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990
  1. {
  2. "model_code": "qwen-plus",
  3. "model_intro": "Qwen3系列Plus模型,实现思考模式和非思考模式的有效融合,可在对话中切换模式。推理能力显著超过QwQ,通用能力显著超过Qwen2.5-Plus,达到同规模业界SOTA水平。",
  4. "model_tags": ["Qwen3", "深度思考", "文本生成"],
  5. "model_capabilities": {
  6. "input_modalities": ["text"],
  7. "output_modalities": ["text"],
  8. "features": {
  9. "model_experience": true,
  10. "function_calling": true,
  11. "structured_output": true,
  12. "web_search": true,
  13. "prefix_continuation": true,
  14. "cache": true,
  15. "batch_inference": true,
  16. "model_tuning": false
  17. }
  18. },
  19. "model_pricing": [
  20. {
  21. "input_range": "输入<=128K",
  22. "unit": "元/千tokens",
  23. "input": 0.0008,
  24. "input_thinking": 0.0008,
  25. "input_cache_hit": 0.00016,
  26. "input_cache_hit_thinking": 0.00016,
  27. "input_batch": 0.0004,
  28. "input_batch_thinking": 0.0004,
  29. "explicit_cache_create": 0.001,
  30. "explicit_cache_hit": 0.00008,
  31. "explicit_cache_create_thinking": 0.001,
  32. "explicit_cache_hit_thinking": 0.00008,
  33. "output": 0.002,
  34. "output_thinking": 0.008,
  35. "output_batch": 0.001,
  36. "output_thinking_batch": 0.004
  37. },
  38. {
  39. "input_range": "128K<输入<=256K",
  40. "unit": "元/千tokens",
  41. "input": 0.0024,
  42. "input_thinking": 0.0024,
  43. "input_cache_hit": 0.00048,
  44. "input_cache_hit_thinking": 0.00048,
  45. "input_batch": 0.0012,
  46. "input_batch_thinking": 0.0012,
  47. "explicit_cache_create": 0.003,
  48. "explicit_cache_hit": 0.00024,
  49. "explicit_cache_create_thinking": 0.003,
  50. "explicit_cache_hit_thinking": 0.00024,
  51. "output": 0.02,
  52. "output_thinking": 0.024,
  53. "output_batch": 0.01,
  54. "output_thinking_batch": 0.012
  55. },
  56. {
  57. "input_range": "256K<输入<=1M",
  58. "unit": "元/千tokens",
  59. "input": 0.0048,
  60. "input_thinking": 0.0048,
  61. "input_cache_hit": 0.00096,
  62. "input_cache_hit_thinking": 0.00096,
  63. "input_batch": 0.0024,
  64. "input_batch_thinking": 0.0024,
  65. "explicit_cache_create": 0.006,
  66. "explicit_cache_hit": 0.00048,
  67. "explicit_cache_create_thinking": 0.006,
  68. "explicit_cache_hit_thinking": 0.00048,
  69. "output": 0.048,
  70. "output_thinking": 0.064,
  71. "output_batch": 0.024,
  72. "output_thinking_batch": 0.032
  73. }
  74. ],
  75. "model_limits": {
  76. "max_input_length": "997K",
  77. "max_input_length_thinking": "995K",
  78. "max_output_length": "32K",
  79. "max_output_length_thinking": "32K",
  80. "max_thinking_length": "80K",
  81. "rpm": 15000,
  82. "tpm": 5000000,
  83. "context_length": "1M"
  84. },
  85. "api_examples": {
  86. "curl": [
  87. "curl -X POST https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions \\\n-H \"Authorization: Bearer $DASHSCOPE_API_KEY\" \\\n-H \"Content-Type: application/json\" \\\n-d '{\n \"model\": \"qwen-plus\",\n \"messages\": [\n {\n \"role\": \"user\", \n \"content\": \"你是谁\"\n }\n ],\n \"stream\": true,\n \"enable_thinking\": true\n}'"
  88. ]
  89. }
  90. }