qwen3-max.json 2.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273
  1. {
  2. "model_code": "qwen3-max",
  3. "model_intro": "通义千问3系列 Max 模型,相较 preview 版本在智能体编程与工具调用方面进行了专项升级。本次发布的正式版模型达到领域 SOTA 水平,适配场景更加复杂的智能体需求。",
  4. "model_tags": ["Qwen3", "文本生成"],
  5. "model_capabilities": {
  6. "input_modalities": ["text"],
  7. "output_modalities": ["text"],
  8. "features": {
  9. "model_experience": true,
  10. "function_calling": true,
  11. "structured_output": true,
  12. "web_search": true,
  13. "prefix_continuation": true,
  14. "cache": true,
  15. "batch_inference": true,
  16. "model_tuning": false
  17. }
  18. },
  19. "model_pricing": [
  20. {
  21. "input_range": "输入<=32K",
  22. "unit": "元/千tokens",
  23. "input": 0.0025,
  24. "input_cache_hit": 0.0005,
  25. "input_batch": 0.00125,
  26. "output": 0.01,
  27. "output_batch": 0.005,
  28. "explicit_cache_create": 0.003125,
  29. "explicit_cache_hit": 0.00025
  30. },
  31. {
  32. "input_range": "32K<输入<=128K",
  33. "unit": "元/千tokens",
  34. "input": 0.004,
  35. "input_cache_hit": 0.0008,
  36. "input_batch": 0.002,
  37. "output": 0.016,
  38. "output_batch": 0.008,
  39. "explicit_cache_create": 0.005,
  40. "explicit_cache_hit": 0.0004
  41. },
  42. {
  43. "input_range": "128K<输入<=256K",
  44. "unit": "元/千tokens",
  45. "input": 0.007,
  46. "input_cache_hit": 0.0014,
  47. "input_batch": 0.0035,
  48. "output": 0.028,
  49. "output_batch": 0.014,
  50. "explicit_cache_create": 0.00875,
  51. "explicit_cache_hit": 0.0007
  52. }
  53. ],
  54. "tool_call_pricing": [
  55. {
  56. "tool": "search_strategy:agent",
  57. "unit": "元/千次调用",
  58. "price": 4
  59. }
  60. ],
  61. "model_limits": {
  62. "max_input_length": "252K",
  63. "max_output_length": "64K",
  64. "rpm": 600,
  65. "tpm": 1000000,
  66. "context_length": "256K"
  67. },
  68. "api_examples": {
  69. "curl": [
  70. "curl -X POST https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions \\\n-H \"Authorization: Bearer $DASHSCOPE_API_KEY\" \\\n-H \"Content-Type: application/json\" \\\n-d '{\n \"model\": \"qwen3-max\",\n \"messages\": [\n {\n \"role\": \"system\",\n \"content\": \"You are a helpful assistant.\"\n },\n {\n \"role\": \"user\",\n \"content\": \"你是谁?\"\n }\n ],\n \"stream\": true\n}'"
  71. ]
  72. }
  73. }