Maas2-group
/
Maas-Model-platform


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990
							{
  "model_code": "qwen-plus",
  "model_intro": "Qwen3系列Plus模型，实现思考模式和非思考模式的有效融合，可在对话中切换模式。推理能力显著超过QwQ，通用能力显著超过Qwen2.5-Plus，达到同规模业界SOTA水平。",
  "model_tags": ["Qwen3", "深度思考", "文本生成"],
  "model_capabilities": {
    "input_modalities": ["text"],
    "output_modalities": ["text"],
    "features": {
      "model_experience": true,
      "function_calling": true,
      "structured_output": true,
      "web_search": true,
      "prefix_continuation": true,
      "cache": true,
      "batch_inference": true,
      "model_tuning": false
    }
  },
  "model_pricing": [
    {
      "input_range": "输入<=128K",
      "unit": "元/千tokens",
      "input": 0.0008,
      "input_thinking": 0.0008,
      "input_cache_hit": 0.00016,
      "input_cache_hit_thinking": 0.00016,
      "input_batch": 0.0004,
      "input_batch_thinking": 0.0004,
      "explicit_cache_create": 0.001,
      "explicit_cache_hit": 0.00008,
      "explicit_cache_create_thinking": 0.001,
      "explicit_cache_hit_thinking": 0.00008,
      "output": 0.002,
      "output_thinking": 0.008,
      "output_batch": 0.001,
      "output_thinking_batch": 0.004
    },
    {
      "input_range": "128K<输入<=256K",
      "unit": "元/千tokens",
      "input": 0.0024,
      "input_thinking": 0.0024,
      "input_cache_hit": 0.00048,
      "input_cache_hit_thinking": 0.00048,
      "input_batch": 0.0012,
      "input_batch_thinking": 0.0012,
      "explicit_cache_create": 0.003,
      "explicit_cache_hit": 0.00024,
      "explicit_cache_create_thinking": 0.003,
      "explicit_cache_hit_thinking": 0.00024,
      "output": 0.02,
      "output_thinking": 0.024,
      "output_batch": 0.01,
      "output_thinking_batch": 0.012
    },
    {
      "input_range": "256K<输入<=1M",
      "unit": "元/千tokens",
      "input": 0.0048,
      "input_thinking": 0.0048,
      "input_cache_hit": 0.00096,
      "input_cache_hit_thinking": 0.00096,
      "input_batch": 0.0024,
      "input_batch_thinking": 0.0024,
      "explicit_cache_create": 0.006,
      "explicit_cache_hit": 0.00048,
      "explicit_cache_create_thinking": 0.006,
      "explicit_cache_hit_thinking": 0.00048,
      "output": 0.048,
      "output_thinking": 0.064,
      "output_batch": 0.024,
      "output_thinking_batch": 0.032
    }
  ],
  "model_limits": {
    "max_input_length": "997K",
    "max_input_length_thinking": "995K",
    "max_output_length": "32K",
    "max_output_length_thinking": "32K",
    "max_thinking_length": "80K",
    "rpm": 15000,
    "tpm": 5000000,
    "context_length": "1M"
  },
  "api_examples": {
    "curl": [
      "curl -X POST https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions \\\n-H \"Authorization: Bearer $DASHSCOPE_API_KEY\" \\\n-H \"Content-Type: application/json\" \\\n-d '{\n    \"model\": \"qwen-plus\",\n    \"messages\": [\n        {\n            \"role\": \"user\", \n            \"content\": \"你是谁\"\n        }\n    ],\n    \"stream\": true,\n    \"enable_thinking\": true\n}'"
    ]
  }
}