| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566 |
- {
- "model_code": "qwen-flash",
- "model_intro": "Qwen3系列Flash模型,实现思考模式和非思考模式的有效融合,可在对话中切换模式。复杂推理类任务性能优秀,指令遵循、文本理解等能力显著提高。支持1M上下文长度,按照上下文长度进行阶梯计费。",
- "model_tags": ["Qwen3", "深度思考", "文本生成"],
- "model_capabilities": {
- "input_modalities": ["text"],
- "output_modalities": ["text"],
- "features": {
- "model_experience": true,
- "function_calling": true,
- "structured_output": true,
- "web_search": true,
- "prefix_continuation": true,
- "cache": true,
- "batch_inference": true,
- "model_tuning": false
- }
- },
- "model_pricing": [
- {
- "input_range": "输入<=128K",
- "unit": "元/千tokens",
- "input": 0.00015,
- "input_cache_hit": 0.00003,
- "input_batch": 0.000075,
- "output": 0.0015,
- "output_batch": 0.00075,
- "explicit_cache_create": 0.0001875,
- "explicit_cache_hit": 0.000015
- },
- {
- "input_range": "128K<输入<=256K",
- "unit": "元/千tokens",
- "input": 0.0006,
- "input_cache_hit": 0.00012,
- "input_batch": 0.0003,
- "output": 0.006,
- "output_batch": 0.003,
- "explicit_cache_create": 0.00075,
- "explicit_cache_hit": 0.00006
- },
- {
- "input_range": "256K<输入<=1M",
- "unit": "元/千tokens",
- "input": 0.0012,
- "input_cache_hit": 0.00024,
- "input_batch": 0.0006,
- "output": 0.012,
- "output_batch": 0.006,
- "explicit_cache_create": 0.0015,
- "explicit_cache_hit": 0.00012
- }
- ],
- "model_limits": {
- "max_input_length": "997K",
- "max_output_length": "32K",
- "rpm": 15000,
- "tpm": 10000000,
- "context_length": "1M"
- },
- "api_examples": {
- "curl": [
- "curl -X POST https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions \\\n-H \"Authorization: Bearer $DASHSCOPE_API_KEY\" \\\n-H \"Content-Type: application/json\" \\\n-d '{\n \"model\": \"qwen-flash\",\n \"messages\": [\n {\n \"role\": \"user\", \n \"content\": \"你是谁\"\n }\n ],\n \"stream\": true,\n \"enable_thinking\": true\n}'"
- ]
- }
- }
|