qwen-vl-max.json 1.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940
  1. {
  2. "model_code": "qwen-vl-max",
  3. "model_intro": "通义千问 VL-Max(qwen-vl-max),即通义千问超大规模视觉语言模型。相比增强版,再次提升视觉推理能力和指令遵循能力,提供更高的视觉感知和认知水平。在更多复杂任务上提供最佳的性能。",
  4. "model_tags": ["视觉理解"],
  5. "model_capabilities": {
  6. "input_modalities": ["text", "image","video"],
  7. "output_modalities": ["text"],
  8. "features": {
  9. "model_experience": true,
  10. "function_calling": false,
  11. "structured_output": true,
  12. "web_search": false,
  13. "prefix_continuation": true,
  14. "cache": true,
  15. "batch_inference": true,
  16. "model_tuning": false
  17. }
  18. },
  19. "model_pricing": {
  20. "unit": "元/千tokens",
  21. "input": 0.0016,
  22. "input_cache_hit": 0.00032,
  23. "input_batch": 0.0008,
  24. "output": 0.004,
  25. "output_batch": 0.002,
  26. "tuning": 0.15
  27. },
  28. "model_limits": {
  29. "max_input_length": "126K",
  30. "max_output_length": "8K",
  31. "rpm": 1200,
  32. "tpm": 1000000,
  33. "context_length": "128K"
  34. },
  35. "api_examples": {
  36. "curl": [
  37. "curl --location 'https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions' \\\n--header \"Authorization: Bearer $DASHSCOPE_API_KEY\" \\\n--header 'Content-Type: application/json' \\\n--data '{\n \"model\": \"qwen-vl-max\",\n \"messages\": [\n {\n \"role\": \"user\",\n \"content\": [\n {\"type\": \"image_url\", \"image_url\": {\"url\": \"https://help-static-aliyun-doc.aliyuncs.com/file-manage-files/zh-CN/20241108/ctdzex/biaozhun.jpg\"}},\n {\"type\": \"text\", \"text\": \"请仅输出图像中的文本内容。\"}\n ]\n }]\n}'"
  38. ]
  39. }
  40. }