@lobehub/chat

Version:

Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.

github.com/lobehub/lobe-chat

lobehub/lobe-chat

1,850 lines (1,848 loc) • 72.5 kB

text/typescript

import { AIChatModelCard, AIImageModelCard } from '../types/aiModel'; // https://help.aliyun.com/zh/model-studio/models?spm=a2c4g.11186623 const qwenChatModels: AIChatModelCard[] = [ { abilities: { reasoning: true, vision: true, }, config: { deploymentName: 'qwen3-vl-plus', }, contextWindowTokens: 262_144, description: '通义千问VL是具有视觉（图像）理解能力的文本生成模型，不仅能进行OCR（图片文字识别），还能进一步总结和推理，例如从商品照片中提取属性，根据习题图进行解题等。', displayName: 'Qwen3 VL Plus', id: 'qwen3-vl-plus', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 1, '[0.032, 0.128]': 1.5, '[0.128, infinity]': 3, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 10, '[0.032, 0.128]': 15, '[0.128, infinity]': 30, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, releasedAt: '2025-09-23', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { reasoning: true, vision: true, }, config: { deploymentName: 'qwen3-vl-flash-2025-10-15', }, contextWindowTokens: 262_144, description: 'Qwen3 VL Flash：轻量化高速推理版本，适合对延迟敏感或大批量请求场景。', displayName: 'Qwen3 VL Flash', id: 'qwen3-vl-flash', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 0.15, '[0.032, 0.128]': 0.3, '[0.128, 0.256]': 0.6, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 1.5, '[0.032, 0.128]': 3, '[0.128, 0.256]': 6, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, releasedAt: '2025-10-15', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 131_072, description: 'deepseek-v3.2-exp 引入稀疏注意力机制，旨在提升处理长文本时的训练与推理效率，价格低于 deepseek-v3.1。', displayName: 'DeepSeek V3.2 Exp', id: 'deepseek-v3.2-exp', maxOutput: 65_536, pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 131_072, description: 'DeepSeek V3.1 模型为混合推理架构模型，同时支持思考模式与非思考模式。', displayName: 'DeepSeek V3.1', id: 'deepseek-v3.1', maxOutput: 65_536, pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { search: true, }, contextWindowTokens: 131_072, description: '总参数 1T，激活参数 32B。非思维模型中，在前沿知识、数学和编码方面达到了顶尖水平，更擅长通用 Agent 任务。针对代理任务进行了精心优化，不仅能回答问题，还能采取行动。最适用于即兴、通用聊天和代理体验，是一款无需长时间思考的反射级模型。', displayName: 'Kimi K2 Instruct', id: 'Moonshot-Kimi-K2-Instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-17', settings: { searchImpl: 'params', }, type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 131_072, description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型，提供思考与非思考两种模式。', displayName: 'GLM-4.5', id: 'glm-4.5', maxOutput: 16_384, pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 3, '[0.032, infinity]': 4, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 14, '[0.032, infinity]': 16, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 131_072, description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型，提供思考与非思考两种模式。', displayName: 'GLM-4.5-Air', id: 'glm-4.5-air', maxOutput: 16_384, pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 0.8, '[0.032, infinity]': 1.2, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 6, '[0.032, infinity]': 8, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, }, config: { deploymentName: 'qwen3-coder-plus', // 支持上下文缓存 }, contextWindowTokens: 1_000_000, description: '通义千问代码模型。最新的 Qwen3-Coder 系列模型是基于 Qwen3 的代码生成模型，具有强大的Coding Agent能力，擅长工具调用和环境交互，能够实现自主编程，代码能力卓越的同时兼具通用能力。', displayName: 'Qwen3 Coder Plus', id: 'qwen3-coder-plus', maxOutput: 65_536, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 4 * 0.2, '[0.032, 0.128]': 6 * 0.2, '[0.128, 0.256]': 10 * 0.2, '[0.256, infinity]': 20 * 0.2, }, pricingParams: ['textInputRange'], }, name: 'textInput_cacheRead', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 4, '[0.032, 0.128]': 6, '[0.128, 0.256]': 10, '[0.256, infinity]': 20, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 16, '[0.032, 0.128]': 24, '[0.128, 0.256]': 40, '[0.256, infinity]': 200, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, config: { deploymentName: 'qwen3-coder-flash', // 支持上下文缓存 }, contextWindowTokens: 1_000_000, description: '通义千问代码模型。最新的 Qwen3-Coder 系列模型是基于 Qwen3 的代码生成模型，具有强大的Coding Agent能力，擅长工具调用和环境交互，能够实现自主编程，代码能力卓越的同时兼具通用能力。', displayName: 'Qwen3 Coder Flash', id: 'qwen3-coder-flash', maxOutput: 65_536, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 0.2, '[0.032, 0.128]': 0.3, '[0.128, 0.256]': 0.5, '[0.256, 1]': 1, }, pricingParams: ['textInputRange'], }, name: 'textInput_cacheRead', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 1, '[0.032, 0.128]': 1.5, '[0.128, 0.256]': 2.5, '[0.256, 1]': 5, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 4, '[0.032, 0.128]': 6, '[0.128, 0.256]': 10, '[0.256, 1]': 25, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 262_144, description: '通义千问代码模型开源版。最新的 qwen3-coder-480b-a35b-instruct 是基于 Qwen3 的代码生成模型，具有强大的Coding Agent能力，擅长工具调用和环境交互，能够实现自主编程、代码能力卓越的同时兼具通用能力。', displayName: 'Qwen3 Coder 480B A35B', id: 'qwen3-coder-480b-a35b-instruct', maxOutput: 65_536, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 6, '[0.032, 0.128]': 9, '[0.128, 0.2]': 15, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 24, '[0.032, 0.128]': 36, '[0.128, 0.2]': 60, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 262_144, description: '通义千问代码模型开源版。最新的 qwen3-coder-30b-a3b-instruct 是基于 Qwen3 的代码生成模型，具有强大的Coding Agent能力，擅长工具调用和环境交互，能够实现自主编程、代码能力卓越的同时兼具通用能力。', displayName: 'Qwen3 Coder 30B A3B', id: 'qwen3-coder-30b-a3b-instruct', maxOutput: 65_536, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 1.5, '[0.032, 0.128]': 2.25, '[0.128, 0.2]': 3.75, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 6, '[0.032, 0.128]': 9, '[0.128, 0.2]': 15, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: '基于Qwen3的思考模式开源模型，相较上一版本（通义千问3-235B-A22B）逻辑能力、通用能力、知识增强及创作能力均有大幅提升，适用于高难度强推理场景。', displayName: 'Qwen3 235B A22B Thinking 2507', enabled: true, id: 'qwen3-235b-a22b-thinking-2507', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-25', settings: { extendParams: ['reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '基于Qwen3的非思考模式开源模型，相较上一版本（通义千问3-235B-A22B）主观创作能力与模型安全性均有小幅度提升。', displayName: 'Qwen3 235B A22B Instruct 2507', enabled: true, id: 'qwen3-235b-a22b-instruct-2507', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-22', type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: '基于Qwen3的思考模式开源模型，相较上一版本（通义千问3-30B-A3B）逻辑能力、通用能力、知识增强及创作能力均有大幅提升，适用于高难度强推理场景。', displayName: 'Qwen3 30B A3B Thinking 2507', id: 'qwen3-30b-a3b-thinking-2507', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-30', settings: { extendParams: ['reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '相较上一版本（Qwen3-30B-A3B）中英文和多语言整体通用能力有大幅提升。主观开放类任务专项优化，显著更加符合用户偏好，能够提供更有帮助性的回复。', displayName: 'Qwen3 30B A3B Instruct 2507', id: 'qwen3-30b-a3b-instruct-2507', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-29', type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: '基于 Qwen3 的新一代思考模式开源模型，相较上一版本（通义千问3-235B-A22B-Thinking-2507）指令遵循能力有提升、模型总结回复更加精简。', displayName: 'Qwen3 Next 80B A3B Thinking', id: 'qwen3-next-80b-a3b-thinking', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 10, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-09-12', settings: { extendParams: ['reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '基于 Qwen3 的新一代非思考模式开源模型，相较上一版本（通义千问3-235B-A22B-Instruct-2507）中文文本理解能力更佳、逻辑推理能力有增强、文本生成类任务表现更好。', displayName: 'Qwen3 Next 80B A3B Instruct', id: 'qwen3-next-80b-a3b-instruct', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-09-12', type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 235B A22B', id: 'qwen3-235b-a22b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 32B', id: 'qwen3-32b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 30B A3B', id: 'qwen3-30b-a3b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 14B', id: 'qwen3-14b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 10, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 8B', id: 'qwen3-8b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 4B', id: 'qwen3-4b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 32_768, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 1.7B', id: 'qwen3-1.7b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, }, contextWindowTokens: 32_768, description: 'Qwen3是一款能力大幅提升的新一代通义千问大模型，在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平，并支持思考模式切换。', displayName: 'Qwen3 0.6B', id: 'qwen3-0.6b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-04-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, search: true, }, config: { deploymentName: 'qwq-plus-2025-03-05', }, contextWindowTokens: 131_072, description: '基于 Qwen2.5 模型训练的 QwQ 推理模型，通过强化学习大幅度提升了模型推理能力。模型数学代码等核心指标（AIME 24/25、LiveCodeBench）以及部分通用指标（IFEval、LiveBench等）达到DeepSeek-R1 满血版水平。', displayName: 'QwQ Plus', id: 'qwq-plus', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1.6, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-03-05', settings: { searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, search: true, }, config: { deploymentName: 'qwen-flash', }, contextWindowTokens: 1_000_000, description: '通义千问系列速度最快、成本极低的模型，适合简单任务。', displayName: 'Qwen Flash', enabled: true, id: 'qwen-flash', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', strategy: 'tiered', tiers: [ { rate: 0.15, upTo: 0.128 }, { rate: 0.6, upTo: 0.256 }, { rate: 1.2, upTo: 'infinity' }, ], unit: 'millionTokens', }, { name: 'textOutput', strategy: 'tiered', tiers: [ { rate: 1.5, upTo: 0.128 }, { rate: 6, upTo: 0.256 }, { rate: 12, upTo: 'infinity' }, ], unit: 'millionTokens', }, { name: 'textInput_cacheRead', strategy: 'tiered', tiers: [ { rate: 0.15 * 0.2, upTo: 0.128 }, { rate: 0.6 * 0.2, upTo: 0.256 }, { rate: 1.2 * 0.2, upTo: 'infinity' }, ], unit: 'millionTokens', }, ], }, releasedAt: '2025-07-28', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, search: true, }, config: { deploymentName: 'qwen-turbo-2025-07-15', }, contextWindowTokens: 1_000_000, // Non-thinking mode description: '通义千问 Turbo 后续不再更新，建议替换为通义千问 Flash 。通义千问超大规模语言模型，支持中文、英文等不同语言输入。', displayName: 'Qwen Turbo', id: 'qwen-turbo', maxOutput: 16_384, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput_cacheRead', rate: 0.3 * 0.2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-15', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, reasoning: true, search: true, }, config: { deploymentName: 'qwen-plus-2025-09-11', }, contextWindowTokens: 1_000_000, description: '通义千问超大规模语言模型增强版，支持中文、英文等不同语言输入。', displayName: 'Qwen Plus', enabled: true, id: 'qwen-plus', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.128]': 0.8 * 0.2, '[0.128, 0.256]': 2.4 * 0.2, '[0.256, infinity]': 4.8 * 0.2, }, pricingParams: ['textInputRange'], }, name: 'textInput_cacheRead', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.128]': 0.8, '[0.128, 0.256]': 2.4, '[0.256, infinity]': 4.8, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.128]_[false]': 2, '[0, 0.128]_[true]': 8, '[0.128, 0.256]_[false]': 20, '[0.128, 0.256]_[true]': 24, '[0.256, infinity]_[false]': 48, '[0.256, infinity]_[true]': 64, }, pricingParams: ['textInputRange', 'thinkingMode'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, search: true, }, config: { deploymentName: 'qwen3-max', // 其支持上下文缓存 }, contextWindowTokens: 262_144, description: '通义千问3系列Max模型，相较2.5系列整体通用能力有大幅度提升，中英文通用文本理解能力、复杂指令遵循能力、主观开放任务能力、多语言能力、工具调用能力均显著增强；模型知识幻觉更少。最新的qwen3-max模型：相较qwen3-max-preview版本，在智能体编程与工具调用方向进行了专项升级。本次发布的正式版模型达到领域SOTA水平，适配场景更加复杂的智能体需求。', displayName: 'Qwen3 Max', enabled: true, id: 'qwen3-max', maxOutput: 65_536, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { lookup: { prices: { '[0, 0.032]': 6 * 0.2, '[0.032, 0.128]': 10 * 0.2, '[0.128, infinity]': 15 * 0.2, }, pricingParams: ['textInputRange'], }, name: 'textInput_cacheRead', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 6, '[0.032, 0.128]': 10, '[0.128, infinity]': 15, }, pricingParams: ['textInputRange'], }, name: 'textInput', strategy: 'lookup', unit: 'millionTokens', }, { lookup: { prices: { '[0, 0.032]': 24, '[0.032, 0.128]': 40, '[0.128, infinity]': 60, }, pricingParams: ['textInputRange'], }, name: 'textOutput', strategy: 'lookup', unit: 'millionTokens', }, ], }, releasedAt: '2025-09-23', settings: { searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, search: true, }, config: { deploymentName: 'qwen-max-2025-01-25', }, contextWindowTokens: 131_072, description: '通义千问千亿级别超大规模语言模型，支持中文、英文等不同语言输入，当前通义千问2.5产品版本背后的API模型。', displayName: 'Qwen Max', id: 'qwen-max', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput_cacheRead', rate: 2.4 * 0.2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textInput', rate: 2.4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 9.6, strategy: 'fixed', unit: 'millionTokens' }, ], }, settings: { searchImpl: 'params', }, type: 'chat', }, { abilities: { functionCall: true, }, config: { deploymentName: 'qwen-long-latest', }, contextWindowTokens: 10_000_000, description: '通义千问超大规模语言模型，支持长文本上下文，以及基于长文档、多文档等多个场景的对话功能。', displayName: 'Qwen Long', id: 'qwen-long', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, config: { deploymentName: 'qwen3-omni-flash-2025-09-15', }, contextWindowTokens: 65_536, description: 'Qwen-Omni 模型能够接收文本、图片、音频、视频等多种模态的组合输入，并生成文本或语音形式的回复，提供多种拟人音色，支持多语言和方言的语音输出，可应用于文本创作、视觉识别、语音助手等场景。', displayName: 'Qwen Omni Turbo', id: 'qwen3-omni-flash', maxOutput: 16_384, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1.8, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6.9, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-09-15', settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { vision: true, }, config: { deploymentName: 'qwen-omni-turbo-2025-03-26', }, contextWindowTokens: 32_768, description: 'Qwen-Omni 系列模型支持输入多种模态的数据，包括视频、音频、图片、文本，并输出音频与文本。', displayName: 'Qwen Omni Turbo', id: 'qwen-omni-turbo', maxOutput: 2048, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 4.5, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 32_768, description: 'Qwen-Omni 系列模型支持输入多种模态的数据，包括视频、音频、图片、文本，并输出音频与文本。', displayName: 'Qwen2.5 Omni 7B', id: 'qwen2.5-omni-7b', maxOutput: 2048, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, config: { deploymentName: 'qwen-vl-plus-2025-08-15', }, contextWindowTokens: 131_072, description: '通义千问大规模视觉语言模型增强版。大幅提升细节识别能力和文字识别能力，支持超百万像素分辨率和任意长宽比规格的图像。', displayName: 'Qwen VL Plus', id: 'qwen-vl-plus', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput_cacheRead', rate: 0.8 * 0.2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textInput', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, config: { deploymentName: 'qwen-vl-max-2025-08-13', }, contextWindowTokens: 131_072, description: '通义千问超大规模视觉语言模型。相比增强版，再次提升视觉推理能力和指令遵循能力，提供更高的视觉感知和认知水平。', displayName: 'Qwen VL Max', id: 'qwen-vl-max', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput_cacheRead', rate: 1.6 * 0.2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textInput', rate: 1.6, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, config: { deploymentName: 'qwen-vl-ocr-2025-04-13', }, contextWindowTokens: 34_096, description: '通义千问OCR是文字提取专有模型，专注于文档、表格、试题、手写体文字等类型图像的文字提取能力。它能够识别多种文字，目前支持的语言有：汉语、英语、法语、日语、韩语、德语、俄语、意大利语、越南语、阿拉伯语。', displayName: 'Qwen VL OCR', id: 'qwen-vl-ocr', maxOutput: 4096, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen-VL（开源版）提供视觉理解与文本生成能力，支持智能体交互、视觉编码、空间感知、长视频理解与深度思考，并在复杂场景下具备更强的文字识别与多语言支持。', displayName: 'Qwen3 VL 30B A3B Thinking', id: 'qwen3-vl-30b-a3b-thinking', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' }, ], }, settings: { extendParams: ['reasoningBudgetToken'], }, type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: 'Qwen3 VL 30B 非思考模式（Instruct），面向普通指令跟随场景，保持较高的多模态理解与生成能力。', displayName: 'Qwen3 VL 30B A3B Instruct', id: 'qwen3-vl-30b-a3b-instruct', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3 VL 8B 思考模式，面向轻量级多模态推理与交互场景，保留长上下文理解能力。', displayName: 'Qwen3 VL 8B Thinking', id: 'qwen3-vl-8b-thinking', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: 'Qwen3 VL 8B 非思考模式（Instruct），适合常规多模态生成与识别任务。', displayName: 'Qwen3 VL 8B Instruct', id: 'qwen3-vl-8b-instruct', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, reasoning: true, }, contextWindowTokens: 131_072, description: 'Qwen3 VL 235B A22B 思考模式（开源版），针对高难度强推理与长视频理解场景，提供顶尖的视觉+文本推理能力。', displayName: 'Qwen3 VL 235B A22B Thinking', id: 'qwen3-vl-235b-a22b-thinking', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' }, ], }, settings: { extendParams: ['enableReasoning', 'reasoningBudgetToken'], }, type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: 'Qwen3 VL 235B A22B 非思考模式（Instruct），适用于非思考指令场景，保持强大的视觉理解能力。', displayName: 'Qwen3 VL 235B A22B Instruct', id: 'qwen3-vl-235b-a22b-instruct', maxOutput: 32_768, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { config: { deploymentName: 'qwen-math-turbo-latest', }, contextWindowTokens: 4096, description: '通义千问数学模型是专门用于数学解题的语言模型。', displayName: 'Qwen Math Turbo', id: 'qwen-math-turbo', maxOutput: 3072, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { config: { deploymentName: 'qwen-math-plus-latest', }, contextWindowTokens: 4096, description: '通义千问数学模型是专门用于数学解题的语言模型。', displayName: 'Qwen Math Plus', id: 'qwen-math-plus', maxOutput: 3072, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { config: { deploymentName: 'qwen-coder-turbo-latest', }, contextWindowTokens: 131_072, description: '通义千问代码模型。', displayName: 'Qwen Coder Turbo', id: 'qwen-coder-turbo', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { config: { deploymentName: 'qwen-coder-plus-latest', }, contextWindowTokens: 131_072, description: '通义千问代码模型。', displayName: 'Qwen Coder Plus', id: 'qwen-coder-plus', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 3.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 7, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { reasoning: true, search: true, }, contextWindowTokens: 131_072, description: '基于 Qwen2.5-32B 模型训练的 QwQ 推理模型，通过强化学习大幅度提升了模型推理能力。模型数学代码等核心指标（AIME 24/25、LiveCodeBench）以及部分通用指标（IFEval、LiveBench等）达到DeepSeek-R1 满血版水平，各指标均显著超过同样基于 Qwen2.5-32B 的 DeepSeek-R1-Distill-Qwen-32B。', displayName: 'QwQ 32B', id: 'qwq-32b', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-03-06', settings: { searchImpl: 'params', }, type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 32_768, description: 'QwQ模型是由 Qwen 团队开发的实验性研究模型，专注于增强 AI 推理能力。', displayName: 'QwQ 32B Preview', id: 'qwq-32b-preview', maxOutput: 16_384, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2024-11-28', type: 'chat', }, { abilities: { reasoning: true, vision: true, }, config: { deploymentName: 'qvq-max-2025-05-15', }, contextWindowTokens: 131_072, description: '通义千问QVQ视觉推理模型，支持视觉输入及思维链输出，在数学、编程、视觉分析、创作以及通用任务上都表现了更强的能力。', displayName: 'QVQ Max', id: 'qvq-max', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 32, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-05-15', type: 'chat', }, { abilities: { reasoning: true, vision: true, }, config: { deploymentName: 'qvq-plus-2025-05-15', }, contextWindowTokens: 131_072, description: '视觉推理模型。支持视觉输入及思维链输出，继qvq-max模型后推出的plus版本，相较于qvq-max模型，qvq-plus系列模型推理速度更快，效果和成本更均衡。', displayName: 'QVQ Plus', id: 'qvq-plus', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-05-15', type: 'chat', }, { abilities: { reasoning: true, vision: true, }, contextWindowTokens: 32_768, description: 'QVQ模型是由 Qwen 团队开发的实验性研究模型，专注于提升视觉推理能力，尤其在数学推理领域。', displayName: 'QVQ 72B Preview', id: 'qvq-72b-preview', maxOutput: 16_384, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 12, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 36, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2024-12-25', type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '通义千问2.5对外开源的7B规模的模型。', displayName: 'Qwen2.5 7B', id: 'qwen2.5-7b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '通义千问2.5对外开源的14B规模的模型。', displayName: 'Qwen2.5 14B', id: 'qwen2.5-14b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '通义千问2.5对外开源的32B规模的模型。', displayName: 'Qwen2.5 32B', id: 'qwen2.5-32b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 131_072, description: '通义千问2.5对外开源的72B规模的模型。', displayName: 'Qwen2.5 72B', id: 'qwen2.5-72b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { functionCall: true, }, contextWindowTokens: 1_000_000, description: '通义千问2.5对外开源的72B规模的模型。', displayName: 'Qwen2.5 14B 1M', id: 'qwen2.5-14b-instruct-1m', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-01-27', type: 'chat', }, { contextWindowTokens: 4096, description: 'Qwen-Math 模型具有强大的数学解题能力。', displayName: 'Qwen2.5 Math 7B', id: 'qwen2.5-math-7b-instruct', maxOutput: 3072, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { contextWindowTokens: 4096, description: 'Qwen-Math 模型具有强大的数学解题能力。', displayName: 'Qwen2.5 Math 72B', id: 'qwen2.5-math-72b-instruct', maxOutput: 3072, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-07-23', type: 'chat', }, { contextWindowTokens: 131_072, description: '通义千问代码模型开源版。', displayName: 'Qwen2.5 Coder 7B', id: 'qwen2.5-coder-7b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { contextWindowTokens: 131_072, description: '通义千问代码模型开源版。', displayName: 'Qwen2.5 Coder 14B', id: 'qwen2.5-coder-14b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { contextWindowTokens: 131_072, description: '通义千问代码模型开源版。', displayName: 'Qwen2.5 Coder 32B', id: 'qwen2.5-coder-32b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' }, ], }, type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: '指令跟随、数学、解题、代码整体提升，万物识别能力提升，支持多样格式直接精准定位视觉元素，支持对长视频文件（最长10分钟）进行理解和秒级别的事件时刻定位，能理解时间先后和快慢，基于解析和定位能力支持操控OS或Mobile的Agent，关键信息抽取能力和Json格式输出能力强，此版本为72B版本，本系列能力最强的版本。', displayName: 'Qwen2.5 VL 72B', id: 'qwen2.5-vl-72b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 16, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 48, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-01-27', type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: 'Qwen2.5VL系列模型，在math和学科问题解答达到了接近Qwen2.5VL-72B的水平，回复风格面向人类偏好进行大幅调整，尤其是数学、逻辑推理、知识问答等客观类query，模型回复详实程度和格式清晰度明显改善。此版本为32B版本。', displayName: 'Qwen2.5 VL 32B', id: 'qwen2.5-vl-32b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 24, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-03-24', type: 'chat', }, { abilities: { vision: true, }, contextWindowTokens: 131_072, description: '指令跟随、数学、解题、代码整体提升，万物识别能力提升，支持多样格式直接精准定位视觉元素，支持对长视频文件（最长10分钟）进行理解和秒级别的事件时刻定位，能理解时间先后和快慢，基于解析和定位能力支持操控OS或Mobile的Agent，关键信息抽取能力和Json格式输出能力强，此版本为72B版本，本系列能力最强的版本。', displayName: 'Qwen2.5 VL 7B', id: 'qwen2.5-vl-7b-instruct', maxOutput: 8192, organization: 'Qwen', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-01-27', type: 'chat', }, { abilities: { reasoning: true, }, contextWindowTokens: 131_072, description: '685B 满血版模型，2025年5月28日发布。DeepSeek-R1 在后训练阶段大规模使用了强化学习技术，在仅有极少标注数据的情况下，极大提升了模型推理能力。在数学、代码、自然语言推理等任务上，性能较高，能力较强。', displayName: 'DeepSeek R1 0528', id: 'deepseek-r1-0528', maxOutput: 16_384, organization: 'DeepSeek', pricing: { currency: 'CNY', units: [ { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' }, { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' }, ], }, releasedAt: '2025-05-28', type: 'chat', }, { contextWindowTokens: 65_536, description: 'DeepSeek-V3 为自研 MoE 模型，671B 参数，激活 37B，在 14.8T token 上进行了预训练，在长文本、代码、数学、百科、中文能力上表现优秀。', displayName: 'DeepSeek V3', id: 'deepseek-v3', maxOutput: 8192, organization: 'DeepSeek', pricing: { currency: 'CNY', units: [ {