@lobehub/chat
Version:
Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.
1,850 lines (1,848 loc) • 72.5 kB
text/typescript
import { AIChatModelCard, AIImageModelCard } from '../types/aiModel';
// https://help.aliyun.com/zh/model-studio/models?spm=a2c4g.11186623
const qwenChatModels: AIChatModelCard[] = [
{
abilities: {
reasoning: true,
vision: true,
},
config: {
deploymentName: 'qwen3-vl-plus',
},
contextWindowTokens: 262_144,
description:
'通义千问VL是具有视觉(图像)理解能力的文本生成模型,不仅能进行OCR(图片文字识别),还能进一步总结和推理,例如从商品照片中提取属性,根据习题图进行解题等。',
displayName: 'Qwen3 VL Plus',
id: 'qwen3-vl-plus',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 1,
'[0.032, 0.128]': 1.5,
'[0.128, infinity]': 3,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 10,
'[0.032, 0.128]': 15,
'[0.128, infinity]': 30,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
releasedAt: '2025-09-23',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
reasoning: true,
vision: true,
},
config: {
deploymentName: 'qwen3-vl-flash-2025-10-15',
},
contextWindowTokens: 262_144,
description: 'Qwen3 VL Flash:轻量化高速推理版本,适合对延迟敏感或大批量请求场景。',
displayName: 'Qwen3 VL Flash',
id: 'qwen3-vl-flash',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 0.15,
'[0.032, 0.128]': 0.3,
'[0.128, 0.256]': 0.6,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 1.5,
'[0.032, 0.128]': 3,
'[0.128, 0.256]': 6,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
releasedAt: '2025-10-15',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'deepseek-v3.2-exp 引入稀疏注意力机制,旨在提升处理长文本时的训练与推理效率,价格低于 deepseek-v3.1。',
displayName: 'DeepSeek V3.2 Exp',
id: 'deepseek-v3.2-exp',
maxOutput: 65_536,
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 131_072,
description: 'DeepSeek V3.1 模型为混合推理架构模型,同时支持思考模式与非思考模式。',
displayName: 'DeepSeek V3.1',
id: 'deepseek-v3.1',
maxOutput: 65_536,
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
search: true,
},
contextWindowTokens: 131_072,
description:
'总参数 1T,激活参数 32B。 非思维模型中,在前沿知识、数学和编码方面达到了顶尖水平,更擅长通用 Agent 任务。 针对代理任务进行了精心优化,不仅能回答问题,还能采取行动。 最适用于即兴、通用聊天和代理体验,是一款无需长时间思考的反射级模型。',
displayName: 'Kimi K2 Instruct',
id: 'Moonshot-Kimi-K2-Instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-17',
settings: {
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 131_072,
description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型,提供思考与非思考两种模式。',
displayName: 'GLM-4.5',
id: 'glm-4.5',
maxOutput: 16_384,
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 3,
'[0.032, infinity]': 4,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 14,
'[0.032, infinity]': 16,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 131_072,
description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型,提供思考与非思考两种模式。',
displayName: 'GLM-4.5-Air',
id: 'glm-4.5-air',
maxOutput: 16_384,
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 0.8,
'[0.032, infinity]': 1.2,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 6,
'[0.032, infinity]': 8,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
config: {
deploymentName: 'qwen3-coder-plus', // 支持上下文缓存
},
contextWindowTokens: 1_000_000,
description:
'通义千问代码模型。最新的 Qwen3-Coder 系列模型是基于 Qwen3 的代码生成模型,具有强大的Coding Agent能力,擅长工具调用和环境交互,能够实现自主编程,代码能力卓越的同时兼具通用能力。',
displayName: 'Qwen3 Coder Plus',
id: 'qwen3-coder-plus',
maxOutput: 65_536,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 4 * 0.2,
'[0.032, 0.128]': 6 * 0.2,
'[0.128, 0.256]': 10 * 0.2,
'[0.256, infinity]': 20 * 0.2,
},
pricingParams: ['textInputRange'],
},
name: 'textInput_cacheRead',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 4,
'[0.032, 0.128]': 6,
'[0.128, 0.256]': 10,
'[0.256, infinity]': 20,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 16,
'[0.032, 0.128]': 24,
'[0.128, 0.256]': 40,
'[0.256, infinity]': 200,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
config: {
deploymentName: 'qwen3-coder-flash', // 支持上下文缓存
},
contextWindowTokens: 1_000_000,
description:
'通义千问代码模型。最新的 Qwen3-Coder 系列模型是基于 Qwen3 的代码生成模型,具有强大的Coding Agent能力,擅长工具调用和环境交互,能够实现自主编程,代码能力卓越的同时兼具通用能力。',
displayName: 'Qwen3 Coder Flash',
id: 'qwen3-coder-flash',
maxOutput: 65_536,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 0.2,
'[0.032, 0.128]': 0.3,
'[0.128, 0.256]': 0.5,
'[0.256, 1]': 1,
},
pricingParams: ['textInputRange'],
},
name: 'textInput_cacheRead',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 1,
'[0.032, 0.128]': 1.5,
'[0.128, 0.256]': 2.5,
'[0.256, 1]': 5,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 4,
'[0.032, 0.128]': 6,
'[0.128, 0.256]': 10,
'[0.256, 1]': 25,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 262_144,
description:
'通义千问代码模型开源版。最新的 qwen3-coder-480b-a35b-instruct 是基于 Qwen3 的代码生成模型,具有强大的Coding Agent能力,擅长工具调用和环境交互,能够实现自主编程、代码能力卓越的同时兼具通用能力。',
displayName: 'Qwen3 Coder 480B A35B',
id: 'qwen3-coder-480b-a35b-instruct',
maxOutput: 65_536,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 6,
'[0.032, 0.128]': 9,
'[0.128, 0.2]': 15,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 24,
'[0.032, 0.128]': 36,
'[0.128, 0.2]': 60,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 262_144,
description:
'通义千问代码模型开源版。最新的 qwen3-coder-30b-a3b-instruct 是基于 Qwen3 的代码生成模型,具有强大的Coding Agent能力,擅长工具调用和环境交互,能够实现自主编程、代码能力卓越的同时兼具通用能力。',
displayName: 'Qwen3 Coder 30B A3B',
id: 'qwen3-coder-30b-a3b-instruct',
maxOutput: 65_536,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 1.5,
'[0.032, 0.128]': 2.25,
'[0.128, 0.2]': 3.75,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 6,
'[0.032, 0.128]': 9,
'[0.128, 0.2]': 15,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'基于Qwen3的思考模式开源模型,相较上一版本(通义千问3-235B-A22B)逻辑能力、通用能力、知识增强及创作能力均有大幅提升,适用于高难度强推理场景。',
displayName: 'Qwen3 235B A22B Thinking 2507',
enabled: true,
id: 'qwen3-235b-a22b-thinking-2507',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-25',
settings: {
extendParams: ['reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description:
'基于Qwen3的非思考模式开源模型,相较上一版本(通义千问3-235B-A22B)主观创作能力与模型安全性均有小幅度提升。',
displayName: 'Qwen3 235B A22B Instruct 2507',
enabled: true,
id: 'qwen3-235b-a22b-instruct-2507',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-22',
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'基于Qwen3的思考模式开源模型,相较上一版本(通义千问3-30B-A3B)逻辑能力、通用能力、知识增强及创作能力均有大幅提升,适用于高难度强推理场景。',
displayName: 'Qwen3 30B A3B Thinking 2507',
id: 'qwen3-30b-a3b-thinking-2507',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-30',
settings: {
extendParams: ['reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description:
'相较上一版本(Qwen3-30B-A3B)中英文和多语言整体通用能力有大幅提升。主观开放类任务专项优化,显著更加符合用户偏好,能够提供更有帮助性的回复。',
displayName: 'Qwen3 30B A3B Instruct 2507',
id: 'qwen3-30b-a3b-instruct-2507',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-29',
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'基于 Qwen3 的新一代思考模式开源模型,相较上一版本(通义千问3-235B-A22B-Thinking-2507)指令遵循能力有提升、模型总结回复更加精简。',
displayName: 'Qwen3 Next 80B A3B Thinking',
id: 'qwen3-next-80b-a3b-thinking',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 10, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-09-12',
settings: {
extendParams: ['reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description:
'基于 Qwen3 的新一代非思考模式开源模型,相较上一版本(通义千问3-235B-A22B-Instruct-2507)中文文本理解能力更佳、逻辑推理能力有增强、文本生成类任务表现更好。',
displayName: 'Qwen3 Next 80B A3B Instruct',
id: 'qwen3-next-80b-a3b-instruct',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-09-12',
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 235B A22B',
id: 'qwen3-235b-a22b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 32B',
id: 'qwen3-32b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 30B A3B',
id: 'qwen3-30b-a3b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 14B',
id: 'qwen3-14b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 10, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 8B',
id: 'qwen3-8b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 4B',
id: 'qwen3-4b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 32_768,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 1.7B',
id: 'qwen3-1.7b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
},
contextWindowTokens: 32_768,
description:
'Qwen3是一款能力大幅提升的新一代通义千问大模型,在推理、通用、Agent和多语言等多个核心能力上均达到业界领先水平,并支持思考模式切换。',
displayName: 'Qwen3 0.6B',
id: 'qwen3-0.6b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-04-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
search: true,
},
config: {
deploymentName: 'qwq-plus-2025-03-05',
},
contextWindowTokens: 131_072,
description:
'基于 Qwen2.5 模型训练的 QwQ 推理模型,通过强化学习大幅度提升了模型推理能力。模型数学代码等核心指标(AIME 24/25、LiveCodeBench)以及部分通用指标(IFEval、LiveBench等)达到DeepSeek-R1 满血版水平。',
displayName: 'QwQ Plus',
id: 'qwq-plus',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1.6, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-03-05',
settings: {
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
search: true,
},
config: {
deploymentName: 'qwen-flash',
},
contextWindowTokens: 1_000_000,
description: '通义千问系列速度最快、成本极低的模型,适合简单任务。',
displayName: 'Qwen Flash',
enabled: true,
id: 'qwen-flash',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
name: 'textInput',
strategy: 'tiered',
tiers: [
{ rate: 0.15, upTo: 0.128 },
{ rate: 0.6, upTo: 0.256 },
{ rate: 1.2, upTo: 'infinity' },
],
unit: 'millionTokens',
},
{
name: 'textOutput',
strategy: 'tiered',
tiers: [
{ rate: 1.5, upTo: 0.128 },
{ rate: 6, upTo: 0.256 },
{ rate: 12, upTo: 'infinity' },
],
unit: 'millionTokens',
},
{
name: 'textInput_cacheRead',
strategy: 'tiered',
tiers: [
{ rate: 0.15 * 0.2, upTo: 0.128 },
{ rate: 0.6 * 0.2, upTo: 0.256 },
{ rate: 1.2 * 0.2, upTo: 'infinity' },
],
unit: 'millionTokens',
},
],
},
releasedAt: '2025-07-28',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
search: true,
},
config: {
deploymentName: 'qwen-turbo-2025-07-15',
},
contextWindowTokens: 1_000_000, // Non-thinking mode
description:
'通义千问 Turbo 后续不再更新,建议替换为通义千问 Flash 。通义千问超大规模语言模型,支持中文、英文等不同语言输入。',
displayName: 'Qwen Turbo',
id: 'qwen-turbo',
maxOutput: 16_384,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput_cacheRead', rate: 0.3 * 0.2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-15',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
reasoning: true,
search: true,
},
config: {
deploymentName: 'qwen-plus-2025-09-11',
},
contextWindowTokens: 1_000_000,
description: '通义千问超大规模语言模型增强版,支持中文、英文等不同语言输入。',
displayName: 'Qwen Plus',
enabled: true,
id: 'qwen-plus',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.128]': 0.8 * 0.2,
'[0.128, 0.256]': 2.4 * 0.2,
'[0.256, infinity]': 4.8 * 0.2,
},
pricingParams: ['textInputRange'],
},
name: 'textInput_cacheRead',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.128]': 0.8,
'[0.128, 0.256]': 2.4,
'[0.256, infinity]': 4.8,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.128]_[false]': 2,
'[0, 0.128]_[true]': 8,
'[0.128, 0.256]_[false]': 20,
'[0.128, 0.256]_[true]': 24,
'[0.256, infinity]_[false]': 48,
'[0.256, infinity]_[true]': 64,
},
pricingParams: ['textInputRange', 'thinkingMode'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
search: true,
},
config: {
deploymentName: 'qwen3-max', // 其支持上下文缓存
},
contextWindowTokens: 262_144,
description:
'通义千问3系列Max模型,相较2.5系列整体通用能力有大幅度提升,中英文通用文本理解能力、复杂指令遵循能力、主观开放任务能力、多语言能力、工具调用能力均显著增强;模型知识幻觉更少。最新的qwen3-max模型:相较qwen3-max-preview版本,在智能体编程与工具调用方向进行了专项升级。本次发布的正式版模型达到领域SOTA水平,适配场景更加复杂的智能体需求。',
displayName: 'Qwen3 Max',
enabled: true,
id: 'qwen3-max',
maxOutput: 65_536,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{
lookup: {
prices: {
'[0, 0.032]': 6 * 0.2,
'[0.032, 0.128]': 10 * 0.2,
'[0.128, infinity]': 15 * 0.2,
},
pricingParams: ['textInputRange'],
},
name: 'textInput_cacheRead',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 6,
'[0.032, 0.128]': 10,
'[0.128, infinity]': 15,
},
pricingParams: ['textInputRange'],
},
name: 'textInput',
strategy: 'lookup',
unit: 'millionTokens',
},
{
lookup: {
prices: {
'[0, 0.032]': 24,
'[0.032, 0.128]': 40,
'[0.128, infinity]': 60,
},
pricingParams: ['textInputRange'],
},
name: 'textOutput',
strategy: 'lookup',
unit: 'millionTokens',
},
],
},
releasedAt: '2025-09-23',
settings: {
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
search: true,
},
config: {
deploymentName: 'qwen-max-2025-01-25',
},
contextWindowTokens: 131_072,
description:
'通义千问千亿级别超大规模语言模型,支持中文、英文等不同语言输入,当前通义千问2.5产品版本背后的API模型。',
displayName: 'Qwen Max',
id: 'qwen-max',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput_cacheRead', rate: 2.4 * 0.2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textInput', rate: 2.4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 9.6, strategy: 'fixed', unit: 'millionTokens' },
],
},
settings: {
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
config: {
deploymentName: 'qwen-long-latest',
},
contextWindowTokens: 10_000_000,
description:
'通义千问超大规模语言模型,支持长文本上下文,以及基于长文档、多文档等多个场景的对话功能。',
displayName: 'Qwen Long',
id: 'qwen-long',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
config: {
deploymentName: 'qwen3-omni-flash-2025-09-15',
},
contextWindowTokens: 65_536,
description:
'Qwen-Omni 模型能够接收文本、图片、音频、视频等多种模态的组合输入,并生成文本或语音形式的回复, 提供多种拟人音色,支持多语言和方言的语音输出,可应用于文本创作、视觉识别、语音助手等场景。',
displayName: 'Qwen Omni Turbo',
id: 'qwen3-omni-flash',
maxOutput: 16_384,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1.8, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6.9, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-09-15',
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
config: {
deploymentName: 'qwen-omni-turbo-2025-03-26',
},
contextWindowTokens: 32_768,
description:
'Qwen-Omni 系列模型支持输入多种模态的数据,包括视频、音频、图片、文本,并输出音频与文本。',
displayName: 'Qwen Omni Turbo',
id: 'qwen-omni-turbo',
maxOutput: 2048,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 4.5, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 32_768,
description:
'Qwen-Omni 系列模型支持输入多种模态的数据,包括视频、音频、图片、文本,并输出音频与文本。',
displayName: 'Qwen2.5 Omni 7B',
id: 'qwen2.5-omni-7b',
maxOutput: 2048,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
config: {
deploymentName: 'qwen-vl-plus-2025-08-15',
},
contextWindowTokens: 131_072,
description:
'通义千问大规模视觉语言模型增强版。大幅提升细节识别能力和文字识别能力,支持超百万像素分辨率和任意长宽比规格的图像。',
displayName: 'Qwen VL Plus',
id: 'qwen-vl-plus',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput_cacheRead', rate: 0.8 * 0.2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textInput', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
config: {
deploymentName: 'qwen-vl-max-2025-08-13',
},
contextWindowTokens: 131_072,
description:
'通义千问超大规模视觉语言模型。相比增强版,再次提升视觉推理能力和指令遵循能力,提供更高的视觉感知和认知水平。',
displayName: 'Qwen VL Max',
id: 'qwen-vl-max',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput_cacheRead', rate: 1.6 * 0.2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textInput', rate: 1.6, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
config: {
deploymentName: 'qwen-vl-ocr-2025-04-13',
},
contextWindowTokens: 34_096,
description:
'通义千问OCR是文字提取专有模型,专注于文档、表格、试题、手写体文字等类型图像的文字提取能力。它能够识别多种文字,目前支持的语言有:汉语、英语、法语、日语、韩语、德语、俄语、意大利语、越南语、阿拉伯语。',
displayName: 'Qwen VL OCR',
id: 'qwen-vl-ocr',
maxOutput: 4096,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'Qwen-VL(开源版)提供视觉理解与文本生成能力,支持智能体交互、视觉编码、空间感知、长视频理解与深度思考,并在复杂场景下具备更强的文字识别与多语言支持。',
displayName: 'Qwen3 VL 30B A3B Thinking',
id: 'qwen3-vl-30b-a3b-thinking',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 7.5, strategy: 'fixed', unit: 'millionTokens' },
],
},
settings: {
extendParams: ['reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description: 'Qwen3 VL 30B 非思考模式(Instruct),面向普通指令跟随场景,保持较高的多模态理解与生成能力。',
displayName: 'Qwen3 VL 30B A3B Instruct',
id: 'qwen3-vl-30b-a3b-instruct',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description: 'Qwen3 VL 8B 思考模式,面向轻量级多模态推理与交互场景,保留长上下文理解能力。',
displayName: 'Qwen3 VL 8B Thinking',
id: 'qwen3-vl-8b-thinking',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description: 'Qwen3 VL 8B 非思考模式(Instruct),适合常规多模态生成与识别任务。',
displayName: 'Qwen3 VL 8B Instruct',
id: 'qwen3-vl-8b-instruct',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
reasoning: true,
},
contextWindowTokens: 131_072,
description: 'Qwen3 VL 235B A22B 思考模式(开源版),针对高难度强推理与长视频理解场景,提供顶尖的视觉+文本推理能力。',
displayName: 'Qwen3 VL 235B A22B Thinking',
id: 'qwen3-vl-235b-a22b-thinking',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 20, strategy: 'fixed', unit: 'millionTokens' },
],
},
settings: {
extendParams: ['enableReasoning', 'reasoningBudgetToken'],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description: 'Qwen3 VL 235B A22B 非思考模式(Instruct),适用于非思考指令场景,保持强大的视觉理解能力。',
displayName: 'Qwen3 VL 235B A22B Instruct',
id: 'qwen3-vl-235b-a22b-instruct',
maxOutput: 32_768,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
config: {
deploymentName: 'qwen-math-turbo-latest',
},
contextWindowTokens: 4096,
description: '通义千问数学模型是专门用于数学解题的语言模型。',
displayName: 'Qwen Math Turbo',
id: 'qwen-math-turbo',
maxOutput: 3072,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
config: {
deploymentName: 'qwen-math-plus-latest',
},
contextWindowTokens: 4096,
description: '通义千问数学模型是专门用于数学解题的语言模型。',
displayName: 'Qwen Math Plus',
id: 'qwen-math-plus',
maxOutput: 3072,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
config: {
deploymentName: 'qwen-coder-turbo-latest',
},
contextWindowTokens: 131_072,
description: '通义千问代码模型。',
displayName: 'Qwen Coder Turbo',
id: 'qwen-coder-turbo',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
config: {
deploymentName: 'qwen-coder-plus-latest',
},
contextWindowTokens: 131_072,
description: '通义千问代码模型。',
displayName: 'Qwen Coder Plus',
id: 'qwen-coder-plus',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 3.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 7, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
reasoning: true,
search: true,
},
contextWindowTokens: 131_072,
description:
'基于 Qwen2.5-32B 模型训练的 QwQ 推理模型,通过强化学习大幅度提升了模型推理能力。模型数学代码等核心指标(AIME 24/25、LiveCodeBench)以及部分通用指标(IFEval、LiveBench等)达到DeepSeek-R1 满血版水平,各指标均显著超过同样基于 Qwen2.5-32B 的 DeepSeek-R1-Distill-Qwen-32B。',
displayName: 'QwQ 32B',
id: 'qwq-32b',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-03-06',
settings: {
searchImpl: 'params',
},
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 32_768,
description: 'QwQ模型是由 Qwen 团队开发的实验性研究模型,专注于增强 AI 推理能力。',
displayName: 'QwQ 32B Preview',
id: 'qwq-32b-preview',
maxOutput: 16_384,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2024-11-28',
type: 'chat',
},
{
abilities: {
reasoning: true,
vision: true,
},
config: {
deploymentName: 'qvq-max-2025-05-15',
},
contextWindowTokens: 131_072,
description:
'通义千问QVQ视觉推理模型,支持视觉输入及思维链输出,在数学、编程、视觉分析、创作以及通用任务上都表现了更强的能力。',
displayName: 'QVQ Max',
id: 'qvq-max',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 32, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-05-15',
type: 'chat',
},
{
abilities: {
reasoning: true,
vision: true,
},
config: {
deploymentName: 'qvq-plus-2025-05-15',
},
contextWindowTokens: 131_072,
description:
'视觉推理模型。支持视觉输入及思维链输出,继qvq-max模型后推出的plus版本,相较于qvq-max模型,qvq-plus系列模型推理速度更快,效果和成本更均衡。',
displayName: 'QVQ Plus',
id: 'qvq-plus',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-05-15',
type: 'chat',
},
{
abilities: {
reasoning: true,
vision: true,
},
contextWindowTokens: 32_768,
description:
'QVQ模型是由 Qwen 团队开发的实验性研究模型,专注于提升视觉推理能力,尤其在数学推理领域。',
displayName: 'QVQ 72B Preview',
id: 'qvq-72b-preview',
maxOutput: 16_384,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 36, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2024-12-25',
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description: '通义千问2.5对外开源的7B规模的模型。',
displayName: 'Qwen2.5 7B',
id: 'qwen2.5-7b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description: '通义千问2.5对外开源的14B规模的模型。',
displayName: 'Qwen2.5 14B',
id: 'qwen2.5-14b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description: '通义千问2.5对外开源的32B规模的模型。',
displayName: 'Qwen2.5 32B',
id: 'qwen2.5-32b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 131_072,
description: '通义千问2.5对外开源的72B规模的模型。',
displayName: 'Qwen2.5 72B',
id: 'qwen2.5-72b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
functionCall: true,
},
contextWindowTokens: 1_000_000,
description: '通义千问2.5对外开源的72B规模的模型。',
displayName: 'Qwen2.5 14B 1M',
id: 'qwen2.5-14b-instruct-1m',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-01-27',
type: 'chat',
},
{
contextWindowTokens: 4096,
description: 'Qwen-Math 模型具有强大的数学解题能力。',
displayName: 'Qwen2.5 Math 7B',
id: 'qwen2.5-math-7b-instruct',
maxOutput: 3072,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
contextWindowTokens: 4096,
description: 'Qwen-Math 模型具有强大的数学解题能力。',
displayName: 'Qwen2.5 Math 72B',
id: 'qwen2.5-math-72b-instruct',
maxOutput: 3072,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-07-23',
type: 'chat',
},
{
contextWindowTokens: 131_072,
description: '通义千问代码模型开源版。',
displayName: 'Qwen2.5 Coder 7B',
id: 'qwen2.5-coder-7b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
contextWindowTokens: 131_072,
description: '通义千问代码模型开源版。',
displayName: 'Qwen2.5 Coder 14B',
id: 'qwen2.5-coder-14b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
contextWindowTokens: 131_072,
description: '通义千问代码模型开源版。',
displayName: 'Qwen2.5 Coder 32B',
id: 'qwen2.5-coder-32b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
],
},
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description:
'指令跟随、数学、解题、代码整体提升,万物识别能力提升,支持多样格式直接精准定位视觉元素,支持对长视频文件(最长10分钟)进行理解和秒级别的事件时刻定位,能理解时间先后和快慢,基于解析和定位能力支持操控OS或Mobile的Agent,关键信息抽取能力和Json格式输出能力强,此版本为72B版本,本系列能力最强的版本。',
displayName: 'Qwen2.5 VL 72B',
id: 'qwen2.5-vl-72b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 48, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-01-27',
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description:
'Qwen2.5VL系列模型,在math和学科问题解答达到了接近Qwen2.5VL-72B的水平,回复风格面向人类偏好进行大幅调整,尤其是数学、逻辑推理、知识问答等客观类query,模型回复详实程度和格式清晰度明显改善。此版本为32B版本。',
displayName: 'Qwen2.5 VL 32B',
id: 'qwen2.5-vl-32b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 24, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-03-24',
type: 'chat',
},
{
abilities: {
vision: true,
},
contextWindowTokens: 131_072,
description:
'指令跟随、数学、解题、代码整体提升,万物识别能力提升,支持多样格式直接精准定位视觉元素,支持对长视频文件(最长10分钟)进行理解和秒级别的事件时刻定位,能理解时间先后和快慢,基于解析和定位能力支持操控OS或Mobile的Agent,关键信息抽取能力和Json格式输出能力强,此版本为72B版本,本系列能力最强的版本。',
displayName: 'Qwen2.5 VL 7B',
id: 'qwen2.5-vl-7b-instruct',
maxOutput: 8192,
organization: 'Qwen',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 5, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-01-27',
type: 'chat',
},
{
abilities: {
reasoning: true,
},
contextWindowTokens: 131_072,
description:
'685B 满血版模型,2025年5月28日发布。DeepSeek-R1 在后训练阶段大规模使用了强化学习技术,在仅有极少标注数据的情况下,极大提升了模型推理能力。在数学、代码、自然语言推理等任务上,性能较高,能力较强。',
displayName: 'DeepSeek R1 0528',
id: 'deepseek-r1-0528',
maxOutput: 16_384,
organization: 'DeepSeek',
pricing: {
currency: 'CNY',
units: [
{ name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
{ name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
],
},
releasedAt: '2025-05-28',
type: 'chat',
},
{
contextWindowTokens: 65_536,
description:
'DeepSeek-V3 为自研 MoE 模型,671B 参数,激活 37B,在 14.8T token 上进行了预训练,在长文本、代码、数学、百科、中文能力上表现优秀。',
displayName: 'DeepSeek V3',
id: 'deepseek-v3',
maxOutput: 8192,
organization: 'DeepSeek',
pricing: {
currency: 'CNY',
units: [
{