-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathmodels.yml
More file actions
129 lines (123 loc) · 3.01 KB
/
models.yml
File metadata and controls
129 lines (123 loc) · 3.01 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
providers:
Alibaba:
baseUrl: "https://coding-intl.dashscope.aliyuncs.com/v1"
api: openai-completions
apiKey: ""
auth: apiKey
authHeader: true
models:
- id: qwen3-max-2026-01-23
name: "qwen3-max-2026-01-23 - smartest, $15/1m"
reasoning: true
input:
- text
cost:
input: 3
output: 15
cacheRead: 3
cacheWrite: 3.75
contextWindow: 262144
maxTokens: 65536
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: qwen3.5-plus
name: "qwen3.5-plus - 1m context! vision, $3/1m"
reasoning: true
input:
- text
- image
cost:
input: 0.5
output: 3
cacheRead: 0.6
cacheWrite: 0.625
contextWindow: 1000000
maxTokens: 65536
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: qwen3-coder-next
name: "qwen3-coder-next - fastest $4/1m"
reasoning: true
input:
- text
cost:
input: 0.8
output: 4
cacheRead: 0
cacheWrite: 0
contextWindow: 262144
maxTokens: 65536
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: glm-4.7
name: "glm-4.7"
reasoning: true
input:
- text
- image
cost:
input: 0.431
output: 3.154
cacheRead: 0
cacheWrite: 0
contextWindow: 202752
maxTokens: 16384
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: glm-5
name: "glm-5"
reasoning: true
input:
- text
cost:
input: 0.573
output: 0.86
cacheRead: 0.0573
cacheWrite: 0.573
contextWindow: 202752
maxTokens: 16384
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: MiniMax-M2.5
name: "MiniMax-M2.5"
reasoning: true
input:
- text
cost:
input: 0
output: 0
cacheRead: 0
cacheWrite: 0
contextWindow: 196608
maxTokens: 32768
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen
- id: kimi-k2.5
name: "kimi-k2.5"
reasoning: true
input:
- text
- image
cost:
input: 0.574
output: 3.011
cacheRead: 0.0574
cacheWrite: 0.7175
contextWindow: 262144
maxTokens: 32768
compat:
supportsDeveloperRole: false
supportsReasoningEffort: true
thinkingFormat: qwen