Skip to content

Files

Latest commit

b207ae4 · Feb 7, 2025

History

History
195 lines (195 loc) · 10.8 KB

elo.csv

File metadata and controls

195 lines (195 loc) · 10.8 KB
1
modeloverallhardcodingcpmilaunchendsource
2
gemini-2.0-flash-thinking-exp-01-211310138113594.0012025-01
3
gemini-2.0-pro-exp-02-051318138113715.0012025-02
4
gemini-exp-12061321131113685.0012024-11
5
gemini-2.0-flash-thinking-exp-12191308130213434.0012024-122024-12
6
chatgpt-4o-latest-2024112013181340135152024-11https://openai.com/api/pricing/
7
gemini-2.0-flash1286135013480.12025-02
8
deepseek-r11319136713620.272025-01
9
o1-2024-12-17132213701362152024-12
10
o1-preview130313511355152024-09https://openai.com/api/pricing/
11
qwen2.5-max1280134313391.62025-01
12
gemini-2.0-flash-exp1296129113512.0012024-12
13
chatgpt-4o-latest-2024090312911277134752024-082024-11https://openai.com/api/pricing/
14
o3-mini1274136813561.12025-01
15
deepseek-v31274130413160.142024-12
16
gemini-2.0-flash-lite-preview1265131713090.0752025-02
17
claude-3-5-sonnet-2024102212851303132432024-10
18
step-2-16k-exp-2024121250129412952024-12
19
gemini-exp-11141268127213255.0012024-112024-12
20
glm-4-plus-0111124912831290
21
gemini-1.5-pro-00212681295128952024-10
22
gpt-4o-2024-05-131263128412922.52024-09
23
claude-3-5-sonnet-2024062012591279129432024-06
24
o1-mini12561335135332024-09https://openai.com/api/pricing/
25
gemini-advanced-05141254125312542024-05
26
qwen2.5-plus-11271231129913022024-12
27
llama-3.1-405b-instruct-fp81252126612752.752024-07https://openrouter.ai/meta-llama/llama-3.1-405b-instruct
28
deepseek-v2.5-12101240129012960.142024-12
29
llama-3.1-405b-instruct-bf1612531268127822024-06https://openrouter.ai/models/meta-llama/llama-3.1-405b
30
gpt-4o-2024-08-061250126612732.52024-08https://openai.com/api/pricing/
31
grok-2-2024-08-1312491273128252024-09https://openrouter.ai/x-ai/grok-2
32
yi-lightning1246129913022024-10
33
gpt-4-turbo-2024-04-09124212541262102024-04https://openai.com/api/pricing/
34
gemini-1.5-pro-0011241125812623.52024-05https://ai.google.dev/pricing
35
claude-3-opus-20240229123812451250152024-02
36
yi-lightning-lite1238123512662024-10
37
claude-3-5-haiku-202410221232124612630.82024-11
38
glm-4-plus1235127312830.332024-10https://open.bigmodel.cn/pricing
39
gpt-4-1106-preview123412461252102023-11https://openai.com/api/pricing/
40
athene-v2-chat1230129212992024-12
41
gpt-4o-mini-2024-07-181235126812840.152024-07https://openai.com/api/pricing/
42
qwen-max-09191231127212792024-09
43
llama-3.3-70b-instruct1234126012580.132024-12https://openrouter.ai/meta-llama/llama-3.3-70b-instruct
44
mistral-large-240712311259126922024-07https://openrouter.ai/models/mistralai/mistral-large
45
gpt-4-0125-preview123112411243102024-01https://openai.com/api/pricing/
46
gemini-1.5-flash-0021229125812530.0752024-10
47
deepseek-v2.51226127212870.142024-08https://openrouter.ai/models/deepseek/deepseek-chat
48
grok-2-mini-2024-08-131224125812612024-08
49
qwen2.5-72b-instruct1222127012820.352024-09https://openrouter.ai/models/qwen/qwen-2.5-72b-instruct
50
athene-70b-07251223124712532024-07
51
mistral-large-241112171248126222024-11
52
amazon-nova-pro-v1.01208124012580.82024-11
53
llama-3.1-nemotron-70b-instruct1216126512700.352024-10https://openrouter.ai/nvidia/llama-3.1-nemotron-70b-instruct
54
llama-3.1-tulu-3-70b120812231231
55
llama-3.1-70b-instruct1214124312510.522024-06https://openrouter.ai/models/meta-llama/llama-3.1-70b-instruct
56
yi-large-preview1206120612452024-07
57
reka-core-202409041207121512212024-09
58
gemma-2-27b-it1207120412090.272024-06https://openrouter.ai/models/google/gemma-2-27b-it
59
qwen-plus-08281206120912452024-08
60
reka-core-202407221204118612082024-07
61
jamba-1.5-large12051219122722024-08https://openrouter.ai/models/ai21/jamba-1-5-large
62
gemini-1.5-flash-0011204122412310.0752024-08https://ai.google.dev/pricing
63
llama-3.1-nemotron-51b-instruct1203120612100.352024-10https://openrouter.ai/nvidia/llama-3.1-nemotron-70b-instruct
64
amazon-nova-lite-v1.01184122212340.062024-11
65
deepseek-v2-api-06281202121112410.142024-06
66
gpt-4-0314119911951195302024-03https://platform.openai.com/docs/deprecations/
67
gemma-2-9b-it-simpo119912031196
68
phi-41179122812402024-11
69
claude-3-sonnet-2024022911971199121232024-02
70
command-r-plus-08-20241197118811812024-08
71
deepseek-coder-v2-07241197121012660.142024-07
72
nemotron-4-340b-instruct1196120211984.22024-06https://openrouter.ai/models/nvidia/nemotron-4-340b-instruct
73
c4ai-aya-expanse-32b1185119711922024-11
74
yi-large11941185121932023-10https://openrouter.ai/models/01-ai/yi-large
75
llama-3-70b-instruct1195119711990.592024-04https://openrouter.ai/models/meta-llama/llama-3-70b-instruct
76
qwen2.5-coder-32b-instruct1189125612602024-10
77
reka-flash-202409041192118511902024-09
78
glm-4-05201188121312160.662024-05https://open.bigmodel.cn/pricing
79
gpt-4-0613118511671166302024-06https://platform.openai.com/docs/deprecations/
80
llama-3.1-tulu-3-8b1146117911782025-01
81
command-r-plus11821168116432024-01
82
deepseek-coder-v21182121112390.142024-07https://openrouter.ai/models/deepseek/deepseek-coder
83
reka-flash-202407221180116511862024-07
84
qwen2-72b-instruct1180118811860.342024-06https://openrouter.ai/qwen/qwen-2-72b-instruct
85
gemini-1.5-flash-8b-0011179121212070.03752024-10
86
amazon-nova-micro-v1.01163119712110.0352024-11
87
gemma-2-9b-it1180117311730.22024-06https://openrouter.ai/models/google/gemma-2-9b-it
88
reka-core-202405011177116811892024-05
89
claude-3-haiku-202403071177117811890.252024-03
90
command-r-08-20241175116911612024-08
91
gemini-1.5-flash-8b-exp-08271172116211892024-08
92
qwen-max-04281171116811892024-04
93
c4ai-aya-expanse-8b1150116211652024-11
94
glm-4-01161162116511902024-01
95
ministral-8b-24101159119812010.12024-10https://openrouter.ai/mistralai/ministral-8b
96
jamba-1.5-mini1160116811800.22024-08https://openrouter.ai/models/ai21/jamba-1-5-mini
97
claude-111581134113582023-03
98
mistral-large-240211571165116982023-11
99
qwen1.5-110b-chat1155116811741.622024-04https://openrouter.ai/models/qwen/qwen-110b-chat
100
hunyuan-standard-256k115212201226
101
reka-flash-preview-202406111151113611552024-08
102
granite-3.1-8b-instruct1134114811712024-11
103
reka-flash-21b-20240226-online1151114211462024-02
104
mixtral-8x22b-instruct-v0.11149114811520.72024-05
105
mistral-next114911471132
106
command-r1147111911220.52023-12
107
qwen1.5-72b-chat1148114611590.812024-01https://openrouter.ai/models/qwen/qwen-72b-chat
108
gemini-pro-dev-api1147110511020.52024-01https://ai.google.dev/pricing
109
claude-2.011451140113482023-07
110
granite-3.1-2b-instruct1103114311462024-11
111
llama-3-8b-instruct1142113711450.052024-04
112
reka-flash-21b-202402261141113311412024-02
113
mistral-medium1141114411522.72023-11
114
gpt-3.5-turbo-03141141113811140.52023-03
115
gpt-3.5-turbo-01251137111211230.52024-01
116
qwq-32b-preview1088117411462024-11
117
gpt-3.5-turbo-06131136113411341.52023-06https://openai.com/api/pricing/
118
claude-2.111341135113182023-11
119
yi-1.5-34b-chat1133116011622024-05
120
llama-3.1-8b-instruct1133118211860.062024-06https://openrouter.ai/models/meta-llama/llama-3.1-8b-instruct
121
gemini-pro1131108310910.52023-12https://ai.google.dev/pricing
122
zephyr-orpo-141b-A35b-v0.1113011161124
123
qwen1.5-32b-chat1126113511490.722023-11https://openrouter.ai/models/qwen/qwen-32b-chat
124
claude-instant-11127112311080.82023-03
125
phi-3-medium-4k-instruct111811291125https://openrouter.ai/microsoft/phi-3-medium-4k-instruct
126
internlm2_5-20b-chat111611641157
127
gemma-2-2b-it1117111811060.062024-06https://openrouter.ai/google/gemma-2-9b-it
128
mixtral-8x7b-instruct-v0.11114111411140.32024-03
129
dbrx-instruct-preview111311091117
130
granite-3.0-8b-instruct1109110910972024-11
131
gpt-3.5-turbo-11061109109010940.52023-11
132
qwen1.5-14b-chat1106111611250.272023-09https://openrouter.ai/models/qwen/qwen-14b-chat
133
wizardlm-70b110410771071
134
snowflake-arctic-instruct1102107310762.162023-12https://openrouter.ai/models/snowflake/snowflake-arctic-instruct
135
yi-34b-chat1101110211060.722023-11https://openrouter.ai/models/01-ai/yi-34b-chat
136
openchat-3.5-01061100108311010.132024-01
137
phi-3-small-8k-instruct109811071107
138
gemma-1.1-7b-it1099107610840.12024-04
139
openchat-3.51094106510530.132024-01
140
llama-3.2-3b-instruct109311021080
141
tulu-2-dpo-70b109210981093
142
starling-lm-7b-beta1091111911292024-03
143
vicuna-33b109110661067
144
deepseek-llm-67b-chat109010651079
145
openhermes-2.5-mistral-7b108910681057
146
smollm2-1.7b-instruct1051107810432025-01
147
starling-lm-7b-alpha108310721079
148
llama-2-70b-chat1081107010720.642023-07
149
granite-3.0-2b-instruct1081108910872024-11
150
pplx-70b-online10761029102812024-02
151
llama2-70b-steerlm-chat1073104510222023-07
152
nous-hermes-2-mixtral-8x7b-dpo107110521079
153
dolphin-2.2.1-mistral-7b106810501024
154
mistral-7b-instruct-v0.21067106810730.062023-12
155
phi-3-mini-4k-instruct-june-2024106810951081
156
qwen1.5-7b-chat1065106710890.182023-09https://openrouter.ai/models/qwen/qwen-7b-chat
157
solar-10.7b-instruct-v1.0106510561047
158
wizardlm-13b106310131025
159
mpt-30b-chat106010471030
160
falcon-180b-chat105810001017
161
vicuna-13b105810251032
162
qwen-14b-chat105610231056
163
phi-3-mini-4k-instruct1055107810852024-05
164
llama-2-13b-chat1054104910510.12023-07
165
zephyr-7b-beta104910261030
166
phi-3-mini-128k-instruct1048103510292024-05
167
codellama-34b-instruct104710271041
168
gemma-7b-it1048104510460.12024-04
169
zephyr-7b-alpha104610221034
170
llama-3.2-1b-instruct104510581046
171
palm-210421000990
172
pplx-7b-online1041101710140.22024-02
173
guanaco-33b10391000965
174
gemma-1.1-2b-it1040101510352024-04
175
codellama-70b-instruct103710511047
176
stripedhyena-nous-7b1033995999
177
mistral-7b-instruct1026100210070.112023-09
178
llama-2-7b-chat1024100910020.562023-07
179
vicuna-7b1021989981
180
qwen1.5-4b-chat10149779900.092023-09https://openrouter.ai/models/qwen/qwen-4b-chat
181
gemma-2b-it10089871000
182
olmo-7b-instruct9939941017
183
koala-13b979924937
184
chatglm3-6b974952953
185
gpt4all-13b-snoozy971930909
186
mpt-7b-chat967891899
187
alpaca-13b966818789
188
RWKV-4-Raven-14B948890896
189
chatglm2-6b942914892
190
oasst-pythia-12b930880873
191
fastchat-t5-3b896808759
192
chatglm-6b887893883
193
dolly-v2-12b880797746
194
llama-13b866723669
195
stablelm-tuned-alpha-7b858830858