Qwen1.5-110B
Meta-Llama-3-70B
Mixtral-8x22B-v0.1
Qwen1.5-72B
DeepSeek-V2
Qwen1.5-32B
dbrx-base
Qwen1.5-14B
deepseek-llm-67b-base
Mixtral-8x7B-v0.1
Qwen1.5-7B
gemma-7b
llama2_70B
Meta-Llama-3-8B
Qwen1.5-4B
llama_65B
Mistral-7B-v0.1
llama2_13B
Qwen1.5-1.8B
llama_33B
falcon-40b
llama2_07B
mpt-30b
Qwen1.5-0.5B
gemma-2b
deepseek-moe-16b-base
llama_13B
deepseek-llm-7b-base
llama_07B
stablelm-3b-4e1t
falcon-7b
stablelm-base-alpha-7b-v2
pythia-12b-deduped-v0
pythia-2.8b-deduped
pythia-6.9b-deduped-v0
pythia-1.4b-deduped-v0
pythia-1b-deduped
gsm8k/1035
gsm8k/823
gsm8k/652
gsm8k/368
gsm8k/1133
gsm8k/7
gsm8k/147
gsm8k/107
gsm8k/606
gsm8k/1092
gsm8k/392
gsm8k/1258
gsm8k/789
gsm8k/135
gsm8k/622
gsm8k/1235
gsm8k/534
gsm8k/1052
gsm8k/442
gsm8k/924
gsm8k/1294
gsm8k/577
gsm8k/1038
gsm8k/363
gsm8k/798
gsm8k/211
gsm8k/810
gsm8k/1164
gsm8k/411
gsm8k/78
gsm8k/1284
gsm8k/639
gsm8k/1123
gsm8k/401
gsm8k/91
gsm8k/165
gsm8k/612
gsm8k/1024
gsm8k/356
gsm8k/865
gsm8k/170
gsm8k/733
gsm8k/1230
gsm8k/719
gsm8k/1285
gsm8k/592
gsm8k/1296
gsm8k/730
gsm8k/3
gsm8k/848
gsm8k/447
gsm8k/268
gsm8k/998
gsm8k/543
gsm8k/134
gsm8k/462
gsm8k/947
gsm8k/907
0
0.2
0.4
0.6
0.8
1
pass1_ex
model
example_id
plotly-logomark