Spaces:
Running
Running
[ | |
{ | |
"Model": "Llama-3.1-8B-Instruct", | |
"CR": "42.6", | |
"S-Acc": "9.9", | |
"EM": "0.0", | |
"PM-0.5": "3.8", | |
"Tokens": "2478" | |
}, | |
{ | |
"Model": "Llama-3.1-70B-Instruct", | |
"CR": "71.8", | |
"S-Acc": "27.4", | |
"EM": "0.5", | |
"PM-0.5": "21.9", | |
"Tokens": "2090" | |
}, | |
{ | |
"Model": "Llama-3.3-70B-Instruct", | |
"CR": "92.4", | |
"S-Acc": "33.1", | |
"EM": "1.3", | |
"PM-0.5": "25.8", | |
"Tokens": "1842" | |
}, | |
{ | |
"Model": "Mistral-7B-Instruct-v0.3", | |
"CR": "85.8", | |
"S-Acc": "12.1", | |
"EM": "0.0", | |
"PM-0.5": "2.3", | |
"Tokens": "2736" | |
}, | |
{ | |
"Model": "Mistral-Small-Instruct-2409", | |
"CR": "91.0", | |
"S-Acc": "23.1", | |
"EM": "0.2", | |
"PM-0.5": "13.3", | |
"Tokens": "2273" | |
}, | |
{ | |
"Model": "Mistral-Large-Instruct-2411", | |
"CR": "96.1", | |
"S-Acc": "36.4", | |
"EM": "2.5", | |
"PM-0.5": "30.0", | |
"Tokens": "2313" | |
}, | |
{ | |
"Model": "Qwen2.5-7B-Instruct", | |
"CR": "85.1", | |
"S-Acc": "17.7", | |
"EM": "0.3", | |
"PM-0.5": "5.1", | |
"Tokens": "2086" | |
}, | |
{ | |
"Model": "Qwen2.5-32B-Instruct", | |
"CR": "96.2", | |
"S-Acc": "29.9", | |
"EM": "0.6", | |
"PM-0.5": "14.8", | |
"Tokens": "1924" | |
}, | |
{ | |
"Model": "Qwen2.5-72B-Instruct", | |
"CR": "95.0", | |
"S-Acc": "33.9", | |
"EM": "0.9", | |
"PM-0.5": "20.8", | |
"Tokens": "2359" | |
}, | |
{ | |
"Model": "QwQ-32B-Preview", | |
"CR": "65.0", | |
"S-Acc": "26.6", | |
"EM": "8.5", | |
"PM-0.5": "19.3", | |
"Tokens": "6709" | |
}, | |
{ | |
"Model": "DeepSeek-R1", | |
"CR": "100.0", | |
"S-Acc": "58.4", | |
"EM": "20.0", | |
"PM-0.5": "62.0", | |
"Tokens": "9856" | |
}, | |
{ | |
"Model": "Gemini-2.0-flash", | |
"CR": "81.1", | |
"S-Acc": "37.0", | |
"EM": "2.4", | |
"PM-0.5": "34.5", | |
"Tokens": "2637" | |
}, | |
{ | |
"Model": "Gemini-2.0-flash-thinking", | |
"CR": "88.2", | |
"S-Acc": "39.4", | |
"EM": "4.3", | |
"PM-0.5": "35.0", | |
"Tokens": "3725" | |
}, | |
{ | |
"Model": "OpenAI-gpt-4o", | |
"CR": "99.8", | |
"S-Acc": "43.7", | |
"EM": "3.2", | |
"PM-0.5": "41.7", | |
"Tokens": "1486" | |
}, | |
{ | |
"Model": "OpenAI-o1-mini", | |
"CR": "97.7", | |
"S-Acc": "41.3", | |
"EM": "9.1", | |
"PM-0.5": "32.8", | |
"Tokens": "9576" | |
}, | |
{ | |
"Model": "OpenAI-o1-preview", | |
"CR": "96.3", | |
"S-Acc": "58.7", | |
"EM": "23.6", | |
"PM-0.5": "61.7", | |
"Tokens": "11436" | |
} | |
] |