Spaces:
Running
Running
[ | |
{ | |
"Model": "Llama-3.1-8B-Instruct", | |
"CR": "61.3", | |
"S-Acc": "23.3", | |
"EM": "0.0", | |
"PM-0.5": "14.0", | |
"Tokens": "2888" | |
}, | |
{ | |
"Model": "Llama-3.1-70B-Instruct", | |
"CR": "77.3", | |
"S-Acc": "46.8", | |
"EM": "0.0", | |
"PM-0.5": "62.0", | |
"Tokens": "3072" | |
}, | |
{ | |
"Model": "Llama-3.3-70B-Instruct", | |
"CR": "85.3", | |
"S-Acc": "47.6", | |
"EM": "0.0", | |
"PM-0.5": "65.3", | |
"Tokens": "2613" | |
}, | |
{ | |
"Model": "Mistral-7B-Instruct-v0.3", | |
"CR": "94.0", | |
"S-Acc": "23.0", | |
"EM": "0.0", | |
"PM-0.5": "6.7", | |
"Tokens": "3655" | |
}, | |
{ | |
"Model": "Mistral-Small-Instruct-2409", | |
"CR": "98.7", | |
"S-Acc": "48.3", | |
"EM": "0.0", | |
"PM-0.5": "54.0", | |
"Tokens": "3135" | |
}, | |
{ | |
"Model": "Mistral-Large-Instruct-2411", | |
"CR": "99.3", | |
"S-Acc": "62.8", | |
"EM": "2.0", | |
"PM-0.5": "86.0", | |
"Tokens": "3237" | |
}, | |
{ | |
"Model": "Qwen2.5-7B-Instruct", | |
"CR": "98.7", | |
"S-Acc": "21.1", | |
"EM": "0.0", | |
"PM-0.5": "3.3", | |
"Tokens": "2441" | |
}, | |
{ | |
"Model": "Qwen2.5-32B-Instruct", | |
"CR": "100.0", | |
"S-Acc": "34.6", | |
"EM": "0.0", | |
"PM-0.5": "20.0", | |
"Tokens": "2560" | |
}, | |
{ | |
"Model": "Qwen2.5-72B-Instruct", | |
"CR": "100.0", | |
"S-Acc": "44.1", | |
"EM": "0.0", | |
"PM-0.5": "36.7", | |
"Tokens": "2735" | |
}, | |
{ | |
"Model": "QwQ-32B-Preview", | |
"CR": "80.0", | |
"S-Acc": "30.2", | |
"EM": "0.0", | |
"PM-0.5": "18.0", | |
"Tokens": "4817" | |
}, | |
{ | |
"Model": "DeepSeek-R1", | |
"CR": "100.0", | |
"S-Acc": "75.3", | |
"EM": "16.7", | |
"PM-0.5": "94.0", | |
"Tokens": "9810" | |
}, | |
{ | |
"Model": "Gemini-2.0-flash", | |
"CR": "98.7", | |
"S-Acc": "61.6", | |
"EM": "0.0", | |
"PM-0.5": "83.3", | |
"Tokens": "2555" | |
}, | |
{ | |
"Model": "Gemini-2.0-flash-thinking", | |
"CR": "94.7", | |
"S-Acc": "57.7", | |
"EM": "1.3", | |
"PM-0.5": "79.3", | |
"Tokens": "2648" | |
}, | |
{ | |
"Model": "OpenAI-gpt-4o", | |
"CR": "100.0", | |
"S-Acc": "66.0", | |
"EM": "1.3", | |
"PM-0.5": "86.7", | |
"Tokens": "1726" | |
}, | |
{ | |
"Model": "OpenAI-o1-mini", | |
"CR": "95.3", | |
"S-Acc": "45.5", | |
"EM": "1.3", | |
"PM-0.5": "54.0", | |
"Tokens": "7840" | |
}, | |
{ | |
"Model": "OpenAI-o1-preview", | |
"CR": "98.0", | |
"S-Acc": "77.7", | |
"EM": "24.7", | |
"PM-0.5": "89.3", | |
"Tokens": "10098" | |
} | |
] |