[ { "Model": "Llama-3.1-8B-Instruct", "CR": "43.0", "S-Acc": "5.6", "EM": "0.0", "PM-0.5": "0.0", "Tokens": "3712" }, { "Model": "Llama-3.1-70B-Instruct", "CR": "84.0", "S-Acc": "35.8", "EM": "0.0", "PM-0.5": "21.0", "Tokens": "3565" }, { "Model": "Llama-3.3-70B-Instruct", "CR": "97.0", "S-Acc": "40.8", "EM": "0.0", "PM-0.5": "28.0", "Tokens": "3584" }, { "Model": "Mistral-7B-Instruct-v0.3", "CR": "75.0", "S-Acc": "7.9", "EM": "0.0", "PM-0.5": "0.0", "Tokens": "4600" }, { "Model": "Mistral-Small-Instruct-2409", "CR": "67.0", "S-Acc": "5.5", "EM": "0.0", "PM-0.5": "0.0", "Tokens": "4171" }, { "Model": "Mistral-Large-Instruct-2411", "CR": "98.0", "S-Acc": "39.4", "EM": "0.0", "PM-0.5": "20.0", "Tokens": "4279" }, { "Model": "Qwen2.5-7B-Instruct", "CR": "42.0", "S-Acc": "3.6", "EM": "0.0", "PM-0.5": "0.0", "Tokens": "4159" }, { "Model": "Qwen2.5-32B-Instruct", "CR": "100.0", "S-Acc": "31.8", "EM": "0.0", "PM-0.5": "2.0", "Tokens": "4073" }, { "Model": "Qwen2.5-72B-Instruct", "CR": "100.0", "S-Acc": "39.3", "EM": "0.0", "PM-0.5": "18.0", "Tokens": "4111" }, { "Model": "QwQ-32B-Preview", "CR": "97.0", "S-Acc": "31.6", "EM": "0.0", "PM-0.5": "6.0", "Tokens": "4964" }, { "Model": "DeepSeek-R1", "CR": "100.0", "S-Acc": "62.2", "EM": "0.0", "PM-0.5": "83.0", "Tokens": "10077" }, { "Model": "Gemini-2.0-flash", "CR": "98.0", "S-Acc": "48.0", "EM": "0.0", "PM-0.5": "48.0", "Tokens": "4020" }, { "Model": "Gemini-2.0-flash-thinking", "CR": "92.0", "S-Acc": "40.7", "EM": "0.0", "PM-0.5": "27.0", "Tokens": "4257" }, { "Model": "OpenAI-gpt-4o", "CR": "100.0", "S-Acc": "56.0", "EM": "0.0", "PM-0.5": "67.0", "Tokens": "3229" }, { "Model": "OpenAI-o1-mini", "CR": "97.0", "S-Acc": "34.7", "EM": "0.0", "PM-0.5": "12.0", "Tokens": "10952" }, { "Model": "OpenAI-o1-preview", "CR": "100.0", "S-Acc": "67.2", "EM": "0.0", "PM-0.5": "90.0", "Tokens": "14847" } ]