LR2Bench / results /Qwen2.5-7B-Instruct.json
UltraRonin's picture
add
f5894fd
{
"config": {
"model_name": "Qwen/Qwen2.5-7B-Instruct",
"link": "https://huggingface.co/Qwen/Qwen2.5-7B-Instruct",
"Params": 7
},
"results": {
"Overall": {
"CR": "85.1",
"S-Acc": "17.7",
"EM": "0.3",
"PM-0.5": "5.1",
"Tokens": "2086"
},
"Acrostic": {
"CR": "42.0",
"S-Acc": "3.6",
"EM": "0.0",
"PM-0.5": "0.0",
"Tokens": "4159"
},
"Crossword": {
"CR": "98.7",
"S-Acc": "21.1",
"EM": "0.0",
"PM-0.5": "3.3",
"Tokens": "2441"
},
"Cryptogram": {
"CR": "81.0",
"S-Acc": "3.5",
"EM": "0.0",
"PM-0.5": "0.0",
"Tokens": "1181"
},
"Logic_Puzzle": {
"CR": "96.5",
"S-Acc": "25.8",
"EM": "0.0",
"PM-0.5": "8.5",
"Tokens": "1396"
},
"Sudoku": {
"CR": "94.5",
"S-Acc": "30.2",
"EM": "1.5",
"PM-0.5": "15.0",
"Tokens": "1486"
},
"Drop_Quote": {
"CR": "98.0",
"S-Acc": "21.9",
"EM": "0.0",
"PM-0.5": "4.0",
"Tokens": "1852"
}
}
}