Spaces:
Running
Running
File size: 1,299 Bytes
b866cfe |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 |
{
"config": {
"model_name": "OpenAI-gpt-4o"
},
"results": {
"Overall": {
"CR": "99.8",
"S-Acc": "43.7",
"EM": "3.2",
"PM-0.5": "41.7",
"Tokens": "1486"
},
"Acrostic": {
"CR": "100.0",
"S-Acc": "56.0",
"EM": "0.0",
"PM-0.5": "67.0",
"Tokens": "3229"
},
"Crossword": {
"CR": "100.0",
"S-Acc": "66.0",
"EM": "1.3",
"PM-0.5": "86.7",
"Tokens": "1726"
},
"Cryptogram": {
"CR": "100.0",
"S-Acc": "20.7",
"EM": "0.0",
"PM-0.5": "5.0",
"Tokens": "740"
},
"Logic_Puzzle": {
"CR": "100.0",
"S-Acc": "39.3",
"EM": "3.5",
"PM-0.5": "29.5",
"Tokens": "953"
},
"Sudoku": {
"CR": "100.0",
"S-Acc": "52.2",
"EM": "14.5",
"PM-0.5": "48.0",
"Tokens": "1104"
},
"Drop_Quote": {
"CR": "99.0",
"S-Acc": "31.1",
"EM": "0.0",
"PM-0.5": "14.0",
"Tokens": "1165"
}
}
} |