gemma-4-E4B-it-Coder / executable_eval.json
josephmayo's picture
Upload proof executable_eval.json
396932b verified
{
"before_pass": 5,
"after_pass": 7,
"total": 8,
"rows": [
{
"phase": "before",
"task_id": "HumanEval/0",
"entry_point": "has_close_elements",
"passed": false,
"error": "Traceback (most recent call last):\n File \"C:\\Users\\USER\\AppData\\Local\\Temp\\tmp6oy5omdq.py\", line 8, in <module>\n exec(code, ns)\n ~~~~^^^^^^^^^^\n File \"<string>\", line 17\n if sorted_numbers[i+1] - sorted_numbers[i\n ^\nSyntaxError: '[' was never closed\n",
"chars": 526
},
{
"phase": "after",
"task_id": "HumanEval/0",
"entry_point": "has_close_elements",
"passed": true,
"error": null,
"chars": 495
},
{
"phase": "before",
"task_id": "HumanEval/1",
"entry_point": "separate_paren_groups",
"passed": false,
"error": "Traceback (most recent call last):\n File \"C:\\Users\\USER\\AppData\\Local\\Temp\\tmpbgx0dlv4.py\", line 10, in <module>\n ns[\"check\"](ns[entry_point])\n ~~~~~~~~~~~^^^^^^^^^^^^^^^^^\n File \"<string>\", line 10, in check\nAssertionError\n",
"chars": 745
},
{
"phase": "after",
"task_id": "HumanEval/1",
"entry_point": "separate_paren_groups",
"passed": true,
"error": null,
"chars": 455
},
{
"phase": "before",
"task_id": "HumanEval/2",
"entry_point": "truncate_number",
"passed": true,
"error": null,
"chars": 360
},
{
"phase": "after",
"task_id": "HumanEval/2",
"entry_point": "truncate_number",
"passed": true,
"error": null,
"chars": 363
},
{
"phase": "before",
"task_id": "HumanEval/3",
"entry_point": "below_zero",
"passed": true,
"error": null,
"chars": 590
},
{
"phase": "after",
"task_id": "HumanEval/3",
"entry_point": "below_zero",
"passed": true,
"error": null,
"chars": 590
},
{
"phase": "before",
"task_id": "HumanEval/4",
"entry_point": "mean_absolute_deviation",
"passed": true,
"error": null,
"chars": 632
},
{
"phase": "after",
"task_id": "HumanEval/4",
"entry_point": "mean_absolute_deviation",
"passed": true,
"error": null,
"chars": 530
},
{
"phase": "before",
"task_id": "HumanEval/5",
"entry_point": "intersperse",
"passed": true,
"error": null,
"chars": 486
},
{
"phase": "after",
"task_id": "HumanEval/5",
"entry_point": "intersperse",
"passed": true,
"error": null,
"chars": 455
},
{
"phase": "before",
"task_id": "HumanEval/6",
"entry_point": "parse_nested_parens",
"passed": false,
"error": "Traceback (most recent call last):\n File \"C:\\Users\\USER\\AppData\\Local\\Temp\\tmpx0bb66c4.py\", line 8, in <module>\n exec(code, ns)\n ~~~~^^^^^^^^^^\n File \"<string>\", line 21\n max_depth = max(max_depth\n ^\nSyntaxError: '(' was never closed\n",
"chars": 692
},
{
"phase": "after",
"task_id": "HumanEval/6",
"entry_point": "parse_nested_parens",
"passed": false,
"error": "Traceback (most recent call last):\n File \"C:\\Users\\USER\\AppData\\Local\\Temp\\tmpn7um62g2.py\", line 8, in <module>\n exec(code, ns)\n ~~~~^^^^^^^^^^\n File \"<string>\", line 20\n max_depth = max(max_depth\n ^\nSyntaxError: '(' was never closed\n",
"chars": 691
},
{
"phase": "before",
"task_id": "HumanEval/7",
"entry_point": "filter_by_substring",
"passed": true,
"error": null,
"chars": 379
},
{
"phase": "after",
"task_id": "HumanEval/7",
"entry_point": "filter_by_substring",
"passed": true,
"error": null,
"chars": 379
}
]
}