readctrl / results /qwen3-8B_subclaims_verifier_test_predictions.jsonl
shahidul034's picture
Add files using upload-large-folder tool
c29669c verified
{"index": 0, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 1, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 2, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 3, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 4, "label": "supported", "prediction": "not_supported", "correct": false, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 5, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 6, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 7, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 8, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 9, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 10, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 11, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 12, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 13, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 14, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 15, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 16, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 17, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 18, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 19, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 20, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 21, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 22, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 23, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 24, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 25, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 26, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 27, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 28, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 29, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 30, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 31, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 32, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 33, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 34, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 35, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 36, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 37, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 38, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 39, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 40, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 41, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 42, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 43, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 44, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 45, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 46, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 47, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 48, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 49, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 50, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 51, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 52, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 53, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 54, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 55, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 56, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 57, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 58, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 59, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 60, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 61, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 62, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 63, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 64, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 65, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 66, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 67, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 68, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 69, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 70, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 71, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 72, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 73, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 74, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 75, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 76, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 77, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 78, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 79, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 80, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 81, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 82, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 83, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 84, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 85, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 86, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 87, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 88, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 89, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 90, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 91, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 92, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 93, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 94, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 95, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 96, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 97, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 98, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 99, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 100, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 101, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 102, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 103, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 104, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 105, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 106, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 107, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 108, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 109, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 110, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 111, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 112, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 113, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 114, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 115, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 116, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 117, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 118, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 119, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 120, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 121, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 122, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 123, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 124, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 125, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 126, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 127, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 128, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 129, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 130, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 131, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 132, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 133, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 134, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 135, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 136, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 137, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 138, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 139, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 140, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 141, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 142, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 143, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 144, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 145, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 146, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 147, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 148, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 149, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 150, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 151, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 152, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 153, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 154, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 155, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 156, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 157, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 158, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 159, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 160, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 161, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 162, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 163, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 164, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 165, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 166, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 167, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 168, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 169, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 170, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 171, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 172, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 173, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 174, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 175, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 176, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 177, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 178, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 179, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 180, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 181, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 182, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 183, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 184, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 185, "label": "not_supported", "prediction": "supported", "correct": false, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 186, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 187, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 188, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 189, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 190, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 191, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 192, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 193, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 194, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 195, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 196, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 197, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 198, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 199, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 200, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 201, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 202, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 203, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 204, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 205, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 206, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 207, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 208, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 209, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 210, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 211, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 212, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 213, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 214, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 215, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 216, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 217, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 218, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 219, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 220, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 221, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 222, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 223, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 224, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 225, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 226, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 227, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 228, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 229, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 230, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 231, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 232, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 233, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 234, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 235, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 236, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 237, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 238, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 239, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 240, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 241, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 242, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 243, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 244, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 245, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 246, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 247, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 248, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 249, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 250, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 251, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 252, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 253, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 254, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 255, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 256, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 257, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 258, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 259, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 260, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 261, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 262, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 263, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 264, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 265, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 266, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 267, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 268, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 269, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 270, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 271, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 272, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 273, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 274, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 275, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 276, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 277, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 278, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 279, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 280, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 281, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 282, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 283, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 284, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 285, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 286, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 287, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 288, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 289, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 290, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 291, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 292, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 293, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 294, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 295, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 296, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 297, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 298, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 299, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 300, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 301, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 302, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 303, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 304, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 305, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 306, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 307, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 308, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 309, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 310, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 311, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 312, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 313, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 314, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 315, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 316, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 317, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 318, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 319, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 320, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 321, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 322, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 323, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 324, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 325, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 326, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 327, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 328, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 329, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 330, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 331, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 332, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 333, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 334, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 335, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 336, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 337, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 338, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 339, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 340, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 341, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 342, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 343, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 344, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 345, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 346, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 347, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 348, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 349, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 350, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 351, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 352, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 353, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 354, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 355, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 356, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 357, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 358, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 359, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 360, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 361, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 362, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 363, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 364, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 365, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 366, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 367, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 368, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 369, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 370, "label": "supported", "prediction": "not_supported", "correct": false, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 371, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 372, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 373, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 374, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 375, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 376, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 377, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 378, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 379, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}
{"index": 380, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 381, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 382, "label": "not_supported", "prediction": "not_supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nnot_supported"}
{"index": 383, "label": "supported", "prediction": "supported", "correct": true, "raw_output": "<think>\n\n</think>\n\nsupported"}