Upload full trainer checkpoint step=3039 (profile=llama3_2_1b_base_grpo, run_type=grpo) 105b56f verified brthor commited on 10 days ago
Upload full trainer checkpoint step=2026 (profile=llama3_2_1b_base_grpo, run_type=grpo) 664ca9a verified brthor commited on 10 days ago
Upload full trainer checkpoint step=1013 (profile=llama3_2_1b_base_grpo, run_type=grpo) 136832e verified brthor commited on 10 days ago
Upload full trainer checkpoint step=2028 (profile=llama3_2_1b_base_grpo, run_type=grpo) 9808de4 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=1521 (profile=llama3_2_1b_base_grpo, run_type=grpo) 2dec6c5 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=1014 (profile=llama3_2_1b_base_grpo, run_type=grpo) ef21f4b verified brthor commited on 10 days ago
Upload full trainer checkpoint step=507 (profile=llama3_2_1b_base_grpo, run_type=grpo) 2f2239b verified brthor commited on 10 days ago
Upload full trainer checkpoint step=14196 (profile=llama3_2_1b_base_grpo, run_type=grpo) 762df2e verified brthor commited on 10 days ago
Upload full trainer checkpoint step=13689 (profile=llama3_2_1b_base_grpo, run_type=grpo) e0bc1e7 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=13182 (profile=llama3_2_1b_base_grpo, run_type=grpo) 61e00ef verified brthor commited on 10 days ago
Upload full trainer checkpoint step=12675 (profile=llama3_2_1b_base_grpo, run_type=grpo) 55006e3 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=12168 (profile=llama3_2_1b_base_grpo, run_type=grpo) ac98d24 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=11661 (profile=llama3_2_1b_base_grpo, run_type=grpo) d3f13d0 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=11154 (profile=llama3_2_1b_base_grpo, run_type=grpo) d61a845 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=10647 (profile=llama3_2_1b_base_grpo, run_type=grpo) b63ea5e verified brthor commited on 10 days ago
Upload full trainer checkpoint step=10140 (profile=llama3_2_1b_base_grpo, run_type=grpo) 1522fc7 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=9633 (profile=llama3_2_1b_base_grpo, run_type=grpo) 8e8c079 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=9126 (profile=llama3_2_1b_base_grpo, run_type=grpo) c23dee9 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=8619 (profile=llama3_2_1b_base_grpo, run_type=grpo) 62c83ba verified brthor commited on 10 days ago
Upload full trainer checkpoint step=8112 (profile=llama3_2_1b_base_grpo, run_type=grpo) a3f8aeb verified brthor commited on 10 days ago
Upload full trainer checkpoint step=7605 (profile=llama3_2_1b_base_grpo, run_type=grpo) 4efd8a6 verified brthor commited on 10 days ago
Upload full trainer checkpoint step=7098 (profile=llama3_2_1b_base_grpo, run_type=grpo) 3e599a7 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=6591 (profile=llama3_2_1b_base_grpo, run_type=grpo) e860ecd verified brthor commited on 11 days ago
Upload full trainer checkpoint step=6084 (profile=llama3_2_1b_base_grpo, run_type=grpo) 5024a09 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=5577 (profile=llama3_2_1b_base_grpo, run_type=grpo) 817c6d4 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=5070 (profile=llama3_2_1b_base_grpo, run_type=grpo) b4e0e96 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=4563 (profile=llama3_2_1b_base_grpo, run_type=grpo) c65a400 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=4056 (profile=llama3_2_1b_base_grpo, run_type=grpo) 62e47b3 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=3549 (profile=llama3_2_1b_base_grpo, run_type=grpo) 18fe2d6 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=3042 (profile=llama3_2_1b_base_grpo, run_type=grpo) b80fcc5 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=2535 (profile=llama3_2_1b_base_grpo, run_type=grpo) 1d53c1b verified brthor commited on 11 days ago
Upload full trainer checkpoint step=2028 (profile=llama3_2_1b_base_grpo, run_type=grpo) 687459f verified brthor commited on 11 days ago
Upload full trainer checkpoint step=1521 (profile=llama3_2_1b_base_grpo, run_type=grpo) 824cba3 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=1014 (profile=llama3_2_1b_base_grpo, run_type=grpo) a5a4a48 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=507 (profile=llama3_2_1b_base_grpo, run_type=grpo) c5db3b2 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=10557 (profile=llama3_2_1b_base_grpo, run_type=grpo) 8a35e6b verified brthor commited on 11 days ago
Upload full trainer checkpoint step=9384 (profile=llama3_2_1b_base_grpo, run_type=grpo) 3bc41b9 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=8211 (profile=llama3_2_1b_base_grpo, run_type=grpo) 907fd7d verified brthor commited on 11 days ago
Upload full trainer checkpoint step=7038 (profile=llama3_2_1b_base_grpo, run_type=grpo) a8bc294 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=5865 (profile=llama3_2_1b_base_grpo, run_type=grpo) c542162 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=4692 (profile=llama3_2_1b_base_grpo, run_type=grpo) 916e607 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=3519 (profile=llama3_2_1b_base_grpo, run_type=grpo) 599422f verified brthor commited on 11 days ago
Upload full trainer checkpoint step=2346 (profile=llama3_2_1b_base_grpo, run_type=grpo) 6157ab6 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=1173 (profile=llama3_2_1b_base_grpo, run_type=grpo) 5329dbc verified brthor commited on 11 days ago
Upload full trainer checkpoint step=18 (profile=llama3_2_1b_base_grpo, run_type=grpo) 1216e9c verified brthor commited on 11 days ago
Upload full trainer checkpoint step=9 (profile=llama3_2_1b_base_grpo, run_type=grpo) 1281bd3 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=2346 (profile=llama3_2_1b_base_grpo, run_type=grpo) 06d6c29 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=1173 (profile=llama3_2_1b_base_grpo, run_type=grpo) 4d483a9 verified brthor commited on 11 days ago
Upload full trainer checkpoint step=141 (profile=llama3_2_1b_base_grpo, run_type=grpo) 6fcf12b verified brthor commited on 11 days ago
Upload full trainer checkpoint step=24 (profile=llama3_2_1b_base_grpo, run_type=grpo) 7d1fe3f verified brthor commited on 11 days ago