Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/generation_config.json with huggingface_hub 04fde4f verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/model-00002-of-00002.safetensors with huggingface_hub 3c0ef59 verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/config.json with huggingface_hub 4605c5b verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/model.safetensors.index.json with huggingface_hub 327c624 verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/tokenizer.json with huggingface_hub b9579bf verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/chat_template.json with huggingface_hub 3fc3270 verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/training_args.bin with huggingface_hub 4dd4ded verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/vocab.json with huggingface_hub f21c4fe verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/video_preprocessor_config.json with huggingface_hub 43f2ca4 verified CserDu123 commited on Nov 2, 2025
Upload 028-arpo_kl-3b-seed_bench_r1_6k-ckpt-376/trainer_state.json with huggingface_hub dabdebe verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/merges.txt with huggingface_hub c7412f9 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/preprocessor_config.json with huggingface_hub 132fc77 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/special_tokens_map.json with huggingface_hub d4cb13a verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/model-00001-of-00002.safetensors with huggingface_hub 0065e4c verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/tokenizer_config.json with huggingface_hub 619c417 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/added_tokens.json with huggingface_hub 7f79727 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/generation_config.json with huggingface_hub cbe6bc6 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/model-00002-of-00002.safetensors with huggingface_hub 534ab04 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/config.json with huggingface_hub 0532579 verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/model.safetensors.index.json with huggingface_hub 492bf3f verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/tokenizer.json with huggingface_hub 3ccb93f verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/chat_template.json with huggingface_hub 2aa87ee verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/training_args.bin with huggingface_hub eac48cb verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/vocab.json with huggingface_hub d62a5cc verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/video_preprocessor_config.json with huggingface_hub 2419abf verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/trainer_state.json with huggingface_hub 91bafcd verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/merges.txt with huggingface_hub 1e05495 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/preprocessor_config.json with huggingface_hub cab91d2 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/special_tokens_map.json with huggingface_hub 4c758ea verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model-00001-of-00002.safetensors with huggingface_hub e99326e verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/tokenizer_config.json with huggingface_hub 269f14e verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/added_tokens.json with huggingface_hub e6bba1f verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/generation_config.json with huggingface_hub 2226cab verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model-00002-of-00002.safetensors with huggingface_hub 1dba941 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/config.json with huggingface_hub 4638d51 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model.safetensors.index.json with huggingface_hub acfe7e8 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/tokenizer.json with huggingface_hub 0992f63 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/chat_template.json with huggingface_hub bf8ae85 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/training_args.bin with huggingface_hub b2965b4 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/vocab.json with huggingface_hub a079392 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/video_preprocessor_config.json with huggingface_hub a07e178 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/trainer_state.json with huggingface_hub 6e0dd1d verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/merges.txt with huggingface_hub c1d42ad verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/preprocessor_config.json with huggingface_hub f6dbc7b verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/special_tokens_map.json with huggingface_hub 1ba9a7c verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/model-00001-of-00002.safetensors with huggingface_hub 9f1d22b verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/tokenizer_config.json with huggingface_hub c833565 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/added_tokens.json with huggingface_hub 2a7ebbb verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/generation_config.json with huggingface_hub ced477e verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/model-00002-of-00002.safetensors with huggingface_hub 5c939b4 verified CserDu123 commited on Nov 2, 2025