Upload 053-tw_grpo-7b_perception_test-ckpt_396/generation_config.json with huggingface_hub 37b4532 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00004-of-00004.safetensors with huggingface_hub 815ab25 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/config.json with huggingface_hub d49b8cd verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00003-of-00004.safetensors with huggingface_hub 257cedc verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model.safetensors.index.json with huggingface_hub 933c239 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/tokenizer.json with huggingface_hub b18a79f verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00002-of-00004.safetensors with huggingface_hub e71d1bd verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/chat_template.json with huggingface_hub 2e1593d verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/training_args.bin with huggingface_hub 406102f verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/vocab.json with huggingface_hub a0dba2c verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/video_preprocessor_config.json with huggingface_hub f8f41b4 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/trainer_state.json with huggingface_hub 2e08823 verified CserDu123 commited on Nov 7, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 5bed397 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 1f447f9 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 7c0578c verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 3335945 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 6948b0b verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 7968f26 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub ac2ebc2 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub bd585f3 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub e298385 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub d883793 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 964be6a verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub cf81eff verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 40dd8be verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub fdfd9ed verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub c58a3ca verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 58f0428 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 20c6654 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 68a77ac verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/merges.txt with huggingface_hub e476441 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/preprocessor_config.json with huggingface_hub 6622ac5 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/special_tokens_map.json with huggingface_hub 2aef09a verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00001-of-00004.safetensors with huggingface_hub 84341f6 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/tokenizer_config.json with huggingface_hub a5a56c3 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/added_tokens.json with huggingface_hub 622007f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/generation_config.json with huggingface_hub 77002ef verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00004-of-00004.safetensors with huggingface_hub 5ed70be verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/config.json with huggingface_hub e173f51 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00003-of-00004.safetensors with huggingface_hub f5f5cd4 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model.safetensors.index.json with huggingface_hub 0bf5b20 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/tokenizer.json with huggingface_hub 30ea2d1 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00002-of-00004.safetensors with huggingface_hub b32706f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/chat_template.json with huggingface_hub 9546c0f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/training_args.bin with huggingface_hub 2d18206 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/vocab.json with huggingface_hub 2ed1a02 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/video_preprocessor_config.json with huggingface_hub b5abdbc verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/trainer_state.json with huggingface_hub 027d93c verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 527f20d verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 9f61a7f verified CserDu123 commited on Nov 6, 2025