Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub e298385 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub d883793 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 964be6a verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub cf81eff verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 40dd8be verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub fdfd9ed verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub c58a3ca verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 58f0428 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 20c6654 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 68a77ac verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/merges.txt with huggingface_hub e476441 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/preprocessor_config.json with huggingface_hub 6622ac5 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/special_tokens_map.json with huggingface_hub 2aef09a verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00001-of-00004.safetensors with huggingface_hub 84341f6 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/tokenizer_config.json with huggingface_hub a5a56c3 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/added_tokens.json with huggingface_hub 622007f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/generation_config.json with huggingface_hub 77002ef verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00004-of-00004.safetensors with huggingface_hub 5ed70be verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/config.json with huggingface_hub e173f51 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00003-of-00004.safetensors with huggingface_hub f5f5cd4 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model.safetensors.index.json with huggingface_hub 0bf5b20 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/tokenizer.json with huggingface_hub 30ea2d1 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/model-00002-of-00004.safetensors with huggingface_hub b32706f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/chat_template.json with huggingface_hub 9546c0f verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/training_args.bin with huggingface_hub 2d18206 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/vocab.json with huggingface_hub 2ed1a02 verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/video_preprocessor_config.json with huggingface_hub b5abdbc verified CserDu123 commited on Nov 6, 2025
Upload 051-grpo-7b_no_kl_seed_bench_r1/trainer_state.json with huggingface_hub 027d93c verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 527f20d verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 9f61a7f verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 4b5d0a0 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 495ea68 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 7ecb46f verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 84c2335 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub c7c6585 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 4c1d68e verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub 95e5bd4 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 0628442 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 16dfb19 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 36276a3 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 797dbd5 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 46f387d verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub d05f019 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub b23ee31 verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub a2480db verified CserDu123 commited on Nov 6, 2025
Upload 050-dapo-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 1b4c852 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/merges.txt with huggingface_hub cdf2bc4 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/chat_template.jinja with huggingface_hub 302d1e5 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/preprocessor_config.json with huggingface_hub a965617 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/special_tokens_map.json with huggingface_hub d88fb8c verified CserDu123 commited on Nov 6, 2025