Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub a25974f verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 82ccc2d verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 0a864c2 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub e6daac8 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 4bcaf28 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 984838e verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub 34065ca verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 2878de0 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 23823f0 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 80e9fb7 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub b74a406 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 48f3c28 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 266fe7a verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub d6044c4 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 8a3e5e8 verified CserDu123 commited on Nov 5, 2025
Upload 039-arpo_kl-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub bfb2752 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/merges.txt with huggingface_hub 2909733 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/preprocessor_config.json with huggingface_hub 3465d3b verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/special_tokens_map.json with huggingface_hub ecfe92b verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/model-00001-of-00002.safetensors with huggingface_hub 92da07d verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/tokenizer_config.json with huggingface_hub bb477f8 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/added_tokens.json with huggingface_hub cf38959 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/generation_config.json with huggingface_hub 3205aae verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/model-00002-of-00002.safetensors with huggingface_hub c590497 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/config.json with huggingface_hub 7fdd642 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/model.safetensors.index.json with huggingface_hub a06efb3 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/tokenizer.json with huggingface_hub 984b800 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/chat_template.json with huggingface_hub dfc5621 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/training_args.bin with huggingface_hub 6bb7462 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/vocab.json with huggingface_hub fb091ad verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/video_preprocessor_config.json with huggingface_hub 51b9e81 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/trainer_state.json with huggingface_hub 21e9f61 verified CserDu123 commited on Nov 5, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/merges.txt with huggingface_hub 249d4e6 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/preprocessor_config.json with huggingface_hub 1c8e49e verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/special_tokens_map.json with huggingface_hub 6fb1e9d verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model-00001-of-00002.safetensors with huggingface_hub 0b71898 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/tokenizer_config.json with huggingface_hub 23f165e verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/added_tokens.json with huggingface_hub a678253 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/generation_config.json with huggingface_hub 44cb8ad verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model-00002-of-00002.safetensors with huggingface_hub 6418b9a verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/config.json with huggingface_hub f13d8ef verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model.safetensors.index.json with huggingface_hub 74dab99 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/tokenizer.json with huggingface_hub 7ecbbb1 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/chat_template.json with huggingface_hub be33dc1 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/training_args.bin with huggingface_hub 5a6b935 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/vocab.json with huggingface_hub eebc17a verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/video_preprocessor_config.json with huggingface_hub 7c2678d verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/trainer_state.json with huggingface_hub 6063c8e verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/merges.txt with huggingface_hub 1873930 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/preprocessor_config.json with huggingface_hub 077f199 verified CserDu123 commited on Nov 4, 2025