Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/chat_template.json with huggingface_hub dfc5621 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/training_args.bin with huggingface_hub 6bb7462 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/vocab.json with huggingface_hub fb091ad verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/video_preprocessor_config.json with huggingface_hub 51b9e81 verified CserDu123 commited on Nov 5, 2025
Upload 034-grpo-3b_kl_1e-2-nextqa-ckpt_2133/trainer_state.json with huggingface_hub 21e9f61 verified CserDu123 commited on Nov 5, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/merges.txt with huggingface_hub 249d4e6 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/preprocessor_config.json with huggingface_hub 1c8e49e verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/special_tokens_map.json with huggingface_hub 6fb1e9d verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model-00001-of-00002.safetensors with huggingface_hub 0b71898 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/tokenizer_config.json with huggingface_hub 23f165e verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/added_tokens.json with huggingface_hub a678253 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/generation_config.json with huggingface_hub 44cb8ad verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model-00002-of-00002.safetensors with huggingface_hub 6418b9a verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/config.json with huggingface_hub f13d8ef verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/model.safetensors.index.json with huggingface_hub 74dab99 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/tokenizer.json with huggingface_hub 7ecbbb1 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/chat_template.json with huggingface_hub be33dc1 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/training_args.bin with huggingface_hub 5a6b935 verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/vocab.json with huggingface_hub eebc17a verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/video_preprocessor_config.json with huggingface_hub 7c2678d verified CserDu123 commited on Nov 4, 2025
Upload 037-arpo_kl_base_grpo_kl_1e-2-3b_seed_bench_r1/trainer_state.json with huggingface_hub 6063c8e verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/merges.txt with huggingface_hub 1873930 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/preprocessor_config.json with huggingface_hub 077f199 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/special_tokens_map.json with huggingface_hub 044e3b2 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/model-00001-of-00002.safetensors with huggingface_hub da4b760 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/tokenizer_config.json with huggingface_hub 877c751 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/added_tokens.json with huggingface_hub 703cf4f verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/generation_config.json with huggingface_hub 71e6187 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/model-00002-of-00002.safetensors with huggingface_hub 4b13ef9 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/config.json with huggingface_hub dbd709d verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/model.safetensors.index.json with huggingface_hub 38bfcac verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/tokenizer.json with huggingface_hub faf7077 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/chat_template.json with huggingface_hub 10db684 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/training_args.bin with huggingface_hub 5315923 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/vocab.json with huggingface_hub a11f907 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/video_preprocessor_config.json with huggingface_hub 9975fe6 verified CserDu123 commited on Nov 4, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-318/trainer_state.json with huggingface_hub 91e6a07 verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/merges.txt with huggingface_hub a99983d verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/preprocessor_config.json with huggingface_hub fd7d08c verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/special_tokens_map.json with huggingface_hub 0e9acd9 verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/model-00001-of-00002.safetensors with huggingface_hub 6afb53f verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/tokenizer_config.json with huggingface_hub 8d66bcd verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/added_tokens.json with huggingface_hub a99ae62 verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/generation_config.json with huggingface_hub fdde9a3 verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/model-00002-of-00002.safetensors with huggingface_hub 6c2699b verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/config.json with huggingface_hub 526adbd verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/model.safetensors.index.json with huggingface_hub b7c4b01 verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/tokenizer.json with huggingface_hub 776dc8a verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/chat_template.json with huggingface_hub a78990f verified CserDu123 commited on Nov 4, 2025
Upload 035-arpo_kl-3b_perception_test-ckpt-396/training_args.bin with huggingface_hub 0f65129 verified CserDu123 commited on Nov 4, 2025