Upload 092-arpo_kl-3b-video_r1-ckpt_2149/added_tokens.json with huggingface_hub 5195f00 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/generation_config.json with huggingface_hub 37dda80 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/model-00002-of-00002.safetensors with huggingface_hub 079d511 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/config.json with huggingface_hub 41d4cf8 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/model.safetensors.index.json with huggingface_hub c845176 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/tokenizer.json with huggingface_hub f70bf86 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/chat_template.json with huggingface_hub 4f9900d verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/training_args.bin with huggingface_hub 519b6bf verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/vocab.json with huggingface_hub 83ec5c0 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/video_preprocessor_config.json with huggingface_hub 79ae5c3 verified CserDu123 commited on Nov 11, 2025
Upload 092-arpo_kl-3b-video_r1-ckpt_2149/trainer_state.json with huggingface_hub 3059da7 verified CserDu123 commited on Nov 11, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/merges.txt with huggingface_hub 5c87b6c verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/preprocessor_config.json with huggingface_hub c7871f9 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/special_tokens_map.json with huggingface_hub bbe909e verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/model-00001-of-00004.safetensors with huggingface_hub 5646d93 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/tokenizer_config.json with huggingface_hub 6a09822 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/added_tokens.json with huggingface_hub d9f6987 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/generation_config.json with huggingface_hub da9bbb8 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/model-00004-of-00004.safetensors with huggingface_hub 9a8dab4 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/config.json with huggingface_hub b07387b verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/model-00003-of-00004.safetensors with huggingface_hub 29cb811 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/model.safetensors.index.json with huggingface_hub 6a21e6f verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/tokenizer.json with huggingface_hub 1f89671 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/model-00002-of-00004.safetensors with huggingface_hub 7190b2a verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/chat_template.json with huggingface_hub cfb6ec2 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/training_args.bin with huggingface_hub 678c691 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/vocab.json with huggingface_hub 33ee313 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/video_preprocessor_config.json with huggingface_hub d74cd50 verified CserDu123 commited on Nov 10, 2025
Upload 091-arpo_kl-7b-video_r1-ckpt_2149/trainer_state.json with huggingface_hub 621b6ee verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/merges.txt with huggingface_hub cbd118c verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 63c1069 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub e89ca10 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 0624c78 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 7859484 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 5c758b2 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 5948f77 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 092b4f9 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/config.json with huggingface_hub a059734 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub e0863ef verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub ce9c96d verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 000dd7c verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub a7952ca verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 6cf1433 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub b9cddb9 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/vocab.json with huggingface_hub de21806 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub ddbc008 verified CserDu123 commited on Nov 10, 2025
Upload 095-arpo_kl-7b-ablation-length_reward-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub bb72dae verified CserDu123 commited on Nov 10, 2025
Upload 096-arpo_kl-3b-ablation-perception_test-ckpt_396/merges.txt with huggingface_hub 076c28d verified CserDu123 commited on Nov 10, 2025
Upload 096-arpo_kl-3b-ablation-perception_test-ckpt_396/preprocessor_config.json with huggingface_hub ee4d553 verified CserDu123 commited on Nov 10, 2025
Upload 096-arpo_kl-3b-ablation-perception_test-ckpt_396/special_tokens_map.json with huggingface_hub 040214e verified CserDu123 commited on Nov 10, 2025