Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/chat_template.json with huggingface_hub 38936f4 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/training_args.bin with huggingface_hub d9eecd6 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/vocab.json with huggingface_hub 702e44b verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/video_preprocessor_config.json with huggingface_hub b8482cf verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/trainer_state.json with huggingface_hub da8ffc5 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/merges.txt with huggingface_hub 6f2576d verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/preprocessor_config.json with huggingface_hub 331aace verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/special_tokens_map.json with huggingface_hub 8aaa736 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/model-00001-of-00002.safetensors with huggingface_hub 780df6c verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/tokenizer_config.json with huggingface_hub 61e3186 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/added_tokens.json with huggingface_hub 1795def verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/generation_config.json with huggingface_hub b946a24 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/model-00002-of-00002.safetensors with huggingface_hub bc52700 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/config.json with huggingface_hub 59c3333 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/model.safetensors.index.json with huggingface_hub 03042f7 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/tokenizer.json with huggingface_hub 2cd697e verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/chat_template.json with huggingface_hub c8d3e97 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/training_args.bin with huggingface_hub 13c7f26 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/vocab.json with huggingface_hub 1c5694e verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/video_preprocessor_config.json with huggingface_hub 6282e43 verified CserDu123 commited on Nov 9, 2025
Upload 067-arpo_kl-ablation-3b_nextgqa-ckpt_418/trainer_state.json with huggingface_hub 90f0d99 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 4bcb0d4 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 7c0b2fd verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 203f3c6 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 469a52d verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 8c28d63 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub a441075 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 809170e verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 0abdb72 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub 5786292 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 540e0ee verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 8eb1537 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub e0ca236 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 3004235 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 1762394 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 80f27a8 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 80b4efc verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub b009ae1 verified CserDu123 commited on Nov 9, 2025
Upload 075-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 3dfe61f verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub ad2fc6b verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub dccae2c verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub b84faa5 verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 2632adb verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 29d9252 verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 2fe5c71 verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub f6f8ecc verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub ab929ab verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub 6072889 verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 72b2a24 verified CserDu123 commited on Nov 9, 2025
Upload 073-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub e1c359e verified CserDu123 commited on Nov 9, 2025