Upload 078-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 973fa6e verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub f885d6f verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 363ea41 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub c3733bc verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 2a008f4 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub f0c271b verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub b936da2 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 26d32b1 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub aca1bdc verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub d366c39 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub f3b08d1 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 7e793d7 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub dc8ae00 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 84be072 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 2588143 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 4b4b231 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 5a505ed verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 184d194 verified CserDu123 commited on Nov 9, 2025
Upload 076-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 4e1538a verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub f55134c verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 3661211 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 0ea2273 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 427cfd8 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub bba73f5 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 740ff16 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 2290cf6 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 365f340 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub c4af460 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 63fe4f7 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 55fcd57 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub ef92661 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub e34e63a verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub efe33eb verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 8a71f95 verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 95bc4eb verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 6dbcd6b verified CserDu123 commited on Nov 9, 2025
Upload 077-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 1b433d5 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/merges.txt with huggingface_hub 3bf1dca verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/preprocessor_config.json with huggingface_hub 8bdb49c verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/special_tokens_map.json with huggingface_hub 2f5058b verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/model-00001-of-00004.safetensors with huggingface_hub 38174e2 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/tokenizer_config.json with huggingface_hub 0144b6e verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/added_tokens.json with huggingface_hub 736b837 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/generation_config.json with huggingface_hub 82a6d65 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/model-00004-of-00004.safetensors with huggingface_hub ed7bf6d verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/config.json with huggingface_hub 7e61f50 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/model-00003-of-00004.safetensors with huggingface_hub b34920a verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/model.safetensors.index.json with huggingface_hub 37e9844 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/tokenizer.json with huggingface_hub 380e263 verified CserDu123 commited on Nov 9, 2025
Upload 068-new-arpo_kl-ablation-7b_nextgqa-ckpt_418/model-00002-of-00004.safetensors with huggingface_hub 752d5ad verified CserDu123 commited on Nov 9, 2025