Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 5ef206b verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 0a10c05 verified CserDu123 commited on Nov 8, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/merges.txt with huggingface_hub a16c507 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/preprocessor_config.json with huggingface_hub fd354f0 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/special_tokens_map.json with huggingface_hub 11770a3 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00001-of-00004.safetensors with huggingface_hub ba02f4c verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/tokenizer_config.json with huggingface_hub d64e74e verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/added_tokens.json with huggingface_hub 5b53169 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/generation_config.json with huggingface_hub aaf4778 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00004-of-00004.safetensors with huggingface_hub d50818c verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/config.json with huggingface_hub 30b1efb verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00003-of-00004.safetensors with huggingface_hub 3234ab6 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model.safetensors.index.json with huggingface_hub d3f1d82 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/tokenizer.json with huggingface_hub ad08734 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00002-of-00004.safetensors with huggingface_hub 21f9c93 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/chat_template.json with huggingface_hub 75afb58 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/training_args.bin with huggingface_hub 40b22db verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/vocab.json with huggingface_hub b4b9d20 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/video_preprocessor_config.json with huggingface_hub 436b244 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/trainer_state.json with huggingface_hub f64ecbe verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/merges.txt with huggingface_hub c472f3b verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/preprocessor_config.json with huggingface_hub 7728f94 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/special_tokens_map.json with huggingface_hub da02e1a verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/model-00001-of-00004.safetensors with huggingface_hub 793ffee verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/tokenizer_config.json with huggingface_hub eb38809 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/added_tokens.json with huggingface_hub e3c4ab9 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/generation_config.json with huggingface_hub 03f3788 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/model-00004-of-00004.safetensors with huggingface_hub f0137b1 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/config.json with huggingface_hub b87ef7a verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/model-00003-of-00004.safetensors with huggingface_hub ca669a0 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/model.safetensors.index.json with huggingface_hub 92cec90 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/tokenizer.json with huggingface_hub e57479a verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/model-00002-of-00004.safetensors with huggingface_hub b3be1f1 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/chat_template.json with huggingface_hub 2568547 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/training_args.bin with huggingface_hub 3d07133 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/vocab.json with huggingface_hub 2d96f38 verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/video_preprocessor_config.json with huggingface_hub 041bc0e verified CserDu123 commited on Nov 7, 2025
Upload results/ARPO/057-grpo-7b_nextgqa/checkpoint-418/trainer_state.json with huggingface_hub edf6ed4 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/merges.txt with huggingface_hub 1847b95 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/preprocessor_config.json with huggingface_hub fd16cc8 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/special_tokens_map.json with huggingface_hub 864e47b verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/model-00001-of-00004.safetensors with huggingface_hub 98a9763 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/tokenizer_config.json with huggingface_hub ca1d4cd verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/added_tokens.json with huggingface_hub 3b07fe0 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/generation_config.json with huggingface_hub 23fd3b0 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/model-00004-of-00004.safetensors with huggingface_hub 399090c verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/config.json with huggingface_hub e9fbaf1 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/model-00003-of-00004.safetensors with huggingface_hub 6ceb02e verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/model.safetensors.index.json with huggingface_hub e25a992 verified CserDu123 commited on Nov 7, 2025
Upload 056-arpo_kl-7b_nextgqa-ckpt_418/tokenizer.json with huggingface_hub 9ccf11c verified CserDu123 commited on Nov 7, 2025