Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 0047da4 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 14f26b8 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub 2046ef0 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub dbb2905 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 806c91f verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub c4e7210 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub fe694f9 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub b3bb350 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 6eee070 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 62e0774 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 9a8a047 verified CserDu123 commited on Nov 8, 2025
Upload 071-arpo_kl-new-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 164f955 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 2b6d4d5 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 3a61a4b verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 937eb4d verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 5b94422 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 783f53f verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 28fdac8 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 1b2fb68 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 22290b0 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub c7ec08b verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub aebbc40 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 831333f verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub f3a6aa5 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 81f1228 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 4b61129 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub abc4522 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 6c5a688 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 0ddcee7 verified CserDu123 commited on Nov 8, 2025
Upload 070-arpo_kl-new-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 3dcdf68 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub c6b1db1 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub c27c870 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub a4b6098 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub e454cf4 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub d51688f verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 003bee2 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 6fde0de verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 3457739 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 3032002 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub 09b4244 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub a59b830 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub d4a330d verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 2db3fb1 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub d91d40c verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 7d74df2 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 57b72c0 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 020ee63 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub a381642 verified CserDu123 commited on Nov 8, 2025
Upload 050-new_grpo-7b_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub fdc9a64 verified CserDu123 commited on Nov 8, 2025
Upload 044-new_grpo-7b_perception_test/merges.txt with huggingface_hub 404f845 verified CserDu123 commited on Nov 8, 2025