Upload 047-arpo_kl_v2-3b_seed_bench_r1/model.safetensors.index.json with huggingface_hub cc4121a verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/tokenizer.json with huggingface_hub f0a42dd verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/training_args.bin with huggingface_hub 3a1f8db verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/vocab.json with huggingface_hub 83626a9 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/video_preprocessor_config.json with huggingface_hub 93da7a5 verified CserDu123 commited on Nov 6, 2025
Upload 047-arpo_kl_v2-3b_seed_bench_r1/trainer_state.json with huggingface_hub ec915be verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/merges.txt with huggingface_hub a210096 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/preprocessor_config.json with huggingface_hub a0a74ec verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/special_tokens_map.json with huggingface_hub 9909cdb verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/model-00001-of-00004.safetensors with huggingface_hub c65d773 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/tokenizer_config.json with huggingface_hub 14e6c68 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/added_tokens.json with huggingface_hub 18d0db0 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/generation_config.json with huggingface_hub 28c80ef verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/model-00004-of-00004.safetensors with huggingface_hub 560e779 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/config.json with huggingface_hub 3e1504b verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/model-00003-of-00004.safetensors with huggingface_hub 8c82f11 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/model.safetensors.index.json with huggingface_hub 6d8a2f8 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/tokenizer.json with huggingface_hub de3e0fb verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/model-00002-of-00004.safetensors with huggingface_hub ebd8e09 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/chat_template.json with huggingface_hub 9399cde verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/training_args.bin with huggingface_hub 154e48f verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/vocab.json with huggingface_hub ab8c41a verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/video_preprocessor_config.json with huggingface_hub 1ad2626 verified CserDu123 commited on Nov 6, 2025
Upload 044-grpo-7b_perception_test/trainer_state.json with huggingface_hub 04de687 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/merges.txt with huggingface_hub a806529 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/preprocessor_config.json with huggingface_hub 329b498 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/special_tokens_map.json with huggingface_hub c6208fa verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/model-00001-of-00002.safetensors with huggingface_hub c229876 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/tokenizer_config.json with huggingface_hub b7c3be8 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/added_tokens.json with huggingface_hub cddf706 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/generation_config.json with huggingface_hub 70af063 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/model-00002-of-00002.safetensors with huggingface_hub 934caf0 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/config.json with huggingface_hub f054f79 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/model.safetensors.index.json with huggingface_hub 181201b verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/tokenizer.json with huggingface_hub 4bdf028 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/chat_template.json with huggingface_hub 916b984 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/training_args.bin with huggingface_hub e48deee verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/vocab.json with huggingface_hub 02d35ef verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/video_preprocessor_config.json with huggingface_hub a03a643 verified CserDu123 commited on Nov 6, 2025
Upload 046-tw_grpo-3b_perception_test-ckpt_396/trainer_state.json with huggingface_hub bc786b6 verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/merges.txt with huggingface_hub e52a479 verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/chat_template.jinja with huggingface_hub 0252b34 verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/preprocessor_config.json with huggingface_hub 59fa58c verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/special_tokens_map.json with huggingface_hub bc86dff verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/model-00001-of-00002.safetensors with huggingface_hub 464114f verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/tokenizer_config.json with huggingface_hub 9262e1c verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/added_tokens.json with huggingface_hub 666e181 verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/generation_config.json with huggingface_hub d909519 verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/model-00002-of-00002.safetensors with huggingface_hub 1ff651f verified CserDu123 commited on Nov 6, 2025
Upload 045-arpo_kl-3b_ablation_perception_test-ckpt_396/config.json with huggingface_hub 2803967 verified CserDu123 commited on Nov 6, 2025