Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub b2894de verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 6f88b84 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 747edf3 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub b1c795b verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub eebb2c2 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 2a45d5b verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub cec407f verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 970e216 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/config.json with huggingface_hub 7e38197 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub bc7b8f1 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub bbd6391 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 6e45ffa verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 2443524 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 2100c9b verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 8ac6a05 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 9b0bdd5 verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub a8a1b0b verified CserDu123 commited on Nov 7, 2025
Upload 055-arpo_kl-7b-ablation_seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 8988ba1 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/merges.txt with huggingface_hub 2b7b874 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/preprocessor_config.json with huggingface_hub 73f20e2 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/special_tokens_map.json with huggingface_hub 9590b3a verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00001-of-00004.safetensors with huggingface_hub 0096963 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/tokenizer_config.json with huggingface_hub c830955 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/added_tokens.json with huggingface_hub 0dcf583 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/generation_config.json with huggingface_hub 37b4532 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00004-of-00004.safetensors with huggingface_hub 815ab25 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/config.json with huggingface_hub d49b8cd verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00003-of-00004.safetensors with huggingface_hub 257cedc verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model.safetensors.index.json with huggingface_hub 933c239 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/tokenizer.json with huggingface_hub b18a79f verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/model-00002-of-00004.safetensors with huggingface_hub e71d1bd verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/chat_template.json with huggingface_hub 2e1593d verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/training_args.bin with huggingface_hub 406102f verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/vocab.json with huggingface_hub a0dba2c verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/video_preprocessor_config.json with huggingface_hub f8f41b4 verified CserDu123 commited on Nov 7, 2025
Upload 053-tw_grpo-7b_perception_test-ckpt_396/trainer_state.json with huggingface_hub 2e08823 verified CserDu123 commited on Nov 7, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 5bed397 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 1f447f9 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 7c0578c verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 3335945 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 6948b0b verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 7968f26 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub ac2ebc2 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub bd585f3 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/config.json with huggingface_hub e298385 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub d883793 verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 964be6a verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub cf81eff verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 40dd8be verified CserDu123 commited on Nov 6, 2025
Upload 052-tw_grpo-7b_seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub fdfd9ed verified CserDu123 commited on Nov 6, 2025