Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub cb8d2d4 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub e61fed1 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub bb7b6ee verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 542fe03 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 82ad88b verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 6b7e7cd verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub a5ce156 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/config.json with huggingface_hub e551d37 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 2494fd4 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 2b41e8b verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 2ad6536 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub eefce91 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 5c844a3 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub e389423 verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/vocab.json with huggingface_hub c36e88a verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 1ea054b verified CserDu123 commited on Nov 8, 2025
Upload 064-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 777e066 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 69cf2e3 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub 0597a8f verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 183bd68 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 4d12ea2 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub 55d7225 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 893aa92 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 314632d verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 49e180a verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/config.json with huggingface_hub e321b75 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 99c6365 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 628a238 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 51caa4f verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub de354aa verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub f9d05c2 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 2f69767 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/vocab.json with huggingface_hub b9043e1 verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 5ef206b verified CserDu123 commited on Nov 8, 2025
Upload 062-arpo_kl-7b-length_reward-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 0a10c05 verified CserDu123 commited on Nov 8, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/merges.txt with huggingface_hub a16c507 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/preprocessor_config.json with huggingface_hub fd354f0 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/special_tokens_map.json with huggingface_hub 11770a3 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00001-of-00004.safetensors with huggingface_hub ba02f4c verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/tokenizer_config.json with huggingface_hub d64e74e verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/added_tokens.json with huggingface_hub 5b53169 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/generation_config.json with huggingface_hub aaf4778 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00004-of-00004.safetensors with huggingface_hub d50818c verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/config.json with huggingface_hub 30b1efb verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00003-of-00004.safetensors with huggingface_hub 3234ab6 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model.safetensors.index.json with huggingface_hub d3f1d82 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/tokenizer.json with huggingface_hub ad08734 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/model-00002-of-00004.safetensors with huggingface_hub 21f9c93 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/chat_template.json with huggingface_hub 75afb58 verified CserDu123 commited on Nov 7, 2025
Upload 058-arpo_kl-7b-perception_test-ckpt_396/training_args.bin with huggingface_hub 40b22db verified CserDu123 commited on Nov 7, 2025