Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub 77d6b2d verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub af7c137 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 37b5ae6 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub f210a16 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 7b21867 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 2bbf993 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/vocab.json with huggingface_hub 2ae1b83 verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 684982e verified CserDu123 commited on Nov 19, 2025
Upload 105-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub e2ae997 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/merges.txt with huggingface_hub 6de3b51 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/preprocessor_config.json with huggingface_hub bdce939 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/special_tokens_map.json with huggingface_hub 285e850 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00001-of-00004.safetensors with huggingface_hub 91f3341 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/tokenizer_config.json with huggingface_hub de95f53 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/added_tokens.json with huggingface_hub 141bd19 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/generation_config.json with huggingface_hub 8afa10a verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00004-of-00004.safetensors with huggingface_hub 030e1df verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/config.json with huggingface_hub 7993c5f verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00003-of-00004.safetensors with huggingface_hub f985fcc verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model.safetensors.index.json with huggingface_hub 6dc372e verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/tokenizer.json with huggingface_hub 43ef8aa verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/model-00002-of-00004.safetensors with huggingface_hub 26eaa78 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/chat_template.json with huggingface_hub 4a7fbee verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/training_args.bin with huggingface_hub 99729ff verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/vocab.json with huggingface_hub da42b87 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/video_preprocessor_config.json with huggingface_hub 7d3a787 verified CserDu123 commited on Nov 19, 2025
Upload 104-arpo_kl-7b-ablation-seed_bench_r1-ckpt_376/trainer_state.json with huggingface_hub 7a30d36 verified CserDu123 commited on Nov 19, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/merges.txt with huggingface_hub db9a4f2 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/preprocessor_config.json with huggingface_hub 5587096 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/special_tokens_map.json with huggingface_hub 79651a4 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/model-00001-of-00002.safetensors with huggingface_hub 925116a verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/tokenizer_config.json with huggingface_hub 564e1d8 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/added_tokens.json with huggingface_hub 5b10e58 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/generation_config.json with huggingface_hub c324637 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/model-00002-of-00002.safetensors with huggingface_hub dba11a8 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/config.json with huggingface_hub 5c02aa1 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/model.safetensors.index.json with huggingface_hub 40701c3 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/tokenizer.json with huggingface_hub 00dbcd1 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/chat_template.json with huggingface_hub 875aa38 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/training_args.bin with huggingface_hub 1839ab2 verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/vocab.json with huggingface_hub c4356ac verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/video_preprocessor_config.json with huggingface_hub 5e6e57c verified CserDu123 commited on Nov 13, 2025
Upload 103-arpo_kl-3b-dynamic_sampling-seed_bench_r1-ckpt_184/trainer_state.json with huggingface_hub afdd37d verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/merges.txt with huggingface_hub 8ffc5ce verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/preprocessor_config.json with huggingface_hub bafc983 verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/special_tokens_map.json with huggingface_hub 6ee35d3 verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/model-00001-of-00004.safetensors with huggingface_hub a9ea695 verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/tokenizer_config.json with huggingface_hub f00db46 verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/added_tokens.json with huggingface_hub 2957d3e verified CserDu123 commited on Nov 13, 2025
Upload 102-arpo_kl-7b-dynamic_sampling-seed_bench_r1-ckpt_182/generation_config.json with huggingface_hub 3940508 verified CserDu123 commited on Nov 13, 2025