Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/chat_template.json with huggingface_hub 2aa87ee verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/training_args.bin with huggingface_hub eac48cb verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/vocab.json with huggingface_hub d62a5cc verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/video_preprocessor_config.json with huggingface_hub 2419abf verified CserDu123 commited on Nov 2, 2025
Upload 026-grpo-3b-kl_1e-2-perception_test_6k-ckpt-396/trainer_state.json with huggingface_hub 91bafcd verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/merges.txt with huggingface_hub 1e05495 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/preprocessor_config.json with huggingface_hub cab91d2 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/special_tokens_map.json with huggingface_hub 4c758ea verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model-00001-of-00002.safetensors with huggingface_hub e99326e verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/tokenizer_config.json with huggingface_hub 269f14e verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/added_tokens.json with huggingface_hub e6bba1f verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/generation_config.json with huggingface_hub 2226cab verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model-00002-of-00002.safetensors with huggingface_hub 1dba941 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/config.json with huggingface_hub 4638d51 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/model.safetensors.index.json with huggingface_hub acfe7e8 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/tokenizer.json with huggingface_hub 0992f63 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/chat_template.json with huggingface_hub bf8ae85 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/training_args.bin with huggingface_hub b2965b4 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/vocab.json with huggingface_hub a079392 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/video_preprocessor_config.json with huggingface_hub a07e178 verified CserDu123 commited on Nov 2, 2025
Upload 023-dapo-3b-perception_test_6k-ckpt-396/trainer_state.json with huggingface_hub 6e0dd1d verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/merges.txt with huggingface_hub c1d42ad verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/preprocessor_config.json with huggingface_hub f6dbc7b verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/special_tokens_map.json with huggingface_hub 1ba9a7c verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/model-00001-of-00002.safetensors with huggingface_hub 9f1d22b verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/tokenizer_config.json with huggingface_hub c833565 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/added_tokens.json with huggingface_hub 2a7ebbb verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/generation_config.json with huggingface_hub ced477e verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/model-00002-of-00002.safetensors with huggingface_hub 5c939b4 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/config.json with huggingface_hub cd2194b verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/model.safetensors.index.json with huggingface_hub 00e67e0 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/tokenizer.json with huggingface_hub 2efd320 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/chat_template.json with huggingface_hub a3e17b8 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/training_args.bin with huggingface_hub fe5093a verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/vocab.json with huggingface_hub 5b6c77a verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/video_preprocessor_config.json with huggingface_hub 9de2e63 verified CserDu123 commited on Nov 2, 2025
Upload 027-tw_grpo-3b-seed_bench_r1_6k-ckpt-376/trainer_state.json with huggingface_hub 86f7c97 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/merges.txt with huggingface_hub 1b3fbcd verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/preprocessor_config.json with huggingface_hub fa77c99 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/special_tokens_map.json with huggingface_hub 365f1bf verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/model-00001-of-00002.safetensors with huggingface_hub 6042c85 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/tokenizer_config.json with huggingface_hub b7f68d0 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/added_tokens.json with huggingface_hub fa7c4dc verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/generation_config.json with huggingface_hub 5649d5d verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/model-00002-of-00002.safetensors with huggingface_hub 1f94920 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/config.json with huggingface_hub bb9b65a verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/model.safetensors.index.json with huggingface_hub 02cb8d2 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/tokenizer.json with huggingface_hub a438c6e verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/chat_template.json with huggingface_hub 1d6dc84 verified CserDu123 commited on Nov 2, 2025
Upload 025-arpo_attn_base_grpo-kl_1e-2-3b-seed_bench_r1_6k-ckpt-376/training_args.bin with huggingface_hub eae7814 verified CserDu123 commited on Nov 2, 2025