Ctrl+K
- grpo_is-qwen3-4b-base-beh-qwen3-8b-seqlen-16384-bs-128-lr-1e-5-ds-synthetic-2-qwen-dm--0.08-dm-0.3-g-0.99_seqlen_8192_bs_128_micro_bs_1_lr_1e-5_dapo-math-17k-dedup
- grpo_is-qwen3-4b-base-beh-qwen3-8b-seqlen-16384-bs-128-lr-1e-5-ds-synthetic__eff-1.0-nmode-flip-chunksize-1_seqlen_16384_epochs_2_bs_128_micro_bs_1_lr_1e-6_dapo-math-17k-dedup
- grpo_is-qwen3-4b-base-beh-qwen3-8b-seqlen-16384-bs-128-lr-3e-5-ds-synthetic-2-sft-verified-merged-json-dm_seqlen_8192_bs_128_lr_1e-5_data_dapo-math-17k-small-processed-parquet
- grpo_is-qwen3-8b-base-beh-qwen3-8b-seqlen-16384-bs-128-lr-3e-5-ds-synthetic-2-qwen3-8b-8192-sft-dm--0.08-_seqlen_8192_bs_128_micro_bs_1_lr_1e-5_data_dapo-math-17k-small-processed-parquet
- grpo_sft-qwen3-4b-base-seqlen-16384-bs-128-lr-1e-5-wd-0.01-ds-synthetic-2-qwen_seqlen_8192_bs_128_micro_bs_1_lr_1e-5_dapo-math-17k-dedup
- grpo_sft-qwen3-8b-base-seqlen-16384-bs-128-lr-1e-5-wd-0.01-ds-synthetic-2-qwen_seqlen_8192_bs_128_micro_bs_1_lr_1e-5_dapo-math-17k-dedup
- grpo_sft_qwen3-4b-base_seqlen_16384_bs_128_lr_3e-5_wd_0.01_ds_synthetic-2_qwen3-8b_8192_sft-global-step-7_seqlen_8192_bs_128_lr_1e-5_data_dapo-math-17k-small-processed-parquet
- grpo_sft_qwen3-8b-base_seqlen_16384_bs_128_lr_3e-5_wd_0.01_ds_synthetic-2_qwen3-8b_8192_sft-global-step-7_seqlen_8192_bs_128_lr_1e-5_data_dapo-math-17k-small-processed-parquet
- is_qwen3-8b-base_beh_qwen3-8b_seqlen_16384_bs_128_lr_1e-5_ds_synthetic-2-qwen_dm_-0.08_dM_0.3_g_0.999_ncoeff_1.0_nmode_flip_chunksize_1
- is_qwen3-8b-base_beh_qwen3-8b_seqlen_16384_bs_1_lr_3e-5_ds_synthetic-2-qwen_dm_-0.08_func_importance-sampling-weight-logspace_dM_0.3_g_0.999_ncoeff_1.0_nmode_flip_chunksize_1
- sft_qwen3-8b-base_seqlen_16384_bs_128_lr_1e-5_wd_0.01_ds_synthetic-2-qwen
- sft_qwen3-8b-base_seqlen_16384_bs_128_lr_3e-5_wd_0.01_ds_synthetic-2_qwen3-8b_8192_sft
- 3.81 kB