Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +22 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/mp_rank_00_model_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/mp_rank_00_model_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/mp_rank_00_model_states.pt +3 -0
- dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
|
@@ -248,3 +248,25 @@ dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-704/tokenizer.json filter=lfs
|
|
| 248 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 249 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 250 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 248 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 249 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 250 |
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 251 |
+
dapo_miss_openmath_20251129_124147/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 252 |
+
dapo_miss_openmath_20251129_124147/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 253 |
+
dapo_miss_openmath_20251129_124147/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 254 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 255 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 256 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 257 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 258 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 259 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 260 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 261 |
+
dapo_vera_qwen2_5_1_5b_20251126_190555/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 262 |
+
dapo_miss_openmath_20251129_124147/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 263 |
+
dapo_miss_openmath_20251129_124147/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 264 |
+
dapo_miss_openmath_20251129_124147/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 265 |
+
dapo_miss_openmath_20251129_124147/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 266 |
+
dapo_miss_openmath_20251129_124147/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 267 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 268 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 269 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 270 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 271 |
+
dr_grpo_lora_20251129_132413/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 272 |
+
dr_grpo_lora_20251129_132413/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32090f502f89c5ce439a705bde1785a7dae55f1a600979241ecc78ca9957b1e7
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa611488de911e1ba5306a5a8d17904e70da19cd595c4c3e09b5383ffaa33c4b
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:823c8514ebc363ea1d8d4bfec8d78188c6f72fda3a644c1e858d4a045880fbb9
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c59c16a883c6c4fc8bc7ae48aba3a672e6c0d6e694721f330f16d91f1f886eea
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36343337d0322ed9fb30c20d107efeafc32cfd5dd766a972a30e8b8ce114190b
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:809e151150c1183179f3d0784f821e958b9e7324228bb5550d26221b5dd38a01
|
| 3 |
+
size 503979621
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb9a1368496a2bed392b95369f79fec35a57b3c62b3bd80197810b42bd9389a2
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70d07ec86689e3c779b769ccbbc337fd3ddd250258b11dadaaf583bfe81c8020
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47954bde48542a6ba04bb52e47b513658cc225c1e699adf9bbc1c824fb2d461c
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ba3f0d95896f8ed1d0188db9322ddb48faf417e1de55034c0060719780cd5a2
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:880bb29973459cf2cff32253d869dfd3ef8d564c25ccc633ec5cf948b7c39d95
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e12d040379345577f4704eb334bd32c689b2247f0493178a3b1dfe0fa8523e5
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36d23da84b7c47a684f37f8d814600cdb651a8bc764994a1c048b0086fba9403
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16a471c03553ded5b3a3930aecf2f173ad913d755cf28242094567a48a94ddc5
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4beefa2d2c5cf4dc397ac5c5fee02c758f8369f51dc85a1ff0a3437d439700c
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79da1c05cd29c7de4d6bcb7732bf2e63df6e157e33140a6d8f129bb55fa50707
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72ff2de492369f2339a036e0d1014831b4085ed7e51eefb7e07fba9bc39e8f59
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a29cee684cd619bcca3d26b88582535c285ff405fb0541e9a50c6c2cd780e285
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6fa0fcb72d2c9bf445ce3a5cc4e358dd947a263fb0543befa849ab3f23ab43b
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5397bc580c67f923f28da4469b59d572c1d35390ffa348b6c5a6c85ae6b09ef8
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1c91f95dbcb3cac073f1b69eba13e216b27ce3c8938a67cf28448f85e76150b
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c726624dc7b014566288304716dc118c328c1fda90d812c7606032fd48a918c
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d51b5543e195f5303bf9684fbf29946087ee091ccdb0f439c27389e0f73485e
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d01327fc9600c278c2d2fe42980af40d5c0a86fa85d2b8602deb37d35e577126
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95f1d81d4b9d225aed9e75118301478e5ab5c8e18f7262dffe44ebfecc667267
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa20027452bf3a45967e71636ade26e5439af1bff4a7025e72190eed1029419a
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82c49228a77e0c006391edf8fb96d2a537a2f5d86cfa9f78bebc9e13be7dc7e5
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e47169e54d2d117bdb8f756548415769af4bc208906812c1c3ecff01fe55e0b
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61f1f2049264ef85634ea60cf95e790e17d167f91e746152731e8a713cff550e
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d2c491480d6cf17b52bb62b53e23f7cde17676b2b0e67f9fd96de53e62561a3d
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1410c38eb02cc7af2f5ac8c87c206b053e492a2fbf4a628a684b05120a2c5346
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95cdb5ae0f99e9af12739c0ca47ad55473aa16b05f3008384825f93933654ff0
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d3dc0f542996d4c53711beaeec8d8cb995f6c5b0c441d7d2f94cda2a95397c1
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1590e6adf6a4a5040f829218649834cf58c3a18394aca277c1c7c3c0a7b0da3a
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27c566b90d796c77d54604be49873c04b3407863fbb1c0cd43a814f15d3c15da
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:caceb0f7f03acf4a84fc15df3e8ea1aebbf20e5dee5e87ad0822ffb7048d27ab
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8b9de7fc8ffd80abeb36d0fc9b2f41b51beabe8d70fcb1c36a960ea64a8a9d5
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd4f48a5acc5b9219f5089a1fee3daa3cef19aeca87d9aed283a3f79518940ed
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abedb71854ec2f9d68ab8f997ab83b3db32ede8fbbee0b07b3eb638d5c935d69
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb845a1583232c8a958ac155ec63fe607eec3b0eed2945b21687115ef89d3e91
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a54b5d552927a509bccf584bbae14adfbca058fa70a4529843e454629669874
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c054068cd7e9c875a7e6036a9ae9df854d7e0e24e9341ec4ec8cc9323510037b
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/global_step768/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba224e5db0b74895b0fa7f2e7b40cc98b645b1be5dd8eab75526e11f4e5efe46
|
| 3 |
+
size 49768921
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0856d5a3c028b7904a68e826c310f92d058a0b909e12534b88ffd7b0eb46ccb0
|
| 3 |
+
size 74329221
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9630adb5c76f67a729d045957e61ea35dc5d84119f720dc1b5d485bb2e874c0
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:450cca4b307af59a79381f663a72ef0c898798df72d5daa67ebe8134010ff30d
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a63733088a000cb0f4db84ac38a65a90eb404fe6caacb4ff1b2755377d53723
|
| 3 |
+
size 74329285
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/global_step832/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d12aa1ab5163139fb0115229f08899e321d73f1698c2aa7c0f773565b0ae1f5
|
| 3 |
+
size 49768921
|
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfeca6115b229b02549c658101c32e10a1e81492c9209ab40a8d286d91d507dd
|
| 3 |
+
size 74329221
|