Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +1 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-5442/global_step5442/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9070/global_step9070/zero_pp_rank_8_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9070/global_step9070/zero_pp_rank_9_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
|
@@ -38,3 +38,4 @@ MuCodec/test_wav/test.wav filter=lfs diff=lfs merge=lfs -text
|
|
| 38 |
checkpoints/Qwen3-0.6B/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
wandb/run-20260316_191457-oo5exfjc/run-oo5exfjc.wandb filter=lfs diff=lfs merge=lfs -text
|
| 40 |
output_qwen3_plain_ar/final/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 38 |
checkpoints/Qwen3-0.6B/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
wandb/run-20260316_191457-oo5exfjc/run-oo5exfjc.wandb filter=lfs diff=lfs merge=lfs -text
|
| 40 |
output_qwen3_plain_ar/final/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
wandb/run-20260401_163956-9mmp0brk/run-9mmp0brk.wandb filter=lfs diff=lfs merge=lfs -text
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7265f156b5836f7ef2c207d43aab126a2210e64a54dc91baa579e72cfafc6fcd
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3c0e31c2ec2629220973424becdc56f3a19cbb237cd089a408aa8b990076d6a
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:271c0b6215f17e8dca7f05c8df635818f149cd797c2d548ed8602df0e3dead80
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59322967b000662e81adff8ebcb84fc1889cb5f90882a179a59dd0b7bb34b9c0
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:517db67c9cd4e00d525c61a22fe38455da2f960a2c5713ceb07915dfda1394e1
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:962741cda94d69bc660637e3bd1be218ffa00b6990c173b74c8b5e7632b7b95c
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a970071461bd67aff9ad6f08535f00d6d99728831403ca83e22ae76cefe70657
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e505c4adebea32332feb830591bd4d573777bb96ee8f1c3867a1c730f2c3182
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32af47a248cf9610691d01d215db31668bc7bb97a16e1d17a0b0714954ba7d7a
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4146073d88df85648238a9b9b1d0219220b7746f1541afd2e1b803103e9b570b
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efa057c509d32d96eb9f553d18d9facc6741713dfb940b35842199b411021e4b
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27c018d2a0ab6b5d0c3d91befa7bd85813664d9956930645cf9ed261be2a8df0
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3e0d87e3f7955ca662b2046de9a18e09292eac747901458c647d23fc99c40a5
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a95a27ff3f2cc0f16079a009c12a44d0bd7320fbf7ac749a81d67210549af909
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61f56db4c99a3055165effa009c97564df0245ddf0df288fdb5952e0fb744ec1
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9368c2c79903198bf6f1ce7253700ba344de2ddb3c710a4252d7a174bf9720af
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56f9f04c67492111a0da503a30df27b27803c67620623d8c4c71e876a9ee299b
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62751048615aae38e8d1b6d1e95fe77d1ebc372bb19725ea7b1b2ee46e4287b8
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dd9a42445ced4fa2002a396f097bec59f8230be16658cafde6c16276df5fb92
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09a049b24bc38ec03cd6a4171d4b7458cdca339ff384a7c82f292b921740c03f
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0dc77ab573663bb86c5d35085cf5cc45549c2ed549379a7d50f17fff250a5ca9
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ed8843084952f816e188761d9f9140cc243d186a9eab66d750f08ad6d1d0aca
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64e95ae51755eab07908535bf8cbd7dd189668fd9b1f9c17caf82987347c23f9
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1699ac99270a202a614f6210f1c9ad94febd6aedffc18f3fc4bc2e697c67bcec
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5f9f233a95e4eee4ede6c5841f6b6464fbe03bc86143c503de787eb10d2f079
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9c2004487dcb1735230353f6436f3c533b754dd9fcbccac0f7c9a4c32b4d5c9
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5369bcc4b129fb4baa0628de34b5a0d20122640481c98c406de2e8b2bcccedb
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c936c3f81c58825206b84df480c2a897e988e9e6e0f3068fa190b3d602f76f6f
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70260936db5c513e70188850e0421db1795933fd9647067ff17b568071aeff46
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4727ea737106b284861c375b119c6277ab8eff94810296f3eaab3f1459f0612
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbe180b104dabe979d41aeb47cc9e4e61dd110d07cb8730e39d1c7945327bd7c
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b865728d3c529d4c078a1d81896a49a3d815a91561b21099ccc3411fa4cf9f3
|
| 3 |
+
size 158167
|
output_qwen3_plain_ar/checkpoint-5442/global_step5442/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1b037300183b0b43b2dd7d0ab50dcac57bbb32afe381b0d45e27730743ca05b
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-9070/global_step9070/zero_pp_rank_8_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9704ccfc7c293de7d8b7c7eb75f4fca3eb8a30b131b6d7c6803b0dd96183dc82
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-9070/global_step9070/zero_pp_rank_9_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b718496cc673161da335b958fc560af7d1950ef7451ddd8cd13801cce6f988df
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:030dc55543d596b5504ce068647d95104ff1f84de13af639d0bb50bc1c3f89a5
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:760d31106fb934eee2f7714152b2ebb59336e99cdec6adbbfb8d4887d7a5867a
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:046770aede095eb24c8662a110740f85ff45854bf8b49d00950beaa65e144ce1
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:455955b98871f599284a98ac420e8d5b813f992dd87746e6966b321373a528fe
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5014ed546880ee701dfce8fe31a172f267f78e92b414fe8b5560c276fb626938
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7331c673b3c5719a6215a7f61506223010f21f49d5fb4801dd679c9f5d9b6a44
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51820c9dd37e4d50df433374db9c5885109d8affba6a7d1c7cdd01313c5a1cce
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:943d57e2fa6f2816bc98045cd1f9af33e7b8a457ad7d4b52f1a006859600edc6
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ac073d33f854abc08dd1c3d8ebf56caf2edf9c90b6269bef51bc570914e2b9b
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e3e6a0eca36484be0c1e06af50455acbf23b09fe98a4f844bc48185adee1679
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e5ba3352a08d04bcee34e0a816ee2f19d6dc2f96cc412ace4bffd78927dc81f
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3dab6a97c5620b734af9ada7fc0c54cad649e1063900b2fea18cf61cf51061e6
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6540ad47d39dde6387776858c20c8b8b8b3a95635b16b5ba7546ec2603e9ea36
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-9977/global_step9977/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:569b3c2dfad62dd06a2a62bdc116bec931a74b98d97ffc29e10334c39e82aad9
|
| 3 |
+
size 229713809
|