Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +23 -0
- ICL/DAPO/verl-recipe/flowrl/figures/flowrl.png +3 -0
- ICL/DAPO/verl-recipe/qat/img/image1.png +3 -0
- ICL/DAPO/verl-recipe/qat/img/image2.png +3 -0
- ICL/DAPO/verl-recipe/qat/img/image3.png +3 -0
- ICL/DAPO/verl-recipe/qat/img/image4.png +3 -0
- ICL/LV/dataset_inspect.schemas.json +3 -0
- ICL/RL/plots/completion_terminated_length.png +3 -0
- ICL/RL/plots/kl_divergence.png +3 -0
- ICL/RL/plots/loss.png +3 -0
- ICL/RL/plots/overview.png +3 -0
- ICL/RL/plots/reward.png +3 -0
- ICL/RL/plots/reward_detail.png +3 -0
- ICL/RL/plots/step_time.png +3 -0
- ICL/RL/trl_source/assets/logo-light.png +3 -0
- ICL/RL/trl_source/trl/trainer/__pycache__/grpo_trainer.cpython-313.pyc +3 -0
- ICL/SFT_new/eval_results/eval_val_20260403_161423.json +3 -0
- ICL/SFT_new/eval_results/eval_val_20260403_163019.json +3 -0
- ICL/SFT_new/eval_results/eval_val_20260403_164141.json +3 -0
- ICL/SFT_new/eval_results/eval_val_20260404_135535.json +3 -0
- ICL/SFT_new/eval_results/eval_val_20260406_040033.json +3 -0
- ICL/SFT_new/eval_results/eval_val_20260407_053929.json +3 -0
- ICL/SFT_new/eval_results/eval_val_latest.json +3 -0
- ICL/dataset_inspect.schemas.json +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00001-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00002-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00003-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00004-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00005-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00006-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00007-of-00008.safetensors +3 -0
- ICL/sft_model/epoch3_step1406_fp32/model-00008-of-00008.safetensors +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +3 -0
- ICL/sft_model/final/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- ICL/sft_model/final/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,26 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
ICL/RL/trl_source/trl/trainer/__pycache__/grpo_trainer.cpython-313.pyc filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
ICL/RL/plots/overview.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
ICL/RL/trl_source/assets/logo-light.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
ICL/SFT_new/eval_results/eval_val_20260403_161423.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
ICL/DAPO/verl-recipe/qat/img/image2.png filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
ICL/DAPO/verl-recipe/qat/img/image4.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
ICL/DAPO/verl-recipe/qat/img/image3.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
ICL/LV/dataset_inspect.schemas.json filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
ICL/dataset_inspect.schemas.json filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
ICL/DAPO/verl-recipe/qat/img/image1.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
ICL/DAPO/verl-recipe/flowrl/figures/flowrl.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
ICL/SFT_new/eval_results/eval_val_20260407_053929.json filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
ICL/SFT_new/eval_results/eval_val_20260406_040033.json filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
ICL/SFT_new/eval_results/eval_val_latest.json filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
ICL/SFT_new/eval_results/eval_val_20260404_135535.json filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
ICL/SFT_new/eval_results/eval_val_20260403_164141.json filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
ICL/RL/plots/reward.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
ICL/RL/plots/reward_detail.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
ICL/RL/plots/step_time.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
ICL/RL/plots/kl_divergence.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
ICL/RL/plots/completion_terminated_length.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
ICL/RL/plots/loss.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
ICL/SFT_new/eval_results/eval_val_20260403_163019.json filter=lfs diff=lfs merge=lfs -text
|
ICL/DAPO/verl-recipe/flowrl/figures/flowrl.png
ADDED
|
Git LFS Details
|
ICL/DAPO/verl-recipe/qat/img/image1.png
ADDED
|
Git LFS Details
|
ICL/DAPO/verl-recipe/qat/img/image2.png
ADDED
|
Git LFS Details
|
ICL/DAPO/verl-recipe/qat/img/image3.png
ADDED
|
Git LFS Details
|
ICL/DAPO/verl-recipe/qat/img/image4.png
ADDED
|
Git LFS Details
|
ICL/LV/dataset_inspect.schemas.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a66fb74f3220136d8910a7287bd70b7d3dfe9a9038c0e94e1f078598215eae22
|
| 3 |
+
size 131773150
|
ICL/RL/plots/completion_terminated_length.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/kl_divergence.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/loss.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/overview.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/reward.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/reward_detail.png
ADDED
|
Git LFS Details
|
ICL/RL/plots/step_time.png
ADDED
|
Git LFS Details
|
ICL/RL/trl_source/assets/logo-light.png
ADDED
|
Git LFS Details
|
ICL/RL/trl_source/trl/trainer/__pycache__/grpo_trainer.cpython-313.pyc
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf8a45c462259c95e85b528d08312f573e2f8f2b49ccba4520c19a922a6f86e3
|
| 3 |
+
size 111750
|
ICL/SFT_new/eval_results/eval_val_20260403_161423.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9115add0560bcaf24bfe4a86376a058fdd1062ea39dc98a0f89dc4070f735cf6
|
| 3 |
+
size 73357999
|
ICL/SFT_new/eval_results/eval_val_20260403_163019.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b2ede88ea04913c716f490c0bc603ed762c15944db68d3018cdf4d76a258a6d
|
| 3 |
+
size 73357999
|
ICL/SFT_new/eval_results/eval_val_20260403_164141.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed8e56f90fc398311661760bf9804ede3919e045d7930eec385cc8a9f03a577a
|
| 3 |
+
size 13380826
|
ICL/SFT_new/eval_results/eval_val_20260404_135535.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ee5f475959dea8d2b6054008c000278e8adbc56b73299bd04bf053fb25d6038
|
| 3 |
+
size 13614172
|
ICL/SFT_new/eval_results/eval_val_20260406_040033.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58442e061f013c65083f37f1b81f732c45917e858ba7d0de800fd9b003d47852
|
| 3 |
+
size 13614171
|
ICL/SFT_new/eval_results/eval_val_20260407_053929.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0278b419a1cda69240f2ead4c5c9c20e4f3f5c55cdf2e43abf4a9781a5f1407c
|
| 3 |
+
size 13614173
|
ICL/SFT_new/eval_results/eval_val_latest.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0278b419a1cda69240f2ead4c5c9c20e4f3f5c55cdf2e43abf4a9781a5f1407c
|
| 3 |
+
size 13614173
|
ICL/dataset_inspect.schemas.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a66fb74f3220136d8910a7287bd70b7d3dfe9a9038c0e94e1f078598215eae22
|
| 3 |
+
size 131773150
|
ICL/sft_model/epoch3_step1406_fp32/model-00001-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:956273bc71e29c89b14d3511a2ea82457990091518795159ee2b31d07d910c72
|
| 3 |
+
size 4958393960
|
ICL/sft_model/epoch3_step1406_fp32/model-00002-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23dad69d99e176a0441a6c7159575864507eb283138be2985bb031ac745b2aea
|
| 3 |
+
size 4832049608
|
ICL/sft_model/epoch3_step1406_fp32/model-00003-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bfbcd41c343359ca4d5a311ecbbcbf46a47eb013bdc9b2298bd025405962400
|
| 3 |
+
size 4832049624
|
ICL/sft_model/epoch3_step1406_fp32/model-00004-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68f4c63b799b37e8ec837866fe491342bcbc6357bd7a240a49a12cb944a136ab
|
| 3 |
+
size 4999856656
|
ICL/sft_model/epoch3_step1406_fp32/model-00005-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee6c01232f7cc496d9f9c39498b3a2db1d69befad2088a699cfd5cc4857aa5c8
|
| 3 |
+
size 4832049680
|
ICL/sft_model/epoch3_step1406_fp32/model-00006-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95e0648042f88d033039e7fe4f604f61d531a6ac596428e3a7f38f4fd6016930
|
| 3 |
+
size 4832049672
|
ICL/sft_model/epoch3_step1406_fp32/model-00007-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5f0756c34ce46f9130b6cab182e04fba2bc3e0d0579b2b64b3cf41bc76ad8f1
|
| 3 |
+
size 3288524864
|
ICL/sft_model/epoch3_step1406_fp32/model-00008-of-00008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6b1cd69a615f82fda5cc5e2c3bd6c5f7cd176c434056707a9a16a5832e9377b
|
| 3 |
+
size 2485026944
|
ICL/sft_model/final/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca4b60aa7696aa4d046c145ad402a088b9fe2ff7d4fe06af9ca7c334db04b134
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61788c2c6d848850dcdd917badd0e1a6d13a7eea1c62d16ab14891607bb41cfd
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6224e39ac79938208d53b49d10d56f85d570e20d2fc62cc2752788fa909afdfa
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:265ce64eb99df5387525955544bc2014831201d56cceb71b20f60002bb075dd9
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:004298254e7d182c7a30c8d80529234312d5a7874f0e1e6c49b82b3d37b0bb47
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:757e6d7353534cd0062008b6f8532e9c4d3b970e8d83f21681fef1cd51505df8
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12a98ed1389b083c9d0b354a536afab56ff0a4097ba982cc87fa156c2d6997dd
|
| 3 |
+
size 6573736579
|
ICL/sft_model/final/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45b8f8b10bcc52e445f0d5d68fa589afa28348ee2d83be18d8dcfe36889c92f5
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6207e3336074d4d28c852a37edba15823f297a9e87939ddccc7e73d47c306567
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd0bf955c6f9736d120b4f96a8383c9d168c2f2738297ed405ccd4423d4afb0f
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5af3ad76a6fed5e135c5e013f7611ad8928c7774eacfec0afdd3e22184b469c1
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:704d46917ad406649380aaca206b4bd5e337c2b3e736c0c1c4d4d0fe6f47107a
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:098c371bc81b3d0cdb79f56f5b1330c4c33554c9a52693dab5e2affee9b1aad2
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3589040bc46bf07a80cffebf0ee6a3ecd127c5b4227fb0e9a54d842117c2ae30
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b419b4a97d3dd62f8508bb125e7bcc3d104d737b93cdddce4ff51d3bd0b50c14
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bccc66d0614cd2c73a1af98180f5aff38830b26f40f1c64a7d6860024ed90503
|
| 3 |
+
size 6573736572
|
ICL/sft_model/final/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e101c44d1ed036f0afac833bd62ed7b0d87e6757cca52a73bcefc0b6b85be2cb
|
| 3 |
+
size 389860
|
ICL/sft_model/final/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:010906bc4d4fde5cc7316901226854dae856722033634412cb9d4e3834d136bf
|
| 3 |
+
size 390614
|