diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..ec471175d83a8f2aab251ab2712aa03a9cc4dc12 100644 --- a/.gitattributes +++ b/.gitattributes @@ -27,6 +27,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.tar.* filter=lfs diff=lfs merge=lfs -text *.tar filter=lfs diff=lfs merge=lfs -text *.tflite filter=lfs diff=lfs merge=lfs -text +*.txt filter=lfs diff=lfs merge=lfs -text *.tgz filter=lfs diff=lfs merge=lfs -text *.wasm filter=lfs diff=lfs merge=lfs -text *.xz filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoints/ckpt_0.pt b/checkpoints/ckpt_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..921f670b96f469753fef815d15292d85b7008089 --- /dev/null +++ b/checkpoints/ckpt_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9320c3d520211866da7625c142148bc60b0b1fdfc4baa83936f220a036ad0c42 +size 1493013690 diff --git a/checkpoints/ckpt_1.pt b/checkpoints/ckpt_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..863372e90137c7a011c299220e805aa4cd938171 --- /dev/null +++ b/checkpoints/ckpt_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70119048fd58b2bec766632d47f8cd3d260b387c8310ba207e31d8a4e654844b +size 1496781612 diff --git a/checkpoints/ckpt_10.pt b/checkpoints/ckpt_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..52ddb80bedac8e30dc2d0469c5bc67eccfab60dd --- /dev/null +++ b/checkpoints/ckpt_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57aa2a94442d0b2b3059255fe8e8b8a5c3260a2088a99ba9ecaa25cc6aa5d667 +size 1517754865 diff --git a/checkpoints/ckpt_11.pt b/checkpoints/ckpt_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..a88b583d242703596d300d72ddbeb0d694a5ab81 --- /dev/null +++ b/checkpoints/ckpt_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0d231d83ae55a4e0e1935250cefc31845eb8029d65ef9a41c4d283d2bb5b1d +size 1517754865 diff --git a/checkpoints/ckpt_12.pt b/checkpoints/ckpt_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad15428a7879e092e07145f4e49029b33283429 --- /dev/null +++ b/checkpoints/ckpt_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8923e40da8e82cab8d3caa70a6a08b85c5f148975f2a5f22e710d3b40c6c40 +size 1493013114 diff --git a/checkpoints/ckpt_13.pt b/checkpoints/ckpt_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dabc3d81c8866d18aa614fa15ebd872cc3f78b6 --- /dev/null +++ b/checkpoints/ckpt_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4987627000111003e4511b6528b8d368e8f418d7466e0bf27abff1d80aed39ed +size 1493014095 diff --git a/checkpoints/ckpt_14.pt b/checkpoints/ckpt_14.pt new file mode 100644 index 0000000000000000000000000000000000000000..888edbe76918bb1a8d0cf1e7d63aef8aefad76d4 --- /dev/null +++ b/checkpoints/ckpt_14.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:befc1599dc9a1345feaaca68d2616c5b6071c03355d634dd563b9e0f16231f07 +size 1517754554 diff --git a/checkpoints/ckpt_15.pt b/checkpoints/ckpt_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d03a707a8af47c7f828f583e84e72351951df3 --- /dev/null +++ b/checkpoints/ckpt_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e276bfe9728e3de4cddfcc417eec44913d8f07c24584b2c2ea68a13a819a2c +size 1517754865 diff --git a/checkpoints/ckpt_16.pt b/checkpoints/ckpt_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fcd7122a4acaec346eed9b37f3c859370a68cb8 --- /dev/null +++ b/checkpoints/ckpt_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951e6fc37a8e0ad7c06634e3a8ead40fabdbe53609f894447508462339ed2ff8 +size 1517754865 diff --git a/checkpoints/ckpt_17.pt b/checkpoints/ckpt_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9dde87d706b308157d28645d49acd87af86f0a --- /dev/null +++ b/checkpoints/ckpt_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c1e7f28e7ef8fe25ab7677ba9a225bfc7eb3ff8181d005e1dccebb4f560994 +size 1517754865 diff --git a/checkpoints/ckpt_18.pt b/checkpoints/ckpt_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e017e9c92c15b8c80b27362eeb26c9bc8d07f5a --- /dev/null +++ b/checkpoints/ckpt_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbd22bc12ad8610e786959cb5c99f028f1005650b45f49b287b87b2c27438a7 +size 1517754865 diff --git a/checkpoints/ckpt_19.pt b/checkpoints/ckpt_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c32bada79c64aeb38243bac49d6fcff0d987bea --- /dev/null +++ b/checkpoints/ckpt_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67bc6b96a8fbd315ee2d547cc079b9a6568332ba8fd9038a051410f76e926086 +size 1517754865 diff --git a/checkpoints/ckpt_2.pt b/checkpoints/ckpt_2.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c601567de4e6bc9e25269ec032d06605fbdf90 --- /dev/null +++ b/checkpoints/ckpt_2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de25c4f369a3759c1914e60469f9310639fb8e31c5d0c1459da4c8a3c4b97fa8 +size 1492586682 diff --git a/checkpoints/ckpt_20.pt b/checkpoints/ckpt_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..f179baf665c1084ee08e435b04ab48e1a8cf6ae4 --- /dev/null +++ b/checkpoints/ckpt_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7b74242b765a7a401bdb77a7a6c0c9dabb942abbe1f9af70fa1fc0d9c0c1bc +size 1517754865 diff --git a/checkpoints/ckpt_21.pt b/checkpoints/ckpt_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..428f012f4970e2d502f091dc6a64cf08d7aecad0 --- /dev/null +++ b/checkpoints/ckpt_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c267c09917840db29a48c7f83df511b73b90f6aa6a8225760f9b6656ac64058 +size 1517754865 diff --git a/checkpoints/ckpt_22.pt b/checkpoints/ckpt_22.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c0f17ecbcfc70e77fcebde55244f4d68fe99a6b --- /dev/null +++ b/checkpoints/ckpt_22.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4dcb7952f689b0b6ed150532ed51c18aad7e37835802ce103de8a9ecd65fe5 +size 1517754865 diff --git a/checkpoints/ckpt_23.pt b/checkpoints/ckpt_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3b538d3a652eaad577b814c2142361f082b9c5 --- /dev/null +++ b/checkpoints/ckpt_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051206d8d21b281c173e2bb3c19c2bc3ec126aa9337b9a4c18498b554381259c +size 1517754865 diff --git a/checkpoints/ckpt_24.pt b/checkpoints/ckpt_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e0789e6c628084ca72a927233b86ac56ace1ac4 --- /dev/null +++ b/checkpoints/ckpt_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9fe06efebcd5abe7548a36bb7b0edab8fcee239a8a99f242b6b98016dec9484 +size 1517754865 diff --git a/checkpoints/ckpt_25.pt b/checkpoints/ckpt_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..43589cf924dd77485418a9e8c3ff9f9cb7e2719a --- /dev/null +++ b/checkpoints/ckpt_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8071125abb22689e883eee7eff885f1cd1ad874f67bee1f132e0b22d29381bb2 +size 1517754865 diff --git a/checkpoints/ckpt_26.pt b/checkpoints/ckpt_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8ddb8933108c4f6848683d6c4e67ae7604d3a58 --- /dev/null +++ b/checkpoints/ckpt_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefc267ce7ad487e2f10202d62c0852be375e7e87315838e8d37c246cfbeb7eb +size 1517754865 diff --git a/checkpoints/ckpt_27.pt b/checkpoints/ckpt_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b4efe5595d852489df072b789420aa4d5d87dbe --- /dev/null +++ b/checkpoints/ckpt_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdcfa59daa005ddd40a17521507a21415e1a47274e8384a24f4a0e34235820e5 +size 1517754865 diff --git a/checkpoints/ckpt_28.pt b/checkpoints/ckpt_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..33847d2faa097be5958a427cd9aeff397d577868 --- /dev/null +++ b/checkpoints/ckpt_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e06e459f7cd84ff689502d785a023277f914b5e081542c7c197b4edc9fa5269e +size 1517754865 diff --git a/checkpoints/ckpt_29.pt b/checkpoints/ckpt_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..4679de45003cb6b244ea352902dddfc9f57dbf3d --- /dev/null +++ b/checkpoints/ckpt_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecb72659b613b4c4836698780a5c206a4b7a05b372820f4b3819cbe3ec97b50 +size 1517754865 diff --git a/checkpoints/ckpt_3.pt b/checkpoints/ckpt_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6cc73df42cd182f866a67df019f213470975b1 --- /dev/null +++ b/checkpoints/ckpt_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fbe0a86cd506048f2e324b5a03d305c022f4d414b946686a098181b4f685619 +size 1493000203 diff --git a/checkpoints/ckpt_30.pt b/checkpoints/ckpt_30.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3cab3d1efa70d3a423e9c1ef7b03b0ffa91168 --- /dev/null +++ b/checkpoints/ckpt_30.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263f2374da43976831bbf5ff4e1ff2b171d096330131b61192a0facc8b485fc8 +size 1517754865 diff --git a/checkpoints/ckpt_31.pt b/checkpoints/ckpt_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..1961b0a38410ba880ae6097d099697301c811d19 --- /dev/null +++ b/checkpoints/ckpt_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a898b5c19ae487a824ee63b28194cf267ba63a68a00c02f651c52806bb06879d +size 1517754865 diff --git a/checkpoints/ckpt_32.pt b/checkpoints/ckpt_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c8234875d63ca9e70a330ec1eb232338081cf4 --- /dev/null +++ b/checkpoints/ckpt_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7b7c4e4271e23ae1fec54d21e41fc956ea6ea3669d6ffaf9eef8bb2ed8b8de +size 1517754865 diff --git a/checkpoints/ckpt_33.pt b/checkpoints/ckpt_33.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ae131ab84cfed65d42a7ae6f95074590a100f3 --- /dev/null +++ b/checkpoints/ckpt_33.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f34a61b9b9900c54fa7434fee33244be38d68829ada7b521f26f6eb577d078e +size 1517754865 diff --git a/checkpoints/ckpt_34.pt b/checkpoints/ckpt_34.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef43a5cbf35dfe91d727c626869facec1328765f --- /dev/null +++ b/checkpoints/ckpt_34.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6ce380723d2e3f3046fedda9239946b6cceec5ee435114d0f9a4bda44a2eaf +size 1517754865 diff --git a/checkpoints/ckpt_35.pt b/checkpoints/ckpt_35.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03a6108094086521ee73432169d6e2f990a2809 --- /dev/null +++ b/checkpoints/ckpt_35.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ab90eccfcbbec2dc04f540869d2c9869beaa8eb3a0e51c6b81c7682725de65 +size 1517754865 diff --git a/checkpoints/ckpt_36.pt b/checkpoints/ckpt_36.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c99549c9bb735ac8affe33bc0d5d47cd353236e --- /dev/null +++ b/checkpoints/ckpt_36.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef6c0af472b0f5e6fd33cd80cb41fa204e37a8dd474df19032df09af64c60cf +size 1517754865 diff --git a/checkpoints/ckpt_37.pt b/checkpoints/ckpt_37.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d6f9625f842c2d9202e9199bf585103b20defba --- /dev/null +++ b/checkpoints/ckpt_37.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39af43a079c343e7c7475f8b31fade19cac1c8e14d489a2033c8c88c072e9a54 +size 1517754865 diff --git a/checkpoints/ckpt_38.pt b/checkpoints/ckpt_38.pt new file mode 100644 index 0000000000000000000000000000000000000000..313217ad893a487d62a8bf4b419ee24f5c2b9abb --- /dev/null +++ b/checkpoints/ckpt_38.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e678080ee0afc703020981b1fa3ab0fad4dc1397a8fd3fd0727354735d322d +size 1517754865 diff --git a/checkpoints/ckpt_39.pt b/checkpoints/ckpt_39.pt new file mode 100644 index 0000000000000000000000000000000000000000..02fe384f24dd2fbc407726e1fe3ccced77f4d9db --- /dev/null +++ b/checkpoints/ckpt_39.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192b41275c3143f4994ba1dbea72f1138b1dc5f9744459fa6e0dee16684bdb08 +size 1517754865 diff --git a/checkpoints/ckpt_4.pt b/checkpoints/ckpt_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..f03bf0fc377604e734f8bae7c4d02a6d30e279b9 --- /dev/null +++ b/checkpoints/ckpt_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb56792cea2e6fc9544a31809a21ef8bab8eeb0cf729f8f443fa1f46856c5d1f +size 1493000139 diff --git a/checkpoints/ckpt_40.pt b/checkpoints/ckpt_40.pt new file mode 100644 index 0000000000000000000000000000000000000000..001ffe4e1fa02fd8767fa7bba7a6ccf23c1547e4 --- /dev/null +++ b/checkpoints/ckpt_40.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42cffccaa0eec34cc74bfabc32b008b8ce6fc57f5e1400183f85ab4b204d8afc +size 1517754865 diff --git a/checkpoints/ckpt_41.pt b/checkpoints/ckpt_41.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb59751950ad62669bf743990fada045fbaac4a6 --- /dev/null +++ b/checkpoints/ckpt_41.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d996c8f20431f0596ca3eacbba598019e2fd426baba958e4c2a6f6c694883b +size 1517754865 diff --git a/checkpoints/ckpt_42.pt b/checkpoints/ckpt_42.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a5e8642fd126abde0435d4e8e76c382b1445af4 --- /dev/null +++ b/checkpoints/ckpt_42.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711822b99873c17715c275bf525e40dd51eda77048854630902379a57af8a19b +size 1517754865 diff --git a/checkpoints/ckpt_43.pt b/checkpoints/ckpt_43.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba9f976850d22fd6a6668373606ed3e4cc2d5f82 --- /dev/null +++ b/checkpoints/ckpt_43.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07dd2d0dab01525bc1c03f69147b7aeda44bc80b57d6e71fa89f7367e348aa94 +size 1517754865 diff --git a/checkpoints/ckpt_44.pt b/checkpoints/ckpt_44.pt new file mode 100644 index 0000000000000000000000000000000000000000..45e9404b342f982d3e3a7e1f01e4f4c466b2ced0 --- /dev/null +++ b/checkpoints/ckpt_44.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10ab6d9b0da098620922554a20cc0fc5a3e9c3a4120f3ffb94b0dcfeb9d7a0e +size 1517754865 diff --git a/checkpoints/ckpt_45.pt b/checkpoints/ckpt_45.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f5b47bfd2cb05d7585915ff9f3868af9743797a --- /dev/null +++ b/checkpoints/ckpt_45.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9037dc1ffc9bbd0538b9cea0f64e66d38a97a772a8ffc06d5d5ad39c81736ead +size 1517754554 diff --git a/checkpoints/ckpt_5.pt b/checkpoints/ckpt_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5c32ee542542cc89399608049ed7b3b99bb325 --- /dev/null +++ b/checkpoints/ckpt_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e80d50e0580f7e31afe110c59bf95d6372813e7ea4f95ee57e2322163451fb9 +size 1493000203 diff --git a/checkpoints/ckpt_6.pt b/checkpoints/ckpt_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..338ec7711074a1eb9d5565ea66e4295d56d26ab5 --- /dev/null +++ b/checkpoints/ckpt_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2f6b97493b3493ad2d3d7e697943d9d165ec9daa322b28c6d09db27cefb17f +size 1492586618 diff --git a/checkpoints/ckpt_7.pt b/checkpoints/ckpt_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e677f6d132d859336f61b7ba6c4560f7a49dc29 --- /dev/null +++ b/checkpoints/ckpt_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2042189b39fcd117e412004da333d552e1e6af4e103a490cfce5988d88256652 +size 1492586987 diff --git a/checkpoints/ckpt_8.pt b/checkpoints/ckpt_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..e69201153c9782b8ab302edb3c7a1da2adc8bc9f --- /dev/null +++ b/checkpoints/ckpt_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff3a0d24cd4cd6ff986672d8066530831cc9eb32a07a21e514e7a1efae328f01 +size 1492586987 diff --git a/checkpoints/ckpt_9.pt b/checkpoints/ckpt_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..a892b279022d89ff17b0439300c578d67a2d5ad2 --- /dev/null +++ b/checkpoints/ckpt_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c8f3361a2f7bd76fd38891f4bd5319559e480abb6a4f8bfe0c587bbcd1ab99 +size 1496781612 diff --git a/indices/ckpt_0_indices.txt b/indices/ckpt_0_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..f0f1030a95771ccdf74ea1667bca9712e1ecbeea --- /dev/null +++ b/indices/ckpt_0_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c536682cb1e933f59e18914b035baaed10a8c8b90e0cd5254526a88f6ce4bb +size 11143445 diff --git a/indices/ckpt_10_indices.txt b/indices/ckpt_10_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..0623fe697cb048c96836680896580c2a87652db9 --- /dev/null +++ b/indices/ckpt_10_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0e8075e193b31fbecd403ad30ba0e7a40ff1d621971d391bcd140899ea215d +size 11143686 diff --git a/indices/ckpt_11_indices.txt b/indices/ckpt_11_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b5f08b29f096dc8a8140db57b6cae206f647cdf --- /dev/null +++ b/indices/ckpt_11_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d191a2c4a654779d61a25a51ce969f6c0886b1ab3757d1b8882c7ebc218d828 +size 11143264 diff --git a/indices/ckpt_12_indices.txt b/indices/ckpt_12_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a4a14ae93b410d43addfd2a43b8f385a3c5fd3d --- /dev/null +++ b/indices/ckpt_12_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18061ff62cac8e7ae0c1fb06d388ef6ddc13552eb79b91c69ed80cb61a760a15 +size 11142605 diff --git a/indices/ckpt_13_indices.txt b/indices/ckpt_13_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..0408d0b4a038d55ddf7f5da7d03679e872abcb9e --- /dev/null +++ b/indices/ckpt_13_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b1754a0a19bd224d8e37d72694dbd78d408fe5ef9c20c2dde653f6640ea65e +size 11143490 diff --git a/indices/ckpt_14_indices.txt b/indices/ckpt_14_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..4deef4601c419e328ad8d206b07a2595276ce90c --- /dev/null +++ b/indices/ckpt_14_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53a3a23f956dd2e6c871fad791cb50b2608036256824f761151dd74daca10fe +size 11143305 diff --git a/indices/ckpt_15_indices.txt b/indices/ckpt_15_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..a91e4f71c04ee9a88756f47085941637d2d1467e --- /dev/null +++ b/indices/ckpt_15_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f715dc97b621f47acf09ff4dfc00c2b9089b65feddb17cacf72a2cec00cd0a +size 11143923 diff --git a/indices/ckpt_16_indices.txt b/indices/ckpt_16_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c782dde265736b223dd3c9be6ab311ef1111c1a --- /dev/null +++ b/indices/ckpt_16_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95816c6078a9adfc2c9ddf435fb6d9169f2cd6d17eec5aac3965c65c62c20d1e +size 11143815 diff --git a/indices/ckpt_17_indices.txt b/indices/ckpt_17_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..e25030f301c50222253a676b5692e3f992174fe8 --- /dev/null +++ b/indices/ckpt_17_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3ea21087e10bc37164c12f9bcbf386912ff07457e2f054258dd5b8aaa2d0cf +size 11143783 diff --git a/indices/ckpt_18_indices.txt b/indices/ckpt_18_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..0cbb45588a736e9c0a122534cf60067f37f5b960 --- /dev/null +++ b/indices/ckpt_18_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b52a51939e2ee745198ac72d17c29826e5039e5d7f32b599ce4bd0a9ddd07a9 +size 11143367 diff --git a/indices/ckpt_19_indices.txt b/indices/ckpt_19_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3e0a60f7343155f225c7b57e72565421c5462b9 --- /dev/null +++ b/indices/ckpt_19_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f45ef443d343552fb814c5b9e95e9d13c15ee11b4dd69386c0764d96803ba3 +size 11143565 diff --git a/indices/ckpt_1_indices.txt b/indices/ckpt_1_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..56a89319a43e7ca7eb5c7166acb705fe7a0b03c8 --- /dev/null +++ b/indices/ckpt_1_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e6e003b112912fd97ad82fc74a25b956737371f9fe75b3e5c6005e9c251a3a +size 11144247 diff --git a/indices/ckpt_20_indices.txt b/indices/ckpt_20_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..8af2104ddbd7bd246a2f44e941e0fe5e1bb44d08 --- /dev/null +++ b/indices/ckpt_20_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4eb0759216aebc43a9c0a1e50acab8f0faa9984701391e7cfc19e43ce84a0e +size 11143425 diff --git a/indices/ckpt_21_indices.txt b/indices/ckpt_21_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..630823c1125d5354f9f9db3c9137e701a47b042e --- /dev/null +++ b/indices/ckpt_21_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0238db741dbd8008cb3323e3aa19bfdf5c54d18879844bb8b9bd5b5c4015a634 +size 11143522 diff --git a/indices/ckpt_22_indices.txt b/indices/ckpt_22_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..803dd1f2df7e1d7ede3c8075eb545bbffde8e96b --- /dev/null +++ b/indices/ckpt_22_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7a3bddbd1834caf5aeb3719462e997921556be490dbc4170cc7bd7156e5e6a +size 11143194 diff --git a/indices/ckpt_23_indices.txt b/indices/ckpt_23_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..15f8db467e9dda00b87555db239c4511f70b534a --- /dev/null +++ b/indices/ckpt_23_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46465a636075d7256dad6f81f56ab95307c526f26f9d794aa802ac8b80b9920 +size 11143289 diff --git a/indices/ckpt_24_indices.txt b/indices/ckpt_24_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..2a2d754b0208a5c9d005563aa353bdacf1db38b7 --- /dev/null +++ b/indices/ckpt_24_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2783ecc9c7e6e6e20820e62c74625353e9015b147f3030a3126a304ac1f06230 +size 11143748 diff --git a/indices/ckpt_25_indices.txt b/indices/ckpt_25_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..52c5b5d303380202c992a22351a9348758b3a595 --- /dev/null +++ b/indices/ckpt_25_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc8a839fed138a84cea9438ca53449301974df0dba899ff2bac4d5964709157 +size 11144081 diff --git a/indices/ckpt_26_indices.txt b/indices/ckpt_26_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..48cc0957fb40166937e4b9e7d28f3226cb3902a9 --- /dev/null +++ b/indices/ckpt_26_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcba7563f2bae4eecead0aa87b7b16a25df45acd9e22afbc454bc4bdb6ae550 +size 11143842 diff --git a/indices/ckpt_27_indices.txt b/indices/ckpt_27_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..37a09575548048b94be110a83e52aba09329a435 --- /dev/null +++ b/indices/ckpt_27_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b6a1747eb379356e4419561d2a8c6c732a33db8d4507ce25adf3703ddfb379 +size 11143582 diff --git a/indices/ckpt_28_indices.txt b/indices/ckpt_28_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf0c36e53c9cb3fcfa4d722a51e82f7a1195e1c3 --- /dev/null +++ b/indices/ckpt_28_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a45fe1402d2f601776637e3d4ca856ccca5e4ec9bcebd6bc7f65247ce9f9d9 +size 11142688 diff --git a/indices/ckpt_29_indices.txt b/indices/ckpt_29_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d1d1b6b95535fb4289941de243162288cbfcc53 --- /dev/null +++ b/indices/ckpt_29_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60e46f36454efde31050ce0a1f542cd04258ea789d6d7ede5687daa23c31764 +size 11143707 diff --git a/indices/ckpt_2_indices.txt b/indices/ckpt_2_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..b0a753d63e65df32843ee3f95c5bf8c54f00ea10 --- /dev/null +++ b/indices/ckpt_2_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc60ee833c6cc1629c9128c4e2fd0c0b9f500ad2193ba508d824de23af4b2c6 +size 11143658 diff --git a/indices/ckpt_30_indices.txt b/indices/ckpt_30_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..a496cb34d8411b0a06c0976dd081ab523f272d0d --- /dev/null +++ b/indices/ckpt_30_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9b1c3bd5cfa9d3f529729b0d93420b80838730ecadd4b1fcc4c31eb2cc98a5 +size 11143745 diff --git a/indices/ckpt_31_indices.txt b/indices/ckpt_31_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..c98a67165699ea712b6303f8e1e3fcbbe8595445 --- /dev/null +++ b/indices/ckpt_31_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9887e760fc8fa7c338b943b0bdb5972e0cbba3a268b9c7a0844e0fed03cf62e7 +size 11143905 diff --git a/indices/ckpt_32_indices.txt b/indices/ckpt_32_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..ff98cfe32752b42f28691d7c9cc24ef862129c5d --- /dev/null +++ b/indices/ckpt_32_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcdc664ea117c980e093d08912fe9a0a22f39b6a59135a3f70710a76aabde19f +size 11144170 diff --git a/indices/ckpt_33_indices.txt b/indices/ckpt_33_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..caa55f989b31c3bd12d5d1789ef7cc0fd3b558d7 --- /dev/null +++ b/indices/ckpt_33_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823c569c12c9688ba672769723c16c8af33763db9a23de7b2f9b6c69b8123da5 +size 11143522 diff --git a/indices/ckpt_34_indices.txt b/indices/ckpt_34_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..3858b85004ed6538ba6d321b752ea896a3586cb6 --- /dev/null +++ b/indices/ckpt_34_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360ea03a033062f2f8cf98ec30a91a16c1a8be7ec184d172ceb7c2066a6d2745 +size 11143612 diff --git a/indices/ckpt_35_indices.txt b/indices/ckpt_35_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..429dc3be90d5eae017d50ed7824fb46b9355cfa5 --- /dev/null +++ b/indices/ckpt_35_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ba0eb59e226a5b46aeb8a6544d5cbe68fb2a0e446cf5fa6b8c17cdd856cbd3 +size 11144048 diff --git a/indices/ckpt_36_indices.txt b/indices/ckpt_36_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb750670d26240cd3e1afe8b4c50b5c49b315acb --- /dev/null +++ b/indices/ckpt_36_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d6c5f9c5d11bf5a3a5b821ea785fb39b1ad97b2b206efa5f2788bef022ef79 +size 11143437 diff --git a/indices/ckpt_37_indices.txt b/indices/ckpt_37_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..b319dfc1b109d84e605f249576fc0c2363c0caee --- /dev/null +++ b/indices/ckpt_37_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9cc5cfa88128a18c982d2e9145fe2213ead7d154a975a8da5fbc741ba594c63 +size 11143696 diff --git a/indices/ckpt_38_indices.txt b/indices/ckpt_38_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..124a3afc834ac6c5684b7c935aeb15fdc9ccad99 --- /dev/null +++ b/indices/ckpt_38_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0a9d282c841372cb806bf0a680a3d69bcdaa85d8477cf028584285c4aba874 +size 11143635 diff --git a/indices/ckpt_39_indices.txt b/indices/ckpt_39_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..5b9dfe94404c20190fbbc8c90b9572dc49151348 --- /dev/null +++ b/indices/ckpt_39_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d242ab2d04d0cbbce674e2fa147b5302614175208725fa9a3a541463119afd +size 11143282 diff --git a/indices/ckpt_3_indices.txt b/indices/ckpt_3_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..b1f7f112a314a1073a7f946528b52ec73c5a7af6 --- /dev/null +++ b/indices/ckpt_3_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:229f52978c3215c33789b6a419cfb8e26f9b53e95c06f2848a3cb425d7fb46e6 +size 11143435 diff --git a/indices/ckpt_40_indices.txt b/indices/ckpt_40_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..c03472a9cd09b26bcc78d37c5f621b0e6bd479b5 --- /dev/null +++ b/indices/ckpt_40_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd24c4469b8a776ea72c96e74a843d5b83d275c5e6c6f3f6f1da3479497dc21 +size 11143790 diff --git a/indices/ckpt_41_indices.txt b/indices/ckpt_41_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d977589828699cae6bcec93784dfa12a665c48c --- /dev/null +++ b/indices/ckpt_41_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70f1a3ae9126ed0025fdc9fbb55bac94cb5cca72fbbb4bb6fc024a7bdb2b94a +size 11143590 diff --git a/indices/ckpt_42_indices.txt b/indices/ckpt_42_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..71d130f7136a59d95320c9262404a943816bc863 --- /dev/null +++ b/indices/ckpt_42_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0661c72e8c80f2dc3766d7d9e3b7093d2f467823f4a28a9e3bdaa3952046a21 +size 11143688 diff --git a/indices/ckpt_43_indices.txt b/indices/ckpt_43_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..5d4188c8cb3f035820413452c78653ad1dfede55 --- /dev/null +++ b/indices/ckpt_43_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed0a530fbf468dcdfc7389e94eee1e79d6cf4a3374d3a2cda7358e9aca4b167 +size 11142894 diff --git a/indices/ckpt_44_indices.txt b/indices/ckpt_44_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..fc00fd0c832fc13857bfe4dc57a489c99ce8a68c --- /dev/null +++ b/indices/ckpt_44_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5e12502b3a2874ff561e426c61e8f0b40ea7ce08dd5d84245d9b7780979a36 +size 11143659 diff --git a/indices/ckpt_45_indices.txt b/indices/ckpt_45_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..4deef4601c419e328ad8d206b07a2595276ce90c --- /dev/null +++ b/indices/ckpt_45_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53a3a23f956dd2e6c871fad791cb50b2608036256824f761151dd74daca10fe +size 11143305 diff --git a/indices/ckpt_4_indices.txt b/indices/ckpt_4_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0599dc138a8d5e578b6cee5fa25f999c2320e85 --- /dev/null +++ b/indices/ckpt_4_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b77431b54dbf1da484dc0c67521aad482753f4e5ad0a6daa2ec821c198f7828 +size 11143795 diff --git a/indices/ckpt_5_indices.txt b/indices/ckpt_5_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..537d3d2374f39d2ea97f351b25eca8ecf1210b45 --- /dev/null +++ b/indices/ckpt_5_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f4dc44ec2b3d1656db46a06405770cf68b1802793215c7c2fdafdb8a7f6c90 +size 11143707 diff --git a/indices/ckpt_6_indices.txt b/indices/ckpt_6_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3fd9c2eb1c9dcbc0cc69e68c27722faeddbd866 --- /dev/null +++ b/indices/ckpt_6_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be1655c48a57b9b953f19f73d5cf44051e695bc1c4465d36d2f639d577f64b6 +size 11144053 diff --git a/indices/ckpt_7_indices.txt b/indices/ckpt_7_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..ef7040b0ae9b4d9f98e6f7c75add5108fb3dc7ff --- /dev/null +++ b/indices/ckpt_7_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27588c820fb2e433cdfaf78a87e4bedf480cc244d062e0cd188c4daadaf3894 +size 11143434 diff --git a/indices/ckpt_8_indices.txt b/indices/ckpt_8_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f0ad781e197e0f643309a5e755dcaae0cc48461 --- /dev/null +++ b/indices/ckpt_8_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f260dde33e229d28ad5bd0991026d26383684a997c0200a1840f4cd8b3d1e7 +size 11144065 diff --git a/indices/ckpt_9_indices.txt b/indices/ckpt_9_indices.txt new file mode 100644 index 0000000000000000000000000000000000000000..e06992fa17e26a7ce7706b69249455225a46e558 --- /dev/null +++ b/indices/ckpt_9_indices.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc458a87230f2dd052c9c6d45a853f950cf4d826b1a5fef7b83ef34bc76c7de +size 11143275 diff --git a/metadata/ckpt_0.json b/metadata/ckpt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bf3f19f2ee3d42e161d8c553a912e9a2f03fc4b9 --- /dev/null +++ b/metadata/ckpt_0.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_0.pt", + "model": "GPT2-S", + "training_step": 6000, + "instability_type": "Slow divergence", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_FP8_head" +} \ No newline at end of file diff --git a/metadata/ckpt_1.json b/metadata/ckpt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9b0c0265e69cb578a2c56d30e2c16e888119fc78 --- /dev/null +++ b/metadata/ckpt_1.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_1.pt", + "model": "GPT2-S", + "training_step": 38000, + "instability_type": "Slow divergence", + "learning_rate": "3e-3", + "decay": "0.1", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_10.json b/metadata/ckpt_10.json new file mode 100644 index 0000000000000000000000000000000000000000..62d33541ad41ae854778143020d4a838d753b366 --- /dev/null +++ b/metadata/ckpt_10.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_10.pt", + "model": "GPT2-S", + "training_step": 42000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-2", + "decay": "0.1", + "warm": "2000", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_11.json b/metadata/ckpt_11.json new file mode 100644 index 0000000000000000000000000000000000000000..7fc6637b4a7ebbf28dbfbf901c48ca0878ce0423 --- /dev/null +++ b/metadata/ckpt_11.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_11.pt", + "model": "GPT2-S", + "training_step": 54000, + "instability_type": "Divergent loss spikes", + "learning_rate": "3e-4", + "decay": "0.0", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_12.json b/metadata/ckpt_12.json new file mode 100644 index 0000000000000000000000000000000000000000..8a2a28f23070c31fe804132656fa2c3cd18ed32b --- /dev/null +++ b/metadata/ckpt_12.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_12.pt", + "model": "GPT2-S", + "training_step": 4000, + "instability_type": "complete non-convergence", + "learning_rate": "3e-3", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_FP8_head" +} \ No newline at end of file diff --git a/metadata/ckpt_13.json b/metadata/ckpt_13.json new file mode 100644 index 0000000000000000000000000000000000000000..a779f5f4e4f73d429f1a6a028ddd3c48033e4cb9 --- /dev/null +++ b/metadata/ckpt_13.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_13.pt", + "model": "GPT2-S", + "training_step": 10000, + "instability_type": "Slow divergence", + "learning_rate": "6e-4", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_FP8_head" +} \ No newline at end of file diff --git a/metadata/ckpt_14.json b/metadata/ckpt_14.json new file mode 100644 index 0000000000000000000000000000000000000000..274caaa49e0a245b18424950c70ee304b0ba9661 --- /dev/null +++ b/metadata/ckpt_14.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_14.pt", + "model": "GPT2-S", + "training_step": 4000, + "instability_type": "complete non-convergence", + "learning_rate": "1e-2", + "decay": "0.1", + "warm": "0", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_15.json b/metadata/ckpt_15.json new file mode 100644 index 0000000000000000000000000000000000000000..13dcafb7a280f929a905d3005944a6db7e04e94e --- /dev/null +++ b/metadata/ckpt_15.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_15.pt", + "model": "GPT2-S", + "training_step": 10000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_16.json b/metadata/ckpt_16.json new file mode 100644 index 0000000000000000000000000000000000000000..e5c255bd72a1450681f3d16a35e974c9877c5798 --- /dev/null +++ b/metadata/ckpt_16.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_16.pt", + "model": "GPT2-S", + "training_step": 12000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_17.json b/metadata/ckpt_17.json new file mode 100644 index 0000000000000000000000000000000000000000..27a48dfd00a97b23f1f107a666976db7dd026cfd --- /dev/null +++ b/metadata/ckpt_17.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_17.pt", + "model": "GPT2-S", + "training_step": 14000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_18.json b/metadata/ckpt_18.json new file mode 100644 index 0000000000000000000000000000000000000000..f256d2fc21080d668b95cdb19c76cccc856dd645 --- /dev/null +++ b/metadata/ckpt_18.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_18.pt", + "model": "GPT2-S", + "training_step": 18000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_19.json b/metadata/ckpt_19.json new file mode 100644 index 0000000000000000000000000000000000000000..130d0fb8206b0778e4c2582b444303a42db2f729 --- /dev/null +++ b/metadata/ckpt_19.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_19.pt", + "model": "GPT2-S", + "training_step": 24000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_2.json b/metadata/ckpt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6a9c3ec84313fc2df6f0a7c717965f082d01cc73 --- /dev/null +++ b/metadata/ckpt_2.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_2.pt", + "model": "GPT2-S", + "training_step": 4000, + "instability_type": "complete non-convergence", + "learning_rate": "3e-2", + "decay": "0.1", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_20.json b/metadata/ckpt_20.json new file mode 100644 index 0000000000000000000000000000000000000000..b750d4cc15c8e4cd591e64fe7400e8e01aa6f5b5 --- /dev/null +++ b/metadata/ckpt_20.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_20.pt", + "model": "GPT2-S", + "training_step": 34000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_21.json b/metadata/ckpt_21.json new file mode 100644 index 0000000000000000000000000000000000000000..d6b2b7195cc14db3eacae91912e6f4d029d4f2c1 --- /dev/null +++ b/metadata/ckpt_21.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_21.pt", + "model": "GPT2-S", + "training_step": 36000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_22.json b/metadata/ckpt_22.json new file mode 100644 index 0000000000000000000000000000000000000000..6e63fc26caf793c183c9b0cdb87ad4272c2a7a6c --- /dev/null +++ b/metadata/ckpt_22.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_22.pt", + "model": "GPT2-S", + "training_step": 38000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_23.json b/metadata/ckpt_23.json new file mode 100644 index 0000000000000000000000000000000000000000..11cbeabe705de5bad8b4f32c0bdb4f4d335423fd --- /dev/null +++ b/metadata/ckpt_23.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_23.pt", + "model": "GPT2-S", + "training_step": 40000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_24.json b/metadata/ckpt_24.json new file mode 100644 index 0000000000000000000000000000000000000000..73934a230a1906ce1385ea0c6d00deb4e38a87ba --- /dev/null +++ b/metadata/ckpt_24.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_24.pt", + "model": "GPT2-S", + "training_step": 42000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_25.json b/metadata/ckpt_25.json new file mode 100644 index 0000000000000000000000000000000000000000..106110e518442b342564899d60e46ee2bb882d5e --- /dev/null +++ b/metadata/ckpt_25.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_25.pt", + "model": "GPT2-S", + "training_step": 44000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_26.json b/metadata/ckpt_26.json new file mode 100644 index 0000000000000000000000000000000000000000..c025ce4d062542f151caf40bbcecd74e7833dd2f --- /dev/null +++ b/metadata/ckpt_26.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_26.pt", + "model": "GPT2-S", + "training_step": 46000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_27.json b/metadata/ckpt_27.json new file mode 100644 index 0000000000000000000000000000000000000000..d9faaad00fccd9279b7498388e3dd0bb086d1bb6 --- /dev/null +++ b/metadata/ckpt_27.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_27.pt", + "model": "GPT2-S", + "training_step": 48000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_28.json b/metadata/ckpt_28.json new file mode 100644 index 0000000000000000000000000000000000000000..a2d0fe42cbf6b034469d903e23771189cf56cbb9 --- /dev/null +++ b/metadata/ckpt_28.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_28.pt", + "model": "GPT2-S", + "training_step": 50000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_29.json b/metadata/ckpt_29.json new file mode 100644 index 0000000000000000000000000000000000000000..f37303ed4c1758c1963238848949448966155b08 --- /dev/null +++ b/metadata/ckpt_29.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_29.pt", + "model": "GPT2-S", + "training_step": 52000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_3.json b/metadata/ckpt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d376d1b4d71d97e320ab1bcaf1aa8906a959a92a --- /dev/null +++ b/metadata/ckpt_3.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_3.pt", + "model": "GPT2-S", + "training_step": 18000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-2", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_BF16_head", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_30.json b/metadata/ckpt_30.json new file mode 100644 index 0000000000000000000000000000000000000000..a77510132be417ed8e004d35198740ea88bd61cc --- /dev/null +++ b/metadata/ckpt_30.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_30.pt", + "model": "GPT2-S", + "training_step": 56000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_31.json b/metadata/ckpt_31.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c1309e46e42233e1880c2d3fe1df0cb7dc156b --- /dev/null +++ b/metadata/ckpt_31.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_31.pt", + "model": "GPT2-S", + "training_step": 58000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_32.json b/metadata/ckpt_32.json new file mode 100644 index 0000000000000000000000000000000000000000..b76715cd4793a3fc21a3b5f4b5b7bd9536e39e50 --- /dev/null +++ b/metadata/ckpt_32.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_32.pt", + "model": "GPT2-S", + "training_step": 60000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_33.json b/metadata/ckpt_33.json new file mode 100644 index 0000000000000000000000000000000000000000..90a4217373bd4c1161d084feb2c7118a6ef04a62 --- /dev/null +++ b/metadata/ckpt_33.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_33.pt", + "model": "GPT2-S", + "training_step": 62000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_34.json b/metadata/ckpt_34.json new file mode 100644 index 0000000000000000000000000000000000000000..de629b5bdc528856824455cf2bc9544311c2f6eb --- /dev/null +++ b/metadata/ckpt_34.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_34.pt", + "model": "GPT2-S", + "training_step": 64000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_35.json b/metadata/ckpt_35.json new file mode 100644 index 0000000000000000000000000000000000000000..c1f0752587bbd2135d800d123559214088f9cb18 --- /dev/null +++ b/metadata/ckpt_35.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_35.pt", + "model": "GPT2-S", + "training_step": 66000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_36.json b/metadata/ckpt_36.json new file mode 100644 index 0000000000000000000000000000000000000000..4da59868fcbf13b4ee1881ceef83671ee7f9aacb --- /dev/null +++ b/metadata/ckpt_36.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_36.pt", + "model": "GPT2-S", + "training_step": 68000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_37.json b/metadata/ckpt_37.json new file mode 100644 index 0000000000000000000000000000000000000000..920f4cc1c288cfaaf00ed912b04ecad8d32c5017 --- /dev/null +++ b/metadata/ckpt_37.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_37.pt", + "model": "GPT2-S", + "training_step": 70000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_38.json b/metadata/ckpt_38.json new file mode 100644 index 0000000000000000000000000000000000000000..2f239f1ea81bd03d554ecef349659ba608762711 --- /dev/null +++ b/metadata/ckpt_38.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_38.pt", + "model": "GPT2-S", + "training_step": 72000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_39.json b/metadata/ckpt_39.json new file mode 100644 index 0000000000000000000000000000000000000000..8c228fb7f18baf471a363dbf98fc643ddd1b2d0a --- /dev/null +++ b/metadata/ckpt_39.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_39.pt", + "model": "GPT2-S", + "training_step": 74000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_4.json b/metadata/ckpt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..586cb2afd8d812195acf379e7d94f4cfed16d7b1 --- /dev/null +++ b/metadata/ckpt_4.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_4.pt", + "model": "GPT2-S", + "training_step": 68000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-2", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_BF16_head", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_40.json b/metadata/ckpt_40.json new file mode 100644 index 0000000000000000000000000000000000000000..90be05a3d44261ba8b6d307b87bbde41cda0eded --- /dev/null +++ b/metadata/ckpt_40.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_40.pt", + "model": "GPT2-S", + "training_step": 76000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_41.json b/metadata/ckpt_41.json new file mode 100644 index 0000000000000000000000000000000000000000..55f13c9c4446520aab59ae04a0cfe4ec80a9ed14 --- /dev/null +++ b/metadata/ckpt_41.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_41.pt", + "model": "GPT2-S", + "training_step": 84000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_42.json b/metadata/ckpt_42.json new file mode 100644 index 0000000000000000000000000000000000000000..7f64faeabbe113088ca136a4fd89f6a9f2585d3a --- /dev/null +++ b/metadata/ckpt_42.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_42.pt", + "model": "GPT2-S", + "training_step": 94000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_43.json b/metadata/ckpt_43.json new file mode 100644 index 0000000000000000000000000000000000000000..4c59ebc8d3c6648de81919a66eeac77b4a1eee73 --- /dev/null +++ b/metadata/ckpt_43.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_43.pt", + "model": "GPT2-S", + "training_step": 96000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_44.json b/metadata/ckpt_44.json new file mode 100644 index 0000000000000000000000000000000000000000..823052152ae0e7c9b12b5904da31d93f31fff9d2 --- /dev/null +++ b/metadata/ckpt_44.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_44.pt", + "model": "GPT2-S", + "training_step": 98000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_45.json b/metadata/ckpt_45.json new file mode 100644 index 0000000000000000000000000000000000000000..97311011180ef6754a6ed327b49daaa9a80b686e --- /dev/null +++ b/metadata/ckpt_45.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_45.pt", + "model": "GPT2-S", + "training_step": 4000, + "instability_type": "complete non-convergence", + "learning_rate": "3e-3", + "decay": "0.1", + "warm": "0", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_5.json b/metadata/ckpt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9f179c87c40934b7f6b365c7bb88874e6f441e8d --- /dev/null +++ b/metadata/ckpt_5.json @@ -0,0 +1,11 @@ +{ + "checkpoint": "ckpt_5.pt", + "model": "GPT2-S", + "training_step": 80000, + "instability_type": "Recoverable loss spikes", + "learning_rate": "1e-2", + "decay": "0.1", + "warm": "2000", + "data_type": "FP8_with_BF16_head", + "reproducibility": false +} \ No newline at end of file diff --git a/metadata/ckpt_6.json b/metadata/ckpt_6.json new file mode 100644 index 0000000000000000000000000000000000000000..b085b8bb33140401d5a98419e26351b08ca5207b --- /dev/null +++ b/metadata/ckpt_6.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_6.pt", + "model": "GPT2-S", + "training_step": 6000, + "instability_type": "Slow divergence", + "learning_rate": "1e-3", + "decay": "0.0", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_7.json b/metadata/ckpt_7.json new file mode 100644 index 0000000000000000000000000000000000000000..957910da26f066ab6dec5ff8117c2d1aeb9fc566 --- /dev/null +++ b/metadata/ckpt_7.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_7.pt", + "model": "GPT2-S", + "training_step": 16000, + "instability_type": "Slow divergence", + "learning_rate": "1e-3", + "decay": "0.1", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_8.json b/metadata/ckpt_8.json new file mode 100644 index 0000000000000000000000000000000000000000..0cf2a922e4bda0f585547943e2f9433974c0cbc2 --- /dev/null +++ b/metadata/ckpt_8.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_8.pt", + "model": "GPT2-S", + "training_step": 18000, + "instability_type": "Slow divergence", + "learning_rate": "3e-3", + "decay": "0.0", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file diff --git a/metadata/ckpt_9.json b/metadata/ckpt_9.json new file mode 100644 index 0000000000000000000000000000000000000000..a049bf3f3506b152e12a1004557c32e3889fa75d --- /dev/null +++ b/metadata/ckpt_9.json @@ -0,0 +1,10 @@ +{ + "checkpoint": "ckpt_9.pt", + "model": "GPT2-S", + "training_step": 10000, + "instability_type": "Slow divergence", + "learning_rate": "1e-2", + "decay": "0.0", + "warm": "2000", + "data_type": "BF16" +} \ No newline at end of file