indus-script-models / models /nanogpt_history.json
hellosindh's picture
Upload 3 files
e5f6f99 verified
[
{
"epoch": 1,
"train": 3.1541355614151274,
"val": 2.6805355599586,
"ppl": 14.592906579896784
},
{
"epoch": 2,
"train": 2.661188569185989,
"val": 2.6236555132460087,
"ppl": 13.786026590221859
},
{
"epoch": 3,
"train": 2.6222057228109668,
"val": 2.6189262702109968,
"ppl": 13.72098304458602
},
{
"epoch": 4,
"train": 2.6041080951690674,
"val": 2.623061422337877,
"ppl": 13.777838869531374
},
{
"epoch": 5,
"train": 2.593652198623334,
"val": 2.612872798392113,
"ppl": 13.638174353311316
},
{
"epoch": 6,
"train": 2.5864927619695663,
"val": 2.6153726057803377,
"ppl": 13.672309810579614
},
{
"epoch": 7,
"train": 2.5816431431365863,
"val": 2.617009090616348,
"ppl": 13.694702656036387
},
{
"epoch": 8,
"train": 2.578338403786932,
"val": 2.600845827701244,
"ppl": 13.475130855096179
},
{
"epoch": 9,
"train": 2.574481935905559,
"val": 2.5990774035453796,
"ppl": 13.451322166323555
},
{
"epoch": 10,
"train": 2.573306300810405,
"val": 2.6109495010781796,
"ppl": 13.611969297345375
},
{
"epoch": 11,
"train": 2.5699439996055196,
"val": 2.6043824705671756,
"ppl": 13.522871952346348
},
{
"epoch": 12,
"train": 2.5692843917225088,
"val": 2.6044237677087176,
"ppl": 13.523430419834895
},
{
"epoch": 13,
"train": 2.567502531622137,
"val": 2.6015377919724645,
"ppl": 13.484458390986532
},
{
"epoch": 14,
"train": 2.5648566955434426,
"val": 2.6039607372689755,
"ppl": 13.51717010936978
},
{
"epoch": 15,
"train": 2.564982747925179,
"val": 2.606540412344831,
"ppl": 13.552085031411677
},
{
"epoch": 16,
"train": 2.565142649891121,
"val": 2.6077234592843563,
"ppl": 13.568127271622808
},
{
"epoch": 17,
"train": 2.561980778484472,
"val": 2.5994231764306415,
"ppl": 13.45597407300484
},
{
"epoch": 18,
"train": 2.563110330541219,
"val": 2.6023097253860312,
"ppl": 13.49487151358394
},
{
"epoch": 19,
"train": 2.561759041356189,
"val": 2.5976937146897012,
"ppl": 13.43272259272678
},
{
"epoch": 20,
"train": 2.560820518593703,
"val": 2.5989098967389856,
"ppl": 13.449069167007325
},
{
"epoch": 21,
"train": 2.5614392177334855,
"val": 2.5982438769746334,
"ppl": 13.440114803352545
},
{
"epoch": 22,
"train": 2.558592631348542,
"val": 2.6015114023330366,
"ppl": 13.48410254568705
},
{
"epoch": 23,
"train": 2.5598560087382793,
"val": 2.594668352857549,
"ppl": 13.392145158153562
},
{
"epoch": 24,
"train": 2.5588360891810487,
"val": 2.5956707951870372,
"ppl": 13.405576742412281
},
{
"epoch": 25,
"train": 2.5575959836798057,
"val": 2.6016628754899855,
"ppl": 13.486145179966494
},
{
"epoch": 26,
"train": 2.5573083627969027,
"val": 2.6081511226106198,
"ppl": 13.573931103017417
},
{
"epoch": 27,
"train": 2.5575086841625825,
"val": 2.6015568743360804,
"ppl": 13.48471570877982
},
{
"epoch": 28,
"train": 2.557002873026899,
"val": 2.602048819369458,
"ppl": 13.491351079684325
},
{
"epoch": 29,
"train": 2.5560219013797387,
"val": 2.610209694568147,
"ppl": 13.601902797934866
},
{
"epoch": 30,
"train": 2.554686253624303,
"val": 2.6000392982300293,
"ppl": 13.46426714647255
},
{
"epoch": 31,
"train": 2.5538660226655856,
"val": 2.5992509849528047,
"ppl": 13.453657268416205
},
{
"epoch": 32,
"train": 2.5537610626114264,
"val": 2.5968120820978853,
"ppl": 13.420885085624993
},
{
"epoch": 33,
"train": 2.555091032758355,
"val": 2.6032118112482925,
"ppl": 13.50705053882672
},
{
"epoch": 34,
"train": 2.5560004072529927,
"val": 2.5948864348391267,
"ppl": 13.395066062193925
},
{
"epoch": 35,
"train": 2.552427670785359,
"val": 2.593587578611171,
"ppl": 13.37767909124727
},
{
"epoch": 36,
"train": 2.552689385733434,
"val": 2.603117510359338,
"ppl": 13.505776872008656
},
{
"epoch": 37,
"train": 2.5538388692906926,
"val": 2.596836513661324,
"ppl": 13.42121298283587
},
{
"epoch": 38,
"train": 2.5519965682178736,
"val": 2.591266675198332,
"ppl": 13.34666679238455
},
{
"epoch": 39,
"train": 2.5516749138810804,
"val": 2.592155272656299,
"ppl": 13.358531877430071
},
{
"epoch": 40,
"train": 2.5518498348870446,
"val": 2.603394275015973,
"ppl": 13.509515311017257
},
{
"epoch": 41,
"train": 2.550012855125325,
"val": 2.596443589697493,
"ppl": 13.415940502540996
},
{
"epoch": 42,
"train": 2.5510117949119637,
"val": 2.5943850392990924,
"ppl": 13.38835151927348
},
{
"epoch": 43,
"train": 2.55065877762224,
"val": 2.6017530053219895,
"ppl": 13.487360738744176
},
{
"epoch": 44,
"train": 2.550856338414763,
"val": 2.5932302386202712,
"ppl": 13.372899565531243
},
{
"epoch": 45,
"train": 2.5491439992828027,
"val": 2.5965981445413955,
"ppl": 13.418014161374055
},
{
"epoch": 46,
"train": 2.549261734155672,
"val": 2.6010512138934847,
"ppl": 13.47789874514592
},
{
"epoch": 47,
"train": 2.548883476427623,
"val": 2.5964993251130934,
"ppl": 13.41668826639885
},
{
"epoch": 48,
"train": 2.5490686427801847,
"val": 2.601477122053187,
"ppl": 13.483640314801011
},
{
"epoch": 49,
"train": 2.5496274632002627,
"val": 2.596776560265967,
"ppl": 13.42040835966793
},
{
"epoch": 50,
"train": 2.549438276993377,
"val": 2.60137410747244,
"ppl": 13.482251374788804
},
{
"epoch": 51,
"train": 2.547333244766508,
"val": 2.5961117275217744,
"ppl": 13.411488998020356
},
{
"epoch": 52,
"train": 2.547550984259163,
"val": 2.603273559123912,
"ppl": 13.507884596253747
},
{
"epoch": 53,
"train": 2.5475961520735706,
"val": 2.606535277468093,
"ppl": 13.55201544330416
},
{
"epoch": 54,
"train": 2.5470066059912955,
"val": 2.6017496788755374,
"ppl": 13.48731587383552
},
{
"epoch": 55,
"train": 2.544834245528494,
"val": 2.5987642572281207,
"ppl": 13.447110593778538
},
{
"epoch": 56,
"train": 2.5448448940047195,
"val": 2.608545351535716,
"ppl": 13.579283394230176
},
{
"epoch": 57,
"train": 2.5467686969786882,
"val": 2.597899075518263,
"ppl": 13.43548143103723
},
{
"epoch": 58,
"train": 2.5460665178086077,
"val": 2.597285856591894,
"ppl": 13.427245065144662
},
{
"epoch": 59,
"train": 2.5445679192032133,
"val": 2.5995786671942853,
"ppl": 13.458066515362539
},
{
"epoch": 60,
"train": 2.544777887208121,
"val": 2.603335055899113,
"ppl": 13.508715313139149
},
{
"epoch": 61,
"train": 2.544875491144402,
"val": 2.6060757269250585,
"ppl": 13.545789038031518
},
{
"epoch": 62,
"train": 2.5440730787813663,
"val": 2.603364035170129,
"ppl": 13.50910679153364
},
{
"epoch": 63,
"train": 2.5455543795334443,
"val": 2.5958931395348084,
"ppl": 13.408557728019938
}
]