hshankar113 commited on
Commit
a7c7d05
·
verified ·
1 Parent(s): 249eb8e

hshankar113/multilingual-chat-slm

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. trainer_state.json +10 -10
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ede9e7cf02cf9741732c58b51becd5670e199835b1af9b3efac89447877c2bc
3
  size 1080120048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a065c3cf5b9387779c0a98f69b547877fac0b0987c23d932a2def224670d216
3
  size 1080120048
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 1.0,
6
  "eval_steps": 500,
7
- "global_step": 30000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2110,13 +2110,13 @@
2110
  "step": 30000
2111
  },
2112
  {
2113
- "epoch": 1.0,
2114
- "step": 30000,
2115
- "total_flos": 4.0980178796544e+17,
2116
- "train_loss": 4.49529921875,
2117
- "train_runtime": 18816.3377,
2118
- "train_samples_per_second": 25.51,
2119
- "train_steps_per_second": 1.594
2120
  }
2121
  ],
2122
  "logging_steps": 100,
@@ -2136,7 +2136,7 @@
2136
  "attributes": {}
2137
  }
2138
  },
2139
- "total_flos": 4.0980178796544e+17,
2140
  "train_batch_size": 4,
2141
  "trial_name": null,
2142
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 1.0000333333333333,
6
  "eval_steps": 500,
7
+ "global_step": 30001,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2110
  "step": 30000
2111
  },
2112
  {
2113
+ "epoch": 1.0000333333333333,
2114
+ "step": 30001,
2115
+ "total_flos": 4.0981544802503885e+17,
2116
+ "train_loss": 0.00044824120156077804,
2117
+ "train_runtime": 24.4073,
2118
+ "train_samples_per_second": 19666.274,
2119
+ "train_steps_per_second": 1229.142
2120
  }
2121
  ],
2122
  "logging_steps": 100,
 
2136
  "attributes": {}
2137
  }
2138
  },
2139
+ "total_flos": 4.0981544802503885e+17,
2140
  "train_batch_size": 4,
2141
  "trial_name": null,
2142
  "trial_params": null