hshankar113/multilingual-chat-slm
Browse files- tokenizer.json +10 -1
- trainer_state.json +3 -3
tokenizer.json
CHANGED
|
@@ -6,7 +6,16 @@
|
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
-
"padding":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
"added_tokens": [
|
| 11 |
{
|
| 12 |
"id": 0,
|
|
|
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
+
"padding": {
|
| 10 |
+
"strategy": {
|
| 11 |
+
"Fixed": 1024
|
| 12 |
+
},
|
| 13 |
+
"direction": "Right",
|
| 14 |
+
"pad_to_multiple_of": null,
|
| 15 |
+
"pad_id": 0,
|
| 16 |
+
"pad_type_id": 0,
|
| 17 |
+
"pad_token": "<pad>"
|
| 18 |
+
},
|
| 19 |
"added_tokens": [
|
| 20 |
{
|
| 21 |
"id": 0,
|
trainer_state.json
CHANGED
|
@@ -714,9 +714,9 @@
|
|
| 714 |
"step": 10000,
|
| 715 |
"total_flos": 1.2490998615421747e+17,
|
| 716 |
"train_loss": 0.0,
|
| 717 |
-
"train_runtime":
|
| 718 |
-
"train_samples_per_second":
|
| 719 |
-
"train_steps_per_second":
|
| 720 |
}
|
| 721 |
],
|
| 722 |
"logging_steps": 100,
|
|
|
|
| 714 |
"step": 10000,
|
| 715 |
"total_flos": 1.2490998615421747e+17,
|
| 716 |
"train_loss": 0.0,
|
| 717 |
+
"train_runtime": 2.0682,
|
| 718 |
+
"train_samples_per_second": 77360.196,
|
| 719 |
+
"train_steps_per_second": 4835.012
|
| 720 |
}
|
| 721 |
],
|
| 722 |
"logging_steps": 100,
|