Upload folder using huggingface_hub
Browse files
adapter_config.json
CHANGED
|
@@ -30,12 +30,12 @@
|
|
| 30 |
"rank_pattern": {},
|
| 31 |
"revision": null,
|
| 32 |
"target_modules": [
|
| 33 |
-
"v_proj",
|
| 34 |
"o_proj",
|
| 35 |
"up_proj",
|
|
|
|
|
|
|
| 36 |
"q_proj",
|
| 37 |
"gate_proj",
|
| 38 |
-
"down_proj",
|
| 39 |
"k_proj"
|
| 40 |
],
|
| 41 |
"target_parameters": null,
|
|
|
|
| 30 |
"rank_pattern": {},
|
| 31 |
"revision": null,
|
| 32 |
"target_modules": [
|
|
|
|
| 33 |
"o_proj",
|
| 34 |
"up_proj",
|
| 35 |
+
"v_proj",
|
| 36 |
+
"down_proj",
|
| 37 |
"q_proj",
|
| 38 |
"gate_proj",
|
|
|
|
| 39 |
"k_proj"
|
| 40 |
],
|
| 41 |
"target_parameters": null,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:828f20aa28d6fde2f54ec3cef68c52c86b74ba89af6430c280bfddcf66de93d0
|
| 3 |
size 80792880
|
checkpoint-77/adapter_config.json
CHANGED
|
@@ -30,12 +30,12 @@
|
|
| 30 |
"rank_pattern": {},
|
| 31 |
"revision": null,
|
| 32 |
"target_modules": [
|
| 33 |
-
"v_proj",
|
| 34 |
"o_proj",
|
| 35 |
"up_proj",
|
|
|
|
|
|
|
| 36 |
"q_proj",
|
| 37 |
"gate_proj",
|
| 38 |
-
"down_proj",
|
| 39 |
"k_proj"
|
| 40 |
],
|
| 41 |
"target_parameters": null,
|
|
|
|
| 30 |
"rank_pattern": {},
|
| 31 |
"revision": null,
|
| 32 |
"target_modules": [
|
|
|
|
| 33 |
"o_proj",
|
| 34 |
"up_proj",
|
| 35 |
+
"v_proj",
|
| 36 |
+
"down_proj",
|
| 37 |
"q_proj",
|
| 38 |
"gate_proj",
|
|
|
|
| 39 |
"k_proj"
|
| 40 |
],
|
| 41 |
"target_parameters": null,
|
checkpoint-77/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80792880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:828f20aa28d6fde2f54ec3cef68c52c86b74ba89af6430c280bfddcf66de93d0
|
| 3 |
size 80792880
|
checkpoint-77/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 161810747
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cb711327043f058babaf737266d6285bc02546ee7853279764ac08b99c80b26
|
| 3 |
size 161810747
|
checkpoint-77/trainer_state.json
CHANGED
|
@@ -10,32 +10,32 @@
|
|
| 10 |
"is_world_process_zero": true,
|
| 11 |
"log_history": [
|
| 12 |
{
|
| 13 |
-
"entropy": 1.
|
| 14 |
"epoch": 0.32786885245901637,
|
| 15 |
-
"grad_norm": 0.
|
| 16 |
"learning_rate": 0.00016282199972956425,
|
| 17 |
-
"loss": 1.
|
| 18 |
-
"mean_token_accuracy": 0.
|
| 19 |
"num_tokens": 150039.0,
|
| 20 |
"step": 25
|
| 21 |
},
|
| 22 |
{
|
| 23 |
-
"entropy": 0.
|
| 24 |
"epoch": 0.6557377049180327,
|
| 25 |
-
"grad_norm": 0.
|
| 26 |
"learning_rate": 6.271435222196916e-05,
|
| 27 |
-
"loss": 0.
|
| 28 |
-
"mean_token_accuracy": 0.
|
| 29 |
"num_tokens": 292991.0,
|
| 30 |
"step": 50
|
| 31 |
},
|
| 32 |
{
|
| 33 |
-
"entropy": 0.
|
| 34 |
"epoch": 0.9836065573770492,
|
| 35 |
-
"grad_norm": 0.
|
| 36 |
"learning_rate": 8.099564741123166e-07,
|
| 37 |
-
"loss": 0.
|
| 38 |
-
"mean_token_accuracy": 0.
|
| 39 |
"num_tokens": 440288.0,
|
| 40 |
"step": 75
|
| 41 |
}
|
|
|
|
| 10 |
"is_world_process_zero": true,
|
| 11 |
"log_history": [
|
| 12 |
{
|
| 13 |
+
"entropy": 1.2594475726783276,
|
| 14 |
"epoch": 0.32786885245901637,
|
| 15 |
+
"grad_norm": 0.05419921875,
|
| 16 |
"learning_rate": 0.00016282199972956425,
|
| 17 |
+
"loss": 1.2619928741455078,
|
| 18 |
+
"mean_token_accuracy": 0.7029473577439785,
|
| 19 |
"num_tokens": 150039.0,
|
| 20 |
"step": 25
|
| 21 |
},
|
| 22 |
{
|
| 23 |
+
"entropy": 0.923663822337985,
|
| 24 |
"epoch": 0.6557377049180327,
|
| 25 |
+
"grad_norm": 0.19140625,
|
| 26 |
"learning_rate": 6.271435222196916e-05,
|
| 27 |
+
"loss": 0.82879150390625,
|
| 28 |
+
"mean_token_accuracy": 0.776209542453289,
|
| 29 |
"num_tokens": 292991.0,
|
| 30 |
"step": 50
|
| 31 |
},
|
| 32 |
{
|
| 33 |
+
"entropy": 0.6226911177486181,
|
| 34 |
"epoch": 0.9836065573770492,
|
| 35 |
+
"grad_norm": 0.103515625,
|
| 36 |
"learning_rate": 8.099564741123166e-07,
|
| 37 |
+
"loss": 0.5372924423217773,
|
| 38 |
+
"mean_token_accuracy": 0.8512885943055153,
|
| 39 |
"num_tokens": 440288.0,
|
| 40 |
"step": 75
|
| 41 |
}
|