Training in progress, step 16
Browse files- adapter_config.json +34 -0
- adapter_model.safetensors +3 -0
- added_tokens.json +3 -0
- runs/May03_13-42-18_2efa04e46d11/events.out.tfevents.1714743739.2efa04e46d11 +3 -0
- runs/May03_13-56-34_2efa04e46d11/events.out.tfevents.1714744595.2efa04e46d11 +3 -0
- runs/May03_14-46-12_2efa04e46d11/events.out.tfevents.1714747572.2efa04e46d11 +3 -0
- runs/May03_14-52-52_2efa04e46d11/events.out.tfevents.1714747973.2efa04e46d11 +3 -0
- runs/May03_15-04-06_2efa04e46d11/events.out.tfevents.1714748646.2efa04e46d11 +3 -0
- runs/May03_15-27-23_2efa04e46d11/events.out.tfevents.1714750044.2efa04e46d11 +3 -0
- runs/May03_15-34-15_2efa04e46d11/events.out.tfevents.1714750456.2efa04e46d11 +3 -0
- runs/May03_15-45-33_2efa04e46d11/events.out.tfevents.1714751134.2efa04e46d11 +3 -0
- runs/May03_15-53-41_2efa04e46d11/events.out.tfevents.1714751622.2efa04e46d11 +3 -0
- runs/May03_16-21-34_2efa04e46d11/events.out.tfevents.1714753294.2efa04e46d11 +3 -0
- runs/May03_16-28-58_2efa04e46d11/events.out.tfevents.1714753739.2efa04e46d11 +3 -0
- runs/May03_16-38-55_2efa04e46d11/events.out.tfevents.1714754335.2efa04e46d11 +3 -0
- runs/May03_16-51-30_2efa04e46d11/events.out.tfevents.1714755091.2efa04e46d11 +3 -0
- runs/May03_18-12-58_2efa04e46d11/events.out.tfevents.1714759980.2efa04e46d11 +3 -0
- runs/May03_18-18-37_2efa04e46d11/events.out.tfevents.1714760317.2efa04e46d11 +3 -0
- runs/May03_18-24-39_2efa04e46d11/events.out.tfevents.1714760682.2efa04e46d11 +3 -0
- runs/May03_18-30-59_2efa04e46d11/events.out.tfevents.1714761060.2efa04e46d11 +3 -0
- special_tokens_map.json +30 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +52 -0
- training_args.bin +3 -0
adapter_config.json
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alpha_pattern": {},
|
| 3 |
+
"auto_mapping": null,
|
| 4 |
+
"base_model_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
|
| 5 |
+
"bias": "none",
|
| 6 |
+
"fan_in_fan_out": false,
|
| 7 |
+
"inference_mode": true,
|
| 8 |
+
"init_lora_weights": true,
|
| 9 |
+
"layer_replication": null,
|
| 10 |
+
"layers_pattern": null,
|
| 11 |
+
"layers_to_transform": null,
|
| 12 |
+
"loftq_config": {},
|
| 13 |
+
"lora_alpha": 64,
|
| 14 |
+
"lora_dropout": 0,
|
| 15 |
+
"megatron_config": null,
|
| 16 |
+
"megatron_core": "megatron.core",
|
| 17 |
+
"modules_to_save": null,
|
| 18 |
+
"peft_type": "LORA",
|
| 19 |
+
"r": 16,
|
| 20 |
+
"rank_pattern": {},
|
| 21 |
+
"revision": null,
|
| 22 |
+
"target_modules": [
|
| 23 |
+
"down_proj",
|
| 24 |
+
"k_proj",
|
| 25 |
+
"o_proj",
|
| 26 |
+
"v_proj",
|
| 27 |
+
"up_proj",
|
| 28 |
+
"gate_proj",
|
| 29 |
+
"q_proj"
|
| 30 |
+
],
|
| 31 |
+
"task_type": "CAUSAL_LM",
|
| 32 |
+
"use_dora": false,
|
| 33 |
+
"use_rslora": false
|
| 34 |
+
}
|
adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe7c35d3f185f2db4b749d9872b0c3a63ae1ec60e65181a376d28337e5c00efe
|
| 3 |
+
size 167832240
|
added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"[PAD]": 32000
|
| 3 |
+
}
|
runs/May03_13-42-18_2efa04e46d11/events.out.tfevents.1714743739.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:601b9841bd65b4121a6a94630ccca2e7d6c952fd35c01c153f52bddd437b2835
|
| 3 |
+
size 5318
|
runs/May03_13-56-34_2efa04e46d11/events.out.tfevents.1714744595.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f3bb908c657898b4c1ce3e83e48d7dea88b30d973fa70c10f6706ef4aa89268
|
| 3 |
+
size 32906
|
runs/May03_14-46-12_2efa04e46d11/events.out.tfevents.1714747572.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b489582dd9ce23c6bc6e4eb368a0b580c70c112fd60e5757b6291006a71f720
|
| 3 |
+
size 7826
|
runs/May03_14-52-52_2efa04e46d11/events.out.tfevents.1714747973.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e22179ff5d3c21b0826c817faaae83598c5d0165ca6cab366771d19b6bb33ec4
|
| 3 |
+
size 11588
|
runs/May03_15-04-06_2efa04e46d11/events.out.tfevents.1714748646.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1e2029f51e24d886ea564f40e8bdd7a8cb2ec9d47946e894f62af67c19fdc51
|
| 3 |
+
size 19112
|
runs/May03_15-27-23_2efa04e46d11/events.out.tfevents.1714750044.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c5a210ea06515bb5707468790b3f914b000bcf2d4691ccc357b5ddfbe4d15d1
|
| 3 |
+
size 5318
|
runs/May03_15-34-15_2efa04e46d11/events.out.tfevents.1714750456.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f79151b26b6830a9a892cfdd96d93549fa6735d622159f905852d4a18339212c
|
| 3 |
+
size 10334
|
runs/May03_15-45-33_2efa04e46d11/events.out.tfevents.1714751134.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7aa472a99651c2b8e75a102b0cc7609fd667fd7258674107aac45a3a9c738d4
|
| 3 |
+
size 7829
|
runs/May03_15-53-41_2efa04e46d11/events.out.tfevents.1714751622.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:397f65cd253320486d24f75c0d03d4cf5918dc220a0873e921067c81e8b8faf0
|
| 3 |
+
size 22869
|
runs/May03_16-21-34_2efa04e46d11/events.out.tfevents.1714753294.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d2a1ec969f2a68b6447f6faf9c0a2f4cef333146d0ac1bbc13254d5897d2a70
|
| 3 |
+
size 5313
|
runs/May03_16-28-58_2efa04e46d11/events.out.tfevents.1714753739.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b7a1811a1002af2d282d86eac60199c2f0d4d9e2af73dcf5a2207f01aa8124c
|
| 3 |
+
size 9075
|
runs/May03_16-38-55_2efa04e46d11/events.out.tfevents.1714754335.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50ee32ee4ed47572d929167c6690b20c4dc67f1eac75c364e4298af2696e0bc6
|
| 3 |
+
size 11583
|
runs/May03_16-51-30_2efa04e46d11/events.out.tfevents.1714755091.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec3885e741eaed8488da1725b542cdf82486ca704e317b055d563acb0b767658
|
| 3 |
+
size 16742
|
runs/May03_18-12-58_2efa04e46d11/events.out.tfevents.1714759980.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28f51b44dec2a9e2e9e7476b0f8eee2f402fefcc52632d2c9677c105bdcb31f8
|
| 3 |
+
size 5426
|
runs/May03_18-18-37_2efa04e46d11/events.out.tfevents.1714760317.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:171d948501d5ba7d2751e59f4f23c8944a27e1238efe4ddf9279de7bb2190611
|
| 3 |
+
size 5426
|
runs/May03_18-24-39_2efa04e46d11/events.out.tfevents.1714760682.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6881055184a448ad37556ba5b04a47a08de9ef825923496e212382bf8cb3ad12
|
| 3 |
+
size 5426
|
runs/May03_18-30-59_2efa04e46d11/events.out.tfevents.1714761060.2efa04e46d11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:636457cb9d5feb1f5e3354d6f4e67347464985968194bd3c6daf93f49bf53bff
|
| 3 |
+
size 24892
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "</s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"unk_token": {
|
| 24 |
+
"content": "<unk>",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
}
|
| 30 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
|
| 3 |
+
size 493443
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_bos_token": true,
|
| 3 |
+
"add_eos_token": false,
|
| 4 |
+
"added_tokens_decoder": {
|
| 5 |
+
"0": {
|
| 6 |
+
"content": "<unk>",
|
| 7 |
+
"lstrip": false,
|
| 8 |
+
"normalized": false,
|
| 9 |
+
"rstrip": false,
|
| 10 |
+
"single_word": false,
|
| 11 |
+
"special": true
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"content": "<s>",
|
| 15 |
+
"lstrip": false,
|
| 16 |
+
"normalized": false,
|
| 17 |
+
"rstrip": false,
|
| 18 |
+
"single_word": false,
|
| 19 |
+
"special": true
|
| 20 |
+
},
|
| 21 |
+
"2": {
|
| 22 |
+
"content": "</s>",
|
| 23 |
+
"lstrip": false,
|
| 24 |
+
"normalized": false,
|
| 25 |
+
"rstrip": false,
|
| 26 |
+
"single_word": false,
|
| 27 |
+
"special": true
|
| 28 |
+
},
|
| 29 |
+
"32000": {
|
| 30 |
+
"content": "[PAD]",
|
| 31 |
+
"lstrip": false,
|
| 32 |
+
"normalized": false,
|
| 33 |
+
"rstrip": false,
|
| 34 |
+
"single_word": false,
|
| 35 |
+
"special": true
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"additional_special_tokens": [],
|
| 39 |
+
"bos_token": "<s>",
|
| 40 |
+
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
|
| 41 |
+
"clean_up_tokenization_spaces": false,
|
| 42 |
+
"eos_token": "</s>",
|
| 43 |
+
"legacy": true,
|
| 44 |
+
"model_max_length": 1000000000000000019884624838656,
|
| 45 |
+
"pad_token": "[PAD]",
|
| 46 |
+
"padding_side": "left",
|
| 47 |
+
"sp_model_kwargs": {},
|
| 48 |
+
"spaces_between_special_tokens": false,
|
| 49 |
+
"tokenizer_class": "LlamaTokenizer",
|
| 50 |
+
"unk_token": "<unk>",
|
| 51 |
+
"use_default_system_prompt": false
|
| 52 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6dee1690a11bb3358d66a6ba11dd88327a96654a51c9007c2a9830994ea29f7c
|
| 3 |
+
size 5240
|