Add files using upload-large-folder tool
Browse files- chat_template.jinja +1 -1
- config.json +19 -14
- model-1-of-40.safetensors +1 -1
- model-10-of-40.safetensors +2 -2
- model-11-of-40.safetensors +2 -2
- model-12-of-40.safetensors +2 -2
- model-13-of-40.safetensors +2 -2
- model-14-of-40.safetensors +2 -2
- model-15-of-40.safetensors +2 -2
- model-16-of-40.safetensors +2 -2
- model-17-of-40.safetensors +2 -2
- model-18-of-40.safetensors +2 -2
- model-19-of-40.safetensors +2 -2
- model-2-of-40.safetensors +2 -2
- model-20-of-40.safetensors +2 -2
- model-21-of-40.safetensors +2 -2
- model-22-of-40.safetensors +2 -2
- model-23-of-40.safetensors +2 -2
- model-24-of-40.safetensors +2 -2
- model-25-of-40.safetensors +2 -2
- model-26-of-40.safetensors +2 -2
- model-27-of-40.safetensors +2 -2
- model-28-of-40.safetensors +2 -2
- model-29-of-40.safetensors +2 -2
- model-3-of-40.safetensors +2 -2
- model-30-of-40.safetensors +2 -2
- model-31-of-40.safetensors +2 -2
- model-32-of-40.safetensors +2 -2
- model-33-of-40.safetensors +2 -2
- model-34-of-40.safetensors +2 -2
- model-35-of-40.safetensors +2 -2
- model-36-of-40.safetensors +2 -2
- model-37-of-40.safetensors +2 -2
- model-38-of-40.safetensors +2 -2
- model-39-of-40.safetensors +2 -2
- model-4-of-40.safetensors +2 -2
- model-40-of-40.safetensors +2 -2
- model-5-of-40.safetensors +2 -2
- model-6-of-40.safetensors +2 -2
- model-7-of-40.safetensors +2 -2
- model-8-of-40.safetensors +2 -2
- model-9-of-40.safetensors +2 -2
- model-non-layer.safetensors +1 -1
- model.safetensors.index.json +2 -5
- mtp-1-of-1.safetensors +1 -1
chat_template.jinja
CHANGED
|
@@ -100,4 +100,4 @@
|
|
| 100 |
|
| 101 |
{%- if add_generation_prompt -%}
|
| 102 |
{{ '<|Assistant|>' }}{{ '<|end_of_thought|>' }}
|
| 103 |
-
{%- endif -%}
|
|
|
|
| 100 |
|
| 101 |
{%- if add_generation_prompt -%}
|
| 102 |
{{ '<|Assistant|>' }}{{ '<|end_of_thought|>' }}
|
| 103 |
+
{%- endif -%}
|
config.json
CHANGED
|
@@ -10,9 +10,11 @@
|
|
| 10 |
"AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
|
| 11 |
},
|
| 12 |
"bos_token_id": 0,
|
|
|
|
| 13 |
"eos_token_id": 1,
|
| 14 |
"ep_size": 1,
|
| 15 |
"first_k_dense_replace": 1,
|
|
|
|
| 16 |
"hidden_act": "silu",
|
| 17 |
"hidden_size": 2048,
|
| 18 |
"initializer_range": 0.02,
|
|
@@ -31,21 +33,11 @@
|
|
| 31 |
"num_hidden_layers": 40,
|
| 32 |
"num_key_value_heads": 32,
|
| 33 |
"num_nextn_predict_layers": 1,
|
|
|
|
| 34 |
"q_lora_rank": 1536,
|
|
|
|
| 35 |
"qk_nope_head_dim": 128,
|
| 36 |
"qk_rope_head_dim": 64,
|
| 37 |
-
"rms_norm_eps": 1e-06,
|
| 38 |
-
"rope_theta": 32000000,
|
| 39 |
-
"routed_scaling_factor": 2.5,
|
| 40 |
-
"scoring_func": "sigmoid",
|
| 41 |
-
"tie_word_embeddings": false,
|
| 42 |
-
"topk_group": 1,
|
| 43 |
-
"topk_method": "noaux_tc",
|
| 44 |
-
"torch_dtype": "bfloat16",
|
| 45 |
-
"transformers_version": "4.44.2",
|
| 46 |
-
"use_cache": true,
|
| 47 |
-
"v_head_dim": 128,
|
| 48 |
-
"vocab_size": 129280,
|
| 49 |
"quantization_config": {
|
| 50 |
"config_groups": {
|
| 51 |
"group_0": {
|
|
@@ -58,7 +50,7 @@
|
|
| 58 |
"actorder": null,
|
| 59 |
"block_structure": null,
|
| 60 |
"dynamic": false,
|
| 61 |
-
"group_size":
|
| 62 |
"num_bits": 4,
|
| 63 |
"observer": "minmax",
|
| 64 |
"observer_kwargs": {},
|
|
@@ -78,5 +70,18 @@
|
|
| 78 |
"kv_cache_scheme": null,
|
| 79 |
"quant_method": "compressed-tensors",
|
| 80 |
"quantization_status": "compressed"
|
| 81 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 82 |
}
|
|
|
|
| 10 |
"AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
|
| 11 |
},
|
| 12 |
"bos_token_id": 0,
|
| 13 |
+
"dtype": "bfloat16",
|
| 14 |
"eos_token_id": 1,
|
| 15 |
"ep_size": 1,
|
| 16 |
"first_k_dense_replace": 1,
|
| 17 |
+
"head_dim": 64,
|
| 18 |
"hidden_act": "silu",
|
| 19 |
"hidden_size": 2048,
|
| 20 |
"initializer_range": 0.02,
|
|
|
|
| 33 |
"num_hidden_layers": 40,
|
| 34 |
"num_key_value_heads": 32,
|
| 35 |
"num_nextn_predict_layers": 1,
|
| 36 |
+
"pretraining_tp": 1,
|
| 37 |
"q_lora_rank": 1536,
|
| 38 |
+
"qk_head_dim": 192,
|
| 39 |
"qk_nope_head_dim": 128,
|
| 40 |
"qk_rope_head_dim": 64,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
"quantization_config": {
|
| 42 |
"config_groups": {
|
| 43 |
"group_0": {
|
|
|
|
| 50 |
"actorder": null,
|
| 51 |
"block_structure": null,
|
| 52 |
"dynamic": false,
|
| 53 |
+
"group_size": 64,
|
| 54 |
"num_bits": 4,
|
| 55 |
"observer": "minmax",
|
| 56 |
"observer_kwargs": {},
|
|
|
|
| 70 |
"kv_cache_scheme": null,
|
| 71 |
"quant_method": "compressed-tensors",
|
| 72 |
"quantization_status": "compressed"
|
| 73 |
+
},
|
| 74 |
+
"rms_norm_eps": 1e-06,
|
| 75 |
+
"rope_interleave": true,
|
| 76 |
+
"rope_scaling": null,
|
| 77 |
+
"rope_theta": 32000000,
|
| 78 |
+
"routed_scaling_factor": 2.5,
|
| 79 |
+
"scoring_func": "sigmoid",
|
| 80 |
+
"tie_word_embeddings": false,
|
| 81 |
+
"topk_group": 1,
|
| 82 |
+
"topk_method": "noaux_tc",
|
| 83 |
+
"transformers_version": "4.57.3",
|
| 84 |
+
"use_cache": true,
|
| 85 |
+
"v_head_dim": 128,
|
| 86 |
+
"vocab_size": 129280
|
| 87 |
}
|
model-1-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 140785016
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4ff3a9595c500b44c308dcb352de70289268867c1cb95398c991b6bda655288
|
| 3 |
size 140785016
|
model-10-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:726a23a975f03162a5fbefa721fb5f06489aaf7a3a6932b7e0ef91e3a1aa7a89
|
| 3 |
+
size 742957112
|
model-11-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd640c160281bd25ee639d7827d8ef1973b88ebdb0bd6e2b4707c57111235329
|
| 3 |
+
size 742959432
|
model-12-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a52a909c7291bacc83be6583a74fa636bc1f80428bd99a4cdd5d9e04b1fab9db
|
| 3 |
+
size 742959432
|
model-13-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acc59d9a7e9c461521d0cfe97a17be25f9964139437c877d2ee9b06eadfe0635
|
| 3 |
+
size 742959432
|
model-14-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ba42417e9ed554dc63689c800b5ac05e0022cd82577e9eccb39336733915e96
|
| 3 |
+
size 742959432
|
model-15-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:547cf7c15e82f400a52d008133236b614f619db00c7ab747ba6457294a36da24
|
| 3 |
+
size 742959432
|
model-16-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0d7632f46d804d3f8fed17525ad22a79b4304366c0e27ba0c943dad384c9e45
|
| 3 |
+
size 742959432
|
model-17-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f18a1c3ef7485c1d949a4766d8dcec32ac043df1c8bf911758718156fccbc5b
|
| 3 |
+
size 742959432
|
model-18-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfbe35220cb9898a22a4fdf2be7402f031e1dbac742a65b317d26509c5764b34
|
| 3 |
+
size 742959432
|
model-19-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a10861e1ffc82ac0f4461fd581b6b401ee5eecbc655c5a8c82b985f5c5fdd97
|
| 3 |
+
size 742959432
|
model-2-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:350f55333a55f367cc9c8dac8d08def69eeeb2b87fb7e883095a242a16ca6485
|
| 3 |
+
size 742957112
|
model-20-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59c28ace24b7d7f918eb6d0b1aee178da684e9e0e87007f90682ca6c227fa7cd
|
| 3 |
+
size 742959432
|
model-21-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4b94080b3a18841a127d565dae1be4e555f3a6108ff4c8cbcd67cbe550739d1
|
| 3 |
+
size 742959432
|
model-22-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19ddcdcafae2e4f809db86a353e600944e33e9979be9f3c7b0a8d2f010f427f1
|
| 3 |
+
size 742959432
|
model-23-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41f14a2707f5d5f2f9c9c66dcae3e3804ead083fa941776e3f897d7e16252987
|
| 3 |
+
size 742959432
|
model-24-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53938e077028c98ec68950310513de8fb6fb7123d6d92b6cc7581f728eef323e
|
| 3 |
+
size 742959432
|
model-25-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5410eb0f47bddba92dc7f167d649aaf1110674679ca48e07fe64e7eeb6f6197
|
| 3 |
+
size 742959432
|
model-26-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21bc943a8428b23d0054fd1e10b7506d5d84ec137b3aedae7a7a4589522c9b51
|
| 3 |
+
size 742959432
|
model-27-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:554e73d388f048d7619a13d0f79c1a80ca6e9279a8073ff8dae186df526e311f
|
| 3 |
+
size 742959432
|
model-28-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fc9b275e1d16621ba95656c4c5dd1a47ab822aef33ec78d398613851bb43efc
|
| 3 |
+
size 742959432
|
model-29-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c8c41d732ca08ee9a2efa0ff166eb7e8b3537e371be3974e26e3ea1fc7d088a
|
| 3 |
+
size 742959432
|
model-3-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10b9f33a96d3967e5036ee3904585c6c598f636c30868782a088d8357c647993
|
| 3 |
+
size 742957112
|
model-30-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fb82b7519ecf2dd6899f3aa6a9c1b270c0b45c11c2739766fcebf4a520f908a
|
| 3 |
+
size 742959432
|
model-31-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a783a6038833bda2b6f781d414daebc6e87b341079ebf402d70e408cbbb7e152
|
| 3 |
+
size 742959432
|
model-32-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:772c68a4ce2a49aba2a37fef2dc832f93f63456f85eafc260d03ae2cf9b5ed08
|
| 3 |
+
size 742959432
|
model-33-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ed2633aaa725ad82583ebecb9f24c00c67a80a5669c309a9c460cbddc4948c2
|
| 3 |
+
size 742959432
|
model-34-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b2eea6d07916ef281c8f0dae32d8d26c7e4d093f6a77a065daf5f97a668de4a
|
| 3 |
+
size 742959432
|
model-35-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7dadaa7799c2217fe60ffcf866a0bdb8cbf80514fa8651cd55d6b27bd6e3533e
|
| 3 |
+
size 742959432
|
model-36-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b66da6210a4112ebd30d1d27bac0e03534b14a3452fc3fe2f21ad00fc1c121e0
|
| 3 |
+
size 742959432
|
model-37-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c33f20ea2a6cdcc1a6b7ac03019528ba56721b6c521448297744bd4f327731a6
|
| 3 |
+
size 742959432
|
model-38-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6970a9ac0d9c47ffedd401ce63deff887ac40ee7c2bc67f297ca11384e00d62
|
| 3 |
+
size 742959432
|
model-39-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21fa2b399986e7f990426980a475e2633d68db49611718bd23a36190a8da2b08
|
| 3 |
+
size 742959432
|
model-4-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4298c221ca35e3c9607b0d7ff0411d7abd95a1fa543b961d3696d3850b50ed3e
|
| 3 |
+
size 742957112
|
model-40-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61742d29c756dd672d4822e0c735649e9e31ab7e25254f99262a76785f30802f
|
| 3 |
+
size 742959432
|
model-5-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5e7a76aa67b9201962fdcb23048229fa07809fc988a278527691ef18125ab1d
|
| 3 |
+
size 742957112
|
model-6-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89cb41236f515d0290b0314995ff844244edff51adddb15250d9cd0a0620b376
|
| 3 |
+
size 742957112
|
model-7-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd2753a823e2efaf7d072d2bd79df61b71276107e4f6222e7fb0e0f8e27e6cc8
|
| 3 |
+
size 742957112
|
model-8-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f6d5145ecd921a7d7d861daf849cb777bf7b8e7567cf5969e353e4e759709f8
|
| 3 |
+
size 742957112
|
model-9-of-40.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9795060b455ea238e1cdb64df5aee4e51d62bae3e51d4c31e579718aedd0d43a
|
| 3 |
+
size 742957112
|
model-non-layer.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1059066184
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b992b0a3e3ab06a9490d364bf942df3bcf69874dcb9f940e935f674672f09cd
|
| 3 |
size 1059066184
|
model.safetensors.index.json
CHANGED
|
@@ -1,7 +1,4 @@
|
|
| 1 |
{
|
| 2 |
-
"metadata": {
|
| 3 |
-
"total_size": 0
|
| 4 |
-
},
|
| 5 |
"weight_map": {
|
| 6 |
"lm_head.weight": "model-non-layer.safetensors",
|
| 7 |
"model.embed_tokens.weight": "model-non-layer.safetensors",
|
|
@@ -90435,7 +90432,7 @@
|
|
| 90435 |
"model.layers.40.self_attn.q_a_layernorm.weight": "mtp-1-of-1.safetensors",
|
| 90436 |
"model.layers.40.self_attn.q_a_proj.weight": "mtp-1-of-1.safetensors",
|
| 90437 |
"model.layers.40.self_attn.q_b_proj.weight": "mtp-1-of-1.safetensors",
|
| 90438 |
-
"model.layers.40.shared_head.
|
| 90439 |
-
"model.layers.40.shared_head.
|
| 90440 |
}
|
| 90441 |
}
|
|
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
| 2 |
"weight_map": {
|
| 3 |
"lm_head.weight": "model-non-layer.safetensors",
|
| 4 |
"model.embed_tokens.weight": "model-non-layer.safetensors",
|
|
|
|
| 90432 |
"model.layers.40.self_attn.q_a_layernorm.weight": "mtp-1-of-1.safetensors",
|
| 90433 |
"model.layers.40.self_attn.q_a_proj.weight": "mtp-1-of-1.safetensors",
|
| 90434 |
"model.layers.40.self_attn.q_b_proj.weight": "mtp-1-of-1.safetensors",
|
| 90435 |
+
"model.layers.40.shared_head.head.weight": "mtp-1-of-1.safetensors",
|
| 90436 |
+
"model.layers.40.shared_head.norm.weight": "mtp-1-of-1.safetensors"
|
| 90437 |
}
|
| 90438 |
}
|
mtp-1-of-1.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 687105960
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74cb5a9b60987b70d854406b19ed713e781774bada163d3097f808f09c08d7bf
|
| 3 |
size 687105960
|