Add files using upload-large-folder tool
Browse files- config.json +41 -0
- generate_config.json +7 -0
- model-00000-of-00099.safetensors +3 -0
- model-00003-of-00099.safetensors +3 -0
- model-00010-of-00099.safetensors +3 -0
- model-00011-of-00099.safetensors +3 -0
- model-00013-of-00099.safetensors +3 -0
- model-00015-of-00099.safetensors +3 -0
- model-00017-of-00099.safetensors +3 -0
- model-00023-of-00099.safetensors +3 -0
- model-00024-of-00099.safetensors +3 -0
- model-00025-of-00099.safetensors +3 -0
- model-00026-of-00099.safetensors +3 -0
- model-00028-of-00099.safetensors +3 -0
- model-00032-of-00099.safetensors +3 -0
- model-00033-of-00099.safetensors +3 -0
- model-00034-of-00099.safetensors +3 -0
- model-00035-of-00099.safetensors +3 -0
- model-00038-of-00099.safetensors +3 -0
- model-00039-of-00099.safetensors +3 -0
- model-00045-of-00099.safetensors +3 -0
- model-00046-of-00099.safetensors +3 -0
- model-00047-of-00099.safetensors +3 -0
- model-00050-of-00099.safetensors +3 -0
- model-00053-of-00099.safetensors +3 -0
- model-00055-of-00099.safetensors +3 -0
- model-00056-of-00099.safetensors +3 -0
- model-00057-of-00099.safetensors +3 -0
- model-00058-of-00099.safetensors +3 -0
- model-00059-of-00099.safetensors +3 -0
- model-00061-of-00099.safetensors +3 -0
- model-00063-of-00099.safetensors +3 -0
- model-00064-of-00099.safetensors +3 -0
- model-00065-of-00099.safetensors +3 -0
- model-00067-of-00099.safetensors +3 -0
- model-00068-of-00099.safetensors +3 -0
- model-00070-of-00099.safetensors +3 -0
- model-00074-of-00099.safetensors +3 -0
- model-00077-of-00099.safetensors +3 -0
- model-00078-of-00099.safetensors +3 -0
- model-00079-of-00099.safetensors +3 -0
- model-00081-of-00099.safetensors +3 -0
- model-00084-of-00099.safetensors +3 -0
- model-00088-of-00099.safetensors +3 -0
- model-00095-of-00099.safetensors +3 -0
- model-00096-of-00099.safetensors +3 -0
- model-00098-of-00099.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer.json +0 -0
- tokenizer_config.json +0 -0
config.json
ADDED
|
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"HYV3ForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"enable_attention_fp32_softmax": false,
|
| 6 |
+
"enable_lm_head_fp32": true,
|
| 7 |
+
"enable_moe_fp32_combine": false,
|
| 8 |
+
"expert_hidden_dim": 1536,
|
| 9 |
+
"moe_intermediate_size": 1536,
|
| 10 |
+
"first_k_dense_replace": 1,
|
| 11 |
+
"head_dim": 128,
|
| 12 |
+
"hidden_act": "silu",
|
| 13 |
+
"hidden_size": 4096,
|
| 14 |
+
"initializer_range": 0.006,
|
| 15 |
+
"intermediate_size": 13312,
|
| 16 |
+
"max_position_embeddings": 262144,
|
| 17 |
+
"model_type": "hy_v3",
|
| 18 |
+
"moe_router_enable_expert_bias": true,
|
| 19 |
+
"moe_router_use_sigmoid": true,
|
| 20 |
+
"num_attention_heads": 64,
|
| 21 |
+
"num_experts": 192,
|
| 22 |
+
"num_experts_per_tok": 8,
|
| 23 |
+
"num_hidden_layers": 80,
|
| 24 |
+
"num_key_value_heads": 8,
|
| 25 |
+
"num_shared_experts": 1,
|
| 26 |
+
"output_router_logits": true,
|
| 27 |
+
"qk_norm": true,
|
| 28 |
+
"rms_norm_eps": 1e-05,
|
| 29 |
+
"rope_parameters": {
|
| 30 |
+
"rope_theta": 11158840.0,
|
| 31 |
+
"rope_type": "default"
|
| 32 |
+
},
|
| 33 |
+
"route_norm": true,
|
| 34 |
+
"router_scaling_factor": 2.826,
|
| 35 |
+
"tie_word_embeddings": false,
|
| 36 |
+
"transformers_version": "5.6.0",
|
| 37 |
+
"use_cache": true,
|
| 38 |
+
"use_grouped_mm": false,
|
| 39 |
+
"vocab_size": 120832,
|
| 40 |
+
"num_nextn_predict_layers": 1
|
| 41 |
+
}
|
generate_config.json
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 120000,
|
| 3 |
+
"do_sample": false,
|
| 4 |
+
"eos_token_id": 120020,
|
| 5 |
+
"max_new_tokens": 2048,
|
| 6 |
+
"transformers_version": "5.6.0"
|
| 7 |
+
}
|
model-00000-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:649a67670108461567758f6280e089d0eb75a28176532b6cfcfd3a6fee18259b
|
| 3 |
+
size 7247829040
|
model-00003-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aff398d6dd970b28b277c07eda15e0586f160a8d91aa7d70762c9da75fbe074c
|
| 3 |
+
size 7247829616
|
model-00010-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:905779aa781a6e1bcf4d0622c2b896ba207a44bc1e34ecf25b6181e512f3919b
|
| 3 |
+
size 1073743720
|
model-00011-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4abae02bef67e29f1a4280c0ad419628acd93bc39e73786e7f99d75cc7930cf2
|
| 3 |
+
size 1006637160
|
model-00013-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2aaf5c5333076df4b161c383cb3811d07d35c9ef1479ebf1ccdd0147d0c5cfb3
|
| 3 |
+
size 7247829616
|
model-00015-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f985037a76b2e3bac969fb091cff97587fb044706c6bd1e2bdd6dde26dfb3de
|
| 3 |
+
size 7247829616
|
model-00017-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b551b941e58ee6f7e5481b97d106eadc8b7cb09c39e19ee02ed13d5e0c0301b0
|
| 3 |
+
size 7247829616
|
model-00023-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d29551e053f88145df17fcf53a7c662de8a9b76e953d93a30783e974c558826a
|
| 3 |
+
size 1006637160
|
model-00024-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:689e9c7759c7d4bdef9db5084c6d24ac59b1dccd848544725b4dd1296f765bf9
|
| 3 |
+
size 7247829040
|
model-00025-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b93d9ac4182eb16c13f831a23ea411ea1599e7e51ed8f3959d061857598b02f5
|
| 3 |
+
size 7247829616
|
model-00026-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:148c2ee768afc48db9378f2836257a61ec04e827c73533e97607435987424336
|
| 3 |
+
size 7247829616
|
model-00028-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c75c788fec6a8c3016c9a84836a7a8b7366e100b9b469ddcc48aac38e91218c
|
| 3 |
+
size 7247829616
|
model-00032-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:554cf656731d8f1af2254b86666e29707f4ac78fbfd74ee57651972c2186cafa
|
| 3 |
+
size 7247829616
|
model-00033-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c0bba2ecbbc54f662b7061be6d90dafc164e90a232194e44af9f7e520100648
|
| 3 |
+
size 7247829616
|
model-00034-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:593fccfe422c1c9398b0dd801b1cd0e97104f3a5811e341453a11e9b6470d3c6
|
| 3 |
+
size 1073742304
|
model-00035-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f9081dbda6a3af23fbe83df70768586009c067b72077ef246fad50c5c5903e2
|
| 3 |
+
size 998247496
|
model-00038-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3957f156b9b482ee929caa9c7e5fe5bda2a88172c573341b95c1e5c3caccec1c
|
| 3 |
+
size 7247829616
|
model-00039-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51a103023248dacbabee740df0303d9b844352994adfd391eba1dbc5bf8dbbbb
|
| 3 |
+
size 7247829616
|
model-00045-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54d8608cd224db1950873450427df87854178b581e14c183b68492054fb4e04b
|
| 3 |
+
size 7247829616
|
model-00046-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f91c867d41408907da3a4b3004ce9b2d86315284f9c68dcc6bb12870b72e88e3
|
| 3 |
+
size 1073746944
|
model-00047-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dac651fa44ddf9751dede24847e89ae6b1fb062105a50726845c4a9384526140
|
| 3 |
+
size 989855880
|
model-00050-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75aa972e44faf1be28ecfc168e14065a74a42df75b6eff7bce9d5ffc937971f5
|
| 3 |
+
size 7247829616
|
model-00053-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c8fd98ec16bd29ac34024aa440fa3222f8c9819edb24ff343c36b09f9c331bd
|
| 3 |
+
size 7247829616
|
model-00055-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:162c709e336f2aa8313091a33a7147ab51be7c90c7f5d09eb4c425acb98aa46e
|
| 3 |
+
size 7247829616
|
model-00056-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9900d98d3bf9fb23ba73510ebe07c23d08a0c44b91425dd8c892775cac34805
|
| 3 |
+
size 7247829616
|
model-00057-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52f204978cf4ac771d80f5c481bcb82deddb509f504eb636f67f77a626036bd0
|
| 3 |
+
size 7247829616
|
model-00058-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1c5ce814ad1d9b7e93729f299fa397482741d5b775d7a9ba783c70f5e6ce6c0
|
| 3 |
+
size 1067580992
|
model-00059-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54f5f74c7a2c2edeb99d73e5b97cc8c54cd4d77a3410b535dc120da73a6f297f
|
| 3 |
+
size 1006637152
|
model-00061-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bab6a301b97e4760423275bd3da4a66d9262888afd974a390d7ad0d313a5e4c1
|
| 3 |
+
size 7247829616
|
model-00063-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86315e6ec9dd0ddf945c5876a71aae7b983e7e9d25e65628be78fd18b3e39ee5
|
| 3 |
+
size 7247829616
|
model-00064-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48062ee9feb503e7c68ec0f1d8ea6b2f13efe85578437f51cb925225b460856f
|
| 3 |
+
size 7247829616
|
model-00065-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe85fe3b29195bab1d7da0a34b3025e1bdb534b13165abd7c0c73a4b6f3188ca
|
| 3 |
+
size 7247829616
|
model-00067-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6824cc3337fef86e7bbf817246c1be032955b5f587ea4bee2455548713459b3
|
| 3 |
+
size 7247829616
|
model-00068-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73190ae1d37122fb84357de49f2ad491a082009c9dbe710bbfa92af584d6454b
|
| 3 |
+
size 7247829616
|
model-00070-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2dad38b16ec57ba0a98014531dab76a3d03b3b818f6e44565dcd4afbf1f64960
|
| 3 |
+
size 1056968696
|
model-00074-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85e558187484c72451c5fba0f0da1be52c25f45bf7858f9dc9137c83cc645ae6
|
| 3 |
+
size 7247829616
|
model-00077-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4baebab026300e2382e88a79e9aff33fad3b69dfac989280c06de6a31b5950ab
|
| 3 |
+
size 7247829616
|
model-00078-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26a9441a2e352219691de0941d957976b4971790b7e629152fd3d29926ecd1d0
|
| 3 |
+
size 7247829616
|
model-00079-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0dba4828f8c22a051b41124afbcf55d9cc90f51839214ad9c364349f7b503914
|
| 3 |
+
size 7247829616
|
model-00081-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16e7d1512e4d19c69cb64b24a20f9505f4c44d5855f735d308d7254b4bbbcdd2
|
| 3 |
+
size 7247829616
|
model-00084-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5352299469b87eca33076001b00268d313265cd1673dd6270b5babfb1f7efa1
|
| 3 |
+
size 305501064
|
model-00088-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f6a84acd4e0b44a46702789cda84efbb7d18f86a295b8fd306a5fba1356802d
|
| 3 |
+
size 7247829616
|
model-00095-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfc79f113cc099e3e6f79abb32253a659e51c64fa40cd40bf73c3b0a8b833b08
|
| 3 |
+
size 2415943240
|
model-00096-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8df37ca6f641290a5a117e62a7fcf1a79cbf1975bb8897035f69e77b100bad30
|
| 3 |
+
size 1027472968
|
model-00098-of-00099.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a74b4293adeb1a2c0c4eb18aa078a9b611f2c1c02caa425fad015ccef8cf0f7
|
| 3 |
+
size 893255032
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|