yiqichen01 commited on
Commit
f71230b
·
verified ·
1 Parent(s): b7d1d83

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. config.json +41 -0
  2. generate_config.json +7 -0
  3. model-00000-of-00099.safetensors +3 -0
  4. model-00003-of-00099.safetensors +3 -0
  5. model-00010-of-00099.safetensors +3 -0
  6. model-00011-of-00099.safetensors +3 -0
  7. model-00013-of-00099.safetensors +3 -0
  8. model-00015-of-00099.safetensors +3 -0
  9. model-00017-of-00099.safetensors +3 -0
  10. model-00023-of-00099.safetensors +3 -0
  11. model-00024-of-00099.safetensors +3 -0
  12. model-00025-of-00099.safetensors +3 -0
  13. model-00026-of-00099.safetensors +3 -0
  14. model-00028-of-00099.safetensors +3 -0
  15. model-00032-of-00099.safetensors +3 -0
  16. model-00033-of-00099.safetensors +3 -0
  17. model-00034-of-00099.safetensors +3 -0
  18. model-00035-of-00099.safetensors +3 -0
  19. model-00038-of-00099.safetensors +3 -0
  20. model-00039-of-00099.safetensors +3 -0
  21. model-00045-of-00099.safetensors +3 -0
  22. model-00046-of-00099.safetensors +3 -0
  23. model-00047-of-00099.safetensors +3 -0
  24. model-00050-of-00099.safetensors +3 -0
  25. model-00053-of-00099.safetensors +3 -0
  26. model-00055-of-00099.safetensors +3 -0
  27. model-00056-of-00099.safetensors +3 -0
  28. model-00057-of-00099.safetensors +3 -0
  29. model-00058-of-00099.safetensors +3 -0
  30. model-00059-of-00099.safetensors +3 -0
  31. model-00061-of-00099.safetensors +3 -0
  32. model-00063-of-00099.safetensors +3 -0
  33. model-00064-of-00099.safetensors +3 -0
  34. model-00065-of-00099.safetensors +3 -0
  35. model-00067-of-00099.safetensors +3 -0
  36. model-00068-of-00099.safetensors +3 -0
  37. model-00070-of-00099.safetensors +3 -0
  38. model-00074-of-00099.safetensors +3 -0
  39. model-00077-of-00099.safetensors +3 -0
  40. model-00078-of-00099.safetensors +3 -0
  41. model-00079-of-00099.safetensors +3 -0
  42. model-00081-of-00099.safetensors +3 -0
  43. model-00084-of-00099.safetensors +3 -0
  44. model-00088-of-00099.safetensors +3 -0
  45. model-00095-of-00099.safetensors +3 -0
  46. model-00096-of-00099.safetensors +3 -0
  47. model-00098-of-00099.safetensors +3 -0
  48. model.safetensors.index.json +0 -0
  49. tokenizer.json +0 -0
  50. tokenizer_config.json +0 -0
config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "HYV3ForCausalLM"
4
+ ],
5
+ "enable_attention_fp32_softmax": false,
6
+ "enable_lm_head_fp32": true,
7
+ "enable_moe_fp32_combine": false,
8
+ "expert_hidden_dim": 1536,
9
+ "moe_intermediate_size": 1536,
10
+ "first_k_dense_replace": 1,
11
+ "head_dim": 128,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 4096,
14
+ "initializer_range": 0.006,
15
+ "intermediate_size": 13312,
16
+ "max_position_embeddings": 262144,
17
+ "model_type": "hy_v3",
18
+ "moe_router_enable_expert_bias": true,
19
+ "moe_router_use_sigmoid": true,
20
+ "num_attention_heads": 64,
21
+ "num_experts": 192,
22
+ "num_experts_per_tok": 8,
23
+ "num_hidden_layers": 80,
24
+ "num_key_value_heads": 8,
25
+ "num_shared_experts": 1,
26
+ "output_router_logits": true,
27
+ "qk_norm": true,
28
+ "rms_norm_eps": 1e-05,
29
+ "rope_parameters": {
30
+ "rope_theta": 11158840.0,
31
+ "rope_type": "default"
32
+ },
33
+ "route_norm": true,
34
+ "router_scaling_factor": 2.826,
35
+ "tie_word_embeddings": false,
36
+ "transformers_version": "5.6.0",
37
+ "use_cache": true,
38
+ "use_grouped_mm": false,
39
+ "vocab_size": 120832,
40
+ "num_nextn_predict_layers": 1
41
+ }
generate_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 120000,
3
+ "do_sample": false,
4
+ "eos_token_id": 120020,
5
+ "max_new_tokens": 2048,
6
+ "transformers_version": "5.6.0"
7
+ }
model-00000-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:649a67670108461567758f6280e089d0eb75a28176532b6cfcfd3a6fee18259b
3
+ size 7247829040
model-00003-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aff398d6dd970b28b277c07eda15e0586f160a8d91aa7d70762c9da75fbe074c
3
+ size 7247829616
model-00010-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:905779aa781a6e1bcf4d0622c2b896ba207a44bc1e34ecf25b6181e512f3919b
3
+ size 1073743720
model-00011-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4abae02bef67e29f1a4280c0ad419628acd93bc39e73786e7f99d75cc7930cf2
3
+ size 1006637160
model-00013-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aaf5c5333076df4b161c383cb3811d07d35c9ef1479ebf1ccdd0147d0c5cfb3
3
+ size 7247829616
model-00015-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f985037a76b2e3bac969fb091cff97587fb044706c6bd1e2bdd6dde26dfb3de
3
+ size 7247829616
model-00017-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b551b941e58ee6f7e5481b97d106eadc8b7cb09c39e19ee02ed13d5e0c0301b0
3
+ size 7247829616
model-00023-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d29551e053f88145df17fcf53a7c662de8a9b76e953d93a30783e974c558826a
3
+ size 1006637160
model-00024-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:689e9c7759c7d4bdef9db5084c6d24ac59b1dccd848544725b4dd1296f765bf9
3
+ size 7247829040
model-00025-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b93d9ac4182eb16c13f831a23ea411ea1599e7e51ed8f3959d061857598b02f5
3
+ size 7247829616
model-00026-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:148c2ee768afc48db9378f2836257a61ec04e827c73533e97607435987424336
3
+ size 7247829616
model-00028-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c75c788fec6a8c3016c9a84836a7a8b7366e100b9b469ddcc48aac38e91218c
3
+ size 7247829616
model-00032-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:554cf656731d8f1af2254b86666e29707f4ac78fbfd74ee57651972c2186cafa
3
+ size 7247829616
model-00033-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c0bba2ecbbc54f662b7061be6d90dafc164e90a232194e44af9f7e520100648
3
+ size 7247829616
model-00034-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:593fccfe422c1c9398b0dd801b1cd0e97104f3a5811e341453a11e9b6470d3c6
3
+ size 1073742304
model-00035-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f9081dbda6a3af23fbe83df70768586009c067b72077ef246fad50c5c5903e2
3
+ size 998247496
model-00038-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3957f156b9b482ee929caa9c7e5fe5bda2a88172c573341b95c1e5c3caccec1c
3
+ size 7247829616
model-00039-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51a103023248dacbabee740df0303d9b844352994adfd391eba1dbc5bf8dbbbb
3
+ size 7247829616
model-00045-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54d8608cd224db1950873450427df87854178b581e14c183b68492054fb4e04b
3
+ size 7247829616
model-00046-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f91c867d41408907da3a4b3004ce9b2d86315284f9c68dcc6bb12870b72e88e3
3
+ size 1073746944
model-00047-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dac651fa44ddf9751dede24847e89ae6b1fb062105a50726845c4a9384526140
3
+ size 989855880
model-00050-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75aa972e44faf1be28ecfc168e14065a74a42df75b6eff7bce9d5ffc937971f5
3
+ size 7247829616
model-00053-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c8fd98ec16bd29ac34024aa440fa3222f8c9819edb24ff343c36b09f9c331bd
3
+ size 7247829616
model-00055-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:162c709e336f2aa8313091a33a7147ab51be7c90c7f5d09eb4c425acb98aa46e
3
+ size 7247829616
model-00056-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9900d98d3bf9fb23ba73510ebe07c23d08a0c44b91425dd8c892775cac34805
3
+ size 7247829616
model-00057-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52f204978cf4ac771d80f5c481bcb82deddb509f504eb636f67f77a626036bd0
3
+ size 7247829616
model-00058-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c5ce814ad1d9b7e93729f299fa397482741d5b775d7a9ba783c70f5e6ce6c0
3
+ size 1067580992
model-00059-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54f5f74c7a2c2edeb99d73e5b97cc8c54cd4d77a3410b535dc120da73a6f297f
3
+ size 1006637152
model-00061-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bab6a301b97e4760423275bd3da4a66d9262888afd974a390d7ad0d313a5e4c1
3
+ size 7247829616
model-00063-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86315e6ec9dd0ddf945c5876a71aae7b983e7e9d25e65628be78fd18b3e39ee5
3
+ size 7247829616
model-00064-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48062ee9feb503e7c68ec0f1d8ea6b2f13efe85578437f51cb925225b460856f
3
+ size 7247829616
model-00065-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe85fe3b29195bab1d7da0a34b3025e1bdb534b13165abd7c0c73a4b6f3188ca
3
+ size 7247829616
model-00067-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6824cc3337fef86e7bbf817246c1be032955b5f587ea4bee2455548713459b3
3
+ size 7247829616
model-00068-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73190ae1d37122fb84357de49f2ad491a082009c9dbe710bbfa92af584d6454b
3
+ size 7247829616
model-00070-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dad38b16ec57ba0a98014531dab76a3d03b3b818f6e44565dcd4afbf1f64960
3
+ size 1056968696
model-00074-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85e558187484c72451c5fba0f0da1be52c25f45bf7858f9dc9137c83cc645ae6
3
+ size 7247829616
model-00077-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4baebab026300e2382e88a79e9aff33fad3b69dfac989280c06de6a31b5950ab
3
+ size 7247829616
model-00078-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a9441a2e352219691de0941d957976b4971790b7e629152fd3d29926ecd1d0
3
+ size 7247829616
model-00079-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dba4828f8c22a051b41124afbcf55d9cc90f51839214ad9c364349f7b503914
3
+ size 7247829616
model-00081-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16e7d1512e4d19c69cb64b24a20f9505f4c44d5855f735d308d7254b4bbbcdd2
3
+ size 7247829616
model-00084-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5352299469b87eca33076001b00268d313265cd1673dd6270b5babfb1f7efa1
3
+ size 305501064
model-00088-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f6a84acd4e0b44a46702789cda84efbb7d18f86a295b8fd306a5fba1356802d
3
+ size 7247829616
model-00095-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc79f113cc099e3e6f79abb32253a659e51c64fa40cd40bf73c3b0a8b833b08
3
+ size 2415943240
model-00096-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8df37ca6f641290a5a117e62a7fcf1a79cbf1975bb8897035f69e77b100bad30
3
+ size 1027472968
model-00098-of-00099.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a74b4293adeb1a2c0c4eb18aa078a9b611f2c1c02caa425fad015ccef8cf0f7
3
+ size 893255032
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff