dylanlanigan commited on
Commit
0ce5305
·
verified ·
1 Parent(s): 676f9de

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3_moe",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 2048,
8
+ "intermediate_size": 6144,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 32,
11
+ "num_hidden_layers": 48,
12
+ "num_key_value_heads": 4,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000.0,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128,
23
+ "weight_block_size": null,
24
+ "moe_intermediate_size": 768,
25
+ "num_experts_per_tok": 8,
26
+ "num_experts": 128,
27
+ "decoder_sparse_step": 1,
28
+ "norm_topk_prob": true
29
+ },
30
+ "vocab_size": 151936,
31
+ "context_window_size": 40960,
32
+ "sliding_window_size": -1,
33
+ "prefill_chunk_size": 2048,
34
+ "attention_sink_size": -1,
35
+ "tensor_parallel_shards": 1,
36
+ "pipeline_parallel_stages": 1,
37
+ "temperature": 0.6,
38
+ "presence_penalty": 0.0,
39
+ "frequency_penalty": 0.0,
40
+ "repetition_penalty": 1.0,
41
+ "top_p": 0.95,
42
+ "tokenizer_files": [
43
+ "tokenizer.json",
44
+ "vocab.json",
45
+ "merges.txt",
46
+ "tokenizer_config.json"
47
+ ],
48
+ "tokenizer_info": {
49
+ "token_postproc_method": "byte_level",
50
+ "prepend_space_in_encode": false,
51
+ "strip_space_in_decode": false
52
+ },
53
+ "conv_template": {
54
+ "name": "qwen2",
55
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
56
+ "system_message": "You are a helpful assistant.",
57
+ "system_prefix_token_ids": null,
58
+ "add_role_after_system_message": true,
59
+ "roles": {
60
+ "user": "<|im_start|>user",
61
+ "assistant": "<|im_start|>assistant"
62
+ },
63
+ "role_templates": {
64
+ "user": "{user_message}",
65
+ "assistant": "{assistant_message}",
66
+ "tool": "{tool_message}"
67
+ },
68
+ "messages": [],
69
+ "seps": [
70
+ "<|im_end|>\n"
71
+ ],
72
+ "role_content_sep": "\n",
73
+ "role_empty_sep": "\n",
74
+ "stop_str": [
75
+ "<|endoftext|>",
76
+ "<|im_end|>"
77
+ ],
78
+ "stop_token_ids": [
79
+ 151643,
80
+ 151645
81
+ ],
82
+ "function_string": "",
83
+ "use_function_calling": false
84
+ },
85
+ "pad_token_id": 151643,
86
+ "bos_token_id": 151643,
87
+ "eos_token_id": [
88
+ 151645,
89
+ 151643
90
+ ]
91
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37775d56f6e3e7688878d037239fcc701f79baf2ae39f83457e62fdff8268da4
3
+ size 100663296
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b24c3521b26944e2c605d45fd651d6b8c32336f7b6b984467d6da6a06fc9a58d
3
+ size 100663296
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d03a27a64522fc45df855596f901ce760c7c180ed118fb1b53b28c817d939b9
3
+ size 25165824
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5def2a88f2329e8e0781d423f9526b1bfeb630b69e2bb3abe0c57949165f60b7
3
+ size 23355904
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae50a1d0ffb4ebb3a9a64341fa42ee55a5abeff5fdb0d4cc361518356eaead41
3
+ size 201326592
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c84d9133fdf40d000b2c38dd3a58e28c52bb8236b370df5073e778e48d947983
3
+ size 25165824
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86cb1f74ad9cd4fcd246165d73aa1f94da166fe53ebcda1c5216d707291e53e
3
+ size 100663296
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb53418d726e519e42f29fe9fdeed4bd44c4fa37b68faabbd8bc92d384f56090
3
+ size 23351808
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e5465e3ac437bdde9d7dccd816bb6e4b67313dcb382cf5ff6401b63c0c1864
3
+ size 25165824
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e46116574e00a4814c1faccc3eeb4a611962bcb6fb91be9c0f7ade4752cb3c08
3
+ size 100663296
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ccbd2110358d25372fb61b6a1ba0bd440891d8785bf5c18619d57158601020f
3
+ size 23355904
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2479eb1e4f7e879e48078f8301228423defede3d7fed5a60cbc945ad82bb246c
3
+ size 23360000
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7893d352c9ff1ea848ba4f32a38b94319b076dda71b658e0fb0d3310889b8a8b
3
+ size 201326592
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:896f406d63cd686fb3a58cad360ce1cd1cc72945a3419e72cdb21d94e98eb157
3
+ size 25165824
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b119dc91a60a53ece792209d6191ac904fa5328637f254aa876f796cd9ed819f
3
+ size 100663296
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5fee541b0de73bc078c21e9e76a2df3637f2d450af6ae4beed38cda1daa2de
3
+ size 23355904
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acdfb45048978efc714b7b0cb2417d806da30619aad14c32a9236e6f2aaf0a94
3
+ size 201326592
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c7c389ec8cfd2ad010bea2515630986917e61956f4e345b4e6c52d2d2d7ac45
3
+ size 25165824
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea78dabe914c9a6fbaea0c9695d012136846e316e4e26157e8588178a768fa0e
3
+ size 23351808
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e370e63f84aa37291f2c2a3e969dfd7f08092af4c561a5789064bd0c6f2a38
3
+ size 25165824
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bdf648d0a139a20959c15db44a51bcfd7726512af31dfe7f83af220b81a1b7f
3
+ size 23360000
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe04bfc970b20e28efd64db80df46ca4268de3a233e75cde431d30045fbd26c
3
+ size 201326592
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76d694ea8dd203f0d7973ce584cb4bf9d7f54cee35c45e2d7e45ad3d23125e62
3
+ size 25165824
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5331653229f94ce1b964feeca8ad56cc48d72d17e85c81b7f7aef3eb74b311
3
+ size 100663296
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e755692662b1135626213cf90747db33ed05663b4c8d294bb3bb2f69ec945423
3
+ size 23355904
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b71d198747ab17f18b00e90b3093dc8e20346e51b8e774bdf2d4e4a533fb49c
3
+ size 25165824
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfdc6e41b03ce1c3e306df2c256735e63f01d09ffd2b1dce12ab86ff0d615d97
3
+ size 25165824
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7b700f83313a66cea2dc677c690504c49b59186fd9f1590f70cd6f70a1c9f42
3
+ size 23351808
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:495d6a50a62ca464550d8765513725eea5b14d2e0e0fd1d62b261574699d2058
3
+ size 25165824
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c626bffdb6fc427b324ae1fdf218b3b63d1a042b74c2c42eec1ddd592553bb28
3
+ size 23360000
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ee42f64ae29d0eb5a77a2495d95eb3c463f8996a10c5a7f601e6ef7502ae9c8
3
+ size 25165824
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d331e215a57caea2196bf80e31371c8984f8f1ccc579462bab40d96fa20e7526
3
+ size 23355904
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc189d1c51c7aa4580dce275bd5dc6cc2f6b71e6a6807073ed790d09c3d2ff07
3
+ size 100663296
params_shard_140.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f9858f95af7185f927c7a26a0f905e9272e366bf2598df148572a2c8f8eeb37
3
+ size 25165824
params_shard_142.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08e672d1271eb319ec3877f1b1e5c593ea4e0d1e8b49e2472be39516edd6c161
3
+ size 23355904
params_shard_143.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12e03f2cfe8461fb96f5424a5cfc0329bfe17f68d6a67f2e6ced8aed64e9bef
3
+ size 201326592
params_shard_144.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3baf5d4564294f8f693610443709c37bb8158414859a7b13a8b3560bccfea864
3
+ size 25165824
params_shard_145.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcb32cdc6b3a7e436fbe1c5d090fa5d8fa339a1707867bf58d89692054a5852f
3
+ size 100663296
params_shard_146.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f14b19b7687cee01dcd75f1bcd40ddf6ca4d068055c8d8a025ea271be85f70a7
3
+ size 23355904
params_shard_148.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:752f8fd67a61621e339ae1400de160cf747d392df6b39c220019864fef03d946
3
+ size 25165824
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ce5d859b00a739e03c0e16cd3169c9dd756e7573462f6e566d2e579a8be4097
3
+ size 23351808
params_shard_150.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c96a925ccefa17769081cb6f13911c64a01a3d4aba91bcd787fd9f29d180c3fc
3
+ size 23355904
params_shard_152.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28d178dd8d70f625d3c5d975ba62edef483645eb20a10972198ae4355de3a7c3
3
+ size 25165824
params_shard_153.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98ba5f6dda5fa1192b05dd5ef2a99423ec4b16833f2e4babc6894179fe47acda
3
+ size 100663296
params_shard_154.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e77021e7e6a8e1152d567ea29841f3dbd8e133e2cd42ff1e9f6b35a1faf2a2
3
+ size 23355904
params_shard_156.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8f7d07d512d61fb9c0a1706351073445118f643e63af6a7ecb6a00a04ee6740
3
+ size 25165824