splats commited on
Commit
11ea343
·
verified ·
1 Parent(s): b59b3ec

Upload Qwen3.6-27B-oQ4e via oMLX

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: mlx
3
+ tags:
4
+ - mlx
5
+ - oq
6
+ - quantized
7
+ ---
8
+
9
+ # Qwen3.6-27B-oQ4e
10
+
11
+ This model was quantized using [oQ](https://github.com/jundot/omlx) (oMLX v0.3.5) mixed-precision quantization.
12
+
13
+ ## Quantization details
14
+
15
+ - **Model type**: qwen3_5
16
+ - **Bits**: 4
17
+ - **Group size**: 64
18
+ - **Format**: MLX safetensors
chat_template.jinja ADDED
@@ -0,0 +1,154 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- set image_count = namespace(value=0) %}
2
+ {%- set video_count = namespace(value=0) %}
3
+ {%- macro render_content(content, do_vision_count, is_system_content=false) %}
4
+ {%- if content is string %}
5
+ {{- content }}
6
+ {%- elif content is iterable and content is not mapping %}
7
+ {%- for item in content %}
8
+ {%- if 'image' in item or 'image_url' in item or item.type == 'image' %}
9
+ {%- if is_system_content %}
10
+ {{- raise_exception('System message cannot contain images.') }}
11
+ {%- endif %}
12
+ {%- if do_vision_count %}
13
+ {%- set image_count.value = image_count.value + 1 %}
14
+ {%- endif %}
15
+ {%- if add_vision_id %}
16
+ {{- 'Picture ' ~ image_count.value ~ ': ' }}
17
+ {%- endif %}
18
+ {{- '<|vision_start|><|image_pad|><|vision_end|>' }}
19
+ {%- elif 'video' in item or item.type == 'video' %}
20
+ {%- if is_system_content %}
21
+ {{- raise_exception('System message cannot contain videos.') }}
22
+ {%- endif %}
23
+ {%- if do_vision_count %}
24
+ {%- set video_count.value = video_count.value + 1 %}
25
+ {%- endif %}
26
+ {%- if add_vision_id %}
27
+ {{- 'Video ' ~ video_count.value ~ ': ' }}
28
+ {%- endif %}
29
+ {{- '<|vision_start|><|video_pad|><|vision_end|>' }}
30
+ {%- elif 'text' in item %}
31
+ {{- item.text }}
32
+ {%- else %}
33
+ {{- raise_exception('Unexpected item type in content.') }}
34
+ {%- endif %}
35
+ {%- endfor %}
36
+ {%- elif content is none or content is undefined %}
37
+ {{- '' }}
38
+ {%- else %}
39
+ {{- raise_exception('Unexpected content type.') }}
40
+ {%- endif %}
41
+ {%- endmacro %}
42
+ {%- if not messages %}
43
+ {{- raise_exception('No messages provided.') }}
44
+ {%- endif %}
45
+ {%- if tools and tools is iterable and tools is not mapping %}
46
+ {{- '<|im_start|>system\n' }}
47
+ {{- "# Tools\n\nYou have access to the following functions:\n\n<tools>" }}
48
+ {%- for tool in tools %}
49
+ {{- "\n" }}
50
+ {{- tool | tojson }}
51
+ {%- endfor %}
52
+ {{- "\n</tools>" }}
53
+ {{- '\n\nIf you choose to call a function ONLY reply in the following format with NO suffix:\n\n<tool_call>\n<function=example_function_name>\n<parameter=example_parameter_1>\nvalue_1\n</parameter>\n<parameter=example_parameter_2>\nThis is the value for the second parameter\nthat can span\nmultiple lines\n</parameter>\n</function>\n</tool_call>\n\n<IMPORTANT>\nReminder:\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\n- Required parameters MUST be specified\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\n</IMPORTANT>' }}
54
+ {%- if messages[0].role == 'system' %}
55
+ {%- set content = render_content(messages[0].content, false, true)|trim %}
56
+ {%- if content %}
57
+ {{- '\n\n' + content }}
58
+ {%- endif %}
59
+ {%- endif %}
60
+ {{- '<|im_end|>\n' }}
61
+ {%- else %}
62
+ {%- if messages[0].role == 'system' %}
63
+ {%- set content = render_content(messages[0].content, false, true)|trim %}
64
+ {{- '<|im_start|>system\n' + content + '<|im_end|>\n' }}
65
+ {%- endif %}
66
+ {%- endif %}
67
+ {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
68
+ {%- for message in messages[::-1] %}
69
+ {%- set index = (messages|length - 1) - loop.index0 %}
70
+ {%- if ns.multi_step_tool and message.role == "user" %}
71
+ {%- set content = render_content(message.content, false)|trim %}
72
+ {%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}
73
+ {%- set ns.multi_step_tool = false %}
74
+ {%- set ns.last_query_index = index %}
75
+ {%- endif %}
76
+ {%- endif %}
77
+ {%- endfor %}
78
+ {%- if ns.multi_step_tool %}
79
+ {{- raise_exception('No user query found in messages.') }}
80
+ {%- endif %}
81
+ {%- for message in messages %}
82
+ {%- set content = render_content(message.content, true)|trim %}
83
+ {%- if message.role == "system" %}
84
+ {%- if not loop.first %}
85
+ {{- raise_exception('System message must be at the beginning.') }}
86
+ {%- endif %}
87
+ {%- elif message.role == "user" %}
88
+ {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
89
+ {%- elif message.role == "assistant" %}
90
+ {%- set reasoning_content = '' %}
91
+ {%- if message.reasoning_content is string %}
92
+ {%- set reasoning_content = message.reasoning_content %}
93
+ {%- else %}
94
+ {%- if '</think>' in content %}
95
+ {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
96
+ {%- set content = content.split('</think>')[-1].lstrip('\n') %}
97
+ {%- endif %}
98
+ {%- endif %}
99
+ {%- set reasoning_content = reasoning_content|trim %}
100
+ {%- if (preserve_thinking is defined and preserve_thinking is true) or (loop.index0 > ns.last_query_index) %}
101
+ {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content + '\n</think>\n\n' + content }}
102
+ {%- else %}
103
+ {{- '<|im_start|>' + message.role + '\n' + content }}
104
+ {%- endif %}
105
+ {%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}
106
+ {%- for tool_call in message.tool_calls %}
107
+ {%- if tool_call.function is defined %}
108
+ {%- set tool_call = tool_call.function %}
109
+ {%- endif %}
110
+ {%- if loop.first %}
111
+ {%- if content|trim %}
112
+ {{- '\n\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
113
+ {%- else %}
114
+ {{- '<tool_call>\n<function=' + tool_call.name + '>\n' }}
115
+ {%- endif %}
116
+ {%- else %}
117
+ {{- '\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
118
+ {%- endif %}
119
+ {%- if tool_call.arguments is defined %}
120
+ {%- for args_name, args_value in tool_call.arguments|items %}
121
+ {{- '<parameter=' + args_name + '>\n' }}
122
+ {%- set args_value = args_value | string if args_value is string else args_value | tojson | safe %}
123
+ {{- args_value }}
124
+ {{- '\n</parameter>\n' }}
125
+ {%- endfor %}
126
+ {%- endif %}
127
+ {{- '</function>\n</tool_call>' }}
128
+ {%- endfor %}
129
+ {%- endif %}
130
+ {{- '<|im_end|>\n' }}
131
+ {%- elif message.role == "tool" %}
132
+ {%- if loop.previtem and loop.previtem.role != "tool" %}
133
+ {{- '<|im_start|>user' }}
134
+ {%- endif %}
135
+ {{- '\n<tool_response>\n' }}
136
+ {{- content }}
137
+ {{- '\n</tool_response>' }}
138
+ {%- if not loop.last and loop.nextitem.role != "tool" %}
139
+ {{- '<|im_end|>\n' }}
140
+ {%- elif loop.last %}
141
+ {{- '<|im_end|>\n' }}
142
+ {%- endif %}
143
+ {%- else %}
144
+ {{- raise_exception('Unexpected message role.') }}
145
+ {%- endif %}
146
+ {%- endfor %}
147
+ {%- if add_generation_prompt %}
148
+ {{- '<|im_start|>assistant\n' }}
149
+ {%- if enable_thinking is defined and enable_thinking is false %}
150
+ {{- '<think>\n\n</think>\n\n' }}
151
+ {%- else %}
152
+ {{- '<think>\n' }}
153
+ {%- endif %}
154
+ {%- endif %}
config.json ADDED
@@ -0,0 +1,614 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3_5ForConditionalGeneration"
4
+ ],
5
+ "image_token_id": 248056,
6
+ "language_model_only": false,
7
+ "model_type": "qwen3_5",
8
+ "text_config": {
9
+ "attention_bias": false,
10
+ "attention_dropout": 0.0,
11
+ "attn_output_gate": true,
12
+ "bos_token_id": 248044,
13
+ "dtype": "bfloat16",
14
+ "eos_token_id": 248044,
15
+ "full_attention_interval": 4,
16
+ "head_dim": 256,
17
+ "hidden_act": "silu",
18
+ "hidden_size": 5120,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 17408,
21
+ "layer_types": [
22
+ "linear_attention",
23
+ "linear_attention",
24
+ "linear_attention",
25
+ "full_attention",
26
+ "linear_attention",
27
+ "linear_attention",
28
+ "linear_attention",
29
+ "full_attention",
30
+ "linear_attention",
31
+ "linear_attention",
32
+ "linear_attention",
33
+ "full_attention",
34
+ "linear_attention",
35
+ "linear_attention",
36
+ "linear_attention",
37
+ "full_attention",
38
+ "linear_attention",
39
+ "linear_attention",
40
+ "linear_attention",
41
+ "full_attention",
42
+ "linear_attention",
43
+ "linear_attention",
44
+ "linear_attention",
45
+ "full_attention",
46
+ "linear_attention",
47
+ "linear_attention",
48
+ "linear_attention",
49
+ "full_attention",
50
+ "linear_attention",
51
+ "linear_attention",
52
+ "linear_attention",
53
+ "full_attention",
54
+ "linear_attention",
55
+ "linear_attention",
56
+ "linear_attention",
57
+ "full_attention",
58
+ "linear_attention",
59
+ "linear_attention",
60
+ "linear_attention",
61
+ "full_attention",
62
+ "linear_attention",
63
+ "linear_attention",
64
+ "linear_attention",
65
+ "full_attention",
66
+ "linear_attention",
67
+ "linear_attention",
68
+ "linear_attention",
69
+ "full_attention",
70
+ "linear_attention",
71
+ "linear_attention",
72
+ "linear_attention",
73
+ "full_attention",
74
+ "linear_attention",
75
+ "linear_attention",
76
+ "linear_attention",
77
+ "full_attention",
78
+ "linear_attention",
79
+ "linear_attention",
80
+ "linear_attention",
81
+ "full_attention",
82
+ "linear_attention",
83
+ "linear_attention",
84
+ "linear_attention",
85
+ "full_attention"
86
+ ],
87
+ "linear_conv_kernel_dim": 4,
88
+ "linear_key_head_dim": 128,
89
+ "linear_num_key_heads": 16,
90
+ "linear_num_value_heads": 48,
91
+ "linear_value_head_dim": 128,
92
+ "mamba_ssm_dtype": "float32",
93
+ "max_position_embeddings": 262144,
94
+ "model_type": "qwen3_5_text",
95
+ "mtp_num_hidden_layers": 1,
96
+ "mtp_use_dedicated_embeddings": false,
97
+ "num_attention_heads": 24,
98
+ "num_hidden_layers": 64,
99
+ "num_key_value_heads": 4,
100
+ "output_gate_type": "swish",
101
+ "pad_token_id": null,
102
+ "partial_rotary_factor": 0.25,
103
+ "rms_norm_eps": 1e-06,
104
+ "rope_parameters": {
105
+ "mrope_interleaved": true,
106
+ "mrope_section": [
107
+ 11,
108
+ 11,
109
+ 10
110
+ ],
111
+ "partial_rotary_factor": 0.25,
112
+ "rope_theta": 10000000,
113
+ "type": "default"
114
+ },
115
+ "tie_word_embeddings": false,
116
+ "use_cache": true,
117
+ "vocab_size": 248320
118
+ },
119
+ "tie_word_embeddings": false,
120
+ "transformers_version": "4.57.1",
121
+ "video_token_id": 248057,
122
+ "vision_config": {
123
+ "deepstack_visual_indexes": [],
124
+ "depth": 27,
125
+ "hidden_act": "gelu_pytorch_tanh",
126
+ "hidden_size": 1152,
127
+ "in_channels": 3,
128
+ "initializer_range": 0.02,
129
+ "intermediate_size": 4304,
130
+ "model_type": "qwen3_5",
131
+ "num_heads": 16,
132
+ "num_position_embeddings": 2304,
133
+ "out_hidden_size": 5120,
134
+ "patch_size": 16,
135
+ "spatial_merge_size": 2,
136
+ "temporal_patch_size": 2
137
+ },
138
+ "vision_end_token_id": 248054,
139
+ "vision_start_token_id": 248053,
140
+ "eos_token_id": [
141
+ 248046,
142
+ 248044
143
+ ],
144
+ "quantization": {
145
+ "group_size": 64,
146
+ "bits": 4,
147
+ "mode": "affine",
148
+ "language_model.model.layers.1.mlp.down_proj": {
149
+ "bits": 6,
150
+ "group_size": 64,
151
+ "mode": "affine"
152
+ },
153
+ "language_model.model.layers.0.mlp.down_proj": {
154
+ "bits": 6,
155
+ "group_size": 64,
156
+ "mode": "affine"
157
+ },
158
+ "language_model.model.layers.17.mlp.down_proj": {
159
+ "bits": 6,
160
+ "group_size": 64,
161
+ "mode": "affine"
162
+ },
163
+ "language_model.model.layers.16.mlp.down_proj": {
164
+ "bits": 6,
165
+ "group_size": 64,
166
+ "mode": "affine"
167
+ },
168
+ "language_model.model.layers.15.mlp.down_proj": {
169
+ "bits": 6,
170
+ "group_size": 64,
171
+ "mode": "affine"
172
+ },
173
+ "language_model.model.layers.11.mlp.down_proj": {
174
+ "bits": 6,
175
+ "group_size": 64,
176
+ "mode": "affine"
177
+ },
178
+ "language_model.model.layers.13.mlp.down_proj": {
179
+ "bits": 6,
180
+ "group_size": 64,
181
+ "mode": "affine"
182
+ },
183
+ "language_model.model.layers.12.mlp.down_proj": {
184
+ "bits": 6,
185
+ "group_size": 64,
186
+ "mode": "affine"
187
+ },
188
+ "language_model.model.layers.14.mlp.down_proj": {
189
+ "bits": 6,
190
+ "group_size": 64,
191
+ "mode": "affine"
192
+ },
193
+ "language_model.model.layers.10.mlp.down_proj": {
194
+ "bits": 6,
195
+ "group_size": 64,
196
+ "mode": "affine"
197
+ },
198
+ "language_model.model.layers.22.mlp.down_proj": {
199
+ "bits": 6,
200
+ "group_size": 64,
201
+ "mode": "affine"
202
+ },
203
+ "language_model.model.layers.21.mlp.down_proj": {
204
+ "bits": 6,
205
+ "group_size": 64,
206
+ "mode": "affine"
207
+ },
208
+ "language_model.model.layers.23.mlp.down_proj": {
209
+ "bits": 6,
210
+ "group_size": 64,
211
+ "mode": "affine"
212
+ },
213
+ "language_model.model.layers.20.mlp.down_proj": {
214
+ "bits": 6,
215
+ "group_size": 64,
216
+ "mode": "affine"
217
+ },
218
+ "language_model.model.layers.2.mlp.down_proj": {
219
+ "bits": 6,
220
+ "group_size": 64,
221
+ "mode": "affine"
222
+ },
223
+ "language_model.model.layers.18.mlp.down_proj": {
224
+ "bits": 6,
225
+ "group_size": 64,
226
+ "mode": "affine"
227
+ },
228
+ "language_model.model.layers.19.mlp.down_proj": {
229
+ "bits": 6,
230
+ "group_size": 64,
231
+ "mode": "affine"
232
+ },
233
+ "language_model.model.layers.3.mlp.down_proj": {
234
+ "bits": 6,
235
+ "group_size": 64,
236
+ "mode": "affine"
237
+ },
238
+ "language_model.model.layers.29.mlp.down_proj": {
239
+ "bits": 6,
240
+ "group_size": 64,
241
+ "mode": "affine"
242
+ },
243
+ "language_model.model.layers.28.mlp.down_proj": {
244
+ "bits": 6,
245
+ "group_size": 64,
246
+ "mode": "affine"
247
+ },
248
+ "language_model.model.layers.26.mlp.down_proj": {
249
+ "bits": 6,
250
+ "group_size": 64,
251
+ "mode": "affine"
252
+ },
253
+ "language_model.model.layers.7.self_attn.v_proj": {
254
+ "bits": 6,
255
+ "group_size": 64,
256
+ "mode": "affine"
257
+ },
258
+ "language_model.model.layers.7.self_attn.k_proj": {
259
+ "bits": 5,
260
+ "group_size": 64,
261
+ "mode": "affine"
262
+ },
263
+ "language_model.model.layers.31.self_attn.v_proj": {
264
+ "bits": 6,
265
+ "group_size": 64,
266
+ "mode": "affine"
267
+ },
268
+ "language_model.model.layers.31.self_attn.q_proj": {
269
+ "bits": 5,
270
+ "group_size": 64,
271
+ "mode": "affine"
272
+ },
273
+ "language_model.model.layers.3.self_attn.k_proj": {
274
+ "bits": 5,
275
+ "group_size": 64,
276
+ "mode": "affine"
277
+ },
278
+ "language_model.model.layers.27.self_attn.v_proj": {
279
+ "bits": 6,
280
+ "group_size": 64,
281
+ "mode": "affine"
282
+ },
283
+ "language_model.model.layers.27.self_attn.k_proj": {
284
+ "bits": 5,
285
+ "group_size": 64,
286
+ "mode": "affine"
287
+ },
288
+ "language_model.model.layers.23.self_attn.v_proj": {
289
+ "bits": 6,
290
+ "group_size": 64,
291
+ "mode": "affine"
292
+ },
293
+ "language_model.model.layers.3.self_attn.v_proj": {
294
+ "bits": 6,
295
+ "group_size": 64,
296
+ "mode": "affine"
297
+ },
298
+ "language_model.model.layers.19.self_attn.k_proj": {
299
+ "bits": 5,
300
+ "group_size": 64,
301
+ "mode": "affine"
302
+ },
303
+ "language_model.model.layers.15.self_attn.k_proj": {
304
+ "bits": 5,
305
+ "group_size": 64,
306
+ "mode": "affine"
307
+ },
308
+ "language_model.model.layers.26.linear_attn.in_proj_a": {
309
+ "bits": 5,
310
+ "group_size": 64,
311
+ "mode": "affine"
312
+ },
313
+ "language_model.model.layers.5.linear_attn.in_proj_a": {
314
+ "bits": 5,
315
+ "group_size": 64,
316
+ "mode": "affine"
317
+ },
318
+ "language_model.model.layers.9.linear_attn.in_proj_a": {
319
+ "bits": 5,
320
+ "group_size": 64,
321
+ "mode": "affine"
322
+ },
323
+ "language_model.model.layers.8.linear_attn.in_proj_a": {
324
+ "bits": 5,
325
+ "group_size": 64,
326
+ "mode": "affine"
327
+ },
328
+ "language_model.model.layers.30.linear_attn.in_proj_a": {
329
+ "bits": 5,
330
+ "group_size": 64,
331
+ "mode": "affine"
332
+ },
333
+ "language_model.model.layers.6.linear_attn.in_proj_b": {
334
+ "bits": 5,
335
+ "group_size": 64,
336
+ "mode": "affine"
337
+ },
338
+ "language_model.model.layers.6.linear_attn.in_proj_a": {
339
+ "bits": 5,
340
+ "group_size": 64,
341
+ "mode": "affine"
342
+ },
343
+ "language_model.model.layers.26.linear_attn.in_proj_b": {
344
+ "bits": 5,
345
+ "group_size": 64,
346
+ "mode": "affine"
347
+ },
348
+ "language_model.model.layers.5.linear_attn.in_proj_b": {
349
+ "bits": 5,
350
+ "group_size": 64,
351
+ "mode": "affine"
352
+ },
353
+ "language_model.model.layers.22.linear_attn.in_proj_a": {
354
+ "bits": 5,
355
+ "group_size": 64,
356
+ "mode": "affine"
357
+ },
358
+ "language_model.model.layers.30.linear_attn.in_proj_b": {
359
+ "bits": 5,
360
+ "group_size": 64,
361
+ "mode": "affine"
362
+ },
363
+ "language_model.model.layers.29.linear_attn.in_proj_b": {
364
+ "bits": 5,
365
+ "group_size": 64,
366
+ "mode": "affine"
367
+ },
368
+ "language_model.model.layers.28.linear_attn.in_proj_b": {
369
+ "bits": 5,
370
+ "group_size": 64,
371
+ "mode": "affine"
372
+ },
373
+ "language_model.model.layers.8.linear_attn.in_proj_b": {
374
+ "bits": 5,
375
+ "group_size": 64,
376
+ "mode": "affine"
377
+ }
378
+ },
379
+ "quantization_config": {
380
+ "group_size": 64,
381
+ "bits": 4,
382
+ "mode": "affine",
383
+ "language_model.model.layers.1.mlp.down_proj": {
384
+ "bits": 6,
385
+ "group_size": 64,
386
+ "mode": "affine"
387
+ },
388
+ "language_model.model.layers.0.mlp.down_proj": {
389
+ "bits": 6,
390
+ "group_size": 64,
391
+ "mode": "affine"
392
+ },
393
+ "language_model.model.layers.17.mlp.down_proj": {
394
+ "bits": 6,
395
+ "group_size": 64,
396
+ "mode": "affine"
397
+ },
398
+ "language_model.model.layers.16.mlp.down_proj": {
399
+ "bits": 6,
400
+ "group_size": 64,
401
+ "mode": "affine"
402
+ },
403
+ "language_model.model.layers.15.mlp.down_proj": {
404
+ "bits": 6,
405
+ "group_size": 64,
406
+ "mode": "affine"
407
+ },
408
+ "language_model.model.layers.11.mlp.down_proj": {
409
+ "bits": 6,
410
+ "group_size": 64,
411
+ "mode": "affine"
412
+ },
413
+ "language_model.model.layers.13.mlp.down_proj": {
414
+ "bits": 6,
415
+ "group_size": 64,
416
+ "mode": "affine"
417
+ },
418
+ "language_model.model.layers.12.mlp.down_proj": {
419
+ "bits": 6,
420
+ "group_size": 64,
421
+ "mode": "affine"
422
+ },
423
+ "language_model.model.layers.14.mlp.down_proj": {
424
+ "bits": 6,
425
+ "group_size": 64,
426
+ "mode": "affine"
427
+ },
428
+ "language_model.model.layers.10.mlp.down_proj": {
429
+ "bits": 6,
430
+ "group_size": 64,
431
+ "mode": "affine"
432
+ },
433
+ "language_model.model.layers.22.mlp.down_proj": {
434
+ "bits": 6,
435
+ "group_size": 64,
436
+ "mode": "affine"
437
+ },
438
+ "language_model.model.layers.21.mlp.down_proj": {
439
+ "bits": 6,
440
+ "group_size": 64,
441
+ "mode": "affine"
442
+ },
443
+ "language_model.model.layers.23.mlp.down_proj": {
444
+ "bits": 6,
445
+ "group_size": 64,
446
+ "mode": "affine"
447
+ },
448
+ "language_model.model.layers.20.mlp.down_proj": {
449
+ "bits": 6,
450
+ "group_size": 64,
451
+ "mode": "affine"
452
+ },
453
+ "language_model.model.layers.2.mlp.down_proj": {
454
+ "bits": 6,
455
+ "group_size": 64,
456
+ "mode": "affine"
457
+ },
458
+ "language_model.model.layers.18.mlp.down_proj": {
459
+ "bits": 6,
460
+ "group_size": 64,
461
+ "mode": "affine"
462
+ },
463
+ "language_model.model.layers.19.mlp.down_proj": {
464
+ "bits": 6,
465
+ "group_size": 64,
466
+ "mode": "affine"
467
+ },
468
+ "language_model.model.layers.3.mlp.down_proj": {
469
+ "bits": 6,
470
+ "group_size": 64,
471
+ "mode": "affine"
472
+ },
473
+ "language_model.model.layers.29.mlp.down_proj": {
474
+ "bits": 6,
475
+ "group_size": 64,
476
+ "mode": "affine"
477
+ },
478
+ "language_model.model.layers.28.mlp.down_proj": {
479
+ "bits": 6,
480
+ "group_size": 64,
481
+ "mode": "affine"
482
+ },
483
+ "language_model.model.layers.26.mlp.down_proj": {
484
+ "bits": 6,
485
+ "group_size": 64,
486
+ "mode": "affine"
487
+ },
488
+ "language_model.model.layers.7.self_attn.v_proj": {
489
+ "bits": 6,
490
+ "group_size": 64,
491
+ "mode": "affine"
492
+ },
493
+ "language_model.model.layers.7.self_attn.k_proj": {
494
+ "bits": 5,
495
+ "group_size": 64,
496
+ "mode": "affine"
497
+ },
498
+ "language_model.model.layers.31.self_attn.v_proj": {
499
+ "bits": 6,
500
+ "group_size": 64,
501
+ "mode": "affine"
502
+ },
503
+ "language_model.model.layers.31.self_attn.q_proj": {
504
+ "bits": 5,
505
+ "group_size": 64,
506
+ "mode": "affine"
507
+ },
508
+ "language_model.model.layers.3.self_attn.k_proj": {
509
+ "bits": 5,
510
+ "group_size": 64,
511
+ "mode": "affine"
512
+ },
513
+ "language_model.model.layers.27.self_attn.v_proj": {
514
+ "bits": 6,
515
+ "group_size": 64,
516
+ "mode": "affine"
517
+ },
518
+ "language_model.model.layers.27.self_attn.k_proj": {
519
+ "bits": 5,
520
+ "group_size": 64,
521
+ "mode": "affine"
522
+ },
523
+ "language_model.model.layers.23.self_attn.v_proj": {
524
+ "bits": 6,
525
+ "group_size": 64,
526
+ "mode": "affine"
527
+ },
528
+ "language_model.model.layers.3.self_attn.v_proj": {
529
+ "bits": 6,
530
+ "group_size": 64,
531
+ "mode": "affine"
532
+ },
533
+ "language_model.model.layers.19.self_attn.k_proj": {
534
+ "bits": 5,
535
+ "group_size": 64,
536
+ "mode": "affine"
537
+ },
538
+ "language_model.model.layers.15.self_attn.k_proj": {
539
+ "bits": 5,
540
+ "group_size": 64,
541
+ "mode": "affine"
542
+ },
543
+ "language_model.model.layers.26.linear_attn.in_proj_a": {
544
+ "bits": 5,
545
+ "group_size": 64,
546
+ "mode": "affine"
547
+ },
548
+ "language_model.model.layers.5.linear_attn.in_proj_a": {
549
+ "bits": 5,
550
+ "group_size": 64,
551
+ "mode": "affine"
552
+ },
553
+ "language_model.model.layers.9.linear_attn.in_proj_a": {
554
+ "bits": 5,
555
+ "group_size": 64,
556
+ "mode": "affine"
557
+ },
558
+ "language_model.model.layers.8.linear_attn.in_proj_a": {
559
+ "bits": 5,
560
+ "group_size": 64,
561
+ "mode": "affine"
562
+ },
563
+ "language_model.model.layers.30.linear_attn.in_proj_a": {
564
+ "bits": 5,
565
+ "group_size": 64,
566
+ "mode": "affine"
567
+ },
568
+ "language_model.model.layers.6.linear_attn.in_proj_b": {
569
+ "bits": 5,
570
+ "group_size": 64,
571
+ "mode": "affine"
572
+ },
573
+ "language_model.model.layers.6.linear_attn.in_proj_a": {
574
+ "bits": 5,
575
+ "group_size": 64,
576
+ "mode": "affine"
577
+ },
578
+ "language_model.model.layers.26.linear_attn.in_proj_b": {
579
+ "bits": 5,
580
+ "group_size": 64,
581
+ "mode": "affine"
582
+ },
583
+ "language_model.model.layers.5.linear_attn.in_proj_b": {
584
+ "bits": 5,
585
+ "group_size": 64,
586
+ "mode": "affine"
587
+ },
588
+ "language_model.model.layers.22.linear_attn.in_proj_a": {
589
+ "bits": 5,
590
+ "group_size": 64,
591
+ "mode": "affine"
592
+ },
593
+ "language_model.model.layers.30.linear_attn.in_proj_b": {
594
+ "bits": 5,
595
+ "group_size": 64,
596
+ "mode": "affine"
597
+ },
598
+ "language_model.model.layers.29.linear_attn.in_proj_b": {
599
+ "bits": 5,
600
+ "group_size": 64,
601
+ "mode": "affine"
602
+ },
603
+ "language_model.model.layers.28.linear_attn.in_proj_b": {
604
+ "bits": 5,
605
+ "group_size": 64,
606
+ "mode": "affine"
607
+ },
608
+ "language_model.model.layers.8.linear_attn.in_proj_b": {
609
+ "bits": 5,
610
+ "group_size": 64,
611
+ "mode": "affine"
612
+ }
613
+ }
614
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 248044,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 248046,
6
+ 248044
7
+ ],
8
+ "pad_token_id": 248044,
9
+ "temperature": 1.0,
10
+ "top_k": 20,
11
+ "top_p": 0.95
12
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dab0d54c0442b530462a6dc5528ce383e71f240561917fa7fb9543750b1af71e
3
+ size 5043516561
model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef565426223e9cd8716284ae8aee1464c51a2b73c4b75f84418460f88678fd8
3
+ size 5046794376
model-00003-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f5ce7eae50fe53cb692639f4264e70d587af87030c99718bb276dddc45aba9b
3
+ size 5019451056
model-00004-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d72db1601bd7451fe960fbfd1f06d07770ce12a043fed1a179c1d455c0facc69
3
+ size 1430829616
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
preprocessor_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "size": {
3
+ "longest_edge": 16777216,
4
+ "shortest_edge": 65536
5
+ },
6
+ "patch_size": 16,
7
+ "temporal_patch_size": 2,
8
+ "merge_size": 2,
9
+ "image_mean": [
10
+ 0.5,
11
+ 0.5,
12
+ 0.5
13
+ ],
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "processor_class": "Qwen3VLProcessor",
20
+ "image_processor_type": "Qwen2VLImageProcessorFast"
21
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9e4d4901a92b997e463c1f46055088b6cca5ca61a6522d1b9f64c4bb81cb42
3
+ size 12807982
tokenizer_config.json ADDED
@@ -0,0 +1,305 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "248044": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "248045": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "248046": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "248047": {
29
+ "content": "<|object_ref_start|>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "248048": {
37
+ "content": "<|object_ref_end|>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "248049": {
45
+ "content": "<|box_start|>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "248050": {
53
+ "content": "<|box_end|>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "248051": {
61
+ "content": "<|quad_start|>",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "248052": {
69
+ "content": "<|quad_end|>",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "248053": {
77
+ "content": "<|vision_start|>",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "248054": {
85
+ "content": "<|vision_end|>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "248055": {
93
+ "content": "<|vision_pad|>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "248056": {
101
+ "content": "<|image_pad|>",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "248057": {
109
+ "content": "<|video_pad|>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "248058": {
117
+ "content": "<tool_call>",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": false
123
+ },
124
+ "248059": {
125
+ "content": "</tool_call>",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": false
131
+ },
132
+ "248060": {
133
+ "content": "<|fim_prefix|>",
134
+ "lstrip": false,
135
+ "normalized": false,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": false
139
+ },
140
+ "248061": {
141
+ "content": "<|fim_middle|>",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": false
147
+ },
148
+ "248062": {
149
+ "content": "<|fim_suffix|>",
150
+ "lstrip": false,
151
+ "normalized": false,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": false
155
+ },
156
+ "248063": {
157
+ "content": "<|fim_pad|>",
158
+ "lstrip": false,
159
+ "normalized": false,
160
+ "rstrip": false,
161
+ "single_word": false,
162
+ "special": false
163
+ },
164
+ "248064": {
165
+ "content": "<|repo_name|>",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false,
170
+ "special": false
171
+ },
172
+ "248065": {
173
+ "content": "<|file_sep|>",
174
+ "lstrip": false,
175
+ "normalized": false,
176
+ "rstrip": false,
177
+ "single_word": false,
178
+ "special": false
179
+ },
180
+ "248066": {
181
+ "content": "<tool_response>",
182
+ "lstrip": false,
183
+ "normalized": false,
184
+ "rstrip": false,
185
+ "single_word": false,
186
+ "special": false
187
+ },
188
+ "248067": {
189
+ "content": "</tool_response>",
190
+ "lstrip": false,
191
+ "normalized": false,
192
+ "rstrip": false,
193
+ "single_word": false,
194
+ "special": false
195
+ },
196
+ "248068": {
197
+ "content": "<think>",
198
+ "lstrip": false,
199
+ "normalized": false,
200
+ "rstrip": false,
201
+ "single_word": false,
202
+ "special": false
203
+ },
204
+ "248069": {
205
+ "content": "</think>",
206
+ "lstrip": false,
207
+ "normalized": false,
208
+ "rstrip": false,
209
+ "single_word": false,
210
+ "special": false
211
+ },
212
+ "248070": {
213
+ "content": "<|audio_start|>",
214
+ "lstrip": false,
215
+ "normalized": false,
216
+ "rstrip": false,
217
+ "single_word": false,
218
+ "special": true
219
+ },
220
+ "248071": {
221
+ "content": "<|audio_end|>",
222
+ "lstrip": false,
223
+ "normalized": false,
224
+ "rstrip": false,
225
+ "single_word": false,
226
+ "special": true
227
+ },
228
+ "248072": {
229
+ "content": "<tts_pad>",
230
+ "lstrip": false,
231
+ "normalized": false,
232
+ "rstrip": false,
233
+ "single_word": false,
234
+ "special": true
235
+ },
236
+ "248073": {
237
+ "content": "<tts_text_bos>",
238
+ "lstrip": false,
239
+ "normalized": false,
240
+ "rstrip": false,
241
+ "single_word": false,
242
+ "special": true
243
+ },
244
+ "248074": {
245
+ "content": "<tts_text_eod>",
246
+ "lstrip": false,
247
+ "normalized": false,
248
+ "rstrip": false,
249
+ "single_word": false,
250
+ "special": true
251
+ },
252
+ "248075": {
253
+ "content": "<tts_text_bos_single>",
254
+ "lstrip": false,
255
+ "normalized": false,
256
+ "rstrip": false,
257
+ "single_word": false,
258
+ "special": true
259
+ },
260
+ "248076": {
261
+ "content": "<|audio_pad|>",
262
+ "lstrip": false,
263
+ "normalized": false,
264
+ "rstrip": false,
265
+ "single_word": false,
266
+ "special": true
267
+ }
268
+ },
269
+ "additional_special_tokens": [
270
+ "<|im_start|>",
271
+ "<|im_end|>",
272
+ "<|object_ref_start|>",
273
+ "<|object_ref_end|>",
274
+ "<|box_start|>",
275
+ "<|box_end|>",
276
+ "<|quad_start|>",
277
+ "<|quad_end|>",
278
+ "<|vision_start|>",
279
+ "<|vision_end|>",
280
+ "<|vision_pad|>",
281
+ "<|image_pad|>",
282
+ "<|video_pad|>"
283
+ ],
284
+ "bos_token": null,
285
+ "chat_template": "{%- set image_count = namespace(value=0) %}\n{%- set video_count = namespace(value=0) %}\n{%- macro render_content(content, do_vision_count, is_system_content=false) %}\n {%- if content is string %}\n {{- content }}\n {%- elif content is iterable and content is not mapping %}\n {%- for item in content %}\n {%- if 'image' in item or 'image_url' in item or item.type == 'image' %}\n {%- if is_system_content %}\n {{- raise_exception('System message cannot contain images.') }}\n {%- endif %}\n {%- if do_vision_count %}\n {%- set image_count.value = image_count.value + 1 %}\n {%- endif %}\n {%- if add_vision_id %}\n {{- 'Picture ' ~ image_count.value ~ ': ' }}\n {%- endif %}\n {{- '<|vision_start|><|image_pad|><|vision_end|>' }}\n {%- elif 'video' in item or item.type == 'video' %}\n {%- if is_system_content %}\n {{- raise_exception('System message cannot contain videos.') }}\n {%- endif %}\n {%- if do_vision_count %}\n {%- set video_count.value = video_count.value + 1 %}\n {%- endif %}\n {%- if add_vision_id %}\n {{- 'Video ' ~ video_count.value ~ ': ' }}\n {%- endif %}\n {{- '<|vision_start|><|video_pad|><|vision_end|>' }}\n {%- elif 'text' in item %}\n {{- item.text }}\n {%- else %}\n {{- raise_exception('Unexpected item type in content.') }}\n {%- endif %}\n {%- endfor %}\n {%- elif content is none or content is undefined %}\n {{- '' }}\n {%- else %}\n {{- raise_exception('Unexpected content type.') }}\n {%- endif %}\n{%- endmacro %}\n{%- if not messages %}\n {{- raise_exception('No messages provided.') }}\n{%- endif %}\n{%- if tools and tools is iterable and tools is not mapping %}\n {{- '<|im_start|>system\\n' }}\n {{- \"# Tools\\n\\nYou have access to the following functions:\\n\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\" }}\n {{- '\\n\\nIf you choose to call a function ONLY reply in the following format with NO suffix:\\n\\n<tool_call>\\n<function=example_function_name>\\n<parameter=example_parameter_1>\\nvalue_1\\n</parameter>\\n<parameter=example_parameter_2>\\nThis is the value for the second parameter\\nthat can span\\nmultiple lines\\n</parameter>\\n</function>\\n</tool_call>\\n\\n<IMPORTANT>\\nReminder:\\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\\n- Required parameters MUST be specified\\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\\n</IMPORTANT>' }}\n {%- if messages[0].role == 'system' %}\n {%- set content = render_content(messages[0].content, false, true)|trim %}\n {%- if content %}\n {{- '\\n\\n' + content }}\n {%- endif %}\n {%- endif %}\n {{- '<|im_end|>\\n' }}\n{%- else %}\n {%- if messages[0].role == 'system' %}\n {%- set content = render_content(messages[0].content, false, true)|trim %}\n {{- '<|im_start|>system\\n' + content + '<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}\n{%- for message in messages[::-1] %}\n {%- set index = (messages|length - 1) - loop.index0 %}\n {%- if ns.multi_step_tool and message.role == \"user\" %}\n {%- set content = render_content(message.content, false)|trim %}\n {%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}\n {%- set ns.multi_step_tool = false %}\n {%- set ns.last_query_index = index %}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if ns.multi_step_tool %}\n {{- raise_exception('No user query found in messages.') }}\n{%- endif %}\n{%- for message in messages %}\n {%- set content = render_content(message.content, true)|trim %}\n {%- if message.role == \"system\" %}\n {%- if not loop.first %}\n {{- raise_exception('System message must be at the beginning.') }}\n {%- endif %}\n {%- elif message.role == \"user\" %}\n {{- '<|im_start|>' + message.role + '\\n' + content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {%- set reasoning_content = '' %}\n {%- if message.reasoning_content is string %}\n {%- set reasoning_content = message.reasoning_content %}\n {%- else %}\n {%- if '</think>' in content %}\n {%- set reasoning_content = content.split('</think>')[0].rstrip('\\n').split('<think>')[-1].lstrip('\\n') %}\n {%- set content = content.split('</think>')[-1].lstrip('\\n') %}\n {%- endif %}\n {%- endif %}\n {%- set reasoning_content = reasoning_content|trim %}\n {%- if (preserve_thinking is defined and preserve_thinking is true) or (loop.index0 > ns.last_query_index) %}\n {{- '<|im_start|>' + message.role + '\\n<think>\\n' + reasoning_content + '\\n</think>\\n\\n' + content }}\n {%- else %}\n {{- '<|im_start|>' + message.role + '\\n' + content }}\n {%- endif %}\n {%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {%- if loop.first %}\n {%- if content|trim %}\n {{- '\\n\\n<tool_call>\\n<function=' + tool_call.name + '>\\n' }}\n {%- else %}\n {{- '<tool_call>\\n<function=' + tool_call.name + '>\\n' }}\n {%- endif %}\n {%- else %}\n {{- '\\n<tool_call>\\n<function=' + tool_call.name + '>\\n' }}\n {%- endif %}\n {%- if tool_call.arguments is defined %}\n {%- for args_name, args_value in tool_call.arguments|items %}\n {{- '<parameter=' + args_name + '>\\n' }}\n {%- set args_value = args_value | string if args_value is string else args_value | tojson | safe %}\n {{- args_value }}\n {{- '\\n</parameter>\\n' }}\n {%- endfor %}\n {%- endif %}\n {{- '</function>\\n</tool_call>' }}\n {%- endfor %}\n {%- endif %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if loop.previtem and loop.previtem.role != \"tool\" %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- content }}\n {{- '\\n</tool_response>' }}\n {%- if not loop.last and loop.nextitem.role != \"tool\" %}\n {{- '<|im_end|>\\n' }}\n {%- elif loop.last %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- else %}\n {{- raise_exception('Unexpected message role.') }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n {%- if enable_thinking is defined and enable_thinking is false %}\n {{- '<think>\\n\\n</think>\\n\\n' }}\n {%- else %}\n {{- '<think>\\n' }}\n {%- endif %}\n{%- endif %}",
286
+ "clean_up_tokenization_spaces": false,
287
+ "eos_token": "<|im_end|>",
288
+ "errors": "replace",
289
+ "model_max_length": 262144,
290
+ "pad_token": "<|endoftext|>",
291
+ "split_special_tokens": false,
292
+ "tokenizer_class": "Qwen2Tokenizer",
293
+ "unk_token": null,
294
+ "add_bos_token": false,
295
+ "pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
296
+ "extra_special_tokens": {
297
+ "audio_bos_token": "<|audio_start|>",
298
+ "audio_eos_token": "<|audio_end|>",
299
+ "audio_token": "<|audio_pad|>",
300
+ "image_token": "<|image_pad|>",
301
+ "video_token": "<|video_pad|>",
302
+ "vision_bos_token": "<|vision_start|>",
303
+ "vision_eos_token": "<|vision_end|>"
304
+ }
305
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff