Upload Hy3-preview-oQ6 via oMLX
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +1 -0
- README.md +18 -0
- chat_template.jinja +195 -0
- config.json +76 -0
- generation_config.json +10 -0
- model-00001-of-00049.safetensors +3 -0
- model-00002-of-00049.safetensors +3 -0
- model-00003-of-00049.safetensors +3 -0
- model-00004-of-00049.safetensors +3 -0
- model-00005-of-00049.safetensors +3 -0
- model-00006-of-00049.safetensors +3 -0
- model-00007-of-00049.safetensors +3 -0
- model-00008-of-00049.safetensors +3 -0
- model-00009-of-00049.safetensors +3 -0
- model-00010-of-00049.safetensors +3 -0
- model-00011-of-00049.safetensors +3 -0
- model-00012-of-00049.safetensors +3 -0
- model-00013-of-00049.safetensors +3 -0
- model-00014-of-00049.safetensors +3 -0
- model-00015-of-00049.safetensors +3 -0
- model-00016-of-00049.safetensors +3 -0
- model-00017-of-00049.safetensors +3 -0
- model-00018-of-00049.safetensors +3 -0
- model-00019-of-00049.safetensors +3 -0
- model-00020-of-00049.safetensors +3 -0
- model-00021-of-00049.safetensors +3 -0
- model-00022-of-00049.safetensors +3 -0
- model-00023-of-00049.safetensors +3 -0
- model-00024-of-00049.safetensors +3 -0
- model-00025-of-00049.safetensors +3 -0
- model-00026-of-00049.safetensors +3 -0
- model-00027-of-00049.safetensors +3 -0
- model-00028-of-00049.safetensors +3 -0
- model-00029-of-00049.safetensors +3 -0
- model-00030-of-00049.safetensors +3 -0
- model-00031-of-00049.safetensors +3 -0
- model-00032-of-00049.safetensors +3 -0
- model-00033-of-00049.safetensors +3 -0
- model-00034-of-00049.safetensors +3 -0
- model-00035-of-00049.safetensors +3 -0
- model-00036-of-00049.safetensors +3 -0
- model-00037-of-00049.safetensors +3 -0
- model-00038-of-00049.safetensors +3 -0
- model-00039-of-00049.safetensors +3 -0
- model-00040-of-00049.safetensors +3 -0
- model-00041-of-00049.safetensors +3 -0
- model-00042-of-00049.safetensors +3 -0
- model-00043-of-00049.safetensors +3 -0
- model-00044-of-00049.safetensors +3 -0
- model-00045-of-00049.safetensors +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
library_name: mlx
|
| 3 |
+
tags:
|
| 4 |
+
- mlx
|
| 5 |
+
- oq
|
| 6 |
+
- quantized
|
| 7 |
+
---
|
| 8 |
+
|
| 9 |
+
# Hy3-preview-oQ6
|
| 10 |
+
|
| 11 |
+
This model was quantized using [oQ](https://github.com/jundot/omlx) (oMLX v0.3.6) mixed-precision quantization.
|
| 12 |
+
|
| 13 |
+
## Quantization details
|
| 14 |
+
|
| 15 |
+
- **Model type**: hy_v3
|
| 16 |
+
- **Bits**: 6
|
| 17 |
+
- **Group size**: 64
|
| 18 |
+
- **Format**: MLX safetensors
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,195 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{#- ----------‑‑‑ special token variables ‑‑‑---------- -#}
|
| 2 |
+
{%- set bos_token = '<|hy_begin▁of▁sentence|>' %}
|
| 3 |
+
{%- set pad_token = '<|hy_▁pad▁|>' %}
|
| 4 |
+
{%- set user_token = '<|hy_User|>' %}
|
| 5 |
+
{%- set assistant_token = '<|hy_Assistant|>' %}
|
| 6 |
+
{%- set eos_token = '<|hy_eos|>' %}
|
| 7 |
+
{%- set think_begin_token = '<think>' %}
|
| 8 |
+
{%- set think_end_token = '</think>' %}
|
| 9 |
+
{%- set toolcalls_begin_token = '<tool_calls>' %}
|
| 10 |
+
{%- set toolcalls_end_token = '</tool_calls>' %}
|
| 11 |
+
{%- set toolcall_begin_token = '<tool_call>' %}
|
| 12 |
+
{%- set toolcall_end_token = '</tool_call>' %}
|
| 13 |
+
{%- set toolsep_token = '<tool_sep>' %}
|
| 14 |
+
{%- set argkey_begin_token = '<arg_key>' %}
|
| 15 |
+
{%- set argkey_end_token = '</arg_key>' %}
|
| 16 |
+
{%- set argvalue_begin_token = '<arg_value>' %}
|
| 17 |
+
{%- set argvalue_end_token = '</arg_value>' %}
|
| 18 |
+
{%- set toolresponses_begin_token = '<tool_responses>' %}
|
| 19 |
+
{%- set toolresponses_end_token = '</tool_responses>' %}
|
| 20 |
+
{%- set toolresponse_begin_token = '<tool_response>' %}
|
| 21 |
+
{%- set toolresponse_end_token = '</tool_response>' %}
|
| 22 |
+
{%- set reasoning_mode_token = '<|reasoning_mode|>' %}
|
| 23 |
+
{#- ----------‑‑‑ hyperparameters variables ‑‑‑---------- -#}
|
| 24 |
+
{%- if not add_generation_prompt is defined %}
|
| 25 |
+
{%- set add_generation_prompt = false %}
|
| 26 |
+
{%- endif %}
|
| 27 |
+
{%- if not interleaved_thinking is defined %}
|
| 28 |
+
{%- set interleaved_thinking = false %}
|
| 29 |
+
{%- endif %}
|
| 30 |
+
{%- if not tools %}
|
| 31 |
+
{%- set interleaved_thinking = false %}
|
| 32 |
+
{%- endif %}
|
| 33 |
+
{%- if not is_training is defined %}
|
| 34 |
+
{%- set is_training = false %}
|
| 35 |
+
{%- endif %}
|
| 36 |
+
{%- if not reasoning_effort is defined or reasoning_effort not in ['high', 'low', 'no_think'] %}
|
| 37 |
+
{%- set reasoning_effort = 'no_think' %}
|
| 38 |
+
{%- endif %}
|
| 39 |
+
|
| 40 |
+
{%- macro visible_text(content) -%}
|
| 41 |
+
{%- if content is string -%}
|
| 42 |
+
{{- content }}
|
| 43 |
+
{%- elif content is iterable and content is not mapping -%}
|
| 44 |
+
{%- for item in content -%}
|
| 45 |
+
{%- if item is mapping and item.type == 'text' -%}
|
| 46 |
+
{{- item.text }}
|
| 47 |
+
{%- elif item is string -%}
|
| 48 |
+
{{- item }}
|
| 49 |
+
{%- endif -%}
|
| 50 |
+
{%- endfor -%}
|
| 51 |
+
{%- elif content is none -%}
|
| 52 |
+
{{- '' }}
|
| 53 |
+
{%- else -%}
|
| 54 |
+
{{- content }}
|
| 55 |
+
{%- endif -%}
|
| 56 |
+
{%- endmacro -%}
|
| 57 |
+
|
| 58 |
+
{%- set ns = namespace(last_user_index=-1) %}
|
| 59 |
+
{%- set sp_ns = namespace(system_prompt='', is_first_sp=true) %}
|
| 60 |
+
{%- for message in messages %}
|
| 61 |
+
{%- if message['role'] == 'system' %}
|
| 62 |
+
{%- set sp_ns.system_prompt = sp_ns.system_prompt + visible_text(message['content']) %}
|
| 63 |
+
{%- endif %}
|
| 64 |
+
{%- if message['role'] == 'user' %}
|
| 65 |
+
{%- set ns.last_user_index = loop.index0 %}
|
| 66 |
+
{%- endif %}
|
| 67 |
+
{%- endfor %}
|
| 68 |
+
{%- if reasoning_effort is defined and reasoning_effort is string and reasoning_effort != '' and not tools %}
|
| 69 |
+
{%- set sp_ns.system_prompt = sp_ns.system_prompt + reasoning_mode_token + 'reasoning_effort:' + reasoning_effort %}
|
| 70 |
+
{%- endif %}
|
| 71 |
+
{{- bos_token }}
|
| 72 |
+
{{- sp_ns.system_prompt }}
|
| 73 |
+
{%- if tools %}
|
| 74 |
+
{%- if sp_ns.system_prompt != '' %}
|
| 75 |
+
{{- '\n\n# Tools\n\nYou may call one or more functions to assist with the user query.' }}
|
| 76 |
+
{%- else %}
|
| 77 |
+
{{- '# Tools\n\nYou may call one or more functions to assist with the user query.' }}
|
| 78 |
+
{%- endif %}
|
| 79 |
+
{{- '\n\nYou are provided with function signatures within <tools></tools> XML tags:' }}
|
| 80 |
+
{{- '\n<tools>\n' }}
|
| 81 |
+
{%- for tool in tools %}
|
| 82 |
+
{%- if loop.index0 > 0 %}
|
| 83 |
+
{{- '\n' }}
|
| 84 |
+
{%- endif %}
|
| 85 |
+
{{- tool | tojson }}
|
| 86 |
+
{%- endfor %}
|
| 87 |
+
{{- '\n</tools>\n\n' }}
|
| 88 |
+
{{- 'For function call returns, you should first print ' + toolcalls_begin_token + '\n' }}
|
| 89 |
+
{{- 'For each function call, you should return object like:\n' }}
|
| 90 |
+
{{- toolcall_begin_token + '{function-name}' + toolsep_token + '\n' }}
|
| 91 |
+
{{- argkey_begin_token + '{arg-key-1}' + argkey_end_token + '\n' }}
|
| 92 |
+
{{- argvalue_begin_token + '{arg-value-1}' + argvalue_end_token + '\n' }}
|
| 93 |
+
{{- argkey_begin_token + '{arg-key-2}' + argkey_end_token + '\n' }}
|
| 94 |
+
{{- argvalue_begin_token + '{arg-value-2}' + argvalue_end_token + '\n' }}
|
| 95 |
+
{{- '...\n' }}
|
| 96 |
+
{{- toolcall_end_token + '\n' }}
|
| 97 |
+
{%- if reasoning_effort is defined and reasoning_effort is string and reasoning_effort != '' %}
|
| 98 |
+
{{- 'At the end of function call returns, you should print ' + toolcalls_end_token + reasoning_mode_token + 'reasoning_effort:' + reasoning_effort }}
|
| 99 |
+
{%- else %}
|
| 100 |
+
{{- 'At the end of function call returns, you should print ' + toolcalls_end_token }}
|
| 101 |
+
{%- endif %}
|
| 102 |
+
{%- endif %}
|
| 103 |
+
|
| 104 |
+
{%- set prev_ns = namespace(is_tool=false, is_tool_first=true) %}
|
| 105 |
+
{%- set last_ns = namespace(last_is_assistant=false) %}
|
| 106 |
+
{%- for message in messages %}
|
| 107 |
+
{%- if message['role'] == 'user' %}
|
| 108 |
+
{%- if prev_ns.is_tool %}
|
| 109 |
+
{{- toolresponses_end_token }}
|
| 110 |
+
{%- endif %}
|
| 111 |
+
{{- user_token + visible_text(message['content']) }}
|
| 112 |
+
{%- set prev_ns.is_tool = false %}
|
| 113 |
+
{%- endif %}
|
| 114 |
+
{%- if message['role'] == 'assistant' %}
|
| 115 |
+
{%- if 'reasoning_content' in message and message['reasoning_content'] is string %}
|
| 116 |
+
{%- set rc = message['reasoning_content'] %}
|
| 117 |
+
{%- elif 'reasoning' in message and message['reasoning'] is string %}
|
| 118 |
+
{%- set rc = message['reasoning'] %}
|
| 119 |
+
{%- else %}
|
| 120 |
+
{%- set rc = none %}
|
| 121 |
+
{%- endif %}
|
| 122 |
+
{%- if is_training %}
|
| 123 |
+
{%- if rc is not none %}
|
| 124 |
+
{%- set content = think_begin_token + rc + think_end_token + visible_text(message['content']) %}
|
| 125 |
+
{%- else %}
|
| 126 |
+
{%- set content = think_begin_token + think_end_token + visible_text(message['content']) %}
|
| 127 |
+
{%- endif %}
|
| 128 |
+
{%- else %}
|
| 129 |
+
{%- if interleaved_thinking %}
|
| 130 |
+
{%- if loop.index0 > ns.last_user_index and rc is not none %}
|
| 131 |
+
{%- set content = think_begin_token + rc + think_end_token + visible_text(message['content']) %}
|
| 132 |
+
{%- else %}
|
| 133 |
+
{%- set content = think_begin_token + think_end_token + visible_text(message['content']) %}
|
| 134 |
+
{%- endif %}
|
| 135 |
+
{%- else %}
|
| 136 |
+
{%- set content = think_begin_token + think_end_token + visible_text(message['content']) %}
|
| 137 |
+
{%- endif %}
|
| 138 |
+
{%- endif %}
|
| 139 |
+
{%- if prev_ns.is_tool %}
|
| 140 |
+
{{- toolresponses_end_token }}
|
| 141 |
+
{%- endif %}
|
| 142 |
+
{{- assistant_token }}
|
| 143 |
+
{%- if message['tool_calls'] is defined and message['tool_calls'] %}
|
| 144 |
+
{%- set prev_ns.is_tool_first = true %}
|
| 145 |
+
{{- content }}
|
| 146 |
+
{{- toolcalls_begin_token + '\n' }}
|
| 147 |
+
{%- for tool in message['tool_calls'] %}
|
| 148 |
+
{%- set arguments = tool['function']['arguments'] %}
|
| 149 |
+
{{- toolcall_begin_token + tool['function']['name'] + toolsep_token + '\n' }}
|
| 150 |
+
{%- for key, value in arguments.items() %}
|
| 151 |
+
{{- argkey_begin_token + key + argkey_end_token + '\n' }}
|
| 152 |
+
{%- if value is not string %}
|
| 153 |
+
{%- set value = value | tojson(ensure_ascii=False) %}
|
| 154 |
+
{%- endif %}
|
| 155 |
+
{{- argvalue_begin_token + value + argvalue_end_token + '\n' }}
|
| 156 |
+
{%- endfor %}
|
| 157 |
+
{{- toolcall_end_token + '\n' }}
|
| 158 |
+
{%- endfor %}
|
| 159 |
+
{{- toolcalls_end_token + eos_token }}
|
| 160 |
+
{%- else %}
|
| 161 |
+
{%- if not loop.last or is_training %}
|
| 162 |
+
{{- content + eos_token }}
|
| 163 |
+
{%- else %}
|
| 164 |
+
{{- content }}
|
| 165 |
+
{%- endif %}
|
| 166 |
+
{%- endif %}
|
| 167 |
+
{%- set prev_ns.is_tool = false %}
|
| 168 |
+
{%- endif %}
|
| 169 |
+
{%- if message['role'] == 'tool' %}
|
| 170 |
+
{%- set prev_ns.is_tool = true %}
|
| 171 |
+
{%- if prev_ns.is_tool_first %}
|
| 172 |
+
{{- toolresponses_begin_token + '\n' }}
|
| 173 |
+
{%- set prev_ns.is_tool_first = false %}
|
| 174 |
+
{%- endif %}
|
| 175 |
+
{{- toolresponse_begin_token + '\n' + visible_text(message['content']) + '\n' + toolresponse_end_token + '\n' }}
|
| 176 |
+
{%- endif %}
|
| 177 |
+
{%- if loop.last and message['role'] == 'assistant' %}
|
| 178 |
+
{%- set last_ns.last_is_assistant = true %}
|
| 179 |
+
{%- endif %}
|
| 180 |
+
|
| 181 |
+
{%- endfor %}
|
| 182 |
+
{%- if prev_ns.is_tool %}
|
| 183 |
+
{{- toolresponses_end_token }}
|
| 184 |
+
{%- endif %}
|
| 185 |
+
{%- if add_generation_prompt %}
|
| 186 |
+
{%- if not last_ns.last_is_assistant %}
|
| 187 |
+
{%- if reasoning_effort is defined and reasoning_effort in ['low', 'high'] %}
|
| 188 |
+
{{- assistant_token + think_begin_token }}
|
| 189 |
+
{%- elif reasoning_effort is defined and reasoning_effort == 'no_think' %}
|
| 190 |
+
{{- assistant_token + think_begin_token + think_end_token }}
|
| 191 |
+
{%- else %}
|
| 192 |
+
{{- assistant_token }}
|
| 193 |
+
{%- endif %}
|
| 194 |
+
{%- endif %}
|
| 195 |
+
{%- endif %}
|
config.json
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"HYV3ForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 120000,
|
| 6 |
+
"enable_attention_fp32_softmax": false,
|
| 7 |
+
"enable_lm_head_fp32": true,
|
| 8 |
+
"enable_moe_fp32_combine": false,
|
| 9 |
+
"eod_token_id": 120026,
|
| 10 |
+
"eos_token_id": 120025,
|
| 11 |
+
"expert_hidden_dim": 1536,
|
| 12 |
+
"moe_intermediate_size": 1536,
|
| 13 |
+
"first_k_dense_replace": 1,
|
| 14 |
+
"head_dim": 128,
|
| 15 |
+
"hidden_act": "silu",
|
| 16 |
+
"hidden_size": 4096,
|
| 17 |
+
"initializer_range": 0.006,
|
| 18 |
+
"intermediate_size": 13312,
|
| 19 |
+
"max_position_embeddings": 262144,
|
| 20 |
+
"model_type": "hy_v3",
|
| 21 |
+
"moe_router_enable_expert_bias": true,
|
| 22 |
+
"moe_router_use_sigmoid": true,
|
| 23 |
+
"num_attention_heads": 64,
|
| 24 |
+
"num_experts": 192,
|
| 25 |
+
"num_experts_per_tok": 8,
|
| 26 |
+
"num_hidden_layers": 80,
|
| 27 |
+
"num_key_value_heads": 8,
|
| 28 |
+
"num_shared_experts": 1,
|
| 29 |
+
"output_router_logits": true,
|
| 30 |
+
"pad_token_id": 120002,
|
| 31 |
+
"qk_norm": true,
|
| 32 |
+
"rms_norm_eps": 1e-05,
|
| 33 |
+
"rope_parameters": {
|
| 34 |
+
"rope_theta": 11158840.0,
|
| 35 |
+
"rope_type": "default"
|
| 36 |
+
},
|
| 37 |
+
"route_norm": true,
|
| 38 |
+
"router_scaling_factor": 2.826,
|
| 39 |
+
"sep_token_id": 120007,
|
| 40 |
+
"tie_word_embeddings": false,
|
| 41 |
+
"transformers_version": "5.6.0",
|
| 42 |
+
"use_cache": true,
|
| 43 |
+
"use_grouped_mm": false,
|
| 44 |
+
"vocab_size": 120832,
|
| 45 |
+
"num_nextn_predict_layers": 1,
|
| 46 |
+
"quantization": {
|
| 47 |
+
"group_size": 64,
|
| 48 |
+
"bits": 6,
|
| 49 |
+
"mode": "affine",
|
| 50 |
+
"lm_head": {
|
| 51 |
+
"bits": 8,
|
| 52 |
+
"group_size": 64,
|
| 53 |
+
"mode": "affine"
|
| 54 |
+
},
|
| 55 |
+
"model.embed_tokens": {
|
| 56 |
+
"bits": 8,
|
| 57 |
+
"group_size": 64,
|
| 58 |
+
"mode": "affine"
|
| 59 |
+
}
|
| 60 |
+
},
|
| 61 |
+
"quantization_config": {
|
| 62 |
+
"group_size": 64,
|
| 63 |
+
"bits": 6,
|
| 64 |
+
"mode": "affine",
|
| 65 |
+
"lm_head": {
|
| 66 |
+
"bits": 8,
|
| 67 |
+
"group_size": 64,
|
| 68 |
+
"mode": "affine"
|
| 69 |
+
},
|
| 70 |
+
"model.embed_tokens": {
|
| 71 |
+
"bits": 8,
|
| 72 |
+
"group_size": 64,
|
| 73 |
+
"mode": "affine"
|
| 74 |
+
}
|
| 75 |
+
}
|
| 76 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 120000,
|
| 3 |
+
"do_sample": true,
|
| 4 |
+
"eos_token_id": 120025,
|
| 5 |
+
"pad_token_id": 120002,
|
| 6 |
+
"temperature": 0.9,
|
| 7 |
+
"top_k": -1,
|
| 8 |
+
"top_p": 1,
|
| 9 |
+
"transformers_version": "5.6.0"
|
| 10 |
+
}
|
model-00001-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:760d28c1eda5ddfbf8bba6b0481acd795f1b5b24afc552d43082e87a177d9c14
|
| 3 |
+
size 5004818860
|
model-00002-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fff0edbd18b51ab7b85a0aefc99519e1f2af0e49766baf07a7748ae3fb33255
|
| 3 |
+
size 5004822229
|
model-00003-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ffbe9956387ff8c01c80c4b362f105ba84e1d57605457c3b86485d7c04c9b72
|
| 3 |
+
size 5004822013
|
model-00004-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:490ae864e74e01cbbd2d2dd1fc4e75c30254fbd90599674bae4ed5567165588b
|
| 3 |
+
size 5004822102
|
model-00005-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7994f6c25542f9144b8890af4f566bb4822f60015c63b4829836733f005c7447
|
| 3 |
+
size 5004822344
|
model-00006-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b309b6a58bd074c9a8c6c08b6ff54704a2460870ec8bdc472b320b27157ae44
|
| 3 |
+
size 5005153050
|
model-00007-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:350b897574d301e7ad12eb6a01c17a05f40b3b7696f17d56d6b48d3abfa5085d
|
| 3 |
+
size 5004829352
|
model-00008-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bd19911a0a6eba73cfae64280527295043addb4163bcdafdb4fb32937e0d336
|
| 3 |
+
size 5004822681
|
model-00009-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:019034a895e38dca3458caeac7935d6ea573585c60b384a3e17c0fbffe306bb0
|
| 3 |
+
size 5004822255
|
model-00010-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37ab986bba571faddfe6fed29afba9ee573b87d9b650fb553d24bfb05e4759af
|
| 3 |
+
size 5004821834
|
model-00011-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e936438f3bc3ea23234a15d27ba4f34b4dfd4fc2b744a0ed1bfe37fbbb91e757
|
| 3 |
+
size 5004822421
|
model-00012-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3124034fcd7c64f4e7b261c7b494f684e0372692fd82eefc475a9a5dfeee6156
|
| 3 |
+
size 5004787586
|
model-00013-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1052ff478482b2b590a73e9e7d2d9f48ec2fcf3e4ce85399d9cd41d1f63b236
|
| 3 |
+
size 5003113584
|
model-00014-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3eea466c1e8b04b6fa86e7e42b5ec63c1b49efb8e78ddde358f0be124f6113c2
|
| 3 |
+
size 5004822565
|
model-00015-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:009c938d0c3aaded913b64f7b78979af8c66cd5146688a3ed8e49915fbfed8ab
|
| 3 |
+
size 5004822337
|
model-00016-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18abc3d15d3ed297815b8dbdd1578d296fe47e834ec8d4d55db79254b6c9934a
|
| 3 |
+
size 5004822112
|
model-00017-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:360ba44004e81d8236cd3dbc20aa45b5cfde6c4bcb8ed52c1cbd3fa66b1a6167
|
| 3 |
+
size 5004822023
|
model-00018-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f498f34872b33a55d9d843a3859e05899427ed303ea885c00d580a548654f82
|
| 3 |
+
size 5001392577
|
model-00019-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ee984b97b32a615c8c161c1a77f62760c91a331135190f4a60726fe7d0f6de7
|
| 3 |
+
size 5004803977
|
model-00020-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b96c462eecae038473243f8332cb4d8279377432f0483b63454c875b01019093
|
| 3 |
+
size 5004822145
|
model-00021-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c88b76d68ccddcbcbf0e7893a6e552f8f774764f3a7caec9438632a84231e4d
|
| 3 |
+
size 5004822327
|
model-00022-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a716da6f9ab60679af633bd659db4eaaa1b7fd94a6ad02e81050ba8855247437
|
| 3 |
+
size 5004822310
|
model-00023-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56b36064055bb736cd6f4336bfedffffdf408ee539874583ad731bc51d916e21
|
| 3 |
+
size 5004821937
|
model-00024-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc50b78fd2802e85cffa60d707df9cbbf444f63f3e10134833f03ea9d06982de
|
| 3 |
+
size 5018437895
|
model-00025-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ab4b755c42fe3f1b3df1cd3be6b32365ffa377bef50165398fbf62983f1b005
|
| 3 |
+
size 5003090597
|
model-00026-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1d846c4fda3e679a2a785d06d14fb7f63735b59277280fb0a1710c1058918f4
|
| 3 |
+
size 5004822128
|
model-00027-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a55c7225fe0b73930826c3c6d2c166bb7919907141c49af326ed56c6a2f3352
|
| 3 |
+
size 5004822047
|
model-00028-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b41f176c1c9c80d3092b885e7e02dcad3f125a6de5cf0bfab3f6771b7d45940b
|
| 3 |
+
size 5004822506
|
model-00029-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:49ae74b4a1a4123e71664ee48b41e83c9ea7f2276b8637eafaecb81dc41aca56
|
| 3 |
+
size 5004822178
|
model-00030-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7567f55eb289a4b7f2580010f8a1150c435a78fba236e82a32d461705363c47a
|
| 3 |
+
size 5004822153
|
model-00031-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a8a918e107d456c34c61b52db72815e586d4ff0c2d8205cdfa2cf071e42f4e5
|
| 3 |
+
size 5002404624
|
model-00032-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a9083ef7550006606d28d307dca7460e2522c20c7baa6f7d4a1b4e8d4a31798
|
| 3 |
+
size 5004822334
|
model-00033-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bfbb471ec2ab1b40ca5b94bf95b73b58b70dea3a116aeeab6ac5375842afc71
|
| 3 |
+
size 5004822158
|
model-00034-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec336161fc99763fa8cbb4caf773113ee6e8c374d629e45f7bb57755b90aabc2
|
| 3 |
+
size 5004822152
|
model-00035-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8d77fde7e4d388ad785f3efe91c2afb141b615ff6242aa854b669e29223da77
|
| 3 |
+
size 5004822573
|
model-00036-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24688974d54ba8425015907d293337b1e6f753700f412234fbf301d34c0c8056
|
| 3 |
+
size 5004822274
|
model-00037-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50550919fa45e5eb37c822a1e9924d8f1d0d3b516b0e8dca5ec2bd6c2f97b2c1
|
| 3 |
+
size 5003316083
|
model-00038-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aaa3783b41b1b2db1b911389a012313a1473948ff918b0a6e39460fa200658ca
|
| 3 |
+
size 5004822297
|
model-00039-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d913c8af1989adbb18eef4fa4fc3e83645f5721144853a6718621162847e8a58
|
| 3 |
+
size 5004822304
|
model-00040-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:65289464230321bf7847657da5bf9b4be58ee5b943121be1c2dbb22694790bd4
|
| 3 |
+
size 5004822116
|
model-00041-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba5593b98316f204ff3e024b109227c68cbc4ac71e8d8e8fdb66f1120ff444d0
|
| 3 |
+
size 5004822312
|
model-00042-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ded5186b7f373a68c27707ed0d825c6971ace2b839d295160753d12dc22f3ff8
|
| 3 |
+
size 5004822360
|
model-00043-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfe2d24114f88ec0120995462d9976cf4d11304210e1e4a332fafaa47850dbc5
|
| 3 |
+
size 5003095784
|
model-00044-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbf55f92d47dc024db25d4a21b0c0e679465e0f6d7f2f77f7ca27002397f8327
|
| 3 |
+
size 5004821720
|
model-00045-of-00049.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b0afd15c8dcef18a9dc83950068891658e2e6968e126c3f5da7b41b3492f747
|
| 3 |
+
size 5004822553
|