wwwtttjjj commited on
Commit ·
078d7d9
1
Parent(s): fa287b5
pure
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +1 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_0.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_1.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_2.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_3.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_4.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_5.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_6.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_7.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/added_tokens.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/chat_template.jinja +54 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/config.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/merges.txt +0 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/special_tokens_map.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/tokenizer.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/tokenizer_config.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/vocab.json +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_0.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_1.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_2.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_3.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_4.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_5.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_6.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_7.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_0.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_1.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_2.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_3.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_4.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_5.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_6.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_7.pt +3 -0
- qwen-1.5B-skywork-1.5B/global_step_250/data.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_0.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_1.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_2.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_3.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_4.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_5.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_6.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_7.pt +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/added_tokens.json +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/config.json +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/generation_config.json +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/merges.txt +0 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00001-of-00004.safetensors +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00002-of-00004.safetensors +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00003-of-00004.safetensors +3 -0
- qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00004-of-00004.safetensors +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
*.json filter=lfs diff=lfs merge=lfs -text
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c56eca5155ffcb4e688bd056a7d1006dcef69a6f432224118cdf9d442bc4d97
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba87237fcb4caea12ef21d5a6e1a7e564fdf9764054fb0b0b19f14b8b839cefd
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c2c8c5908c6c2877940f3fbc43b51cafd38287173a3b20abf3d4a793fe000ce
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c1ccd26fefc6ba7cc6eead04b7fecc5e4a9ab80e8fc01ae14d31fc8c6ed9638
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78a338d6da41fde705987fc7d9e81c0d66a9a47dc98abd0611a67bb60792abae
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70f07ee320260c830ff4479a97c094a28cc8055d62c868ac611dcd9d6da9918f
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d29417545ae20e4d1fe42828b790db38082bdc3616ab8c7d7f3ee5860f5af795
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/extra_state_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:774833e7fbf8a7cda3eec8f638f5ccef80141b202e5f6020f8ee8d5b141308f6
|
| 3 |
+
size 14632
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
|
| 3 |
+
size 605
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/chat_template.jinja
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{%- if tools %}
|
| 2 |
+
{{- '<|im_start|>system\n' }}
|
| 3 |
+
{%- if messages[0]['role'] == 'system' %}
|
| 4 |
+
{{- messages[0]['content'] }}
|
| 5 |
+
{%- else %}
|
| 6 |
+
{{- 'Please reason step by step, and put your final answer within \\boxed{}.' }}
|
| 7 |
+
{%- endif %}
|
| 8 |
+
{{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
|
| 9 |
+
{%- for tool in tools %}
|
| 10 |
+
{{- "\n" }}
|
| 11 |
+
{{- tool | tojson }}
|
| 12 |
+
{%- endfor %}
|
| 13 |
+
{{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
|
| 14 |
+
{%- else %}
|
| 15 |
+
{%- if messages[0]['role'] == 'system' %}
|
| 16 |
+
{{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}
|
| 17 |
+
{%- else %}
|
| 18 |
+
{{- '<|im_start|>system\nPlease reason step by step, and put your final answer within \\boxed{}.<|im_end|>\n' }}
|
| 19 |
+
{%- endif %}
|
| 20 |
+
{%- endif %}
|
| 21 |
+
{%- for message in messages %}
|
| 22 |
+
{%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %}
|
| 23 |
+
{{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
|
| 24 |
+
{%- elif message.role == "assistant" %}
|
| 25 |
+
{{- '<|im_start|>' + message.role }}
|
| 26 |
+
{%- if message.content %}
|
| 27 |
+
{{- '\n' + message.content }}
|
| 28 |
+
{%- endif %}
|
| 29 |
+
{%- for tool_call in message.tool_calls %}
|
| 30 |
+
{%- if tool_call.function is defined %}
|
| 31 |
+
{%- set tool_call = tool_call.function %}
|
| 32 |
+
{%- endif %}
|
| 33 |
+
{{- '\n<tool_call>\n{"name": "' }}
|
| 34 |
+
{{- tool_call.name }}
|
| 35 |
+
{{- '", "arguments": ' }}
|
| 36 |
+
{{- tool_call.arguments | tojson }}
|
| 37 |
+
{{- '}\n</tool_call>' }}
|
| 38 |
+
{%- endfor %}
|
| 39 |
+
{{- '<|im_end|>\n' }}
|
| 40 |
+
{%- elif message.role == "tool" %}
|
| 41 |
+
{%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %}
|
| 42 |
+
{{- '<|im_start|>user' }}
|
| 43 |
+
{%- endif %}
|
| 44 |
+
{{- '\n<tool_response>\n' }}
|
| 45 |
+
{{- message.content }}
|
| 46 |
+
{{- '\n</tool_response>' }}
|
| 47 |
+
{%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
|
| 48 |
+
{{- '<|im_end|>\n' }}
|
| 49 |
+
{%- endif %}
|
| 50 |
+
{%- endif %}
|
| 51 |
+
{%- endfor %}
|
| 52 |
+
{%- if add_generation_prompt %}
|
| 53 |
+
{{- '<|im_start|>assistant\n' }}
|
| 54 |
+
{%- endif %}
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e321f017c3bc28c8ea90b9256fcd367ae319c1f3c8205de54e28bd4638a57b1
|
| 3 |
+
size 1338
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/special_tokens_map.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6676f091c8bc4d1b50146427cfde92073402866b87b6e39223227931b70083e9
|
| 3 |
+
size 616
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
|
| 3 |
+
size 11421896
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/tokenizer_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60f6e7bc948cedd377a20f01d022ef664d026fbc93d72e0a9bdac233f8632181
|
| 3 |
+
size 4689
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/huggingface/vocab.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
|
| 3 |
+
size 2776833
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8324747f5a4bf39a9f780cfea9bdd0e21fcefbd3440af1b20a4562f52bb7960
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f624a74d887351fdd969c7ca083e212941769bbcf97b01b82b29d4f26cfcdf58
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de48bda292149a42eba20f7e33a4c6ac46f6afda68eae424a2defa01e9771a0d
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:905712736ac83c3fb8012fdb22d17c8dccfacc5ebd1f70cd509d024fc20a9663
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d59fedc3a47af84f7b0d30782191b9b335f6bbfbd668d95a442549463f02be0a
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4ef1e13df5d7ab60abb9cd74abc988e326fb81be7ef53e842e96340132d8fed
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e9fd643388b7af722f94c7947e543711811638f665de34684c1b15c5009e9dc
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/model_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f93027254e732311d9dda4275682356f2bf7e8bb66ba8fefaf113d265639177
|
| 3 |
+
size 888732218
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:513e3b3a6e85ae6321593d9c37d72aa014d10b0a9ce3519ab4101f6a83c280e9
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cff0d1d63929dc8f20aafe1f14c0410f20b9ef98ef4841806380e91312d2796e
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ce51f2acb5908e187cb9342fb7612e54d996cf11cbbd94937b6545d0aeeb16e
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02df2752412802ead3fa2eeb9436b02fe8b32b9d100066eb61a8a00a32fd44de
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33f2d045efff8c528491845ce3c40a21afb4f37c8bd9bae332d6e5316de6aef7
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4760044625a2fa864d90722547c510ec1c8f0a47e2800e685170ce5215c8efb6
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:150bb7688404b1d023b2d9f6df34fdf2c9f6e34d60264ab27a8aeccbe985ccf9
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/actor/optim_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:282cfac72cb0fe0a2f0fc5dc376f4e0b9e082cc9b060147f659033621e18d7ba
|
| 3 |
+
size 1543740471
|
qwen-1.5B-skywork-1.5B/global_step_250/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee1ede7d9a5c1ec80a624389640464fbaf09b5ff3e1fe0ccae18de3106cd7d34
|
| 3 |
+
size 1108
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5532ae8bcf60338fa48809bde2b25f5e097c8930b56a5df0a92b9b362ee5361
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28839eb8bbb96daf1b0ef61478b6556ba5b95f6f9bedc1df509b2dcb4128b7ce
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d71ac2bdaa621d71921e6922b8c6007383a48c7179088908c53c29295ec7cfb
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bd4c57d929cc83366242648afa1e8961612d94e381d77b9661221d473d78dad
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:321d26d90106ed2c604a1e8a517bad3f389f4f86ace1120aebb7efed2b866e3b
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0ce77fbccf93c741639bed6b70001641a1a428da738a607a12b91246dcf3dbb
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e05e5c826c3a1bfb5fa2d17bfbc45dad146e01b2d2cc2b729f668a1eb31d1eed
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/extra_state_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:535aa8f389d3512238110c2bd7e6d13a48653f9423fd16a4c18300999ffc5969
|
| 3 |
+
size 14632
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
|
| 3 |
+
size 605
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f153de7ab125306c10522b8f0470d8ed2c918c6ebaffe1cd06014a4be7cc9da9
|
| 3 |
+
size 1387
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/generation_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7402413987500866d32be7f6136c9db6e85080e3b4de4e5eccc83dc4df2548d
|
| 3 |
+
size 121
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00001-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9d0b4ed3eb79e4c2012d7d6e1bc3da15c6ac970218893da731cac352c49299d
|
| 3 |
+
size 4888731480
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00002-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19e954dac8058c183983208d24a4dcb2d8c9f23bf682e3669bdadfced1952f3f
|
| 3 |
+
size 4176767696
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00003-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b920a0e5d306f5c8be516ea1fd73503e10f5648ef38ff5c327510e3ab5b3d777
|
| 3 |
+
size 4877540192
|
qwen-7B-skywork-7B/global_step_190/actor/hf_model/model-00004-of-00004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20f3595cab4bfa3c0697ea48a5edd28d74894e49a6fc3e13008c074b58cf6fe5
|
| 3 |
+
size 1288232448
|