Training in progress, step 50
Browse files- README.md +4 -4
- adapter_config.json +1 -1
- adapter_model.safetensors +1 -1
- processor_config.json +1 -4
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -4,8 +4,8 @@ library_name: transformers
|
|
| 4 |
model_name: number
|
| 5 |
tags:
|
| 6 |
- generated_from_trainer
|
| 7 |
-
- sft
|
| 8 |
- trl
|
|
|
|
| 9 |
licence: license
|
| 10 |
---
|
| 11 |
|
|
@@ -27,7 +27,7 @@ print(output["generated_text"])
|
|
| 27 |
|
| 28 |
## Training procedure
|
| 29 |
|
| 30 |
-
|
| 31 |
|
| 32 |
|
| 33 |
|
|
@@ -35,8 +35,8 @@ This model was trained with SFT.
|
|
| 35 |
|
| 36 |
### Framework versions
|
| 37 |
|
| 38 |
-
- TRL: 0.29.
|
| 39 |
-
- Transformers: 5.
|
| 40 |
- Pytorch: 2.10.0+cu128
|
| 41 |
- Datasets: 4.0.0
|
| 42 |
- Tokenizers: 0.22.2
|
|
|
|
| 4 |
model_name: number
|
| 5 |
tags:
|
| 6 |
- generated_from_trainer
|
|
|
|
| 7 |
- trl
|
| 8 |
+
- sft
|
| 9 |
licence: license
|
| 10 |
---
|
| 11 |
|
|
|
|
| 27 |
|
| 28 |
## Training procedure
|
| 29 |
|
| 30 |
+
|
| 31 |
|
| 32 |
|
| 33 |
|
|
|
|
| 35 |
|
| 36 |
### Framework versions
|
| 37 |
|
| 38 |
+
- TRL: 0.29.1
|
| 39 |
+
- Transformers: 5.4.0
|
| 40 |
- Pytorch: 2.10.0+cu128
|
| 41 |
- Datasets: 4.0.0
|
| 42 |
- Tokenizers: 0.22.2
|
adapter_config.json
CHANGED
|
@@ -29,8 +29,8 @@
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
-
"q_proj",
|
| 33 |
"v_proj",
|
|
|
|
| 34 |
"o_proj"
|
| 35 |
],
|
| 36 |
"target_parameters": null,
|
|
|
|
| 29 |
"rank_pattern": {},
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
|
|
|
| 32 |
"v_proj",
|
| 33 |
+
"q_proj",
|
| 34 |
"o_proj"
|
| 35 |
],
|
| 36 |
"target_parameters": null,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5071040
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5aa82cf9717696a08251b642e581761d9bb0c73b0d3db1320b88a4fe30ee4f7a
|
| 3 |
size 5071040
|
processor_config.json
CHANGED
|
@@ -1,6 +1,5 @@
|
|
| 1 |
{
|
| 2 |
"image_processor": {
|
| 3 |
-
"data_format": "channels_first",
|
| 4 |
"do_convert_rgb": true,
|
| 5 |
"do_normalize": true,
|
| 6 |
"do_rescale": true,
|
|
@@ -10,7 +9,7 @@
|
|
| 10 |
0.5,
|
| 11 |
0.5
|
| 12 |
],
|
| 13 |
-
"image_processor_type": "
|
| 14 |
"image_std": [
|
| 15 |
0.5,
|
| 16 |
0.5,
|
|
@@ -28,8 +27,6 @@
|
|
| 28 |
},
|
| 29 |
"processor_class": "Qwen3VLProcessor",
|
| 30 |
"video_processor": {
|
| 31 |
-
"data_format": "channels_first",
|
| 32 |
-
"default_to_square": true,
|
| 33 |
"do_convert_rgb": true,
|
| 34 |
"do_normalize": true,
|
| 35 |
"do_rescale": true,
|
|
|
|
| 1 |
{
|
| 2 |
"image_processor": {
|
|
|
|
| 3 |
"do_convert_rgb": true,
|
| 4 |
"do_normalize": true,
|
| 5 |
"do_rescale": true,
|
|
|
|
| 9 |
0.5,
|
| 10 |
0.5
|
| 11 |
],
|
| 12 |
+
"image_processor_type": "Qwen2VLImageProcessor",
|
| 13 |
"image_std": [
|
| 14 |
0.5,
|
| 15 |
0.5,
|
|
|
|
| 27 |
},
|
| 28 |
"processor_class": "Qwen3VLProcessor",
|
| 29 |
"video_processor": {
|
|
|
|
|
|
|
| 30 |
"do_convert_rgb": true,
|
| 31 |
"do_normalize": true,
|
| 32 |
"do_rescale": true,
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5649
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f9255623a6f7f550f0efc0716d29ab04e883c72e25f798bc07edaff9eb82b8a
|
| 3 |
size 5649
|