Jerry999 commited on
Commit
0346146
·
verified ·
1 Parent(s): 8b68ee6

Upload checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309

Browse files
Files changed (18) hide show
  1. .gitattributes +1 -0
  2. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/chat_template.jinja +4 -0
  3. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/config.json +71 -0
  4. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/generation_config.json +12 -0
  5. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/model.safetensors +3 -0
  6. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/optimizer.pt +3 -0
  7. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/rng_state.pth +3 -0
  8. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/scheduler.pt +3 -0
  9. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokenizer.json +3 -0
  10. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokenizer_config.json +29 -0
  11. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokens_state. +1 -0
  12. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/trainer_state.json +0 -0
  13. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/training_args.bin +3 -0
  14. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/debug.log +0 -0
  15. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/balanced_test_alpaca_converted.jsonl +0 -0
  16. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/balanced_test_alpaca_results.jsonl +0 -0
  17. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/eval_results.csv +2 -0
  18. checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/eval_summary.json +133 -0
.gitattributes CHANGED
@@ -72,3 +72,4 @@ checkpoints/math_operations/lora_sft_primitive_atomic_50k_t20260305/checkpoint-4
72
  checkpoints/math_operations/lora_sft_primitive_atomic_50k_t20260305/checkpoint-5150/tokenizer.json filter=lfs diff=lfs merge=lfs -text
73
  checkpoints/math_operations/primitive_atomic_full_sft_50k_lr1e4_t20260308/checkpoint-2082/tokenizer.json filter=lfs diff=lfs merge=lfs -text
74
  checkpoints/math_operations/primitive_atomic_full_sft_50k_lr1e4_t20260308/checkpoint-3123/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
72
  checkpoints/math_operations/lora_sft_primitive_atomic_50k_t20260305/checkpoint-5150/tokenizer.json filter=lfs diff=lfs merge=lfs -text
73
  checkpoints/math_operations/primitive_atomic_full_sft_50k_lr1e4_t20260308/checkpoint-2082/tokenizer.json filter=lfs diff=lfs merge=lfs -text
74
  checkpoints/math_operations/primitive_atomic_full_sft_50k_lr1e4_t20260308/checkpoint-3123/tokenizer.json filter=lfs diff=lfs merge=lfs -text
75
+ checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/chat_template.jinja ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '
2
+ ' + message['content'] + '<|im_end|>' + '
3
+ '}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
4
+ ' }}{% endif %}
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": null,
8
+ "dtype": "bfloat16",
9
+ "eos_token_id": 151645,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 2560,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 9728,
15
+ "layer_types": [
16
+ "full_attention",
17
+ "full_attention",
18
+ "full_attention",
19
+ "full_attention",
20
+ "full_attention",
21
+ "full_attention",
22
+ "full_attention",
23
+ "full_attention",
24
+ "full_attention",
25
+ "full_attention",
26
+ "full_attention",
27
+ "full_attention",
28
+ "full_attention",
29
+ "full_attention",
30
+ "full_attention",
31
+ "full_attention",
32
+ "full_attention",
33
+ "full_attention",
34
+ "full_attention",
35
+ "full_attention",
36
+ "full_attention",
37
+ "full_attention",
38
+ "full_attention",
39
+ "full_attention",
40
+ "full_attention",
41
+ "full_attention",
42
+ "full_attention",
43
+ "full_attention",
44
+ "full_attention",
45
+ "full_attention",
46
+ "full_attention",
47
+ "full_attention",
48
+ "full_attention",
49
+ "full_attention",
50
+ "full_attention",
51
+ "full_attention"
52
+ ],
53
+ "max_position_embeddings": 262144,
54
+ "max_window_layers": 36,
55
+ "model_type": "qwen3",
56
+ "num_attention_heads": 32,
57
+ "num_hidden_layers": 36,
58
+ "num_key_value_heads": 8,
59
+ "pad_token_id": 151643,
60
+ "rms_norm_eps": 1e-06,
61
+ "rope_parameters": {
62
+ "rope_theta": 5000000,
63
+ "rope_type": "default"
64
+ },
65
+ "sliding_window": null,
66
+ "tie_word_embeddings": true,
67
+ "transformers_version": "5.0.0",
68
+ "use_cache": false,
69
+ "use_sliding_window": false,
70
+ "vocab_size": 151936
71
+ }
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_sample": true,
3
+ "eos_token_id": [
4
+ 151645,
5
+ 151643
6
+ ],
7
+ "pad_token_id": 151643,
8
+ "temperature": 0.7,
9
+ "top_k": 20,
10
+ "top_p": 0.8,
11
+ "transformers_version": "5.0.0"
12
+ }
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:292d00bb09b3870f13e4d6c952cbf2bfa6917fe472738124a6ebb8df0796836c
3
+ size 8822894520
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8780501c2f783665a77b85208cd3e759fe4f06e87bab00e2b7ca226cda4b40d1
3
+ size 16090225449
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed3753ab7977739b8eda494dd72defae5750f7283141b11a8f562160ba4c1a23
3
+ size 14645
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd5cdc84d2b4d9a932721799f114ebfcc55a4d590aebab27d5998a9f127ea471
3
+ size 1465
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
+ size 11422650
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokenizer_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": true,
24
+ "model_max_length": 1010000,
25
+ "pad_token": "<|endoftext|>",
26
+ "split_special_tokens": false,
27
+ "tokenizer_class": "Qwen2Tokenizer",
28
+ "unk_token": null
29
+ }
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/tokens_state. ADDED
@@ -0,0 +1 @@
 
 
1
+ {"total": 51200000, "trainable": 5590610}
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/checkpoint-3125/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f19357fe7faa7293775d9e7faee6aabb3fe0214ae428e3c5d4fa8ace13d4ef3
3
+ size 7185
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/debug.log ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/balanced_test_alpaca_converted.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/balanced_test_alpaca_results.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/eval_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ category,filename,total,correct,accuracy,format_found,format_accuracy,errors_count
2
+ math_operations,balanced_test_alpaca_results,500,4,0.80,500,100.00,496
checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/eval_summary.json ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "overall": {
3
+ "total": 500,
4
+ "correct": 4,
5
+ "accuracy": 0.8,
6
+ "format_found": 500,
7
+ "format_accuracy": 100.0
8
+ },
9
+ "per_operation": {
10
+ "a": {
11
+ "total": 25,
12
+ "correct": 0,
13
+ "accuracy": 0.0,
14
+ "format_found": 25
15
+ },
16
+ "b": {
17
+ "total": 25,
18
+ "correct": 0,
19
+ "accuracy": 0.0,
20
+ "format_found": 25
21
+ },
22
+ "c": {
23
+ "total": 25,
24
+ "correct": 1,
25
+ "accuracy": 4.0,
26
+ "format_found": 25
27
+ },
28
+ "d": {
29
+ "total": 25,
30
+ "correct": 0,
31
+ "accuracy": 0.0,
32
+ "format_found": 25
33
+ },
34
+ "e": {
35
+ "total": 25,
36
+ "correct": 0,
37
+ "accuracy": 0.0,
38
+ "format_found": 25
39
+ },
40
+ "f": {
41
+ "total": 25,
42
+ "correct": 0,
43
+ "accuracy": 0.0,
44
+ "format_found": 25
45
+ },
46
+ "g": {
47
+ "total": 25,
48
+ "correct": 0,
49
+ "accuracy": 0.0,
50
+ "format_found": 25
51
+ },
52
+ "h": {
53
+ "total": 25,
54
+ "correct": 0,
55
+ "accuracy": 0.0,
56
+ "format_found": 25
57
+ },
58
+ "i": {
59
+ "total": 25,
60
+ "correct": 0,
61
+ "accuracy": 0.0,
62
+ "format_found": 25
63
+ },
64
+ "j": {
65
+ "total": 25,
66
+ "correct": 0,
67
+ "accuracy": 0.0,
68
+ "format_found": 25
69
+ },
70
+ "k": {
71
+ "total": 25,
72
+ "correct": 0,
73
+ "accuracy": 0.0,
74
+ "format_found": 25
75
+ },
76
+ "l": {
77
+ "total": 25,
78
+ "correct": 0,
79
+ "accuracy": 0.0,
80
+ "format_found": 25
81
+ },
82
+ "m": {
83
+ "total": 25,
84
+ "correct": 0,
85
+ "accuracy": 0.0,
86
+ "format_found": 25
87
+ },
88
+ "n": {
89
+ "total": 25,
90
+ "correct": 1,
91
+ "accuracy": 4.0,
92
+ "format_found": 25
93
+ },
94
+ "o": {
95
+ "total": 25,
96
+ "correct": 0,
97
+ "accuracy": 0.0,
98
+ "format_found": 25
99
+ },
100
+ "p": {
101
+ "total": 25,
102
+ "correct": 0,
103
+ "accuracy": 0.0,
104
+ "format_found": 25
105
+ },
106
+ "q": {
107
+ "total": 25,
108
+ "correct": 0,
109
+ "accuracy": 0.0,
110
+ "format_found": 25
111
+ },
112
+ "r": {
113
+ "total": 25,
114
+ "correct": 0,
115
+ "accuracy": 0.0,
116
+ "format_found": 25
117
+ },
118
+ "s": {
119
+ "total": 25,
120
+ "correct": 0,
121
+ "accuracy": 0.0,
122
+ "format_found": 25
123
+ },
124
+ "t": {
125
+ "total": 25,
126
+ "correct": 2,
127
+ "accuracy": 8.0,
128
+ "format_found": 25
129
+ }
130
+ },
131
+ "n_errors": 496,
132
+ "results_file": "/home/jiaruil5/math_rl/mix_teachers/r3lit_rl/mix_teachers/checkpoints/math_operations/primitive_atomic_full_sft_then_2step_compositional_full_sft_t20260309/eval_results_easy_ops/balanced_test_alpaca_results.jsonl"
133
+ }