sreenathsree1578 commited on
Commit
c3351cc
·
verified ·
1 Parent(s): 3400653

Delete checkpoint-420

Browse files
checkpoint-420/config.json DELETED
@@ -1,38 +0,0 @@
1
- {
2
- "architectures": [
3
- "RobertaForSequenceClassification"
4
- ],
5
- "attention_probs_dropout_prob": 0.1,
6
- "bos_token_id": 0,
7
- "classifier_dropout": null,
8
- "dtype": "float32",
9
- "eos_token_id": 2,
10
- "gradient_checkpointing": false,
11
- "hidden_act": "gelu",
12
- "hidden_dropout_prob": 0.1,
13
- "hidden_size": 768,
14
- "id2label": {
15
- "0": "negative",
16
- "1": "neutral",
17
- "2": "positive"
18
- },
19
- "initializer_range": 0.02,
20
- "intermediate_size": 3072,
21
- "label2id": {
22
- "negative": 0,
23
- "neutral": 1,
24
- "positive": 2
25
- },
26
- "layer_norm_eps": 1e-05,
27
- "max_position_embeddings": 514,
28
- "model_type": "roberta",
29
- "num_attention_heads": 12,
30
- "num_hidden_layers": 12,
31
- "pad_token_id": 1,
32
- "position_embedding_type": "absolute",
33
- "problem_type": "single_label_classification",
34
- "transformers_version": "4.57.3",
35
- "type_vocab_size": 1,
36
- "use_cache": true,
37
- "vocab_size": 50265
38
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-420/merges.txt DELETED
The diff for this file is too large to render. See raw diff
 
checkpoint-420/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6da9ce0bfcb6094cfd8ba360092741512ab034ae071d2f38acb8a05033b03b8
3
- size 498615900
 
 
 
 
checkpoint-420/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3bfb7bbc7ada6aead86c4e9fd749d152867a3bea6e4d1009626b5c162871ee3
3
- size 997354891
 
 
 
 
checkpoint-420/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a88f713e170b605de3f07d6335a7aebf0563448c4205da1f174ad7488145d5f6
3
- size 14645
 
 
 
 
checkpoint-420/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0d081670a3595ef1d8bda2d0593865c2e4f927204e0ce17c8a124e63314dd6d
3
- size 1383
 
 
 
 
checkpoint-420/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:779cf509249b6a7144c85ba8b6511ff2eac89a925012de054cb032c63e161910
3
- size 1465
 
 
 
 
checkpoint-420/special_tokens_map.json DELETED
@@ -1,51 +0,0 @@
1
- {
2
- "bos_token": {
3
- "content": "<s>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "cls_token": {
10
- "content": "<s>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "eos_token": {
17
- "content": "</s>",
18
- "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "mask_token": {
24
- "content": "<mask>",
25
- "lstrip": true,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "pad_token": {
31
- "content": "<pad>",
32
- "lstrip": false,
33
- "normalized": true,
34
- "rstrip": false,
35
- "single_word": false
36
- },
37
- "sep_token": {
38
- "content": "</s>",
39
- "lstrip": false,
40
- "normalized": true,
41
- "rstrip": false,
42
- "single_word": false
43
- },
44
- "unk_token": {
45
- "content": "<unk>",
46
- "lstrip": false,
47
- "normalized": true,
48
- "rstrip": false,
49
- "single_word": false
50
- }
51
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-420/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
checkpoint-420/tokenizer_config.json DELETED
@@ -1,58 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<s>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "1": {
13
- "content": "<pad>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- },
20
- "2": {
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false,
26
- "special": true
27
- },
28
- "3": {
29
- "content": "<unk>",
30
- "lstrip": false,
31
- "normalized": true,
32
- "rstrip": false,
33
- "single_word": false,
34
- "special": true
35
- },
36
- "50264": {
37
- "content": "<mask>",
38
- "lstrip": true,
39
- "normalized": false,
40
- "rstrip": false,
41
- "single_word": false,
42
- "special": true
43
- }
44
- },
45
- "bos_token": "<s>",
46
- "clean_up_tokenization_spaces": false,
47
- "cls_token": "<s>",
48
- "eos_token": "</s>",
49
- "errors": "replace",
50
- "extra_special_tokens": {},
51
- "mask_token": "<mask>",
52
- "model_max_length": 1000000000000000019884624838656,
53
- "pad_token": "<pad>",
54
- "sep_token": "</s>",
55
- "tokenizer_class": "RobertaTokenizer",
56
- "trim_offsets": true,
57
- "unk_token": "<unk>"
58
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-420/trainer_state.json DELETED
@@ -1,117 +0,0 @@
1
- {
2
- "best_global_step": 420,
3
- "best_metric": 0.9964285714285714,
4
- "best_model_checkpoint": "/content/fine_tuned_eq_model/checkpoint-420",
5
- "epoch": 3.0,
6
- "eval_steps": 500,
7
- "global_step": 420,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.35714285714285715,
14
- "grad_norm": 0.0005774371675215662,
15
- "learning_rate": 1.7666666666666668e-05,
16
- "loss": 0.0003,
17
- "step": 50
18
- },
19
- {
20
- "epoch": 0.7142857142857143,
21
- "grad_norm": 0.003052965272217989,
22
- "learning_rate": 1.5285714285714286e-05,
23
- "loss": 0.0429,
24
- "step": 100
25
- },
26
- {
27
- "epoch": 1.0,
28
- "eval_accuracy": 0.9946428571428572,
29
- "eval_loss": 0.05661650374531746,
30
- "eval_runtime": 1.1506,
31
- "eval_samples_per_second": 486.685,
32
- "eval_steps_per_second": 30.418,
33
- "step": 140
34
- },
35
- {
36
- "epoch": 1.0714285714285714,
37
- "grad_norm": 0.0009856473188847303,
38
- "learning_rate": 1.2904761904761907e-05,
39
- "loss": 0.0182,
40
- "step": 150
41
- },
42
- {
43
- "epoch": 1.4285714285714286,
44
- "grad_norm": 0.0010016919113695621,
45
- "learning_rate": 1.0523809523809525e-05,
46
- "loss": 0.0045,
47
- "step": 200
48
- },
49
- {
50
- "epoch": 1.7857142857142856,
51
- "grad_norm": 0.0010772283421829343,
52
- "learning_rate": 8.142857142857143e-06,
53
- "loss": 0.0002,
54
- "step": 250
55
- },
56
- {
57
- "epoch": 2.0,
58
- "eval_accuracy": 0.9946428571428572,
59
- "eval_loss": 0.057632118463516235,
60
- "eval_runtime": 1.1024,
61
- "eval_samples_per_second": 507.962,
62
- "eval_steps_per_second": 31.748,
63
- "step": 280
64
- },
65
- {
66
- "epoch": 2.142857142857143,
67
- "grad_norm": 0.016079673543572426,
68
- "learning_rate": 5.761904761904762e-06,
69
- "loss": 0.0032,
70
- "step": 300
71
- },
72
- {
73
- "epoch": 2.5,
74
- "grad_norm": 0.0009342965204268694,
75
- "learning_rate": 3.3809523809523814e-06,
76
- "loss": 0.0001,
77
- "step": 350
78
- },
79
- {
80
- "epoch": 2.857142857142857,
81
- "grad_norm": 0.0011493319179862738,
82
- "learning_rate": 1.0000000000000002e-06,
83
- "loss": 0.0016,
84
- "step": 400
85
- },
86
- {
87
- "epoch": 3.0,
88
- "eval_accuracy": 0.9964285714285714,
89
- "eval_loss": 0.040300153195858,
90
- "eval_runtime": 1.1154,
91
- "eval_samples_per_second": 502.056,
92
- "eval_steps_per_second": 31.379,
93
- "step": 420
94
- }
95
- ],
96
- "logging_steps": 50,
97
- "max_steps": 420,
98
- "num_input_tokens_seen": 0,
99
- "num_train_epochs": 3,
100
- "save_steps": 500,
101
- "stateful_callbacks": {
102
- "TrainerControl": {
103
- "args": {
104
- "should_epoch_stop": false,
105
- "should_evaluate": false,
106
- "should_log": false,
107
- "should_save": true,
108
- "should_training_stop": true
109
- },
110
- "attributes": {}
111
- }
112
- },
113
- "total_flos": 441241201529856.0,
114
- "train_batch_size": 16,
115
- "trial_name": null,
116
- "trial_params": null
117
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-420/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:51571e96933e76889f48a34720768090b72cb2a7ccc8b89aa2c33188cb83f712
3
- size 5841
 
 
 
 
checkpoint-420/vocab.json DELETED
The diff for this file is too large to render. See raw diff