ferxalb commited on
Commit
f59a9ee
·
verified ·
1 Parent(s): 1f09741

Upload matex-privacy-sentinel-v0.1 trained on Modal L40S

Browse files
Files changed (2) hide show
  1. finetune_summary.json +88 -88
  2. model.safetensors +1 -1
finetune_summary.json CHANGED
@@ -6,131 +6,131 @@
6
  },
7
  "base_checkpoint": "/root/.opf/privacy_filter",
8
  "batch_size": 4,
9
- "best_epoch": 3,
10
- "best_metric": 0.341848680201349,
11
  "best_metric_name": "validation_loss",
12
  "checkpoint_category_version": "v2",
13
  "device": "cuda",
14
- "elapsed_s": 1202.3356187059999,
15
  "encoding": "o200k_base",
16
  "epoch_metrics": [
17
  {
18
- "elapsed_s": 156.62828432,
19
  "epoch": 1,
20
- "optimizer_steps": 2250,
21
- "train_batches": 2250,
22
- "train_loss": 0.7579528993816216,
23
- "train_token_accuracy": 0.8079268596096835,
24
- "train_tokens": 904343,
25
- "validation_batches": 125,
26
- "validation_loss": 0.5067812929464072,
27
- "validation_token_accuracy": 0.867818841446398,
28
- "validation_tokens": 50166
29
  },
30
  {
31
- "elapsed_s": 152.96221749900002,
32
  "epoch": 2,
33
- "optimizer_steps": 2250,
34
- "train_batches": 2250,
35
- "train_loss": 0.38092665674540604,
36
- "train_token_accuracy": 0.9006980758406932,
37
- "train_tokens": 904343,
38
- "validation_batches": 125,
39
- "validation_loss": 0.38360365174622296,
40
- "validation_token_accuracy": 0.9019056731650918,
41
- "validation_tokens": 50166
42
  },
43
  {
44
- "elapsed_s": 151.324623019,
45
  "epoch": 3,
46
- "optimizer_steps": 2250,
47
- "train_batches": 2250,
48
- "train_loss": 0.2702202035309268,
49
- "train_token_accuracy": 0.9303217916210995,
50
- "train_tokens": 904343,
51
- "validation_batches": 125,
52
- "validation_loss": 0.341848680201349,
53
- "validation_token_accuracy": 0.9153610014751027,
54
- "validation_tokens": 50166
55
  },
56
  {
57
- "elapsed_s": 146.090914769,
58
  "epoch": 4,
59
- "optimizer_steps": 2250,
60
- "train_batches": 2250,
61
- "train_loss": 0.20918852428017598,
62
- "train_token_accuracy": 0.9461697608097812,
63
- "train_tokens": 904343,
64
- "validation_batches": 125,
65
- "validation_loss": 0.34960059886833394,
66
- "validation_token_accuracy": 0.9198660447314915,
67
- "validation_tokens": 50166
68
  },
69
  {
70
- "elapsed_s": 147.21897273000002,
71
  "epoch": 5,
72
- "optimizer_steps": 2250,
73
- "train_batches": 2250,
74
- "train_loss": 0.17146903831328053,
75
- "train_token_accuracy": 0.9572429929794337,
76
- "train_tokens": 904343,
77
- "validation_batches": 125,
78
- "validation_loss": 0.3568825089484372,
79
- "validation_token_accuracy": 0.9235737351991389,
80
- "validation_tokens": 50166
81
  },
82
  {
83
- "elapsed_s": 147.21631511600003,
84
  "epoch": 6,
85
- "optimizer_steps": 2250,
86
- "train_batches": 2250,
87
- "train_loss": 0.1385621205590411,
88
- "train_token_accuracy": 0.96554294111858,
89
- "train_tokens": 904343,
90
- "validation_batches": 125,
91
- "validation_loss": 0.3496786308457096,
92
- "validation_token_accuracy": 0.9281385799146833,
93
- "validation_tokens": 50166
94
  },
95
  {
96
- "elapsed_s": 147.04402772600008,
97
  "epoch": 7,
98
- "optimizer_steps": 2250,
99
- "train_batches": 2250,
100
- "train_loss": 0.1159271389398995,
101
- "train_token_accuracy": 0.9721267262532026,
102
- "train_tokens": 904343,
103
- "validation_batches": 125,
104
- "validation_loss": 0.39336468872144575,
105
- "validation_token_accuracy": 0.9263844037794522,
106
- "validation_tokens": 50166
107
  },
108
  {
109
- "elapsed_s": 147.08385474300007,
110
  "epoch": 8,
111
- "optimizer_steps": 2250,
112
- "train_batches": 2250,
113
- "train_loss": 0.094867783832476,
114
- "train_token_accuracy": 0.9776732943142149,
115
- "train_tokens": 904343,
116
- "validation_batches": 125,
117
- "validation_loss": 0.41877376376543324,
118
- "validation_token_accuracy": 0.9266236096160746,
119
- "validation_tokens": 50166
120
  }
121
  ],
122
  "epochs": 8,
123
- "generated_at_unix": 1777714940.5670223,
124
  "grad_accum_steps": 1,
125
  "label_space_json_path": "/__modal/volumes/vo-1GyZvIAPD7wnYD3s0C2QXS/dataset/configs/custom_label_space.json",
126
  "label_space_source": "label-space-json",
127
  "learning_rate": 1e-05,
128
  "max_grad_norm": 1.0,
129
  "num_output_labels": 97,
130
- "num_train_examples": 9000,
131
- "num_train_windows": 9000,
132
- "num_validation_examples": 500,
133
- "num_validation_windows": 500,
134
  "output_checkpoint_dir": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.1",
135
  "output_head_reinitialized": true,
136
  "output_head_rows_copied": 97,
 
6
  },
7
  "base_checkpoint": "/root/.opf/privacy_filter",
8
  "batch_size": 4,
9
+ "best_epoch": 4,
10
+ "best_metric": 0.22034703597205768,
11
  "best_metric_name": "validation_loss",
12
  "checkpoint_category_version": "v2",
13
  "device": "cuda",
14
+ "elapsed_s": 1707.967649188,
15
  "encoding": "o200k_base",
16
  "epoch_metrics": [
17
  {
18
+ "elapsed_s": 217.39479903,
19
  "epoch": 1,
20
+ "optimizer_steps": 3038,
21
+ "train_batches": 3038,
22
+ "train_loss": 0.6062319690959177,
23
+ "train_token_accuracy": 0.8512172545619088,
24
+ "train_tokens": 1453065,
25
+ "validation_batches": 169,
26
+ "validation_loss": 0.2926192293667525,
27
+ "validation_token_accuracy": 0.9352956475523843,
28
+ "validation_tokens": 88433
29
  },
30
  {
31
+ "elapsed_s": 213.544190871,
32
  "epoch": 2,
33
+ "optimizer_steps": 3038,
34
+ "train_batches": 3038,
35
+ "train_loss": 0.2367756585074477,
36
+ "train_token_accuracy": 0.9442185999938062,
37
+ "train_tokens": 1453065,
38
+ "validation_batches": 169,
39
+ "validation_loss": 0.23744411616401195,
40
+ "validation_token_accuracy": 0.9441950403130053,
41
+ "validation_tokens": 88433
42
  },
43
  {
44
+ "elapsed_s": 213.38700962000001,
45
  "epoch": 3,
46
+ "optimizer_steps": 3038,
47
+ "train_batches": 3038,
48
+ "train_loss": 0.17531355934431897,
49
+ "train_token_accuracy": 0.9586143771957896,
50
+ "train_tokens": 1453065,
51
+ "validation_batches": 169,
52
+ "validation_loss": 0.2293024442145412,
53
+ "validation_token_accuracy": 0.9511494577815973,
54
+ "validation_tokens": 88433
55
  },
56
  {
57
+ "elapsed_s": 213.449483773,
58
  "epoch": 4,
59
+ "optimizer_steps": 3038,
60
+ "train_batches": 3038,
61
+ "train_loss": 0.13766411499792147,
62
+ "train_token_accuracy": 0.9675279495411423,
63
+ "train_tokens": 1453065,
64
+ "validation_batches": 169,
65
+ "validation_loss": 0.22034703597205768,
66
+ "validation_token_accuracy": 0.9541008447072925,
67
+ "validation_tokens": 88433
68
  },
69
  {
70
+ "elapsed_s": 211.39228578199993,
71
  "epoch": 5,
72
+ "optimizer_steps": 3038,
73
+ "train_batches": 3038,
74
+ "train_loss": 0.10729076129519516,
75
+ "train_token_accuracy": 0.9746652765017394,
76
+ "train_tokens": 1453065,
77
+ "validation_batches": 169,
78
+ "validation_loss": 0.23614277132286401,
79
+ "validation_token_accuracy": 0.9555256521886626,
80
+ "validation_tokens": 88433
81
  },
82
  {
83
+ "elapsed_s": 211.30701109300003,
84
  "epoch": 6,
85
+ "optimizer_steps": 3038,
86
+ "train_batches": 3038,
87
+ "train_loss": 0.08785577328875824,
88
+ "train_token_accuracy": 0.9804427193552938,
89
+ "train_tokens": 1453065,
90
+ "validation_batches": 169,
91
+ "validation_loss": 0.27111270338299504,
92
+ "validation_token_accuracy": 0.9552881842751009,
93
+ "validation_tokens": 88433
94
  },
95
  {
96
+ "elapsed_s": 211.223892794,
97
  "epoch": 7,
98
+ "optimizer_steps": 3038,
99
+ "train_batches": 3038,
100
+ "train_loss": 0.07146611258642582,
101
+ "train_token_accuracy": 0.9836793261141105,
102
+ "train_tokens": 1453065,
103
+ "validation_batches": 169,
104
+ "validation_loss": 0.27473266072740865,
105
+ "validation_token_accuracy": 0.9579116393201633,
106
+ "validation_tokens": 88433
107
  },
108
  {
109
+ "elapsed_s": 209.94307118100005,
110
  "epoch": 8,
111
+ "optimizer_steps": 3038,
112
+ "train_batches": 3038,
113
+ "train_loss": 0.05768033069594669,
114
+ "train_token_accuracy": 0.9867569585668914,
115
+ "train_tokens": 1453065,
116
+ "validation_batches": 169,
117
+ "validation_loss": 0.30543249755483665,
118
+ "validation_token_accuracy": 0.9566903757647032,
119
+ "validation_tokens": 88433
120
  }
121
  ],
122
  "epochs": 8,
123
+ "generated_at_unix": 1777747058.003828,
124
  "grad_accum_steps": 1,
125
  "label_space_json_path": "/__modal/volumes/vo-1GyZvIAPD7wnYD3s0C2QXS/dataset/configs/custom_label_space.json",
126
  "label_space_source": "label-space-json",
127
  "learning_rate": 1e-05,
128
  "max_grad_norm": 1.0,
129
  "num_output_labels": 97,
130
+ "num_train_examples": 12150,
131
+ "num_train_windows": 12150,
132
+ "num_validation_examples": 675,
133
+ "num_validation_windows": 675,
134
  "output_checkpoint_dir": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.1",
135
  "output_head_reinitialized": true,
136
  "output_head_rows_copied": 97,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa888ac79911de3b1b25a09a157d5f9b642a1b7cbb730c1e45dca413f302361c
3
  size 2799065896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8005133a9d82548fced788b3716a41284eedde86fb701a767be52c41e5453013
3
  size 2799065896