Ian-Khalzov commited on
Commit
328c7b9
·
verified ·
1 Parent(s): ad0d092

Upload final model artifacts

Browse files
README.md ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ library_name: transformers
5
+ license: mit
6
+ pipeline_tag: text-classification
7
+ tags:
8
+ - arxiv
9
+ - scientific-text-classification
10
+ - scibert
11
+ - streamlit-demo
12
+ datasets:
13
+ - librarian-bots/arxiv-metadata-snapshot
14
+ metrics:
15
+ - accuracy
16
+ - f1
17
+ ---
18
+
19
+ # Article Topic Service SciBERT
20
+
21
+ SciBERT text classifier for scientific article topic prediction from article title and abstract.
22
+
23
+ ## Labels
24
+
25
+ - Artificial Intelligence
26
+ - Natural Language Processing
27
+ - Computer Vision
28
+ - Machine Learning
29
+ - Computer Science Theory and Algorithms
30
+ - Mathematics
31
+ - Statistics
32
+ - Electrical Engineering
33
+ - Astrophysics
34
+ - Condensed Matter Physics
35
+ - Quantum Physics
36
+ - Quantitative Biology
37
+
38
+ ## Dataset
39
+
40
+ Balanced 12-class subset built from `librarian-bots/arxiv-metadata-snapshot`.
41
+
42
+ - Train: 30,000 examples
43
+ - Validation: 3,600 examples
44
+ - Test: 3,600 examples
45
+
46
+ ## Metrics
47
+
48
+ - Validation accuracy: 0.8350
49
+ - Validation macro F1: 0.8351
50
+ - Test accuracy: 0.8356
51
+ - Test macro F1: 0.8351
52
+ - Title-only test accuracy: 0.7522
53
+ - Title-only test macro F1: 0.7495
54
+
55
+ ## Usage
56
+
57
+ ```python
58
+ from transformers import AutoModelForSequenceClassification, AutoTokenizer
59
+ import torch
60
+
61
+ model_id = "Ian-Khalzov/article-topic-service-scibert"
62
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
63
+ model = AutoModelForSequenceClassification.from_pretrained(model_id)
64
+
65
+ text = "Title: Large language models for scientific document classification\n\nAbstract: We study..."
66
+ inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=256)
67
+ with torch.inference_mode():
68
+ probs = torch.softmax(model(**inputs).logits[0], dim=-1)
69
+
70
+ predicted_label = model.config.id2label[int(probs.argmax())]
71
+ print(predicted_label)
72
+ ```
73
+
74
+ ## Notes
75
+
76
+ The current baseline is strongest on physics-heavy classes and weakest on the broad `Machine Learning` category, where topical overlap with AI, NLP, CV, and Statistics remains high.
config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": null,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": null,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "Artificial Intelligence",
16
+ "1": "Natural Language Processing",
17
+ "2": "Computer Vision",
18
+ "3": "Machine Learning",
19
+ "4": "Computer Science Theory and Algorithms",
20
+ "5": "Mathematics",
21
+ "6": "Statistics",
22
+ "7": "Electrical Engineering",
23
+ "8": "Astrophysics",
24
+ "9": "Condensed Matter Physics",
25
+ "10": "Quantum Physics",
26
+ "11": "Quantitative Biology"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "Artificial Intelligence": 0,
33
+ "Astrophysics": 8,
34
+ "Computer Science Theory and Algorithms": 4,
35
+ "Computer Vision": 2,
36
+ "Condensed Matter Physics": 9,
37
+ "Electrical Engineering": 7,
38
+ "Machine Learning": 3,
39
+ "Mathematics": 5,
40
+ "Natural Language Processing": 1,
41
+ "Quantitative Biology": 11,
42
+ "Quantum Physics": 10,
43
+ "Statistics": 6
44
+ },
45
+ "layer_norm_eps": 1e-12,
46
+ "max_position_embeddings": 512,
47
+ "model_type": "bert",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "pad_token_id": 0,
51
+ "tie_word_embeddings": true,
52
+ "transformers_version": "5.5.0",
53
+ "type_vocab_size": 2,
54
+ "use_cache": false,
55
+ "vocab_size": 31090
56
+ }
eval_run_config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "prepared_at_utc": "2026-04-06T15:01:43.444774+00:00",
3
+ "model_name": "/home/yakh/ML/ML2/article_topic_service/artifacts/scibert_topics12_run1",
4
+ "max_length": 256,
5
+ "per_device_train_batch_size": 4,
6
+ "per_device_eval_batch_size": 8,
7
+ "gradient_accumulation_steps": 8,
8
+ "num_train_epochs": 12,
9
+ "learning_rate": 2e-05,
10
+ "weight_decay": 0.01,
11
+ "warmup_ratio": 0.1,
12
+ "label_smoothing_factor": 0.05,
13
+ "title_only_prob": 0.2,
14
+ "early_stopping_patience": 3,
15
+ "seed": 42,
16
+ "resume_from_checkpoint": null,
17
+ "use_bf16": true,
18
+ "use_fp16": false,
19
+ "taxonomy_profile": "topics12",
20
+ "num_labels": 12,
21
+ "label_order": [
22
+ "artificial_intelligence",
23
+ "natural_language_processing",
24
+ "computer_vision",
25
+ "machine_learning",
26
+ "computer_science_theory",
27
+ "mathematics",
28
+ "statistics",
29
+ "electrical_engineering",
30
+ "astrophysics",
31
+ "condensed_matter_physics",
32
+ "quantum_physics",
33
+ "quantitative_biology"
34
+ ]
35
+ }
metrics_summary.json ADDED
@@ -0,0 +1,561 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train_runtime": {
3
+ "skipped_train": true
4
+ },
5
+ "eval_metrics": {
6
+ "train": {
7
+ "train_loss": 0.5018106698989868,
8
+ "train_model_preparation_time": 0.0013,
9
+ "train_accuracy": 0.9251333333333334,
10
+ "train_macro_f1": 0.9246237953755961,
11
+ "train_runtime": 90.3107,
12
+ "train_samples_per_second": 332.186,
13
+ "train_steps_per_second": 41.523,
14
+ "epoch": 0
15
+ },
16
+ "validation": {
17
+ "validation_loss": 0.709372878074646,
18
+ "validation_model_preparation_time": 0.0013,
19
+ "validation_accuracy": 0.835,
20
+ "validation_macro_f1": 0.8351179604209936,
21
+ "validation_runtime": 11.0597,
22
+ "validation_samples_per_second": 325.505,
23
+ "validation_steps_per_second": 40.688,
24
+ "epoch": 0
25
+ },
26
+ "test_full": {
27
+ "test_full_loss": 0.7299672365188599,
28
+ "test_full_model_preparation_time": 0.0013,
29
+ "test_full_accuracy": 0.8355555555555556,
30
+ "test_full_macro_f1": 0.835052453623228,
31
+ "test_full_runtime": 10.953,
32
+ "test_full_samples_per_second": 328.676,
33
+ "test_full_steps_per_second": 41.084,
34
+ "epoch": 0
35
+ },
36
+ "test_title_only": {
37
+ "test_title_only_loss": 1.0085811614990234,
38
+ "test_title_only_model_preparation_time": 0.0013,
39
+ "test_title_only_accuracy": 0.7522222222222222,
40
+ "test_title_only_macro_f1": 0.7495277786217475,
41
+ "test_title_only_runtime": 6.6335,
42
+ "test_title_only_samples_per_second": 542.697,
43
+ "test_title_only_steps_per_second": 67.837,
44
+ "epoch": 0
45
+ }
46
+ },
47
+ "test_full_classification_report": {
48
+ "Artificial Intelligence": {
49
+ "precision": 0.7289719626168224,
50
+ "recall": 0.78,
51
+ "f1-score": 0.7536231884057971,
52
+ "support": 300.0
53
+ },
54
+ "Natural Language Processing": {
55
+ "precision": 0.852760736196319,
56
+ "recall": 0.9266666666666666,
57
+ "f1-score": 0.8881789137380192,
58
+ "support": 300.0
59
+ },
60
+ "Computer Vision": {
61
+ "precision": 0.8379310344827586,
62
+ "recall": 0.81,
63
+ "f1-score": 0.823728813559322,
64
+ "support": 300.0
65
+ },
66
+ "Machine Learning": {
67
+ "precision": 0.6564885496183206,
68
+ "recall": 0.5733333333333334,
69
+ "f1-score": 0.6120996441281139,
70
+ "support": 300.0
71
+ },
72
+ "CS Theory and Algorithms": {
73
+ "precision": 0.8657718120805369,
74
+ "recall": 0.86,
75
+ "f1-score": 0.862876254180602,
76
+ "support": 300.0
77
+ },
78
+ "Mathematics": {
79
+ "precision": 0.9622641509433962,
80
+ "recall": 0.85,
81
+ "f1-score": 0.9026548672566371,
82
+ "support": 300.0
83
+ },
84
+ "Statistics": {
85
+ "precision": 0.7125748502994012,
86
+ "recall": 0.7933333333333333,
87
+ "f1-score": 0.750788643533123,
88
+ "support": 300.0
89
+ },
90
+ "Electrical Engineering": {
91
+ "precision": 0.7736486486486487,
92
+ "recall": 0.7633333333333333,
93
+ "f1-score": 0.7684563758389261,
94
+ "support": 300.0
95
+ },
96
+ "Astrophysics": {
97
+ "precision": 0.9966329966329966,
98
+ "recall": 0.9866666666666667,
99
+ "f1-score": 0.9916247906197655,
100
+ "support": 300.0
101
+ },
102
+ "Condensed Matter Physics": {
103
+ "precision": 0.916083916083916,
104
+ "recall": 0.8733333333333333,
105
+ "f1-score": 0.89419795221843,
106
+ "support": 300.0
107
+ },
108
+ "Quantum Physics": {
109
+ "precision": 0.8676923076923077,
110
+ "recall": 0.94,
111
+ "f1-score": 0.9024,
112
+ "support": 300.0
113
+ },
114
+ "Quantitative Biology": {
115
+ "precision": 0.87,
116
+ "recall": 0.87,
117
+ "f1-score": 0.87,
118
+ "support": 300.0
119
+ },
120
+ "accuracy": 0.8355555555555556,
121
+ "macro avg": {
122
+ "precision": 0.8367350804412852,
123
+ "recall": 0.8355555555555555,
124
+ "f1-score": 0.835052453623228,
125
+ "support": 3600.0
126
+ },
127
+ "weighted avg": {
128
+ "precision": 0.8367350804412854,
129
+ "recall": 0.8355555555555556,
130
+ "f1-score": 0.835052453623228,
131
+ "support": 3600.0
132
+ }
133
+ },
134
+ "test_full_confusion_matrix": [
135
+ [
136
+ 234,
137
+ 15,
138
+ 4,
139
+ 22,
140
+ 11,
141
+ 0,
142
+ 10,
143
+ 0,
144
+ 0,
145
+ 0,
146
+ 2,
147
+ 2
148
+ ],
149
+ [
150
+ 9,
151
+ 278,
152
+ 5,
153
+ 4,
154
+ 0,
155
+ 0,
156
+ 1,
157
+ 1,
158
+ 0,
159
+ 0,
160
+ 0,
161
+ 2
162
+ ],
163
+ [
164
+ 3,
165
+ 5,
166
+ 243,
167
+ 15,
168
+ 0,
169
+ 0,
170
+ 1,
171
+ 31,
172
+ 0,
173
+ 0,
174
+ 0,
175
+ 2
176
+ ],
177
+ [
178
+ 32,
179
+ 14,
180
+ 19,
181
+ 172,
182
+ 8,
183
+ 1,
184
+ 40,
185
+ 9,
186
+ 0,
187
+ 0,
188
+ 0,
189
+ 5
190
+ ],
191
+ [
192
+ 25,
193
+ 1,
194
+ 0,
195
+ 1,
196
+ 258,
197
+ 2,
198
+ 3,
199
+ 2,
200
+ 0,
201
+ 2,
202
+ 5,
203
+ 1
204
+ ],
205
+ [
206
+ 1,
207
+ 0,
208
+ 0,
209
+ 3,
210
+ 12,
211
+ 255,
212
+ 13,
213
+ 6,
214
+ 0,
215
+ 3,
216
+ 3,
217
+ 4
218
+ ],
219
+ [
220
+ 4,
221
+ 3,
222
+ 0,
223
+ 31,
224
+ 2,
225
+ 0,
226
+ 238,
227
+ 8,
228
+ 0,
229
+ 0,
230
+ 1,
231
+ 13
232
+ ],
233
+ [
234
+ 6,
235
+ 7,
236
+ 18,
237
+ 8,
238
+ 5,
239
+ 5,
240
+ 15,
241
+ 229,
242
+ 0,
243
+ 1,
244
+ 0,
245
+ 6
246
+ ],
247
+ [
248
+ 1,
249
+ 0,
250
+ 1,
251
+ 0,
252
+ 0,
253
+ 0,
254
+ 0,
255
+ 1,
256
+ 296,
257
+ 0,
258
+ 1,
259
+ 0
260
+ ],
261
+ [
262
+ 0,
263
+ 0,
264
+ 0,
265
+ 1,
266
+ 1,
267
+ 0,
268
+ 1,
269
+ 0,
270
+ 1,
271
+ 262,
272
+ 30,
273
+ 4
274
+ ],
275
+ [
276
+ 0,
277
+ 0,
278
+ 0,
279
+ 2,
280
+ 0,
281
+ 0,
282
+ 0,
283
+ 1,
284
+ 0,
285
+ 15,
286
+ 282,
287
+ 0
288
+ ],
289
+ [
290
+ 6,
291
+ 3,
292
+ 0,
293
+ 3,
294
+ 1,
295
+ 2,
296
+ 12,
297
+ 8,
298
+ 0,
299
+ 3,
300
+ 1,
301
+ 261
302
+ ]
303
+ ],
304
+ "test_title_only_classification_report": {
305
+ "Artificial Intelligence": {
306
+ "precision": 0.6678321678321678,
307
+ "recall": 0.6366666666666667,
308
+ "f1-score": 0.6518771331058021,
309
+ "support": 300.0
310
+ },
311
+ "Natural Language Processing": {
312
+ "precision": 0.7485207100591716,
313
+ "recall": 0.8433333333333334,
314
+ "f1-score": 0.7931034482758621,
315
+ "support": 300.0
316
+ },
317
+ "Computer Vision": {
318
+ "precision": 0.7210884353741497,
319
+ "recall": 0.7066666666666667,
320
+ "f1-score": 0.7138047138047138,
321
+ "support": 300.0
322
+ },
323
+ "Machine Learning": {
324
+ "precision": 0.5879828326180258,
325
+ "recall": 0.45666666666666667,
326
+ "f1-score": 0.5140712945590994,
327
+ "support": 300.0
328
+ },
329
+ "CS Theory and Algorithms": {
330
+ "precision": 0.7033639143730887,
331
+ "recall": 0.7666666666666667,
332
+ "f1-score": 0.733652312599681,
333
+ "support": 300.0
334
+ },
335
+ "Mathematics": {
336
+ "precision": 0.837037037037037,
337
+ "recall": 0.7533333333333333,
338
+ "f1-score": 0.7929824561403509,
339
+ "support": 300.0
340
+ },
341
+ "Statistics": {
342
+ "precision": 0.6128048780487805,
343
+ "recall": 0.67,
344
+ "f1-score": 0.6401273885350318,
345
+ "support": 300.0
346
+ },
347
+ "Electrical Engineering": {
348
+ "precision": 0.7295373665480427,
349
+ "recall": 0.6833333333333333,
350
+ "f1-score": 0.7056798623063684,
351
+ "support": 300.0
352
+ },
353
+ "Astrophysics": {
354
+ "precision": 0.9534883720930233,
355
+ "recall": 0.9566666666666667,
356
+ "f1-score": 0.9550748752079867,
357
+ "support": 300.0
358
+ },
359
+ "Condensed Matter Physics": {
360
+ "precision": 0.8430034129692833,
361
+ "recall": 0.8233333333333334,
362
+ "f1-score": 0.8330522765598651,
363
+ "support": 300.0
364
+ },
365
+ "Quantum Physics": {
366
+ "precision": 0.7834757834757835,
367
+ "recall": 0.9166666666666666,
368
+ "f1-score": 0.8448540706605223,
369
+ "support": 300.0
370
+ },
371
+ "Quantitative Biology": {
372
+ "precision": 0.8187919463087249,
373
+ "recall": 0.8133333333333334,
374
+ "f1-score": 0.8160535117056856,
375
+ "support": 300.0
376
+ },
377
+ "accuracy": 0.7522222222222222,
378
+ "macro avg": {
379
+ "precision": 0.7505772380614398,
380
+ "recall": 0.7522222222222222,
381
+ "f1-score": 0.7495277786217475,
382
+ "support": 3600.0
383
+ },
384
+ "weighted avg": {
385
+ "precision": 0.7505772380614398,
386
+ "recall": 0.7522222222222222,
387
+ "f1-score": 0.7495277786217475,
388
+ "support": 3600.0
389
+ }
390
+ },
391
+ "test_title_only_confusion_matrix": [
392
+ [
393
+ 191,
394
+ 30,
395
+ 10,
396
+ 19,
397
+ 18,
398
+ 2,
399
+ 17,
400
+ 3,
401
+ 1,
402
+ 1,
403
+ 5,
404
+ 3
405
+ ],
406
+ [
407
+ 12,
408
+ 253,
409
+ 11,
410
+ 13,
411
+ 0,
412
+ 0,
413
+ 5,
414
+ 1,
415
+ 0,
416
+ 1,
417
+ 1,
418
+ 3
419
+ ],
420
+ [
421
+ 6,
422
+ 11,
423
+ 212,
424
+ 19,
425
+ 5,
426
+ 2,
427
+ 3,
428
+ 37,
429
+ 2,
430
+ 0,
431
+ 1,
432
+ 2
433
+ ],
434
+ [
435
+ 21,
436
+ 22,
437
+ 28,
438
+ 137,
439
+ 21,
440
+ 1,
441
+ 48,
442
+ 9,
443
+ 1,
444
+ 2,
445
+ 1,
446
+ 9
447
+ ],
448
+ [
449
+ 24,
450
+ 4,
451
+ 0,
452
+ 6,
453
+ 230,
454
+ 10,
455
+ 12,
456
+ 4,
457
+ 0,
458
+ 1,
459
+ 7,
460
+ 2
461
+ ],
462
+ [
463
+ 4,
464
+ 0,
465
+ 2,
466
+ 3,
467
+ 25,
468
+ 226,
469
+ 11,
470
+ 7,
471
+ 1,
472
+ 11,
473
+ 5,
474
+ 5
475
+ ],
476
+ [
477
+ 11,
478
+ 4,
479
+ 2,
480
+ 28,
481
+ 11,
482
+ 9,
483
+ 201,
484
+ 10,
485
+ 1,
486
+ 5,
487
+ 2,
488
+ 16
489
+ ],
490
+ [
491
+ 3,
492
+ 8,
493
+ 24,
494
+ 4,
495
+ 9,
496
+ 8,
497
+ 16,
498
+ 205,
499
+ 3,
500
+ 3,
501
+ 4,
502
+ 13
503
+ ],
504
+ [
505
+ 2,
506
+ 0,
507
+ 3,
508
+ 0,
509
+ 0,
510
+ 3,
511
+ 0,
512
+ 0,
513
+ 287,
514
+ 3,
515
+ 2,
516
+ 0
517
+ ],
518
+ [
519
+ 1,
520
+ 0,
521
+ 0,
522
+ 0,
523
+ 0,
524
+ 5,
525
+ 1,
526
+ 0,
527
+ 2,
528
+ 247,
529
+ 43,
530
+ 1
531
+ ],
532
+ [
533
+ 1,
534
+ 1,
535
+ 0,
536
+ 1,
537
+ 5,
538
+ 2,
539
+ 2,
540
+ 0,
541
+ 2,
542
+ 11,
543
+ 275,
544
+ 0
545
+ ],
546
+ [
547
+ 10,
548
+ 5,
549
+ 2,
550
+ 3,
551
+ 3,
552
+ 2,
553
+ 12,
554
+ 5,
555
+ 1,
556
+ 8,
557
+ 5,
558
+ 244
559
+ ]
560
+ ]
561
+ }
metrics_summary.txt ADDED
@@ -0,0 +1,561 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train_runtime": {
3
+ "skipped_train": true
4
+ },
5
+ "eval_metrics": {
6
+ "train": {
7
+ "train_loss": 0.5018106698989868,
8
+ "train_model_preparation_time": 0.0013,
9
+ "train_accuracy": 0.9251333333333334,
10
+ "train_macro_f1": 0.9246237953755961,
11
+ "train_runtime": 90.3107,
12
+ "train_samples_per_second": 332.186,
13
+ "train_steps_per_second": 41.523,
14
+ "epoch": 0
15
+ },
16
+ "validation": {
17
+ "validation_loss": 0.709372878074646,
18
+ "validation_model_preparation_time": 0.0013,
19
+ "validation_accuracy": 0.835,
20
+ "validation_macro_f1": 0.8351179604209936,
21
+ "validation_runtime": 11.0597,
22
+ "validation_samples_per_second": 325.505,
23
+ "validation_steps_per_second": 40.688,
24
+ "epoch": 0
25
+ },
26
+ "test_full": {
27
+ "test_full_loss": 0.7299672365188599,
28
+ "test_full_model_preparation_time": 0.0013,
29
+ "test_full_accuracy": 0.8355555555555556,
30
+ "test_full_macro_f1": 0.835052453623228,
31
+ "test_full_runtime": 10.953,
32
+ "test_full_samples_per_second": 328.676,
33
+ "test_full_steps_per_second": 41.084,
34
+ "epoch": 0
35
+ },
36
+ "test_title_only": {
37
+ "test_title_only_loss": 1.0085811614990234,
38
+ "test_title_only_model_preparation_time": 0.0013,
39
+ "test_title_only_accuracy": 0.7522222222222222,
40
+ "test_title_only_macro_f1": 0.7495277786217475,
41
+ "test_title_only_runtime": 6.6335,
42
+ "test_title_only_samples_per_second": 542.697,
43
+ "test_title_only_steps_per_second": 67.837,
44
+ "epoch": 0
45
+ }
46
+ },
47
+ "test_full_classification_report": {
48
+ "Artificial Intelligence": {
49
+ "precision": 0.7289719626168224,
50
+ "recall": 0.78,
51
+ "f1-score": 0.7536231884057971,
52
+ "support": 300.0
53
+ },
54
+ "Natural Language Processing": {
55
+ "precision": 0.852760736196319,
56
+ "recall": 0.9266666666666666,
57
+ "f1-score": 0.8881789137380192,
58
+ "support": 300.0
59
+ },
60
+ "Computer Vision": {
61
+ "precision": 0.8379310344827586,
62
+ "recall": 0.81,
63
+ "f1-score": 0.823728813559322,
64
+ "support": 300.0
65
+ },
66
+ "Machine Learning": {
67
+ "precision": 0.6564885496183206,
68
+ "recall": 0.5733333333333334,
69
+ "f1-score": 0.6120996441281139,
70
+ "support": 300.0
71
+ },
72
+ "CS Theory and Algorithms": {
73
+ "precision": 0.8657718120805369,
74
+ "recall": 0.86,
75
+ "f1-score": 0.862876254180602,
76
+ "support": 300.0
77
+ },
78
+ "Mathematics": {
79
+ "precision": 0.9622641509433962,
80
+ "recall": 0.85,
81
+ "f1-score": 0.9026548672566371,
82
+ "support": 300.0
83
+ },
84
+ "Statistics": {
85
+ "precision": 0.7125748502994012,
86
+ "recall": 0.7933333333333333,
87
+ "f1-score": 0.750788643533123,
88
+ "support": 300.0
89
+ },
90
+ "Electrical Engineering": {
91
+ "precision": 0.7736486486486487,
92
+ "recall": 0.7633333333333333,
93
+ "f1-score": 0.7684563758389261,
94
+ "support": 300.0
95
+ },
96
+ "Astrophysics": {
97
+ "precision": 0.9966329966329966,
98
+ "recall": 0.9866666666666667,
99
+ "f1-score": 0.9916247906197655,
100
+ "support": 300.0
101
+ },
102
+ "Condensed Matter Physics": {
103
+ "precision": 0.916083916083916,
104
+ "recall": 0.8733333333333333,
105
+ "f1-score": 0.89419795221843,
106
+ "support": 300.0
107
+ },
108
+ "Quantum Physics": {
109
+ "precision": 0.8676923076923077,
110
+ "recall": 0.94,
111
+ "f1-score": 0.9024,
112
+ "support": 300.0
113
+ },
114
+ "Quantitative Biology": {
115
+ "precision": 0.87,
116
+ "recall": 0.87,
117
+ "f1-score": 0.87,
118
+ "support": 300.0
119
+ },
120
+ "accuracy": 0.8355555555555556,
121
+ "macro avg": {
122
+ "precision": 0.8367350804412852,
123
+ "recall": 0.8355555555555555,
124
+ "f1-score": 0.835052453623228,
125
+ "support": 3600.0
126
+ },
127
+ "weighted avg": {
128
+ "precision": 0.8367350804412854,
129
+ "recall": 0.8355555555555556,
130
+ "f1-score": 0.835052453623228,
131
+ "support": 3600.0
132
+ }
133
+ },
134
+ "test_full_confusion_matrix": [
135
+ [
136
+ 234,
137
+ 15,
138
+ 4,
139
+ 22,
140
+ 11,
141
+ 0,
142
+ 10,
143
+ 0,
144
+ 0,
145
+ 0,
146
+ 2,
147
+ 2
148
+ ],
149
+ [
150
+ 9,
151
+ 278,
152
+ 5,
153
+ 4,
154
+ 0,
155
+ 0,
156
+ 1,
157
+ 1,
158
+ 0,
159
+ 0,
160
+ 0,
161
+ 2
162
+ ],
163
+ [
164
+ 3,
165
+ 5,
166
+ 243,
167
+ 15,
168
+ 0,
169
+ 0,
170
+ 1,
171
+ 31,
172
+ 0,
173
+ 0,
174
+ 0,
175
+ 2
176
+ ],
177
+ [
178
+ 32,
179
+ 14,
180
+ 19,
181
+ 172,
182
+ 8,
183
+ 1,
184
+ 40,
185
+ 9,
186
+ 0,
187
+ 0,
188
+ 0,
189
+ 5
190
+ ],
191
+ [
192
+ 25,
193
+ 1,
194
+ 0,
195
+ 1,
196
+ 258,
197
+ 2,
198
+ 3,
199
+ 2,
200
+ 0,
201
+ 2,
202
+ 5,
203
+ 1
204
+ ],
205
+ [
206
+ 1,
207
+ 0,
208
+ 0,
209
+ 3,
210
+ 12,
211
+ 255,
212
+ 13,
213
+ 6,
214
+ 0,
215
+ 3,
216
+ 3,
217
+ 4
218
+ ],
219
+ [
220
+ 4,
221
+ 3,
222
+ 0,
223
+ 31,
224
+ 2,
225
+ 0,
226
+ 238,
227
+ 8,
228
+ 0,
229
+ 0,
230
+ 1,
231
+ 13
232
+ ],
233
+ [
234
+ 6,
235
+ 7,
236
+ 18,
237
+ 8,
238
+ 5,
239
+ 5,
240
+ 15,
241
+ 229,
242
+ 0,
243
+ 1,
244
+ 0,
245
+ 6
246
+ ],
247
+ [
248
+ 1,
249
+ 0,
250
+ 1,
251
+ 0,
252
+ 0,
253
+ 0,
254
+ 0,
255
+ 1,
256
+ 296,
257
+ 0,
258
+ 1,
259
+ 0
260
+ ],
261
+ [
262
+ 0,
263
+ 0,
264
+ 0,
265
+ 1,
266
+ 1,
267
+ 0,
268
+ 1,
269
+ 0,
270
+ 1,
271
+ 262,
272
+ 30,
273
+ 4
274
+ ],
275
+ [
276
+ 0,
277
+ 0,
278
+ 0,
279
+ 2,
280
+ 0,
281
+ 0,
282
+ 0,
283
+ 1,
284
+ 0,
285
+ 15,
286
+ 282,
287
+ 0
288
+ ],
289
+ [
290
+ 6,
291
+ 3,
292
+ 0,
293
+ 3,
294
+ 1,
295
+ 2,
296
+ 12,
297
+ 8,
298
+ 0,
299
+ 3,
300
+ 1,
301
+ 261
302
+ ]
303
+ ],
304
+ "test_title_only_classification_report": {
305
+ "Artificial Intelligence": {
306
+ "precision": 0.6678321678321678,
307
+ "recall": 0.6366666666666667,
308
+ "f1-score": 0.6518771331058021,
309
+ "support": 300.0
310
+ },
311
+ "Natural Language Processing": {
312
+ "precision": 0.7485207100591716,
313
+ "recall": 0.8433333333333334,
314
+ "f1-score": 0.7931034482758621,
315
+ "support": 300.0
316
+ },
317
+ "Computer Vision": {
318
+ "precision": 0.7210884353741497,
319
+ "recall": 0.7066666666666667,
320
+ "f1-score": 0.7138047138047138,
321
+ "support": 300.0
322
+ },
323
+ "Machine Learning": {
324
+ "precision": 0.5879828326180258,
325
+ "recall": 0.45666666666666667,
326
+ "f1-score": 0.5140712945590994,
327
+ "support": 300.0
328
+ },
329
+ "CS Theory and Algorithms": {
330
+ "precision": 0.7033639143730887,
331
+ "recall": 0.7666666666666667,
332
+ "f1-score": 0.733652312599681,
333
+ "support": 300.0
334
+ },
335
+ "Mathematics": {
336
+ "precision": 0.837037037037037,
337
+ "recall": 0.7533333333333333,
338
+ "f1-score": 0.7929824561403509,
339
+ "support": 300.0
340
+ },
341
+ "Statistics": {
342
+ "precision": 0.6128048780487805,
343
+ "recall": 0.67,
344
+ "f1-score": 0.6401273885350318,
345
+ "support": 300.0
346
+ },
347
+ "Electrical Engineering": {
348
+ "precision": 0.7295373665480427,
349
+ "recall": 0.6833333333333333,
350
+ "f1-score": 0.7056798623063684,
351
+ "support": 300.0
352
+ },
353
+ "Astrophysics": {
354
+ "precision": 0.9534883720930233,
355
+ "recall": 0.9566666666666667,
356
+ "f1-score": 0.9550748752079867,
357
+ "support": 300.0
358
+ },
359
+ "Condensed Matter Physics": {
360
+ "precision": 0.8430034129692833,
361
+ "recall": 0.8233333333333334,
362
+ "f1-score": 0.8330522765598651,
363
+ "support": 300.0
364
+ },
365
+ "Quantum Physics": {
366
+ "precision": 0.7834757834757835,
367
+ "recall": 0.9166666666666666,
368
+ "f1-score": 0.8448540706605223,
369
+ "support": 300.0
370
+ },
371
+ "Quantitative Biology": {
372
+ "precision": 0.8187919463087249,
373
+ "recall": 0.8133333333333334,
374
+ "f1-score": 0.8160535117056856,
375
+ "support": 300.0
376
+ },
377
+ "accuracy": 0.7522222222222222,
378
+ "macro avg": {
379
+ "precision": 0.7505772380614398,
380
+ "recall": 0.7522222222222222,
381
+ "f1-score": 0.7495277786217475,
382
+ "support": 3600.0
383
+ },
384
+ "weighted avg": {
385
+ "precision": 0.7505772380614398,
386
+ "recall": 0.7522222222222222,
387
+ "f1-score": 0.7495277786217475,
388
+ "support": 3600.0
389
+ }
390
+ },
391
+ "test_title_only_confusion_matrix": [
392
+ [
393
+ 191,
394
+ 30,
395
+ 10,
396
+ 19,
397
+ 18,
398
+ 2,
399
+ 17,
400
+ 3,
401
+ 1,
402
+ 1,
403
+ 5,
404
+ 3
405
+ ],
406
+ [
407
+ 12,
408
+ 253,
409
+ 11,
410
+ 13,
411
+ 0,
412
+ 0,
413
+ 5,
414
+ 1,
415
+ 0,
416
+ 1,
417
+ 1,
418
+ 3
419
+ ],
420
+ [
421
+ 6,
422
+ 11,
423
+ 212,
424
+ 19,
425
+ 5,
426
+ 2,
427
+ 3,
428
+ 37,
429
+ 2,
430
+ 0,
431
+ 1,
432
+ 2
433
+ ],
434
+ [
435
+ 21,
436
+ 22,
437
+ 28,
438
+ 137,
439
+ 21,
440
+ 1,
441
+ 48,
442
+ 9,
443
+ 1,
444
+ 2,
445
+ 1,
446
+ 9
447
+ ],
448
+ [
449
+ 24,
450
+ 4,
451
+ 0,
452
+ 6,
453
+ 230,
454
+ 10,
455
+ 12,
456
+ 4,
457
+ 0,
458
+ 1,
459
+ 7,
460
+ 2
461
+ ],
462
+ [
463
+ 4,
464
+ 0,
465
+ 2,
466
+ 3,
467
+ 25,
468
+ 226,
469
+ 11,
470
+ 7,
471
+ 1,
472
+ 11,
473
+ 5,
474
+ 5
475
+ ],
476
+ [
477
+ 11,
478
+ 4,
479
+ 2,
480
+ 28,
481
+ 11,
482
+ 9,
483
+ 201,
484
+ 10,
485
+ 1,
486
+ 5,
487
+ 2,
488
+ 16
489
+ ],
490
+ [
491
+ 3,
492
+ 8,
493
+ 24,
494
+ 4,
495
+ 9,
496
+ 8,
497
+ 16,
498
+ 205,
499
+ 3,
500
+ 3,
501
+ 4,
502
+ 13
503
+ ],
504
+ [
505
+ 2,
506
+ 0,
507
+ 3,
508
+ 0,
509
+ 0,
510
+ 3,
511
+ 0,
512
+ 0,
513
+ 287,
514
+ 3,
515
+ 2,
516
+ 0
517
+ ],
518
+ [
519
+ 1,
520
+ 0,
521
+ 0,
522
+ 0,
523
+ 0,
524
+ 5,
525
+ 1,
526
+ 0,
527
+ 2,
528
+ 247,
529
+ 43,
530
+ 1
531
+ ],
532
+ [
533
+ 1,
534
+ 1,
535
+ 0,
536
+ 1,
537
+ 5,
538
+ 2,
539
+ 2,
540
+ 0,
541
+ 2,
542
+ 11,
543
+ 275,
544
+ 0
545
+ ],
546
+ [
547
+ 10,
548
+ 5,
549
+ 2,
550
+ 3,
551
+ 3,
552
+ 2,
553
+ 12,
554
+ 5,
555
+ 1,
556
+ 8,
557
+ 5,
558
+ 244
559
+ ]
560
+ ]
561
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bb43480cebf6a605d7ea6fc34268b5caac9fdc6b31296205b6b58bae8e579b5
3
+ size 439734280
run_config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "prepared_at_utc": "2026-04-06T14:00:00+00:00",
3
+ "model_name": "allenai/scibert_scivocab_uncased",
4
+ "max_length": 256,
5
+ "per_device_train_batch_size": 4,
6
+ "per_device_eval_batch_size": 8,
7
+ "gradient_accumulation_steps": 8,
8
+ "num_train_epochs": 12,
9
+ "learning_rate": 2e-05,
10
+ "weight_decay": 0.01,
11
+ "warmup_ratio": 0.1,
12
+ "label_smoothing_factor": 0.05,
13
+ "title_only_prob": 0.2,
14
+ "early_stopping_patience": 3,
15
+ "seed": 42,
16
+ "resume_from_checkpoint": null,
17
+ "use_bf16": true,
18
+ "use_fp16": false,
19
+ "taxonomy_profile": "topics12",
20
+ "num_labels": 12,
21
+ "label_order": [
22
+ "artificial_intelligence",
23
+ "natural_language_processing",
24
+ "computer_vision",
25
+ "machine_learning",
26
+ "computer_science_theory",
27
+ "mathematics",
28
+ "statistics",
29
+ "electrical_engineering",
30
+ "astrophysics",
31
+ "condensed_matter_physics",
32
+ "quantum_physics",
33
+ "quantitative_biology"
34
+ ]
35
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": true,
5
+ "is_local": false,
6
+ "mask_token": "[MASK]",
7
+ "model_max_length": 1000000000000000019884624838656,
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "strip_accents": null,
11
+ "tokenize_chinese_chars": true,
12
+ "tokenizer_class": "BertTokenizer",
13
+ "unk_token": "[UNK]"
14
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9ea637bcad0c6445dbfe1a0110faae0f86e61c5a830e59ef2821d192ab5ae31
3
+ size 5265