idobn commited on Jan 21

Commit

75449cb

verified ·

1 Parent(s): 634615e

Upload folder using huggingface_hub

Browse files

Files changed (19) hide show

README.md +37 -0
added_tokens.json +3 -0
checkpoint-1542/config.json +73 -0
checkpoint-1542/model.safetensors +3 -0
checkpoint-1542/optimizer.pt +3 -0
checkpoint-1542/rng_state.pth +3 -0
checkpoint-1542/scheduler.pt +3 -0
checkpoint-1542/trainer_state.json +1228 -0
checkpoint-1542/training_args.bin +3 -0
config.json +73 -0
model.safetensors +3 -0
runs/Jan21_15-38-16_r-idobn-twitter-mbti-2rmya185-a2492-5fds5/events.out.tfevents.1769009898.r-idobn-twitter-mbti-2rmya185-a2492-5fds5.120.0 +2 -2
runs/Jan21_15-38-16_r-idobn-twitter-mbti-2rmya185-a2492-5fds5/events.out.tfevents.1769017304.r-idobn-twitter-mbti-2rmya185-a2492-5fds5.120.1 +3 -0
special_tokens_map.json +15 -0
spm.model +3 -0
tokenizer.json +0 -0
tokenizer_config.json +59 -0
training_args.bin +3 -0
training_params.json +30 -0

README.md ADDED Viewed

	@@ -0,0 +1,37 @@

+---
+library_name: transformers
+tags:
+- autotrain
+- text-classification
+base_model: microsoft/deberta-v3-large
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 1.9677170515060425
+f1_macro: 0.43647747790260216
+f1_micro: 0.40711847879083374
+f1_weighted: 0.3874051890698862
+precision_macro: 0.49034231056721467
+precision_micro: 0.40711847879083374
+precision_weighted: 0.4284233711977137
+recall_macro: 0.4407702395816866
+recall_micro: 0.40711847879083374
+recall_weighted: 0.40711847879083374
+accuracy: 0.40711847879083374

added_tokens.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "[MASK]": 128000
+}

checkpoint-1542/config.json ADDED Viewed

	@@ -0,0 +1,73 @@

+{
+  "_name_or_path": "microsoft/deberta-v3-large",
+  "_num_labels": 16,
+  "architectures": [
+    "DebertaV2ForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "enfj",
+    "1": "enfp",
+    "2": "entj",
+    "3": "entp",
+    "4": "esfj",
+    "5": "esfp",
+    "6": "estj",
+    "7": "estp",
+    "8": "infj",
+    "9": "infp",
+    "10": "intj",
+    "11": "intp",
+    "12": "isfj",
+    "13": "isfp",
+    "14": "istj",
+    "15": "istp"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "enfj": 0,
+    "enfp": 1,
+    "entj": 2,
+    "entp": 3,
+    "esfj": 4,
+    "esfp": 5,
+    "estj": 6,
+    "estp": 7,
+    "infj": 8,
+    "infp": 9,
+    "intj": 10,
+    "intp": 11,
+    "isfj": 12,
+    "isfp": 13,
+    "istj": 14,
+    "istp": 15
+  },
+  "layer_norm_eps": 1e-07,
+  "legacy": true,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 1024,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "type_vocab_size": 0,
+  "vocab_size": 128100
+}

checkpoint-1542/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c9b5b9de47af2e45c14a96ab10be692e0caf5e1ae04b1a717235a34c072f012
+size 1740361848

checkpoint-1542/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8890e67ff5e7849ac67c82a5fe3088c782f25b6b8224943a94a612014a413a5f
+size 3480955056

checkpoint-1542/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d440435e7a9ceae19abce66d810fb753ca6f090ea4d3ab8404d4282570a3effa
+size 14244

checkpoint-1542/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9950f111117344b3bf990d7231eaf6b6ce2fcff45a97c769c5f23872f16f7cb5
+size 1064

checkpoint-1542/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1228 @@

+{
+  "best_metric": 1.9677170515060425,
+  "best_model_checkpoint": "twitter-mbti-v2/checkpoint-1542",
+  "epoch": 6.0,
+  "eval_steps": 500,
+  "global_step": 1542,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03900536323744515,
+      "grad_norm": 3.7978336811065674,
+      "learning_rate": 3.90625e-07,
+      "loss": 2.833,
+      "step": 10
+    },
+    {
+      "epoch": 0.0780107264748903,
+      "grad_norm": 2.6848301887512207,
+      "learning_rate": 7.8125e-07,
+      "loss": 2.8331,
+      "step": 20
+    },
+    {
+      "epoch": 0.11701608971233544,
+      "grad_norm": 2.5124902725219727,
+      "learning_rate": 1.1718750000000001e-06,
+      "loss": 2.8206,
+      "step": 30
+    },
+    {
+      "epoch": 0.1560214529497806,
+      "grad_norm": 3.32080340385437,
+      "learning_rate": 1.5625e-06,
+      "loss": 2.8144,
+      "step": 40
+    },
+    {
+      "epoch": 0.19502681618722575,
+      "grad_norm": 3.0330629348754883,
+      "learning_rate": 1.953125e-06,
+      "loss": 2.821,
+      "step": 50
+    },
+    {
+      "epoch": 0.2340321794246709,
+      "grad_norm": 2.991515874862671,
+      "learning_rate": 2.3437500000000002e-06,
+      "loss": 2.8096,
+      "step": 60
+    },
+    {
+      "epoch": 0.27303754266211605,
+      "grad_norm": 3.302293062210083,
+      "learning_rate": 2.7343750000000004e-06,
+      "loss": 2.794,
+      "step": 70
+    },
+    {
+      "epoch": 0.3120429058995612,
+      "grad_norm": 3.306318521499634,
+      "learning_rate": 3.125e-06,
+      "loss": 2.7629,
+      "step": 80
+    },
+    {
+      "epoch": 0.3510482691370063,
+      "grad_norm": 2.56471848487854,
+      "learning_rate": 3.5156250000000003e-06,
+      "loss": 2.7602,
+      "step": 90
+    },
+    {
+      "epoch": 0.3900536323744515,
+      "grad_norm": 3.474318027496338,
+      "learning_rate": 3.90625e-06,
+      "loss": 2.6947,
+      "step": 100
+    },
+    {
+      "epoch": 0.42905899561189664,
+      "grad_norm": 2.990626096725464,
+      "learning_rate": 4.296875e-06,
+      "loss": 2.7265,
+      "step": 110
+    },
+    {
+      "epoch": 0.4680643588493418,
+      "grad_norm": 4.794486999511719,
+      "learning_rate": 4.6875000000000004e-06,
+      "loss": 2.7143,
+      "step": 120
+    },
+    {
+      "epoch": 0.5070697220867869,
+      "grad_norm": 3.5165743827819824,
+      "learning_rate": 5.078125000000001e-06,
+      "loss": 2.7444,
+      "step": 130
+    },
+    {
+      "epoch": 0.5460750853242321,
+      "grad_norm": 2.8984289169311523,
+      "learning_rate": 5.468750000000001e-06,
+      "loss": 2.7384,
+      "step": 140
+    },
+    {
+      "epoch": 0.5850804485616772,
+      "grad_norm": 3.9029452800750732,
+      "learning_rate": 5.859375e-06,
+      "loss": 2.7444,
+      "step": 150
+    },
+    {
+      "epoch": 0.6240858117991224,
+      "grad_norm": 4.58915376663208,
+      "learning_rate": 6.25e-06,
+      "loss": 2.6959,
+      "step": 160
+    },
+    {
+      "epoch": 0.6630911750365676,
+      "grad_norm": 3.549612045288086,
+      "learning_rate": 6.6406250000000005e-06,
+      "loss": 2.7289,
+      "step": 170
+    },
+    {
+      "epoch": 0.7020965382740126,
+      "grad_norm": 2.6437020301818848,
+      "learning_rate": 7.031250000000001e-06,
+      "loss": 2.732,
+      "step": 180
+    },
+    {
+      "epoch": 0.7411019015114578,
+      "grad_norm": 3.5032520294189453,
+      "learning_rate": 7.421875000000001e-06,
+      "loss": 2.7296,
+      "step": 190
+    },
+    {
+      "epoch": 0.780107264748903,
+      "grad_norm": 3.1741631031036377,
+      "learning_rate": 7.8125e-06,
+      "loss": 2.7316,
+      "step": 200
+    },
+    {
+      "epoch": 0.8191126279863481,
+      "grad_norm": 2.8320600986480713,
+      "learning_rate": 8.203125000000001e-06,
+      "loss": 2.7319,
+      "step": 210
+    },
+    {
+      "epoch": 0.8581179912237933,
+      "grad_norm": 2.8625762462615967,
+      "learning_rate": 8.59375e-06,
+      "loss": 2.742,
+      "step": 220
+    },
+    {
+      "epoch": 0.8971233544612384,
+      "grad_norm": 2.858238697052002,
+      "learning_rate": 8.984375000000002e-06,
+      "loss": 2.7252,
+      "step": 230
+    },
+    {
+      "epoch": 0.9361287176986836,
+      "grad_norm": 3.340858221054077,
+      "learning_rate": 9.375000000000001e-06,
+      "loss": 2.7159,
+      "step": 240
+    },
+    {
+      "epoch": 0.9751340809361287,
+      "grad_norm": 2.8419265747070312,
+      "learning_rate": 9.765625e-06,
+      "loss": 2.7509,
+      "step": 250
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.12823013164310093,
+      "eval_f1_macro": 0.022844391014094804,
+      "eval_f1_micro": 0.12823013164310093,
+      "eval_f1_weighted": 0.04192036517091411,
+      "eval_loss": 2.7105822563171387,
+      "eval_precision_macro": 0.03190063069208076,
+      "eval_precision_micro": 0.12823013164310093,
+      "eval_precision_weighted": 0.0493667840880759,
+      "eval_recall_macro": 0.06533440208373821,
+      "eval_recall_micro": 0.12823013164310093,
+      "eval_recall_weighted": 0.12823013164310093,
+      "eval_runtime": 57.6155,
+      "eval_samples_per_second": 35.598,
+      "eval_steps_per_second": 4.461,
+      "step": 257
+    },
+    {
+      "epoch": 1.0117016089712336,
+      "grad_norm": 3.288947343826294,
+      "learning_rate": 9.98263888888889e-06,
+      "loss": 2.5368,
+      "step": 260
+    },
+    {
+      "epoch": 1.0507069722086786,
+      "grad_norm": 3.894672155380249,
+      "learning_rate": 9.939236111111112e-06,
+      "loss": 2.7183,
+      "step": 270
+    },
+    {
+      "epoch": 1.0897123354461238,
+      "grad_norm": 3.038849353790283,
+      "learning_rate": 9.895833333333334e-06,
+      "loss": 2.7326,
+      "step": 280
+    },
+    {
+      "epoch": 1.128717698683569,
+      "grad_norm": 4.149471282958984,
+      "learning_rate": 9.852430555555557e-06,
+      "loss": 2.7304,
+      "step": 290
+    },
+    {
+      "epoch": 1.1677230619210142,
+      "grad_norm": 3.3252062797546387,
+      "learning_rate": 9.80902777777778e-06,
+      "loss": 2.7161,
+      "step": 300
+    },
+    {
+      "epoch": 1.2067284251584594,
+      "grad_norm": 3.7927067279815674,
+      "learning_rate": 9.765625e-06,
+      "loss": 2.6916,
+      "step": 310
+    },
+    {
+      "epoch": 1.2457337883959045,
+      "grad_norm": 3.313178777694702,
+      "learning_rate": 9.722222222222223e-06,
+      "loss": 2.7163,
+      "step": 320
+    },
+    {
+      "epoch": 1.2847391516333495,
+      "grad_norm": 3.720956802368164,
+      "learning_rate": 9.678819444444445e-06,
+      "loss": 2.6494,
+      "step": 330
+    },
+    {
+      "epoch": 1.3237445148707947,
+      "grad_norm": 4.145543575286865,
+      "learning_rate": 9.635416666666668e-06,
+      "loss": 2.6825,
+      "step": 340
+    },
+    {
+      "epoch": 1.3627498781082399,
+      "grad_norm": 3.6850345134735107,
+      "learning_rate": 9.592013888888888e-06,
+      "loss": 2.6725,
+      "step": 350
+    },
+    {
+      "epoch": 1.401755241345685,
+      "grad_norm": 4.245800495147705,
+      "learning_rate": 9.548611111111113e-06,
+      "loss": 2.6788,
+      "step": 360
+    },
+    {
+      "epoch": 1.4407606045831303,
+      "grad_norm": 3.8264000415802,
+      "learning_rate": 9.505208333333335e-06,
+      "loss": 2.6755,
+      "step": 370
+    },
+    {
+      "epoch": 1.4797659678205752,
+      "grad_norm": 4.036210060119629,
+      "learning_rate": 9.461805555555556e-06,
+      "loss": 2.6943,
+      "step": 380
+    },
+    {
+      "epoch": 1.5187713310580204,
+      "grad_norm": 4.102363586425781,
+      "learning_rate": 9.418402777777778e-06,
+      "loss": 2.6931,
+      "step": 390
+    },
+    {
+      "epoch": 1.5577766942954656,
+      "grad_norm": 3.794200897216797,
+      "learning_rate": 9.375000000000001e-06,
+      "loss": 2.6692,
+      "step": 400
+    },
+    {
+      "epoch": 1.5967820575329108,
+      "grad_norm": 4.008747577667236,
+      "learning_rate": 9.331597222222223e-06,
+      "loss": 2.6698,
+      "step": 410
+    },
+    {
+      "epoch": 1.635787420770356,
+      "grad_norm": 4.523059844970703,
+      "learning_rate": 9.288194444444444e-06,
+      "loss": 2.6308,
+      "step": 420
+    },
+    {
+      "epoch": 1.674792784007801,
+      "grad_norm": 3.91786789894104,
+      "learning_rate": 9.244791666666667e-06,
+      "loss": 2.5987,
+      "step": 430
+    },
+    {
+      "epoch": 1.7137981472452464,
+      "grad_norm": 4.020909309387207,
+      "learning_rate": 9.201388888888889e-06,
+      "loss": 2.6354,
+      "step": 440
+    },
+    {
+      "epoch": 1.7528035104826913,
+      "grad_norm": 3.620465040206909,
+      "learning_rate": 9.157986111111112e-06,
+      "loss": 2.659,
+      "step": 450
+    },
+    {
+      "epoch": 1.7918088737201365,
+      "grad_norm": 3.509871482849121,
+      "learning_rate": 9.114583333333334e-06,
+      "loss": 2.6531,
+      "step": 460
+    },
+    {
+      "epoch": 1.8308142369575817,
+      "grad_norm": 4.906174659729004,
+      "learning_rate": 9.071180555555557e-06,
+      "loss": 2.6146,
+      "step": 470
+    },
+    {
+      "epoch": 1.8698196001950267,
+      "grad_norm": 4.495574951171875,
+      "learning_rate": 9.027777777777779e-06,
+      "loss": 2.6399,
+      "step": 480
+    },
+    {
+      "epoch": 1.908824963432472,
+      "grad_norm": 4.081535339355469,
+      "learning_rate": 8.984375000000002e-06,
+      "loss": 2.5733,
+      "step": 490
+    },
+    {
+      "epoch": 1.947830326669917,
+      "grad_norm": 4.859089374542236,
+      "learning_rate": 8.940972222222222e-06,
+      "loss": 2.6333,
+      "step": 500
+    },
+    {
+      "epoch": 1.9868356899073623,
+      "grad_norm": 4.1170830726623535,
+      "learning_rate": 8.897569444444445e-06,
+      "loss": 2.6284,
+      "step": 510
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.16626036079960996,
+      "eval_f1_macro": 0.07002851524088888,
+      "eval_f1_micro": 0.16626036079960996,
+      "eval_f1_weighted": 0.0850951694800105,
+      "eval_loss": 2.5804367065429688,
+      "eval_precision_macro": 0.1575303519561262,
+      "eval_precision_micro": 0.16626036079960996,
+      "eval_precision_weighted": 0.14667789639701573,
+      "eval_recall_macro": 0.11376388483029318,
+      "eval_recall_micro": 0.16626036079960996,
+      "eval_recall_weighted": 0.16626036079960996,
+      "eval_runtime": 57.5878,
+      "eval_samples_per_second": 35.615,
+      "eval_steps_per_second": 4.463,
+      "step": 514
+    },
+    {
+      "epoch": 2.0234032179424672,
+      "grad_norm": 4.6980390548706055,
+      "learning_rate": 8.854166666666667e-06,
+      "loss": 2.4096,
+      "step": 520
+    },
+    {
+      "epoch": 2.062408581179912,
+      "grad_norm": 5.933006286621094,
+      "learning_rate": 8.81076388888889e-06,
+      "loss": 2.5589,
+      "step": 530
+    },
+    {
+      "epoch": 2.101413944417357,
+      "grad_norm": NaN,
+      "learning_rate": 8.77170138888889e-06,
+      "loss": 2.563,
+      "step": 540
+    },
+    {
+      "epoch": 2.1404193076548026,
+      "grad_norm": 5.945810794830322,
+      "learning_rate": 8.728298611111112e-06,
+      "loss": 2.5338,
+      "step": 550
+    },
+    {
+      "epoch": 2.1794246708922476,
+      "grad_norm": 5.052691459655762,
+      "learning_rate": 8.684895833333335e-06,
+      "loss": 2.501,
+      "step": 560
+    },
+    {
+      "epoch": 2.218430034129693,
+      "grad_norm": 4.916421413421631,
+      "learning_rate": 8.641493055555557e-06,
+      "loss": 2.4721,
+      "step": 570
+    },
+    {
+      "epoch": 2.257435397367138,
+      "grad_norm": 5.270256519317627,
+      "learning_rate": 8.598090277777778e-06,
+      "loss": 2.4879,
+      "step": 580
+    },
+    {
+      "epoch": 2.2964407606045834,
+      "grad_norm": 6.149162292480469,
+      "learning_rate": 8.5546875e-06,
+      "loss": 2.407,
+      "step": 590
+    },
+    {
+      "epoch": 2.3354461238420283,
+      "grad_norm": 5.327962398529053,
+      "learning_rate": 8.511284722222223e-06,
+      "loss": 2.4255,
+      "step": 600
+    },
+    {
+      "epoch": 2.3744514870794733,
+      "grad_norm": 5.612864017486572,
+      "learning_rate": 8.467881944444445e-06,
+      "loss": 2.4923,
+      "step": 610
+    },
+    {
+      "epoch": 2.4134568503169187,
+      "grad_norm": 5.927056789398193,
+      "learning_rate": 8.424479166666666e-06,
+      "loss": 2.4304,
+      "step": 620
+    },
+    {
+      "epoch": 2.4524622135543637,
+      "grad_norm": 6.483325958251953,
+      "learning_rate": 8.381076388888889e-06,
+      "loss": 2.4392,
+      "step": 630
+    },
+    {
+      "epoch": 2.491467576791809,
+      "grad_norm": 6.655641555786133,
+      "learning_rate": 8.337673611111113e-06,
+      "loss": 2.4165,
+      "step": 640
+    },
+    {
+      "epoch": 2.530472940029254,
+      "grad_norm": 6.099938869476318,
+      "learning_rate": 8.294270833333334e-06,
+      "loss": 2.4274,
+      "step": 650
+    },
+    {
+      "epoch": 2.569478303266699,
+      "grad_norm": 7.101120471954346,
+      "learning_rate": 8.250868055555556e-06,
+      "loss": 2.3871,
+      "step": 660
+    },
+    {
+      "epoch": 2.6084836665041444,
+      "grad_norm": 6.579291820526123,
+      "learning_rate": 8.207465277777779e-06,
+      "loss": 2.3718,
+      "step": 670
+    },
+    {
+      "epoch": 2.6474890297415894,
+      "grad_norm": 6.7963457107543945,
+      "learning_rate": 8.164062500000001e-06,
+      "loss": 2.3544,
+      "step": 680
+    },
+    {
+      "epoch": 2.686494392979035,
+      "grad_norm": 10.213848114013672,
+      "learning_rate": 8.120659722222224e-06,
+      "loss": 2.3501,
+      "step": 690
+    },
+    {
+      "epoch": 2.7254997562164798,
+      "grad_norm": 6.80430269241333,
+      "learning_rate": 8.077256944444444e-06,
+      "loss": 2.2806,
+      "step": 700
+    },
+    {
+      "epoch": 2.7645051194539247,
+      "grad_norm": 6.852050304412842,
+      "learning_rate": 8.033854166666667e-06,
+      "loss": 2.3389,
+      "step": 710
+    },
+    {
+      "epoch": 2.80351048269137,
+      "grad_norm": 8.63313102722168,
+      "learning_rate": 7.99045138888889e-06,
+      "loss": 2.3668,
+      "step": 720
+    },
+    {
+      "epoch": 2.842515845928815,
+      "grad_norm": 8.344212532043457,
+      "learning_rate": 7.947048611111112e-06,
+      "loss": 2.2608,
+      "step": 730
+    },
+    {
+      "epoch": 2.8815212091662605,
+      "grad_norm": 7.747754096984863,
+      "learning_rate": 7.903645833333334e-06,
+      "loss": 2.3099,
+      "step": 740
+    },
+    {
+      "epoch": 2.9205265724037055,
+      "grad_norm": 8.065759658813477,
+      "learning_rate": 7.860243055555557e-06,
+      "loss": 2.1869,
+      "step": 750
+    },
+    {
+      "epoch": 2.9595319356411505,
+      "grad_norm": 9.365443229675293,
+      "learning_rate": 7.81684027777778e-06,
+      "loss": 2.266,
+      "step": 760
+    },
+    {
+      "epoch": 2.998537298878596,
+      "grad_norm": 7.615650653839111,
+      "learning_rate": 7.7734375e-06,
+      "loss": 2.1923,
+      "step": 770
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.27693807898586054,
+      "eval_f1_macro": 0.23444058368942994,
+      "eval_f1_micro": 0.27693807898586054,
+      "eval_f1_weighted": 0.2232954691057457,
+      "eval_loss": 2.2444159984588623,
+      "eval_precision_macro": 0.42520232898903443,
+      "eval_precision_micro": 0.27693807898586054,
+      "eval_precision_weighted": 0.36698946639719304,
+      "eval_recall_macro": 0.2559615112919232,
+      "eval_recall_micro": 0.27693807898586054,
+      "eval_recall_weighted": 0.27693807898586054,
+      "eval_runtime": 57.5648,
+      "eval_samples_per_second": 35.629,
+      "eval_steps_per_second": 4.465,
+      "step": 771
+    },
+    {
+      "epoch": 3.0351048269137006,
+      "grad_norm": 6.9213056564331055,
+      "learning_rate": 7.730034722222223e-06,
+      "loss": 1.9593,
+      "step": 780
+    },
+    {
+      "epoch": 3.0741101901511456,
+      "grad_norm": 7.0944366455078125,
+      "learning_rate": 7.686631944444445e-06,
+      "loss": 2.0703,
+      "step": 790
+    },
+    {
+      "epoch": 3.113115553388591,
+      "grad_norm": 7.207167148590088,
+      "learning_rate": 7.643229166666668e-06,
+      "loss": 2.1229,
+      "step": 800
+    },
+    {
+      "epoch": 3.152120916626036,
+      "grad_norm": 8.827300071716309,
+      "learning_rate": 7.599826388888889e-06,
+      "loss": 2.0435,
+      "step": 810
+    },
+    {
+      "epoch": 3.1911262798634814,
+      "grad_norm": 8.51149845123291,
+      "learning_rate": 7.5564236111111125e-06,
+      "loss": 2.1189,
+      "step": 820
+    },
+    {
+      "epoch": 3.2301316431009264,
+      "grad_norm": 9.00069808959961,
+      "learning_rate": 7.513020833333334e-06,
+      "loss": 1.9885,
+      "step": 830
+    },
+    {
+      "epoch": 3.2691370063383713,
+      "grad_norm": 7.135461330413818,
+      "learning_rate": 7.469618055555557e-06,
+      "loss": 2.043,
+      "step": 840
+    },
+    {
+      "epoch": 3.3081423695758168,
+      "grad_norm": 7.121860027313232,
+      "learning_rate": 7.426215277777778e-06,
+      "loss": 2.1203,
+      "step": 850
+    },
+    {
+      "epoch": 3.3471477328132617,
+      "grad_norm": 7.476314067840576,
+      "learning_rate": 7.382812500000001e-06,
+      "loss": 2.008,
+      "step": 860
+    },
+    {
+      "epoch": 3.386153096050707,
+      "grad_norm": 11.115015029907227,
+      "learning_rate": 7.339409722222222e-06,
+      "loss": 2.0098,
+      "step": 870
+    },
+    {
+      "epoch": 3.425158459288152,
+      "grad_norm": 6.821423053741455,
+      "learning_rate": 7.296006944444445e-06,
+      "loss": 2.0252,
+      "step": 880
+    },
+    {
+      "epoch": 3.464163822525597,
+      "grad_norm": 12.535731315612793,
+      "learning_rate": 7.2526041666666665e-06,
+      "loss": 1.9571,
+      "step": 890
+    },
+    {
+      "epoch": 3.5031691857630425,
+      "grad_norm": 8.49023723602295,
+      "learning_rate": 7.209201388888889e-06,
+      "loss": 1.9901,
+      "step": 900
+    },
+    {
+      "epoch": 3.5421745490004874,
+      "grad_norm": 9.62365436553955,
+      "learning_rate": 7.165798611111112e-06,
+      "loss": 1.9254,
+      "step": 910
+    },
+    {
+      "epoch": 3.581179912237933,
+      "grad_norm": 8.030123710632324,
+      "learning_rate": 7.122395833333334e-06,
+      "loss": 1.9497,
+      "step": 920
+    },
+    {
+      "epoch": 3.620185275475378,
+      "grad_norm": 9.932555198669434,
+      "learning_rate": 7.0789930555555564e-06,
+      "loss": 1.9421,
+      "step": 930
+    },
+    {
+      "epoch": 3.659190638712823,
+      "grad_norm": 10.256240844726562,
+      "learning_rate": 7.035590277777778e-06,
+      "loss": 1.8403,
+      "step": 940
+    },
+    {
+      "epoch": 3.698196001950268,
+      "grad_norm": 8.8562593460083,
+      "learning_rate": 6.9921875000000006e-06,
+      "loss": 1.835,
+      "step": 950
+    },
+    {
+      "epoch": 3.737201365187713,
+      "grad_norm": 9.009734153747559,
+      "learning_rate": 6.948784722222223e-06,
+      "loss": 1.9243,
+      "step": 960
+    },
+    {
+      "epoch": 3.7762067284251586,
+      "grad_norm": 7.639193058013916,
+      "learning_rate": 6.905381944444445e-06,
+      "loss": 1.9483,
+      "step": 970
+    },
+    {
+      "epoch": 3.8152120916626036,
+      "grad_norm": 11.056807518005371,
+      "learning_rate": 6.861979166666667e-06,
+      "loss": 1.9227,
+      "step": 980
+    },
+    {
+      "epoch": 3.8542174549000485,
+      "grad_norm": 11.807608604431152,
+      "learning_rate": 6.818576388888889e-06,
+      "loss": 1.9521,
+      "step": 990
+    },
+    {
+      "epoch": 3.893222818137494,
+      "grad_norm": 8.170421600341797,
+      "learning_rate": 6.775173611111112e-06,
+      "loss": 1.8677,
+      "step": 1000
+    },
+    {
+      "epoch": 3.932228181374939,
+      "grad_norm": 9.836169242858887,
+      "learning_rate": 6.731770833333335e-06,
+      "loss": 1.8232,
+      "step": 1010
+    },
+    {
+      "epoch": 3.9712335446123843,
+      "grad_norm": 10.409213066101074,
+      "learning_rate": 6.688368055555556e-06,
+      "loss": 1.878,
+      "step": 1020
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.3554363725012189,
+      "eval_f1_macro": 0.3424708705030215,
+      "eval_f1_micro": 0.3554363725012189,
+      "eval_f1_weighted": 0.30902224255328264,
+      "eval_loss": 1.9913461208343506,
+      "eval_precision_macro": 0.46004367455197387,
+      "eval_precision_micro": 0.3554363725012189,
+      "eval_precision_weighted": 0.41659948847945955,
+      "eval_recall_macro": 0.36864660751423883,
+      "eval_recall_micro": 0.3554363725012189,
+      "eval_recall_weighted": 0.3554363725012189,
+      "eval_runtime": 57.605,
+      "eval_samples_per_second": 35.605,
+      "eval_steps_per_second": 4.461,
+      "step": 1028
+    },
+    {
+      "epoch": 4.007801072647489,
+      "grad_norm": 10.35783576965332,
+      "learning_rate": 6.644965277777779e-06,
+      "loss": 1.8021,
+      "step": 1030
+    },
+    {
+      "epoch": 4.0468064358849345,
+      "grad_norm": 6.1023101806640625,
+      "learning_rate": 6.6015625e-06,
+      "loss": 1.6937,
+      "step": 1040
+    },
+    {
+      "epoch": 4.0858117991223795,
+      "grad_norm": 9.223121643066406,
+      "learning_rate": 6.558159722222223e-06,
+      "loss": 1.671,
+      "step": 1050
+    },
+    {
+      "epoch": 4.124817162359824,
+      "grad_norm": 11.505966186523438,
+      "learning_rate": 6.5147569444444445e-06,
+      "loss": 1.7108,
+      "step": 1060
+    },
+    {
+      "epoch": 4.163822525597269,
+      "grad_norm": 8.100488662719727,
+      "learning_rate": 6.471354166666667e-06,
+      "loss": 1.7243,
+      "step": 1070
+    },
+    {
+      "epoch": 4.202827888834714,
+      "grad_norm": 10.167851448059082,
+      "learning_rate": 6.427951388888889e-06,
+      "loss": 1.6785,
+      "step": 1080
+    },
+    {
+      "epoch": 4.24183325207216,
+      "grad_norm": 9.894684791564941,
+      "learning_rate": 6.384548611111112e-06,
+      "loss": 1.6085,
+      "step": 1090
+    },
+    {
+      "epoch": 4.280838615309605,
+      "grad_norm": 14.413894653320312,
+      "learning_rate": 6.3411458333333344e-06,
+      "loss": 1.6503,
+      "step": 1100
+    },
+    {
+      "epoch": 4.31984397854705,
+      "grad_norm": 9.841206550598145,
+      "learning_rate": 6.297743055555556e-06,
+      "loss": 1.6533,
+      "step": 1110
+    },
+    {
+      "epoch": 4.358849341784495,
+      "grad_norm": 10.768450736999512,
+      "learning_rate": 6.2543402777777786e-06,
+      "loss": 1.6423,
+      "step": 1120
+    },
+    {
+      "epoch": 4.39785470502194,
+      "grad_norm": 10.424446105957031,
+      "learning_rate": 6.2109375e-06,
+      "loss": 1.704,
+      "step": 1130
+    },
+    {
+      "epoch": 4.436860068259386,
+      "grad_norm": 12.57535171508789,
+      "learning_rate": 6.167534722222223e-06,
+      "loss": 1.6415,
+      "step": 1140
+    },
+    {
+      "epoch": 4.475865431496831,
+      "grad_norm": 12.024733543395996,
+      "learning_rate": 6.124131944444444e-06,
+      "loss": 1.6701,
+      "step": 1150
+    },
+    {
+      "epoch": 4.514870794734276,
+      "grad_norm": 14.477334976196289,
+      "learning_rate": 6.080729166666667e-06,
+      "loss": 1.6661,
+      "step": 1160
+    },
+    {
+      "epoch": 4.553876157971721,
+      "grad_norm": 12.958348274230957,
+      "learning_rate": 6.037326388888889e-06,
+      "loss": 1.6084,
+      "step": 1170
+    },
+    {
+      "epoch": 4.592881521209167,
+      "grad_norm": 10.68494987487793,
+      "learning_rate": 5.993923611111112e-06,
+      "loss": 1.6175,
+      "step": 1180
+    },
+    {
+      "epoch": 4.631886884446612,
+      "grad_norm": 13.702882766723633,
+      "learning_rate": 5.950520833333334e-06,
+      "loss": 1.6614,
+      "step": 1190
+    },
+    {
+      "epoch": 4.670892247684057,
+      "grad_norm": 11.554649353027344,
+      "learning_rate": 5.907118055555556e-06,
+      "loss": 1.5768,
+      "step": 1200
+    },
+    {
+      "epoch": 4.709897610921502,
+      "grad_norm": 12.292317390441895,
+      "learning_rate": 5.863715277777778e-06,
+      "loss": 1.5714,
+      "step": 1210
+    },
+    {
+      "epoch": 4.748902974158947,
+      "grad_norm": 12.34539794921875,
+      "learning_rate": 5.820312500000001e-06,
+      "loss": 1.6122,
+      "step": 1220
+    },
+    {
+      "epoch": 4.7879083373963915,
+      "grad_norm": 9.150538444519043,
+      "learning_rate": 5.7769097222222225e-06,
+      "loss": 1.5502,
+      "step": 1230
+    },
+    {
+      "epoch": 4.826913700633837,
+      "grad_norm": 12.019886016845703,
+      "learning_rate": 5.733506944444445e-06,
+      "loss": 1.5283,
+      "step": 1240
+    },
+    {
+      "epoch": 4.865919063871282,
+      "grad_norm": 13.477303504943848,
+      "learning_rate": 5.690104166666667e-06,
+      "loss": 1.5673,
+      "step": 1250
+    },
+    {
+      "epoch": 4.904924427108727,
+      "grad_norm": 14.153918266296387,
+      "learning_rate": 5.646701388888889e-06,
+      "loss": 1.5456,
+      "step": 1260
+    },
+    {
+      "epoch": 4.943929790346172,
+      "grad_norm": 12.06778335571289,
+      "learning_rate": 5.6032986111111124e-06,
+      "loss": 1.5221,
+      "step": 1270
+    },
+    {
+      "epoch": 4.982935153583618,
+      "grad_norm": 14.565933227539062,
+      "learning_rate": 5.559895833333334e-06,
+      "loss": 1.4679,
+      "step": 1280
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.3793271574841541,
+      "eval_f1_macro": 0.3788654736153261,
+      "eval_f1_micro": 0.3793271574841541,
+      "eval_f1_weighted": 0.3406548058322202,
+      "eval_loss": 1.980505347251892,
+      "eval_precision_macro": 0.40541928460663945,
+      "eval_precision_micro": 0.3793271574841541,
+      "eval_precision_weighted": 0.3634818029255939,
+      "eval_recall_macro": 0.40614544202326364,
+      "eval_recall_micro": 0.3793271574841541,
+      "eval_recall_weighted": 0.3793271574841541,
+      "eval_runtime": 57.5587,
+      "eval_samples_per_second": 35.633,
+      "eval_steps_per_second": 4.465,
+      "step": 1285
+    },
+    {
+      "epoch": 5.0195026816187225,
+      "grad_norm": 10.44895076751709,
+      "learning_rate": 5.5164930555555566e-06,
+      "loss": 1.3376,
+      "step": 1290
+    },
+    {
+      "epoch": 5.0585080448561675,
+      "grad_norm": 15.51266860961914,
+      "learning_rate": 5.4774305555555565e-06,
+      "loss": 1.479,
+      "step": 1300
+    },
+    {
+      "epoch": 5.097513408093613,
+      "grad_norm": 11.123811721801758,
+      "learning_rate": 5.434027777777778e-06,
+      "loss": 1.3313,
+      "step": 1310
+    },
+    {
+      "epoch": 5.136518771331058,
+      "grad_norm": 10.911710739135742,
+      "learning_rate": 5.390625000000001e-06,
+      "loss": 1.406,
+      "step": 1320
+    },
+    {
+      "epoch": 5.175524134568503,
+      "grad_norm": 12.338854789733887,
+      "learning_rate": 5.347222222222222e-06,
+      "loss": 1.3619,
+      "step": 1330
+    },
+    {
+      "epoch": 5.214529497805948,
+      "grad_norm": 10.681340217590332,
+      "learning_rate": 5.303819444444445e-06,
+      "loss": 1.3803,
+      "step": 1340
+    },
+    {
+      "epoch": 5.253534861043393,
+      "grad_norm": 12.806472778320312,
+      "learning_rate": 5.260416666666666e-06,
+      "loss": 1.4016,
+      "step": 1350
+    },
+    {
+      "epoch": 5.292540224280838,
+      "grad_norm": 9.82974624633789,
+      "learning_rate": 5.217013888888889e-06,
+      "loss": 1.4298,
+      "step": 1360
+    },
+    {
+      "epoch": 5.331545587518284,
+      "grad_norm": 9.38745403289795,
+      "learning_rate": 5.173611111111112e-06,
+      "loss": 1.2707,
+      "step": 1370
+    },
+    {
+      "epoch": 5.370550950755729,
+      "grad_norm": 11.31470012664795,
+      "learning_rate": 5.130208333333334e-06,
+      "loss": 1.2818,
+      "step": 1380
+    },
+    {
+      "epoch": 5.409556313993174,
+      "grad_norm": 12.014089584350586,
+      "learning_rate": 5.086805555555556e-06,
+      "loss": 1.3868,
+      "step": 1390
+    },
+    {
+      "epoch": 5.448561677230619,
+      "grad_norm": 12.203828811645508,
+      "learning_rate": 5.043402777777778e-06,
+      "loss": 1.2886,
+      "step": 1400
+    },
+    {
+      "epoch": 5.487567040468065,
+      "grad_norm": 15.790043830871582,
+      "learning_rate": 5e-06,
+      "loss": 1.2743,
+      "step": 1410
+    },
+    {
+      "epoch": 5.52657240370551,
+      "grad_norm": 13.66932201385498,
+      "learning_rate": 4.956597222222223e-06,
+      "loss": 1.2872,
+      "step": 1420
+    },
+    {
+      "epoch": 5.565577766942955,
+      "grad_norm": 11.339312553405762,
+      "learning_rate": 4.9131944444444445e-06,
+      "loss": 1.3496,
+      "step": 1430
+    },
+    {
+      "epoch": 5.6045831301804,
+      "grad_norm": 10.514497756958008,
+      "learning_rate": 4.8741319444444444e-06,
+      "loss": 1.2668,
+      "step": 1440
+    },
+    {
+      "epoch": 5.643588493417845,
+      "grad_norm": 14.161802291870117,
+      "learning_rate": 4.830729166666667e-06,
+      "loss": 1.3988,
+      "step": 1450
+    },
+    {
+      "epoch": 5.6825938566552905,
+      "grad_norm": 13.395609855651855,
+      "learning_rate": 4.787326388888889e-06,
+      "loss": 1.2777,
+      "step": 1460
+    },
+    {
+      "epoch": 5.7215992198927355,
+      "grad_norm": 16.105741500854492,
+      "learning_rate": 4.743923611111111e-06,
+      "loss": 1.3207,
+      "step": 1470
+    },
+    {
+      "epoch": 5.76060458313018,
+      "grad_norm": 12.356030464172363,
+      "learning_rate": 4.7005208333333335e-06,
+      "loss": 1.3008,
+      "step": 1480
+    },
+    {
+      "epoch": 5.799609946367625,
+      "grad_norm": 16.024171829223633,
+      "learning_rate": 4.657118055555556e-06,
+      "loss": 1.3169,
+      "step": 1490
+    },
+    {
+      "epoch": 5.83861530960507,
+      "grad_norm": 13.603280067443848,
+      "learning_rate": 4.6137152777777785e-06,
+      "loss": 1.3377,
+      "step": 1500
+    },
+    {
+      "epoch": 5.877620672842516,
+      "grad_norm": 12.428413391113281,
+      "learning_rate": 4.5703125e-06,
+      "loss": 1.3143,
+      "step": 1510
+    },
+    {
+      "epoch": 5.916626036079961,
+      "grad_norm": 12.86538028717041,
+      "learning_rate": 4.526909722222223e-06,
+      "loss": 1.3215,
+      "step": 1520
+    },
+    {
+      "epoch": 5.955631399317406,
+      "grad_norm": 17.084808349609375,
+      "learning_rate": 4.483506944444444e-06,
+      "loss": 1.3156,
+      "step": 1530
+    },
+    {
+      "epoch": 5.994636762554851,
+      "grad_norm": 11.272918701171875,
+      "learning_rate": 4.440104166666668e-06,
+      "loss": 1.2399,
+      "step": 1540
+    },
+    {
+      "epoch": 6.0,
+      "eval_accuracy": 0.40711847879083374,
+      "eval_f1_macro": 0.43647747790260216,
+      "eval_f1_micro": 0.40711847879083374,
+      "eval_f1_weighted": 0.3874051890698862,
+      "eval_loss": 1.9677170515060425,
+      "eval_precision_macro": 0.49034231056721467,
+      "eval_precision_micro": 0.40711847879083374,
+      "eval_precision_weighted": 0.4284233711977137,
+      "eval_recall_macro": 0.4407702395816866,
+      "eval_recall_micro": 0.40711847879083374,
+      "eval_recall_weighted": 0.40711847879083374,
+      "eval_runtime": 57.6083,
+      "eval_samples_per_second": 35.603,
+      "eval_steps_per_second": 4.461,
+      "step": 1542
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 2560,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 4.587586907052442e+16,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1542/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a02b0d078d86ef0a1711524deea83d7a31c2e9047f6f3914251d4766e478633
+size 5368

config.json ADDED Viewed

	@@ -0,0 +1,73 @@

+{
+  "_name_or_path": "microsoft/deberta-v3-large",
+  "_num_labels": 16,
+  "architectures": [
+    "DebertaV2ForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "enfj",
+    "1": "enfp",
+    "2": "entj",
+    "3": "entp",
+    "4": "esfj",
+    "5": "esfp",
+    "6": "estj",
+    "7": "estp",
+    "8": "infj",
+    "9": "infp",
+    "10": "intj",
+    "11": "intp",
+    "12": "isfj",
+    "13": "isfp",
+    "14": "istj",
+    "15": "istp"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "enfj": 0,
+    "enfp": 1,
+    "entj": 2,
+    "entp": 3,
+    "esfj": 4,
+    "esfp": 5,
+    "estj": 6,
+    "estp": 7,
+    "infj": 8,
+    "infp": 9,
+    "intj": 10,
+    "intp": 11,
+    "isfj": 12,
+    "isfp": 13,
+    "istj": 14,
+    "istp": 15
+  },
+  "layer_norm_eps": 1e-07,
+  "legacy": true,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 1024,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "type_vocab_size": 0,
+  "vocab_size": 128100
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c9b5b9de47af2e45c14a96ab10be692e0caf5e1ae04b1a717235a34c072f012
+size 1740361848

runs/Jan21_15-38-16_r-idobn-twitter-mbti-2rmya185-a2492-5fds5/events.out.tfevents.1769009898.r-idobn-twitter-mbti-2rmya185-a2492-5fds5.120.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ae04a51f32d0ff40558520b8ac6c5420853b18c481a4a3c208dac0220da9cd3
-size 63268

 version https://git-lfs.github.com/spec/v1
+oid sha256:0dd2028fa475d3218fa9bfbe2d5f1ccfd1460eeae1e4a3166dbab412489f3a2f
+size 68464

runs/Jan21_15-38-16_r-idobn-twitter-mbti-2rmya185-a2492-5fds5/events.out.tfevents.1769017304.r-idobn-twitter-mbti-2rmya185-a2492-5fds5.120.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e72f600ffc5d8ad8eeac7b8964d4b71ddaab5ae014180d5a422f8cf63fd89c37
+size 921

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "[CLS]",
+  "cls_token": "[CLS]",
+  "eos_token": "[SEP]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

spm.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
+size 2464616

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,59 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128000": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "[CLS]",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "eos_token": "[SEP]",
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "sp_model_kwargs": {},
+  "split_by_punct": false,
+  "tokenizer_class": "DebertaV2Tokenizer",
+  "unk_token": "[UNK]",
+  "vocab_type": "spm"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a02b0d078d86ef0a1711524deea83d7a31c2e9047f6f3914251d4766e478633
+size 5368

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "twitter-mbti-v2/autotrain-data",
+    "model": "microsoft/deberta-v3-large",
+    "lr": 1e-05,
+    "epochs": 10,
+    "max_seq_length": 512,
+    "batch_size": 4,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 8,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.01,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": 10,
+    "project_name": "twitter-mbti-v2",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "eval_strategy": "epoch",
+    "username": "idobn",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}