Training in progress, epoch 1

Browse files

Files changed (14) hide show

adapter_model.safetensors +1 -1
final/adapter_config.json +2 -2
final/adapter_model.safetensors +1 -1
final/training_config.json +7 -7
logs/20260109-133806/events.out.tfevents.1767937088.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.536.0 +2 -2
logs/20260109-133806/events.out.tfevents.1767937151.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.536.1 +3 -0
logs/20260109-134833/events.out.tfevents.1767937714.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.1518.0 +3 -0
search-ner-lora-model/config.json +66 -0
search-ner-lora-model/model.safetensors +3 -0
search-ner-lora-model/special_tokens_map.json +37 -0
search-ner-lora-model/tokenizer.json +0 -0
search-ner-lora-model/tokenizer_config.json +62 -0
search-ner-lora-model/vocab.txt +0 -0
training_args.bin +1 -1

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96416577097d4c41fc14f1d43040a8a0e724fa48c41f6ac8287fee7652dbf260
 size 5387004

 version https://git-lfs.github.com/spec/v1
+oid sha256:4633e0f7265c39f0af0d59009d7dd7030d19e65b67e36e97fcc271270d8a8ed3
 size 5387004

final/adapter_config.json CHANGED Viewed

@@ -32,9 +32,9 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "dense",
-    "key",
     "value",
     "query"
   ],
   "target_parameters": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "value",
+    "key",
+    "dense",
     "query"
   ],
   "target_parameters": null,

final/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a6e4e1c1d14aa5fcce9df3ad6de1a60e7706872557589270aaaba2c5a82ee4af
 size 5387004

 version https://git-lfs.github.com/spec/v1
+oid sha256:7956fbc17bbd28e8815dad60f3a6105b92afe5ce8a6ed4e81d91ac488fe13d80
 size 5387004

final/training_config.json CHANGED Viewed

@@ -7,13 +7,13 @@
   "batch_size": 16,
   "num_epochs": 10,
   "final_metrics": {
-    "eval_loss": 0.0005899938987568021,
-    "eval_precision": 1.0,
-    "eval_recall": 1.0,
-    "eval_f1": 1.0,
-    "eval_runtime": 0.5923,
-    "eval_samples_per_second": 675.317,
-    "eval_steps_per_second": 42.207,
     "epoch": 7.0
   },
   "label_list": [

   "batch_size": 16,
   "num_epochs": 10,
   "final_metrics": {
+    "eval_loss": 0.005412294063717127,
+    "eval_precision": 0.997907949790795,
+    "eval_recall": 0.997907949790795,
+    "eval_f1": 0.997907949790795,
+    "eval_runtime": 0.6175,
+    "eval_samples_per_second": 323.895,
+    "eval_steps_per_second": 21.053,
     "epoch": 7.0
   },
   "label_list": [

logs/20260109-133806/events.out.tfevents.1767937088.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.536.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e17ee1cdc4784a9a57bf63991ce2e540bf68e8ad6a3bd2e07220adfb02ad02f3
-size 11064

 version https://git-lfs.github.com/spec/v1
+oid sha256:004a63929cb0af33fc1505555346350ad80e1dba4544131e3e1b0c45f79f0b48
+size 12260

logs/20260109-133806/events.out.tfevents.1767937151.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.536.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c55c09bc8c4c93184cb4bf90086b97bf96290546108353cba2c1466bc774fa3
+size 508

logs/20260109-134833/events.out.tfevents.1767937714.r-lujin-train-search-ner-331oo3bz-6c66e-8xn59.1518.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:338c9dec52aea5dc301bb2978aebccbabb2ff76770b618e26607ad5f72963bfb
+size 8550

search-ner-lora-model/config.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "architectures": [
+    "BertForTokenClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "dtype": "float32",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "O",
+    "1": "B-TIME",
+    "2": "I-TIME",
+    "3": "B-LOCATION",
+    "4": "I-LOCATION",
+    "5": "B-PERSON",
+    "6": "I-PERSON",
+    "7": "B-ORGANIZATION",
+    "8": "I-ORGANIZATION",
+    "9": "B-PRODUCT",
+    "10": "I-PRODUCT",
+    "11": "B-EVENT",
+    "12": "I-EVENT",
+    "13": "B-TOPIC",
+    "14": "I-TOPIC",
+    "15": "B-CONCEPT",
+    "16": "I-CONCEPT",
+    "17": "B-SEARCH_INTENT",
+    "18": "I-SEARCH_INTENT"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "B-CONCEPT": 15,
+    "B-EVENT": 11,
+    "B-LOCATION": 3,
+    "B-ORGANIZATION": 7,
+    "B-PERSON": 5,
+    "B-PRODUCT": 9,
+    "B-SEARCH_INTENT": 17,
+    "B-TIME": 1,
+    "B-TOPIC": 13,
+    "I-CONCEPT": 16,
+    "I-EVENT": 12,
+    "I-LOCATION": 4,
+    "I-ORGANIZATION": 8,
+    "I-PERSON": 6,
+    "I-PRODUCT": 10,
+    "I-SEARCH_INTENT": 18,
+    "I-TIME": 2,
+    "I-TOPIC": 14,
+    "O": 0
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "transformers_version": "4.57.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 21128
+}

search-ner-lora-model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4abc46418334e01514022ff919d1049819e86dbc8023365813babc7ba1017548
+size 406789980

search-ner-lora-model/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

search-ner-lora-model/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

search-ner-lora-model/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "max_length": 512,
+  "model_max_length": 1000000000000000019884624838656,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "stride": 0,
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "[UNK]"
+}

search-ner-lora-model/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:30bb792ac207bda2fa0a184e5a993e2146480d0e5b431fb7a1d24e11e0a7fbd4
 size 5841

 version https://git-lfs.github.com/spec/v1
+oid sha256:290380ec95c540f3947f84950f4f0f12d32b4f3b2905886d39f542a10b429ebc
 size 5841