usr256864 commited on Sep 27, 2025

Commit

6df4d35

verified ·

1 Parent(s): 0952acb

Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

args.txt +13 -0
config_kwargs.json +41 -0
experiment_params.json +248 -0
log.txt +36 -0
lora_config.json +28 -0
metrics.tex +112 -0
model-epoch=03-mean_f1=0.1669_sd=42.ckpt +3 -0
predictions/predictions_0.json +1 -0
predictions/predictions_1.json +1 -0
predictions/predictions_2.json +1 -0
predictions/predictions_3.json +1 -0
predictions/predictions_4.json +1 -0
predictions/predictions_5.json +1 -0
predictions/predictions_6.json +1 -0
predictions/predictions_7.json +1 -0
qualitative_analysis.txt +0 -0
quantization_config.json +1 -0
test_metrics.tex +12 -0

args.txt ADDED Viewed

	@@ -0,0 +1,13 @@

+  --train_batch_size 1
+  --eval_batch_size 1
+  --num_train_epochs 20
+  --nbr_gpus 1
+  --learning_rate 5e-6
+  --grad_check
+  --config experiments/event_extraction/config_code_generator.json
+  --non_strict_load
+  --ds ../datasets/textee/wikievents
+  --answer_generator HiTZ/GoLLIE-7B
+  --guidelines new_Llama-31-8B-Instruct_annotation_guidelines
+  --k_schemes 10
+  --num_passages 5

config_kwargs.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "monitor_metric": "mean_f1",
+  "trainer_kwargs": {
+    "class_name": "Event_Extractor_Code"
+  },
+  "trainee_kwargs": {
+    "class_name": "EE",
+    "prompt_cls": "event_extraction_code",
+    "loss": {
+      "class_name": "NLLLoss"
+    },
+    "freeze_prefixes": []
+  },
+  "data_module_kwargs": {
+    "class_name": "event_extraction_DataModule",
+    "data_processor": {
+      "class_name": "viquae_data_processor",
+      "train_path": "viquae/train/",
+      "val_path": "viquae/val/",
+      "test_path": "viquae/test/"
+    },
+    "dataloader_kwargs": {
+      "num_workers": 6,
+      "prefetch_factor": 2
+    }
+  },
+  "answer_generator_kwargs": {
+    "dividable": true,
+    "checkpoint_name": "answer_generator",
+    "rag_training": false,
+    "rag": false,
+    "wo_kb": true,
+    "generator_only": true,
+    "entity_prompt": false,
+    "beam_search": true,
+    "best_answer": false,
+    "best_entity": false,
+    "inference_path": "saved_models/wikievents/GoLLIE-7B/code_generator/train/2025-09-26/19-34-03/answer_generator"
+  },
+  "all_datasets_path": "../datasets"
+}

experiment_params.json ADDED Viewed

	@@ -0,0 +1,248 @@

+{
+  "max_seq_length": 256,
+  "question_max_seq_length": 256,
+  "RC": false,
+  "coco": false,
+  "flickr": false,
+  "aokvqa": false,
+  "grad_check": true,
+  "MJL": false,
+  "debug_run_time": false,
+  "debug_output": false,
+  "only_neighbors": false,
+  "full_kb": false,
+  "image_eval": false,
+  "embedding_column": "my_DPR_few_shot",
+  "output_ds": null,
+  "output_kb": null,
+  "embed": false,
+  "data_path": null,
+  "train_batch_size": 1,
+  "eval_batch_size": 1,
+  "viquae_dev_batch_size": 1000,
+  "transformer_model_name": "bert-base-uncased",
+  "gradient_accumulation_steps": 1,
+  "warmup_proportion": 0.1,
+  "weight_decay": 0.01,
+  "lr_decay": false,
+  "adam_beta1": 0.9,
+  "adam_beta2": 0.999,
+  "warmup_steps": 4,
+  "adam_epsilon": 1e-08,
+  "num_train_epochs": 20,
+  "learning_rate": 5e-06,
+  "dropout": 0.5,
+  "bert_hidden_size": 768,
+  "MM": null,
+  "use_graph_P": null,
+  "use_graph_Q": null,
+  "syntactic_P": null,
+  "syntactic_Q": null,
+  "NS": false,
+  "IC_Q": false,
+  "IC_P": false,
+  "gcn_lr": 2e-05,
+  "clip_lr": null,
+  "dpr_lr": null,
+  "head_lr": 2e-06,
+  "func": "cat",
+  "graph_pooling": "mean",
+  "max_nbr_nodes": 2,
+  "num_neib": 1,
+  "neib_depth": 1,
+  "undirect": false,
+  "node_hidden_size": 128,
+  "max_num_relations": null,
+  "max_num_syntactic_relations": null,
+  "map_wikidataRelCode_to_idx": null,
+  "graph_layout": "fr",
+  "residual": false,
+  "num_gcn": null,
+  "node_alias_max_len": 32,
+  "attention": false,
+  "num_paths": 1,
+  "kg_embed": false,
+  "graph_only": false,
+  "freeze": false,
+  "sanity_run": false,
+  "scale_losses": false,
+  "check_answers": false,
+  "load_4bit": false,
+  "load_8bit": false,
+  "device_id": null,
+  "drop_last": false,
+  "disable_checkpointing": false,
+  "samples": null,
+  "sample_id": null,
+  "datasets_root_dir": "../datasets",
+  "ds": "../datasets/textee/wikievents",
+  "supp_train_ds": null,
+  "guidelines": "new_Llama-31-8B-Instruct_annotation_guidelines",
+  "num_trainable_params": null,
+  "num_all_param": null,
+  "trainable_ratio": null,
+  "train_sanity_run": false,
+  "enhanced_question": false,
+  "use_entity_type": false,
+  "filter_edges": false,
+  "draw": false,
+  "layer_norm": false,
+  "filters_3": 768,
+  "tensor_neurons": 16,
+  "output_dir": "saved_models/wikievents/GoLLIE-7B/code_generator/train/2025-09-26/19-34-03",
+  "main_dir": "/fscratch/oadjali/EEE",
+  "experiment_dir": "/fscratch/oadjali/EEE/saved_models/wikievents/GoLLIE-7B/code_generator/train/2025-09-26/19-34-03",
+  "experiment_name": null,
+  "search": null,
+  "input_key": null,
+  "train_input_key": null,
+  "train_search_run": null,
+  "val_search_run": null,
+  "test_search_run": null,
+  "no_resize": false,
+  "xlnet": false,
+  "tune_loss": false,
+  "tune_dev": true,
+  "tune_valid_loss": false,
+  "sanity_val_steps": 0,
+  "cpu": false,
+  "keep_in_memory": false,
+  "nbr_gpus": 1,
+  "N": 0,
+  "nbr_workers": 1,
+  "num_proc": 1,
+  "acc": "gpu",
+  "fast_dev_run": null,
+  "local_cache": "../my_transformers_cache",
+  "IMAGE_PATH": null,
+  "transformer_path": null,
+  "resume_from": null,
+  "answer_generator": "HiTZ/GoLLIE-7B",
+  "query_model": null,
+  "context_model": null,
+  "answer_generator_2": null,
+  "checkpoint": null,
+  "query_checkpoint": null,
+  "checkpoint_2": null,
+  "non_strict_load": true,
+  "trainer_checkpoint": null,
+  "linear_MEP_checkpoint": null,
+  "linear_MLM_checkpoint": null,
+  "config": "experiments/event_extraction/config_code_generator.json",
+  "context_checkpoint": null,
+  "grad_accum": 1,
+  "cls_token": "[CLS]",
+  "sep_token": "[SEP]",
+  "pad_token": "[PAD]",
+  "cls_token_at_end": false,
+  "mask_padding_with_zero": true,
+  "pad_on_left": false,
+  "sequence_a_segment_id": 0,
+  "pad_token_segment_id": 0,
+  "cls_token_segment_id": 0,
+  "pad_token_label_id": 0,
+  "pad_token_id": 0,
+  "past_index": -1,
+  "world_size": 1,
+  "use_lstm": false,
+  "use_entity": false,
+  "use_question_graph": false,
+  "use_question_objects": false,
+  "EFeat": null,
+  "NFeat": null,
+  "ltn": false,
+  "use_kelm": false,
+  "unshared": false,
+  "mlm": false,
+  "test": false,
+  "validate": false,
+  "eval_on_start": false,
+  "predict": null,
+  "split_dpr": false,
+  "rename_model": false,
+  "mask_rate": 0.15,
+  "pretrained_triviaq": false,
+  "error_analysis": false,
+  "debug": false,
+  "stop_debug": false,
+  "entity_linking": false,
+  "entity_linking_split": false,
+  "build_entity_paths": null,
+  "object_detection": null,
+  "update_wikidata_ids": null,
+  "update_None_ids": null,
+  "dependency_parsing": null,
+  "image_captionning": null,
+  "build_graph": false,
+  "from_bert": false,
+  "fast": false,
+  "get_examples": false,
+  "get_statistics": null,
+  "word_vocab_size": 0,
+  "char_vocab_size": 0,
+  "max_word_len": 30,
+  "device": "cuda",
+  "embedding_matrix": null,
+  "new_vocab_embeddings": null,
+  "w2v_file": "word_vector_200d.vec",
+  "word_emb_dim": 200,
+  "char_lstm": false,
+  "char_cnn": false,
+  "seed": 42,
+  "tune_batch_size": false,
+  "val_check_interval": null,
+  "model_names": null,
+  "build_hf_local_cache": true,
+  "strategy": null,
+  "monitor_metric": "mean_f1",
+  "precision": 32,
+  "no_lora": false,
+  "early_stopping": true,
+  "reduce_on_plateau": true,
+  "num_generations": 2,
+  "num_passages": 5,
+  "k_schemes": 10,
+  "use_liger_loss": false,
+  "kl_beta": 0.0,
+  "TI_alpha": 1.0,
+  "TC_alpha": 1.0,
+  "AI_alpha": 1.0,
+  "AC_alpha": 1.0,
+  "schema_retrieval_val": false,
+  "schema_retrieval_train": false,
+  "EE_2steps": false,
+  "EE_SL": false,
+  "save_ckpt": false,
+  "lora_config": {
+    "peft_type": "LORA",
+    "auto_mapping": null,
+    "base_model_name_or_path": null,
+    "revision": null,
+    "task_type": "CAUSAL_LM",
+    "inference_mode": false,
+    "r": 8,
+    "target_modules": [
+      "q_proj",
+      "v_proj"
+    ],
+    "lora_alpha": 16,
+    "lora_dropout": 0.05,
+    "fan_in_fan_out": false,
+    "bias": "none",
+    "use_rslora": false,
+    "modules_to_save": null,
+    "init_lora_weights": true,
+    "layers_to_transform": null,
+    "layers_pattern": null,
+    "rank_pattern": {},
+    "alpha_pattern": {},
+    "megatron_config": null,
+    "megatron_core": "megatron.core",
+    "loftq_config": {},
+    "use_dora": false
+  },
+  "quantization_config": null,
+  "hf": false,
+  "slurm_scipt_path": null,
+  "enabled_args": "  --train_batch_size 1\n  --eval_batch_size 1\n  --num_train_epochs 20\n  --nbr_gpus 1\n  --learning_rate 5e-6\n  --grad_check\n  --config experiments/event_extraction/config_code_generator.json\n  --non_strict_load\n  --ds ../datasets/textee/wikievents\n  --answer_generator HiTZ/GoLLIE-7B\n  --guidelines new_Llama-31-8B-Instruct_annotation_guidelines\n  --k_schemes 10\n  --num_passages 5"
+}

log.txt ADDED Viewed

	@@ -0,0 +1,36 @@

+trainable params: 4194304 || all params: 6742740992 || trainable%: 0.06220473254091146
+epoch:0 {'TC_prec': 0.3167701863354037, 'TC_rec': 0.12085308056872038, 'TI_prec': 0.45962732919254656, 'TI_rec': 0.17535545023696683, 'AC_prec': 0.10723860589812333, 'AC_rec': 0.06825938566552901, 'AI_prec': 0.13404825737265416, 'AI_rec': 0.08532423208191127, 'TI': 0.2538593481989709, 'TC': 0.17495711835334476, 'AI': 0.1042752867570386, 'AC': 0.08342022940563087, 'mean_f1': 0.15412799567874627}
+avg_train_loss tensor(1.6375)
+lr 5e-06
+epoch:1 {'TC_prec': 0.3235294117647059, 'TC_rec': 0.13033175355450238, 'TI_prec': 0.4764705882352941, 'TI_rec': 0.19194312796208532, 'AC_prec': 0.1174934725848564, 'AC_rec': 0.07679180887372014, 'AI_prec': 0.1409921671018277, 'AI_rec': 0.09215017064846416, 'TI': 0.27364864864864863, 'TC': 0.18581081081081083, 'AI': 0.11145510835913311, 'AC': 0.09287925696594428, 'mean_f1': 0.1659484561961342}
+avg_train_loss tensor(1.1741)
+lr 5e-06
+epoch:2 {'TC_prec': 0.3176470588235294, 'TC_rec': 0.12796208530805686, 'TI_prec': 0.47058823529411764, 'TI_rec': 0.1895734597156398, 'AC_prec': 0.11345646437994723, 'AC_rec': 0.07337883959044368, 'AI_prec': 0.13192612137203166, 'AI_rec': 0.08532423208191127, 'TI': 0.2702702702702703, 'TC': 0.1824324324324324, 'AI': 0.10362694300518135, 'AC': 0.08911917098445596, 'mean_f1': 0.161362204173085}
+avg_train_loss tensor(1.0730)
+lr 5e-06
+epoch:3 {'TC_prec': 0.3275862068965517, 'TC_rec': 0.13507109004739337, 'TI_prec': 0.4827586206896552, 'TI_rec': 0.1990521327014218, 'AC_prec': 0.11286089238845144, 'AC_rec': 0.07337883959044368, 'AI_prec': 0.13385826771653545, 'AI_rec': 0.08703071672354949, 'TI': 0.2818791946308725, 'TC': 0.1912751677852349, 'AI': 0.10548086866597725, 'AC': 0.08893485005170632, 'mean_f1': 0.16689252028344775}
+avg_train_loss tensor(1.0316)
+lr 5e-06
+epoch:4 {'TC_prec': 0.3176470588235294, 'TC_rec': 0.12796208530805686, 'TI_prec': 0.4764705882352941, 'TI_rec': 0.19194312796208532, 'AC_prec': 0.11466666666666667, 'AC_rec': 0.07337883959044368, 'AI_prec': 0.13333333333333333, 'AI_rec': 0.08532423208191127, 'TI': 0.27364864864864863, 'TC': 0.1824324324324324, 'AI': 0.10405827263267431, 'AC': 0.08949011446409989, 'mean_f1': 0.16240736704446382}
+avg_train_loss tensor(1.0073)
+lr 5e-06
+epoch:5 {'TC_prec': 0.313953488372093, 'TC_rec': 0.12796208530805686, 'TI_prec': 0.48255813953488375, 'TI_rec': 0.1966824644549763, 'AC_prec': 0.11052631578947368, 'AC_rec': 0.07167235494880546, 'AI_prec': 0.13421052631578947, 'AI_rec': 0.08703071672354949, 'TI': 0.27946127946127947, 'TC': 0.18181818181818182, 'AI': 0.10559006211180125, 'AC': 0.08695652173913043, 'mean_f1': 0.16345651128259822}
+avg_train_loss tensor(0.9908)
+lr 5e-06
+epoch:6 {'TC_prec': 0.32335329341317365, 'TC_rec': 0.12796208530805686, 'TI_prec': 0.48502994011976047, 'TI_rec': 0.19194312796208532, 'AC_prec': 0.12054794520547946, 'AC_rec': 0.07508532423208192, 'AI_prec': 0.14246575342465753, 'AI_rec': 0.08873720136518772, 'TI': 0.2750424448217318, 'TC': 0.1833616298811545, 'AI': 0.10935856992639327, 'AC': 0.092534174553102, 'mean_f1': 0.1650742047955954}
+avg_train_loss tensor(0.9788)
+lr 5e-06
+epoch:7 {'TC_prec': 0.33532934131736525, 'TC_rec': 0.13270142180094788, 'TI_prec': 0.47904191616766467, 'TI_rec': 0.1895734597156398, 'AC_prec': 0.11653116531165311, 'AC_rec': 0.07337883959044368, 'AI_prec': 0.13821138211382114, 'AI_rec': 0.08703071672354949, 'TI': 0.27164685908319186, 'TC': 0.19015280135823429, 'AI': 0.1068062827225131, 'AC': 0.0900523560209424, 'mean_f1': 0.16466457479622043}
+avg_train_loss tensor(0.9733)
+lr 2.5e-06
+[TEST]
+{'TC_prec': 0.2796610169491525, 'TC_rec': 0.1746031746031746, 'TI_prec': 0.3728813559322034, 'TI_rec': 0.2328042328042328, 'AC_prec': 0.0947136563876652, 'AC_rec': 0.083984375, 'AI_prec': 0.11674008810572688, 'AI_rec': 0.103515625, 'TI': 0.2866449511400651, 'TC': 0.21498371335504887, 'AI': 0.10973084886128363, 'AC': 0.08902691511387163, 'mean_f1': 0.1750966071175673}

lora_config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "peft_type": "LORA",
+  "auto_mapping": null,
+  "base_model_name_or_path": null,
+  "revision": null,
+  "task_type": "CAUSAL_LM",
+  "inference_mode": false,
+  "r": 8,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "lora_alpha": 16,
+  "lora_dropout": 0.05,
+  "fan_in_fan_out": false,
+  "bias": "none",
+  "use_rslora": false,
+  "modules_to_save": null,
+  "init_lora_weights": true,
+  "layers_to_transform": null,
+  "layers_pattern": null,
+  "rank_pattern": {},
+  "alpha_pattern": {},
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "loftq_config": {},
+  "use_dora": false
+}

metrics.tex ADDED Viewed

	@@ -0,0 +1,112 @@

+epoch:0
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+25.39 & 17.50 & 10.43 & 8.34 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:1
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.36 & 18.58 & 11.15 & 9.29 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:2
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.03 & 18.24 & 10.36 & 8.91 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:3
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+28.19 & 19.13 & 10.55 & 8.89 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:4
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.36 & 18.24 & 10.41 & 8.95 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:5
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.95 & 18.18 & 10.56 & 8.70 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:6
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.50 & 18.34 & 10.94 & 9.25 \\
+\bottomrule
+\end{tabular}
+\end{table}
+epoch:7
+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+27.16 & 19.02 & 10.68 & 9.01 \\
+\bottomrule
+\end{tabular}
+\end{table}

model-epoch=03-mean_f1=0.1669_sd=42.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:812d283bbcb77631a3a04b23066e0509a69b67edd8931898c49de27f72b0670f
+size 13502640837

predictions/predictions_0.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_1.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_2.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_3.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_4.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_5.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_6.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

predictions/predictions_7.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

qualitative_analysis.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

quantization_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ null

test_metrics.tex ADDED Viewed

	@@ -0,0 +1,12 @@

+=========================================
+\begin{table}
+\caption{Evaluation Metrics}
+\label{tab:metrics}
+\begin{tabular}{rrrr}
+\toprule
+TI & TC & AI & AC \\
+\midrule
+28.66 & 21.50 & 10.97 & 8.90 \\
+\bottomrule
+\end{tabular}
+\end{table}