unknown-JAX-MIND-small / training_run_summary.json
igor174's picture
Upload unknown (jax) trained on MIND-small — 3 seeds
6965b7b verified
{
"configuration": {
"framework": "jax",
"weights": null,
"seed": 123,
"output_base_dir": "outputs",
"device": {
"gpu_ids": [
0
],
"memory_limit": 1,
"keras_backend": "jax",
"precision": "float32"
},
"num_workers": 4,
"train": {
"batch_size": 64,
"num_epochs": 20,
"learning_rate": 5e-05,
"gradient_clip_val": 1.0,
"grad_accum_steps": 1,
"early_stopping": {
"patience": 5,
"min_improvement": 0.01
}
},
"eval": {
"fast_evaluation": true,
"batch_size": 256,
"save_predictions": true,
"predictions_dir": "predictions",
"run_initial_eval": false,
"run_test_after_training": true
},
"logging": {
"project_name": "NewsReX",
"enable_wandb": true,
"experiment_name": "jax/MIND-small/CAUM",
"wandb_group": "jax/MIND-small/CAUM",
"progress_backend": "tqdm"
},
"metrics": {
"params": {},
"_target_": "src.core.metrics.functions.NewsRecommenderMetrics"
},
"multi_seed": {
"enabled": true,
"seeds": [
42,
123,
456
]
},
"cache": {
"root_dir": ".cache",
"clear_on_start": false
},
"spec": {
"model": {
"name": "caum",
"architecture": {
"news_encoder": {
"type": "multi_head_self_attention",
"num_heads": 20,
"head_dim": 20,
"attention_hidden_dim": 200,
"entity_embedding_dim": 100,
"entity_num_heads": 4,
"entity_head_dim": 40,
"category_embedding_dim": 100
},
"user_encoder": {
"type": "candidate_aware",
"candi_selfatt": {
"num_heads": 20,
"head_dim": 20
},
"candi_cnn": {
"half_window": 1
},
"candi_att": {
"hidden_dim": 400,
"mid_dim": 256
}
},
"click_predictor": {
"type": "dot_product"
}
},
"embedding": {
"size": 300,
"trainable": true
},
"news_dim": 400,
"use_entity": true,
"use_category": true,
"dropout_rate": 0.2,
"seed": 42
},
"inputs": {
"title": {
"max_length": 30
},
"history": {
"max_length": 50
},
"impressions": {
"max_length": 5
},
"max_entities": 5,
"process_title": true,
"process_abstract": false,
"process_category": true,
"process_subcategory": false,
"process_user_id": false,
"process_entities": true
},
"training": {
"loss": {
"name": "categorical_crossentropy",
"from_logits": true,
"reduction": "sum_over_batch_size",
"label_smoothing": 0.0
},
"optimizer": "adam",
"learning_rate": 5e-05,
"batch_size": 64,
"num_epochs": 20,
"gradient_clip_val": 1.0,
"grad_accum_steps": 1,
"early_stopping": {
"patience": 5,
"min_improvement": 0.01
},
"negative_sampling": {
"strategy": "random",
"candidates": 4
}
},
"evaluation": {
"mode": "fast",
"evaluator": "caum",
"metrics": [
"auc",
"mrr",
"ndcg@5",
"ndcg@10"
],
"batch_size": 256
}
},
"dataset": {
"seed": 42,
"popularity": {
"ctr_method": "wall_clock",
"bucket_hours": 2,
"max_buckets": 1500,
"ctr_smoothing": 0.01
},
"_target_": "src.core.data.datasets.mind.MINDDataset",
"name": "MIND-small",
"version": "small",
"embedding_type": "glove",
"embedding_size": 300,
"random_train_samples": false,
"validation_split_strategy": "random",
"validation_split_percentage": 0.05,
"validation_split_seed": 42,
"data_fraction_train": 1.0,
"data_fraction_val": 1.0,
"data_fraction_test": 1.0,
"mode": "train",
"word_threshold": 5,
"urls": {
"small": {
"train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_train.zip",
"valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_dev.zip"
},
"large": {
"train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_train.zip",
"valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_dev.zip",
"test": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_test.zip"
}
},
"max_title_length": 30,
"max_abstract_length": 50,
"max_history_length": 50,
"max_impressions_length": 5,
"use_knowledge_graph": false,
"max_entities": 5,
"max_relations": 50,
"sampling": {
"max_impressions_length": 5,
"strategy": "random",
"random_seed": 42,
"random": {
"replace": false
},
"topic_diverse": {
"min_categories": 3,
"category_weights": {
"entertainment": 1.0,
"sports": 1.0,
"technology": 1.0,
"business": 1.0,
"lifestyle": 1.0,
"news": 1.0
}
},
"temporal": {
"time_window": 24,
"recency_weight": 0.7
},
"popularity": {
"top_k_ratio": 0.8,
"popularity_metric": "clicks"
}
},
"process_title": true,
"process_abstract": false,
"process_category": true,
"process_subcategory": false,
"process_user_id": false,
"process_entities": true
},
"sampling": {
"max_impressions_length": 5,
"strategy": "random",
"random_seed": 42,
"random": {
"replace": false
},
"topic_diverse": {
"min_categories": 3,
"category_weights": {
"entertainment": 1.0,
"sports": 1.0,
"technology": 1.0,
"business": 1.0,
"lifestyle": 1.0,
"news": 1.0
}
},
"temporal": {
"time_window": 24,
"recency_weight": 0.7
},
"popularity": {
"top_k_ratio": 0.8,
"popularity_metric": "clicks"
}
},
"name": "mind_caum",
"model_name": "CAUM",
"_output_run_dir": "outputs/train/MIND-small/CAUM/jax/seed_123"
},
"initial_validation_metrics": {},
"best_validation_summary": {
"epoch_number": 10.0,
"train_loss": 1.2371471108698318,
"average_metric_value": 0.5206724943439838,
"val_loss": 4.4820805537700945,
"val_auc": 0.7497600715485296,
"val_mrr": 0.39857799672194205,
"val_ndcg@5": 0.4387125845284695,
"val_ndcg@10": 0.4956393245769941,
"val_num_impressions": 7824.0,
"timing": {
"epoch_training_times": [
152.7604115009308,
128.3657763004303,
128.71619987487793,
126.83259797096252,
126.7269389629364,
127.33337998390198,
126.36471319198608,
127.29102325439453,
126.6120913028717,
126.97762560844421
],
"epoch_validation_times": [
156.19692087173462,
156.4893136024475,
156.90509462356567,
155.93345546722412,
156.1876072883606,
154.95236468315125,
157.0661187171936,
156.74578547477722,
156.08843064308167,
156.18353486061096
],
"total_training_time": 2860.9791276454926
}
},
"final_test_metrics": {
"loss": 4.895912475360167,
"auc": 0.6746637875073116,
"mrr": 0.3214330456909908,
"ndcg@5": 0.35560859266126893,
"ndcg@10": 0.4193156331068628,
"num_impressions": 72903.0
}
}