GLORY-JAX-MIND-small / training_run_summary.json
igor174's picture
Upload GLORY (jax) trained on MIND-small — 3 seeds
378e817 verified
{
"configuration": {
"framework": "jax",
"weights": null,
"seed": 42,
"output_base_dir": "outputs",
"device": {
"gpu_ids": [
0
],
"memory_limit": 1,
"keras_backend": "jax",
"precision": "float32"
},
"num_workers": 4,
"train": {
"batch_size": 32,
"num_epochs": 20,
"learning_rate": 0.0002,
"gradient_clip_val": 1.0,
"grad_accum_steps": 1,
"early_stopping": {
"patience": 5,
"min_improvement": 0.01
}
},
"eval": {
"fast_evaluation": true,
"batch_size": 256,
"save_predictions": true,
"predictions_dir": "predictions",
"run_initial_eval": false,
"run_test_after_training": true
},
"logging": {
"project_name": "NewsReX",
"enable_wandb": true,
"experiment_name": "jax/MIND-small/GLORY",
"wandb_group": "jax/MIND-small/GLORY",
"progress_backend": "tqdm"
},
"metrics": {
"params": {},
"_target_": "src.core.metrics.functions.NewsRecommenderMetrics"
},
"multi_seed": {
"enabled": true,
"seeds": [
42,
123,
456
]
},
"cache": {
"root_dir": ".cache",
"clear_on_start": false
},
"spec": {
"model": {
"name": "glory",
"architecture": {
"news_encoder": {
"type": "mha_pool",
"head_num": 20,
"head_dim": 20,
"attention_hidden_dim": 200
},
"graph_encoder": {
"type": "gated_graph_conv",
"gnn_num_layers": 3,
"use_graph_type": 0,
"directed": true,
"k_hops": 2,
"num_neighbors": 8,
"entity_neighbors": 10
},
"click_predictor": {
"type": "dot_product"
}
},
"embedding": {
"size": 300,
"trainable": true
},
"dropout_rate": 0.2,
"seed": 42,
"use_entity": true,
"entity_emb_dim": 100
},
"inputs": {
"title": {
"max_length": 30
},
"entity": {
"max_length": 5
},
"history": {
"max_length": 50
},
"impressions": {
"max_length": 5
},
"process_title": true,
"process_abstract": false,
"process_category": true,
"process_subcategory": true,
"process_entities": true,
"process_user_id": false
},
"training": {
"loss": {
"name": "categorical_crossentropy",
"from_logits": true,
"reduction": "sum_over_batch_size",
"label_smoothing": 0.0
},
"optimizer": "adam",
"learning_rate": 0.0002,
"batch_size": 32,
"grad_accum_steps": 1,
"num_epochs": 20,
"gradient_clip_val": 1.0,
"early_stopping": {
"patience": 5,
"min_improvement": 0.01
},
"negative_sampling": {
"strategy": "random",
"candidates": 4
}
},
"evaluation": {
"mode": "fast",
"evaluator": "default",
"metrics": [
"auc",
"mrr",
"ndcg@5",
"ndcg@10"
],
"batch_size": 256
}
},
"dataset": {
"seed": 42,
"popularity": {
"ctr_method": "wall_clock",
"bucket_hours": 2,
"max_buckets": 1500,
"ctr_smoothing": 0.01
},
"_target_": "src.core.data.datasets.mind.MINDDataset",
"name": "MIND-small",
"version": "small",
"embedding_type": "glove",
"embedding_size": 300,
"random_train_samples": false,
"validation_split_strategy": "random",
"validation_split_percentage": 0.05,
"validation_split_seed": 42,
"data_fraction_train": 1.0,
"data_fraction_val": 1.0,
"data_fraction_test": 1.0,
"mode": "train",
"word_threshold": 5,
"urls": {
"small": {
"train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_train.zip",
"valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_dev.zip"
},
"large": {
"train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_train.zip",
"valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_dev.zip",
"test": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_test.zip"
}
},
"max_title_length": 30,
"max_abstract_length": 50,
"max_history_length": 50,
"max_impressions_length": 5,
"use_knowledge_graph": false,
"max_entities": 5,
"max_relations": 50,
"sampling": {
"max_impressions_length": 5,
"strategy": "random",
"random_seed": 42,
"random": {
"replace": false
},
"topic_diverse": {
"min_categories": 3,
"category_weights": {
"entertainment": 1.0,
"sports": 1.0,
"technology": 1.0,
"business": 1.0,
"lifestyle": 1.0,
"news": 1.0
}
},
"temporal": {
"time_window": 24,
"recency_weight": 0.7
},
"popularity": {
"top_k_ratio": 0.8,
"popularity_metric": "clicks"
}
},
"process_title": true,
"process_abstract": false,
"process_category": true,
"process_subcategory": true,
"process_user_id": false,
"process_entities": true
},
"sampling": {
"max_impressions_length": 5,
"strategy": "random",
"random_seed": 42,
"random": {
"replace": false
},
"topic_diverse": {
"min_categories": 3,
"category_weights": {
"entertainment": 1.0,
"sports": 1.0,
"technology": 1.0,
"business": 1.0,
"lifestyle": 1.0,
"news": 1.0
}
},
"temporal": {
"time_window": 24,
"recency_weight": 0.7
},
"popularity": {
"top_k_ratio": 0.8,
"popularity_metric": "clicks"
}
},
"name": "mind_glory",
"model_name": "GLORY",
"_output_run_dir": "outputs/train/MIND-small/GLORY/jax/seed_42"
},
"initial_validation_metrics": {},
"best_validation_summary": {
"epoch_number": 4.0,
"train_loss": 1.2500946109834778,
"average_metric_value": 0.515969451866312,
"val_loss": 4.612048836593911,
"val_auc": 0.7439823902490937,
"val_mrr": 0.39419114946478445,
"val_ndcg@5": 0.43471800815289297,
"val_ndcg@10": 0.4909862595984772,
"val_num_impressions": 7664.0,
"timing": {
"epoch_training_times": [
2244.404512166977,
2201.9322175979614,
2199.9934306144714,
2205.808046102524,
2203.0027322769165,
2199.94650888443,
2199.697597503662
],
"epoch_validation_times": [
663.1509070396423,
80.81412124633789,
81.00111055374146,
78.61834621429443,
79.14026737213135,
80.17580127716064,
80.92336940765381
],
"total_training_time": 16599.34289455414
}
},
"final_test_metrics": {
"loss": 5.125263598847068,
"auc": 0.6653187263146543,
"mrr": 0.3200566670065452,
"ndcg@5": 0.35333528688262456,
"ndcg@10": 0.41684149154770783,
"num_impressions": 70658.0
}
}