| { |
| "configuration": { |
| "framework": "jax", |
| "weights": null, |
| "seed": 123, |
| "output_base_dir": "outputs", |
| "device": { |
| "gpu_ids": [ |
| 0 |
| ], |
| "memory_limit": 1, |
| "keras_backend": "jax", |
| "precision": "float32" |
| }, |
| "num_workers": 4, |
| "train": { |
| "batch_size": 64, |
| "num_epochs": 20, |
| "learning_rate": 5e-05, |
| "gradient_clip_val": 1.0, |
| "grad_accum_steps": 1, |
| "early_stopping": { |
| "patience": 5, |
| "min_improvement": 0.01 |
| } |
| }, |
| "eval": { |
| "fast_evaluation": true, |
| "batch_size": 256, |
| "save_predictions": true, |
| "predictions_dir": "predictions", |
| "run_initial_eval": false, |
| "run_test_after_training": true |
| }, |
| "logging": { |
| "project_name": "NewsReX", |
| "enable_wandb": true, |
| "experiment_name": "jax/MIND-small/CAUM", |
| "wandb_group": "jax/MIND-small/CAUM", |
| "progress_backend": "tqdm" |
| }, |
| "metrics": { |
| "params": {}, |
| "_target_": "src.core.metrics.functions.NewsRecommenderMetrics" |
| }, |
| "multi_seed": { |
| "enabled": true, |
| "seeds": [ |
| 42, |
| 123, |
| 456 |
| ] |
| }, |
| "cache": { |
| "root_dir": ".cache", |
| "clear_on_start": false |
| }, |
| "spec": { |
| "model": { |
| "name": "caum", |
| "architecture": { |
| "news_encoder": { |
| "type": "multi_head_self_attention", |
| "num_heads": 20, |
| "head_dim": 20, |
| "attention_hidden_dim": 200, |
| "entity_embedding_dim": 100, |
| "entity_num_heads": 4, |
| "entity_head_dim": 40, |
| "category_embedding_dim": 100 |
| }, |
| "user_encoder": { |
| "type": "candidate_aware", |
| "candi_selfatt": { |
| "num_heads": 20, |
| "head_dim": 20 |
| }, |
| "candi_cnn": { |
| "half_window": 1 |
| }, |
| "candi_att": { |
| "hidden_dim": 400, |
| "mid_dim": 256 |
| } |
| }, |
| "click_predictor": { |
| "type": "dot_product" |
| } |
| }, |
| "embedding": { |
| "size": 300, |
| "trainable": true |
| }, |
| "news_dim": 400, |
| "use_entity": true, |
| "use_category": true, |
| "dropout_rate": 0.2, |
| "seed": 42 |
| }, |
| "inputs": { |
| "title": { |
| "max_length": 30 |
| }, |
| "history": { |
| "max_length": 50 |
| }, |
| "impressions": { |
| "max_length": 5 |
| }, |
| "max_entities": 5, |
| "process_title": true, |
| "process_abstract": false, |
| "process_category": true, |
| "process_subcategory": false, |
| "process_user_id": false, |
| "process_entities": true |
| }, |
| "training": { |
| "loss": { |
| "name": "categorical_crossentropy", |
| "from_logits": true, |
| "reduction": "sum_over_batch_size", |
| "label_smoothing": 0.0 |
| }, |
| "optimizer": "adam", |
| "learning_rate": 5e-05, |
| "batch_size": 64, |
| "num_epochs": 20, |
| "gradient_clip_val": 1.0, |
| "grad_accum_steps": 1, |
| "early_stopping": { |
| "patience": 5, |
| "min_improvement": 0.01 |
| }, |
| "negative_sampling": { |
| "strategy": "random", |
| "candidates": 4 |
| } |
| }, |
| "evaluation": { |
| "mode": "fast", |
| "evaluator": "caum", |
| "metrics": [ |
| "auc", |
| "mrr", |
| "ndcg@5", |
| "ndcg@10" |
| ], |
| "batch_size": 256 |
| } |
| }, |
| "dataset": { |
| "seed": 42, |
| "popularity": { |
| "ctr_method": "wall_clock", |
| "bucket_hours": 2, |
| "max_buckets": 1500, |
| "ctr_smoothing": 0.01 |
| }, |
| "_target_": "src.core.data.datasets.mind.MINDDataset", |
| "name": "MIND-small", |
| "version": "small", |
| "embedding_type": "glove", |
| "embedding_size": 300, |
| "random_train_samples": false, |
| "validation_split_strategy": "random", |
| "validation_split_percentage": 0.05, |
| "validation_split_seed": 42, |
| "data_fraction_train": 1.0, |
| "data_fraction_val": 1.0, |
| "data_fraction_test": 1.0, |
| "mode": "train", |
| "word_threshold": 5, |
| "urls": { |
| "small": { |
| "train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_train.zip", |
| "valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDsmall_dev.zip" |
| }, |
| "large": { |
| "train": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_train.zip", |
| "valid": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_dev.zip", |
| "test": "https://huggingface.co/datasets/yjw1029/MIND/resolve/main/MINDlarge_test.zip" |
| } |
| }, |
| "max_title_length": 30, |
| "max_abstract_length": 50, |
| "max_history_length": 50, |
| "max_impressions_length": 5, |
| "use_knowledge_graph": false, |
| "max_entities": 5, |
| "max_relations": 50, |
| "sampling": { |
| "max_impressions_length": 5, |
| "strategy": "random", |
| "random_seed": 42, |
| "random": { |
| "replace": false |
| }, |
| "topic_diverse": { |
| "min_categories": 3, |
| "category_weights": { |
| "entertainment": 1.0, |
| "sports": 1.0, |
| "technology": 1.0, |
| "business": 1.0, |
| "lifestyle": 1.0, |
| "news": 1.0 |
| } |
| }, |
| "temporal": { |
| "time_window": 24, |
| "recency_weight": 0.7 |
| }, |
| "popularity": { |
| "top_k_ratio": 0.8, |
| "popularity_metric": "clicks" |
| } |
| }, |
| "process_title": true, |
| "process_abstract": false, |
| "process_category": true, |
| "process_subcategory": false, |
| "process_user_id": false, |
| "process_entities": true |
| }, |
| "sampling": { |
| "max_impressions_length": 5, |
| "strategy": "random", |
| "random_seed": 42, |
| "random": { |
| "replace": false |
| }, |
| "topic_diverse": { |
| "min_categories": 3, |
| "category_weights": { |
| "entertainment": 1.0, |
| "sports": 1.0, |
| "technology": 1.0, |
| "business": 1.0, |
| "lifestyle": 1.0, |
| "news": 1.0 |
| } |
| }, |
| "temporal": { |
| "time_window": 24, |
| "recency_weight": 0.7 |
| }, |
| "popularity": { |
| "top_k_ratio": 0.8, |
| "popularity_metric": "clicks" |
| } |
| }, |
| "name": "mind_caum", |
| "model_name": "CAUM", |
| "_output_run_dir": "outputs/train/MIND-small/CAUM/jax/seed_123" |
| }, |
| "initial_validation_metrics": {}, |
| "best_validation_summary": { |
| "epoch_number": 10.0, |
| "train_loss": 1.2371471108698318, |
| "average_metric_value": 0.5206724943439838, |
| "val_loss": 4.4820805537700945, |
| "val_auc": 0.7497600715485296, |
| "val_mrr": 0.39857799672194205, |
| "val_ndcg@5": 0.4387125845284695, |
| "val_ndcg@10": 0.4956393245769941, |
| "val_num_impressions": 7824.0, |
| "timing": { |
| "epoch_training_times": [ |
| 152.7604115009308, |
| 128.3657763004303, |
| 128.71619987487793, |
| 126.83259797096252, |
| 126.7269389629364, |
| 127.33337998390198, |
| 126.36471319198608, |
| 127.29102325439453, |
| 126.6120913028717, |
| 126.97762560844421 |
| ], |
| "epoch_validation_times": [ |
| 156.19692087173462, |
| 156.4893136024475, |
| 156.90509462356567, |
| 155.93345546722412, |
| 156.1876072883606, |
| 154.95236468315125, |
| 157.0661187171936, |
| 156.74578547477722, |
| 156.08843064308167, |
| 156.18353486061096 |
| ], |
| "total_training_time": 2860.9791276454926 |
| } |
| }, |
| "final_test_metrics": { |
| "loss": 4.895912475360167, |
| "auc": 0.6746637875073116, |
| "mrr": 0.3214330456909908, |
| "ndcg@5": 0.35560859266126893, |
| "ndcg@10": 0.4193156331068628, |
| "num_impressions": 72903.0 |
| } |
| } |