Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/best_model.pt +3 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/config.json +262 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/last_model.pt +3 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/metrics.csv +0 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/metrics.json +0 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/summary.txt +407 -0
outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/train.log +0 -0

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/best_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0d72b5aa5573b04611dde1bdb3c2815337b4ca3938b3e9077ae65267e3b67f1e
+size 3261776405

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/config.json ADDED Viewed

	@@ -0,0 +1,262 @@

+{
+  "args": {
+    "config_path": "data/esm2_t33_650M_UR50D.json",
+    "checkpoint_path": "mint.ckpt",
+    "train_csv": "data/libB/train_fold_enrichment_freqmean_pseudo_1to1.csv",
+    "val_csv": [
+      "data/libB/val_fold_enrichment_freqmean_pseudo_1to1.csv",
+      "data/libB/val_fold_enrichment_freqmean_pseudo_1to1_v2.csv"
+    ],
+    "best_val_index": 0,
+    "train_limit": null,
+    "log_transform": true,
+    "use_multimer": true,
+    "unfreeze_last_n": 5,
+    "sep_chains": true,
+    "hidden_dim": 512,
+    "dropout": 0.2,
+    "bs": 256,
+    "num_epochs": 10,
+    "lr": 0.001,
+    "backbone_lr": 0.0001,
+    "loss_fn": "mse",
+    "huber_delta": 1.0,
+    "truncation_rate": 0.0,
+    "truncation_warmup_steps": 3000,
+    "consistency_col": null,
+    "truncation_consistency_bonus": 0.5,
+    "grad_clip": 1.0,
+    "val_interval": 100,
+    "mixed_precision": "bf16",
+    "gradient_accumulation_steps": 2,
+    "activation_checkpointing": false,
+    "lr_scheduler_type": "constant",
+    "warmup_steps": 0,
+    "lr_min": 0.0,
+    "lr_scheduler_kwargs": "{}",
+    "sample_weight_col": null,
+    "negative_weight": 1.0,
+    "use_binding_quality": false,
+    "bq_w_count": 0.7,
+    "bq_w_fe": 0.3,
+    "no_wandb": false,
+    "wandb_project": "pep-affibody-ablation-fe",
+    "wandb_entity": "protein_llm",
+    "wandb_run_name": "libB_pseudo_bf16",
+    "output_dir": "/home/pj25000082/ku50001421/mint/outputs/pep-affibody-ablation-fe/libB_pseudo_bf16",
+    "seed": 42,
+    "num_workers": 4,
+    "prefetch_factor": 2,
+    "device": "cuda"
+  },
+  "model_cfg": {
+    "no_progress_bar": false,
+    "log_interval": 100,
+    "log_format": "json",
+    "azureml_logging": false,
+    "seed": 1,
+    "cpu": false,
+    "tpu": false,
+    "bf16": false,
+    "memory_efficient_bf16": false,
+    "fp16": true,
+    "memory_efficient_fp16": false,
+    "fp16_no_flatten_grads": false,
+    "fp16_init_scale": 4,
+    "fp16_scale_tolerance": 0.0,
+    "on_cpu_convert_precision": false,
+    "min_loss_scale": 0.0001,
+    "amp": false,
+    "amp_batch_retries": 2,
+    "amp_init_scale": 128,
+    "empty_cache_freq": 0,
+    "all_gather_list_size": 16384,
+    "model_parallel_size": 1,
+    "profile": false,
+    "reset_logging": false,
+    "suppress_crashes": false,
+    "use_plasma_view": false,
+    "plasma_path": "/tmp/plasma",
+    "criterion": "masked_lm",
+    "optimizer": "adam",
+    "lr_scheduler": "polynomial_decay",
+    "scoring": "bleu",
+    "task": "p_masked_lm_cluster_resample",
+    "num_workers": 0,
+    "skip_invalid_size_inputs_valid_test": true,
+    "max_tokens": 1024,
+    "required_batch_size_multiple": 8,
+    "required_seq_len_multiple": 1,
+    "dataset_impl": "fasta",
+    "data_buffer_size": 10,
+    "train_subset": "train50",
+    "valid_subset": "valid50",
+    "ignore_unused_valid_subsets": true,
+    "validate_interval": 99999,
+    "validate_interval_updates": 0,
+    "validate_after_updates": 0,
+    "disable_validation": false,
+    "max_tokens_valid": 1024,
+    "curriculum": 0,
+    "gen_subset": "test",
+    "num_shards": 1,
+    "shard_id": 0,
+    "distributed_world_size": 512,
+    "distributed_num_procs": 8,
+    "distributed_rank": 0,
+    "distributed_backend": "nccl",
+    "distributed_port": 14490,
+    "device_id": 0,
+    "distributed_no_spawn": false,
+    "ddp_backend": "c10d",
+    "ddp_comm_hook": "none",
+    "bucket_cap_mb": 25,
+    "fix_batches_to_gpus": false,
+    "find_unused_parameters": false,
+    "fast_stat_sync": false,
+    "heartbeat_timeout": 3600,
+    "broadcast_buffers": false,
+    "slowmo_algorithm": "LocalSGD",
+    "localsgd_frequency": 3,
+    "nprocs_per_node": 8,
+    "pipeline_model_parallel": false,
+    "pipeline_chunks": 0,
+    "pipeline_checkpoint": "never",
+    "zero_sharding": "none",
+    "no_reshard_after_forward": false,
+    "fp32_reduce_scatter": false,
+    "cpu_offload": false,
+    "use_sharded_state": false,
+    "arch": "p_roberta_large",
+    "max_epoch": 500,
+    "max_update": 0,
+    "stop_time_hours": 0,
+    "clip_norm": 0.0,
+    "use_inf_norm": false,
+    "sentence_avg": false,
+    "update_freq": [
+      4
+    ],
+    "lr": [
+      0.0004
+    ],
+    "stop_min_lr": -1.0,
+    "use_bmuf": false,
+    "save_dir": "/fsx-protein/halilakin/checkpoints/33layer_lr_poly.sample_ur50_to_90.ngpu512",
+    "restore_file": "checkpoint_last.pt",
+    "reset_dataloader": false,
+    "reset_lr_scheduler": false,
+    "reset_meters": false,
+    "reset_optimizer": false,
+    "optimizer_overrides": "{}",
+    "save_interval": 99999,
+    "save_interval_updates": 10000,
+    "keep_interval_updates": -1,
+    "keep_interval_updates_pattern": -1,
+    "keep_last_epochs": -1,
+    "keep_best_checkpoints": -1,
+    "no_save": false,
+    "no_epoch_checkpoints": true,
+    "no_last_checkpoints": false,
+    "no_save_optimizer_state": false,
+    "best_checkpoint_metric": "loss",
+    "maximize_best_checkpoint_metric": false,
+    "patience": -1,
+    "checkpoint_suffix": "",
+    "checkpoint_shard_count": 1,
+    "load_checkpoint_on_all_dp_ranks": false,
+    "write_checkpoints_asynchronously": false,
+    "no_mid_epoch_validate": false,
+    "encoder_layerdrop": 0,
+    "quant_noise_pq": 0,
+    "quant_noise_pq_block_size": 8,
+    "quant_noise_scalar": 0,
+    "min_params_to_wrap": 100000000,
+    "data": "/fsx-protein/zhongkai/datasets/202104esm2/03_output",
+    "sample_break_mode": "eos",
+    "tokens_per_sample": 1024,
+    "mask_prob": 0.15,
+    "leave_unmasked_prob": 0.1,
+    "random_token_prob": 0.1,
+    "freq_weighted_replacement": false,
+    "mask_whole_words": false,
+    "mask_multiple_length": 1,
+    "mask_stdev": 0.0,
+    "shorten_method": "random_crop",
+    "shorten_data_split_list": "train50",
+    "num_batch_buckets": 0,
+    "cluster_resample_fasta_path": "/fsx-protein/zhongkai/datasets/202104esm2/03_output/uniref90.filtered.fasta",
+    "cluster_resample_seq_id": 90,
+    "cluster_resample_ur50_ur90_ur100_path": "/fsx-protein/zhongkai/datasets/202104esm2/01_inputs/ur50_ur90_ur100.no_ur_id_prefix.csv",
+    "adam_betas": "[0.9,0.98]",
+    "adam_eps": 1e-08,
+    "weight_decay": 0.01,
+    "use_old_adam": false,
+    "warmup_updates": 2000,
+    "end_learning_rate": 2e-05,
+    "power": 1.0,
+    "total_num_update": "450000",
+    "pad": 1,
+    "eos": 2,
+    "unk": 3,
+    "max_positions": 1024,
+    "activation_fn": "gelu",
+    "use_rotary_embeddings": true,
+    "encoder_normalize_after": true,
+    "preact_normalize": true,
+    "token_dropout": true,
+    "layer_norm_fp32": true,
+    "attention_dropout": 0.0,
+    "dropout": 0.0,
+    "activation_dropout": 0.0,
+    "encoder_attention_heads": 20,
+    "encoder_embed_dim": 1280,
+    "encoder_ffn_embed_dim": 5120,
+    "encoder_layers": 33,
+    "no_seed_provided": false,
+    "pooler_activation_fn": "tanh",
+    "pooler_dropout": 0.0,
+    "encoder_normalize_before": false,
+    "encoder_learned_pos": false,
+    "use_bert_init": false,
+    "checkpoint_transformer_block": false,
+    "checkpoint_activations": false,
+    "effective_attention": false,
+    "_name": "p_roberta_large",
+    "untie_weights_roberta": false
+  },
+  "environment": {
+    "python_version": "3.10.19 (main, Oct 21 2025, 16:43:05) [GCC 11.2.0]",
+    "torch_version": "2.10.0+cu128",
+    "cuda_available": true,
+    "cuda_device": "NVIDIA H100 80GB HBM3",
+    "wandb_available": true
+  },
+  "git": {
+    "git_commit": "unknown",
+    "git_dirty": null
+  },
+  "timestamp": "2026-02-15 19:29:35",
+  "dataset": {
+    "train_csv": "data/libB/train_fold_enrichment_freqmean_pseudo_1to1.csv",
+    "val_csv": [
+      "data/libB/val_fold_enrichment_freqmean_pseudo_1to1.csv",
+      "data/libB/val_fold_enrichment_freqmean_pseudo_1to1_v2.csv"
+    ],
+    "train_size": 1481332,
+    "train_positive_ratio": 0.5,
+    "train_count_mean": 2.6410122781388643,
+    "train_count_std": 16.249330698762655,
+    "train_count_max": 17196.0,
+    "val_0_csv": "data/libB/val_fold_enrichment_freqmean_pseudo_1to1.csv",
+    "val_0_size": 176,
+    "val_0_positive_ratio": 0.7670454545454546,
+    "val_0_count_mean": 84.94886363636364,
+    "val_0_count_std": 426.4907605080106,
+    "val_1_csv": "data/libB/val_fold_enrichment_freqmean_pseudo_1to1_v2.csv",
+    "val_1_size": 165,
+    "val_1_positive_ratio": 0.806060606060606,
+    "val_1_count_mean": 77.43636363636364,
+    "val_1_count_std": 427.8391721268735
+  }
+}

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/last_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5efd660a2b0ecdf5baed0e1bcf2f8295ade391911f2e7db97d14df8c9facaf4e
+size 7524953661

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/metrics.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/metrics.json ADDED Viewed

The diff for this file is too large to render. See raw diff

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/summary.txt ADDED Viewed

	@@ -0,0 +1,407 @@

+============================================================
+Experiment Summary
+============================================================
+Output dir: /home/pj25000082/ku50001421/mint/outputs/pep-affibody-ablation-fe/libB_pseudo_bf16
+Timestamp:  2026-02-16 18:48:31
+Duration:   83951.4 seconds (1399.2 minutes)
+--- Key Hyperparameters ---
+  lr: 0.001
+  backbone_lr: 0.0001
+  bs: 256
+  num_epochs: 10
+  unfreeze_last_n: 5
+  hidden_dim: 512
+  dropout: 0.2
+  log_transform: True
+  sep_chains: True
+  loss_fn: mse
+  huber_delta: 1.0
+  truncation_rate: 0.0
+  truncation_warmup_steps: 3000
+  truncation_consistency_bonus: 0.5
+  val_interval: 100
+  grad_clip: 1.0
+  seed: 42
+  mixed_precision: bf16
+  gradient_accumulation_steps: 2
+  lr_scheduler_type: constant
+  warmup_steps: 0
+  lr_min: 0.0
+  lr_scheduler_kwargs: {}
+  activation_checkpointing: False
+  num_workers: 4
+  prefetch_factor: 2
+  negative_weight: 1.0
+  use_binding_quality: False
+  bq_w_count: 0.7
+  bq_w_fe: 0.3
+--- Best Validation Metrics ---
+  val_0_cs0_kendall: 0.2156
+  val_0_cs0_n: 60
+  val_0_cs0_pearson: 0.21365348994731903
+  val_0_cs0_r2: -4.1103
+  val_0_cs0_rmse: 0.9724
+  val_0_cs0_spearman: 0.2781
+  val_0_cs1_kendall: 0.3810
+  val_0_cs1_n: 14
+  val_0_cs1_pearson: 0.6624651551246643
+  val_0_cs1_r2: -0.4791
+  val_0_cs1_rmse: 0.5618
+  val_0_cs1_spearman: 0.4532
+  val_0_cs2_kendall: 0.5490
+  val_0_cs2_n: 14
+  val_0_cs2_pearson: 0.8056180477142334
+  val_0_cs2_r2: 0.4388
+  val_0_cs2_rmse: 0.9954
+  val_0_cs2_spearman: 0.6675
+  val_0_cs3_kendall: 0.6030
+  val_0_cs3_n: 88
+  val_0_cs3_pearson: 0.6629645824432373
+  val_0_cs3_r2: 0.1671
+  val_0_cs3_rmse: 1.3475
+  val_0_cs3_spearman: 0.7335
+  val_0_kendall: 0.7003
+  val_0_pearson: 0.8241990208625793
+  val_0_pr_auc: 0.9677
+  val_0_r2: 0.6435
+  val_0_r2_orig: -0.0026
+  val_0_rmse: 1.1551
+  val_0_rmse_orig: 425.8286
+  val_0_roc_auc: 0.8944
+  val_0_spearman: 0.8574
+  val_0_top20_precision: 1.0000
+  val_0_top50_precision: 1.0000
+  val_1_cs0_kendall: 0.1705
+  val_1_cs0_n: 56
+  val_1_cs0_pearson: 0.1607104390859604
+  val_1_cs0_r2: -4.2089
+  val_1_cs0_rmse: 1.0479
+  val_1_cs0_spearman: 0.2263
+  val_1_cs1_kendall: 0.3552
+  val_1_cs1_n: 19
+  val_1_cs1_pearson: 0.7219028472900391
+  val_1_cs1_r2: -1.4061
+  val_1_cs1_rmse: 0.6211
+  val_1_cs1_spearman: 0.4364
+  val_1_cs2_kendall: 0.6250
+  val_1_cs2_n: 12
+  val_1_cs2_pearson: 0.8879897594451904
+  val_1_cs2_r2: 0.6522
+  val_1_cs2_rmse: 0.8304
+  val_1_cs2_spearman: 0.7666
+  val_1_cs3_kendall: 0.6641
+  val_1_cs3_n: 78
+  val_1_cs3_pearson: 0.7661534547805786
+  val_1_cs3_r2: 0.4029
+  val_1_cs3_rmse: 1.2134
+  val_1_cs3_spearman: 0.8095
+  val_1_kendall: 0.6468
+  val_1_pearson: 0.8435776829719543
+  val_1_pr_auc: 0.9530
+  val_1_r2: 0.6715
+  val_1_r2_orig: 0.0056
+  val_1_rmse: 1.0785
+  val_1_rmse_orig: 425.3369
+  val_1_roc_auc: 0.8253
+  val_1_spearman: 0.8048
+  val_1_top20_precision: 1.0000
+  val_1_top50_precision: 1.0000
+--- Best Test Metrics ---
+--- Training History (val_spearman) ---
+  step 100 (epoch 1): val_spearman=0.4002  train_loss=0.4755
+  step 200 (epoch 1): val_spearman=0.3998  train_loss=0.3835
+  step 300 (epoch 1): val_spearman=0.3618  train_loss=0.3674
+  step 400 (epoch 1): val_spearman=0.4301  train_loss=0.3556
+  step 500 (epoch 1): val_spearman=0.5208  train_loss=0.3525
+  step 600 (epoch 1): val_spearman=0.5011  train_loss=0.3524
+  step 700 (epoch 1): val_spearman=0.5102  train_loss=0.3553
+  step 800 (epoch 1): val_spearman=0.5923  train_loss=0.3336
+  step 900 (epoch 1): val_spearman=0.5592  train_loss=0.3499
+  step 1000 (epoch 1): val_spearman=0.6022  train_loss=0.3309
+  step 1100 (epoch 1): val_spearman=0.6729  train_loss=0.3378
+  step 1200 (epoch 1): val_spearman=0.6790  train_loss=0.3366
+  step 1300 (epoch 1): val_spearman=0.6750  train_loss=0.3252
+  step 1400 (epoch 1): val_spearman=0.7067  train_loss=0.3283
+  step 1500 (epoch 1): val_spearman=0.6072  train_loss=0.3320
+  step 1600 (epoch 1): val_spearman=0.6993  train_loss=0.3289
+  step 1700 (epoch 1): val_spearman=0.6476  train_loss=0.3312
+  step 1800 (epoch 1): val_spearman=0.6780  train_loss=0.3237
+  step 1900 (epoch 1): val_spearman=0.6616  train_loss=0.3295
+  step 2000 (epoch 1): val_spearman=0.6771  train_loss=0.3270
+  step 2100 (epoch 1): val_spearman=0.7104  train_loss=0.3328
+  step 2200 (epoch 1): val_spearman=0.6848  train_loss=0.3235
+  step 2300 (epoch 1): val_spearman=0.7076  train_loss=0.3243
+  step 2400 (epoch 1): val_spearman=0.6631  train_loss=0.3258
+  step 2500 (epoch 1): val_spearman=0.7335  train_loss=0.3313
+  step 2600 (epoch 1): val_spearman=0.7135  train_loss=0.3256
+  step 2700 (epoch 1): val_spearman=0.7599  train_loss=0.3250
+  step 2800 (epoch 1): val_spearman=0.7327  train_loss=0.3251
+  step 2900 (epoch 2): val_spearman=0.7286  train_loss=0.3280
+  step 3000 (epoch 2): val_spearman=0.7045  train_loss=0.3226
+  step 3100 (epoch 2): val_spearman=0.7314  train_loss=0.3182
+  step 3200 (epoch 2): val_spearman=0.7498  train_loss=0.3126
+  step 3300 (epoch 2): val_spearman=0.7618  train_loss=0.3178
+  step 3400 (epoch 2): val_spearman=0.7497  train_loss=0.3211
+  step 3500 (epoch 2): val_spearman=0.7116  train_loss=0.3228
+  step 3600 (epoch 2): val_spearman=0.7906  train_loss=0.3160
+  step 3700 (epoch 2): val_spearman=0.7276  train_loss=0.3146
+  step 3800 (epoch 2): val_spearman=0.7192  train_loss=0.3203
+  step 3900 (epoch 2): val_spearman=0.7611  train_loss=0.3152
+  step 4000 (epoch 2): val_spearman=0.7465  train_loss=0.3132
+  step 4100 (epoch 2): val_spearman=0.7588  train_loss=0.3167
+  step 4200 (epoch 2): val_spearman=0.7728  train_loss=0.3180
+  step 4300 (epoch 2): val_spearman=0.7827  train_loss=0.3137
+  step 4400 (epoch 2): val_spearman=0.7532  train_loss=0.3171
+  step 4500 (epoch 2): val_spearman=0.7677  train_loss=0.3173
+  step 4600 (epoch 2): val_spearman=0.7805  train_loss=0.3223
+  step 4700 (epoch 2): val_spearman=0.7669  train_loss=0.3137
+  step 4800 (epoch 2): val_spearman=0.7809  train_loss=0.3150
+  step 4900 (epoch 2): val_spearman=0.7627  train_loss=0.3196
+  step 5000 (epoch 2): val_spearman=0.7679  train_loss=0.3153
+  step 5100 (epoch 2): val_spearman=0.7821  train_loss=0.3182
+  step 5200 (epoch 2): val_spearman=0.7567  train_loss=0.3119
+  step 5300 (epoch 2): val_spearman=0.7915  train_loss=0.3161
+  step 5400 (epoch 2): val_spearman=0.7890  train_loss=0.3131
+  step 5500 (epoch 2): val_spearman=0.7941  train_loss=0.3148
+  step 5600 (epoch 2): val_spearman=0.7873  train_loss=0.3165
+  step 5700 (epoch 2): val_spearman=0.8025  train_loss=0.3134
+  step 5800 (epoch 3): val_spearman=0.7950  train_loss=0.3151
+  step 5900 (epoch 3): val_spearman=0.8108  train_loss=0.3074
+  step 6000 (epoch 3): val_spearman=0.8236  train_loss=0.3037
+  step 6100 (epoch 3): val_spearman=0.8253  train_loss=0.3115
+  step 6200 (epoch 3): val_spearman=0.8008  train_loss=0.3036
+  step 6300 (epoch 3): val_spearman=0.8184  train_loss=0.3031
+  step 6400 (epoch 3): val_spearman=0.8036  train_loss=0.3127
+  step 6500 (epoch 3): val_spearman=0.8262  train_loss=0.3057
+  step 6600 (epoch 3): val_spearman=0.8286  train_loss=0.3057
+  step 6700 (epoch 3): val_spearman=0.8057  train_loss=0.3049
+  step 6800 (epoch 3): val_spearman=0.8081  train_loss=0.3065
+  step 6900 (epoch 3): val_spearman=0.8071  train_loss=0.3097
+  step 7000 (epoch 3): val_spearman=0.7703  train_loss=0.3047
+  step 7100 (epoch 3): val_spearman=0.7687  train_loss=0.3128
+  step 7200 (epoch 3): val_spearman=0.8192  train_loss=0.3081
+  step 7300 (epoch 3): val_spearman=0.7907  train_loss=0.3060
+  step 7400 (epoch 3): val_spearman=0.8335  train_loss=0.3078
+  step 7500 (epoch 3): val_spearman=0.8353  train_loss=0.3058
+  step 7600 (epoch 3): val_spearman=0.8262  train_loss=0.3030
+  step 7700 (epoch 3): val_spearman=0.7816  train_loss=0.3041
+  step 7800 (epoch 3): val_spearman=0.8260  train_loss=0.3092
+  step 7900 (epoch 3): val_spearman=0.8271  train_loss=0.3121
+  step 8000 (epoch 3): val_spearman=0.8045  train_loss=0.3060
+  step 8100 (epoch 3): val_spearman=0.8065  train_loss=0.3092
+  step 8200 (epoch 3): val_spearman=0.8127  train_loss=0.3056
+  step 8300 (epoch 3): val_spearman=0.8522  train_loss=0.3035
+  step 8400 (epoch 3): val_spearman=0.8279  train_loss=0.3032
+  step 8500 (epoch 3): val_spearman=0.7696  train_loss=0.3043
+  step 8600 (epoch 3): val_spearman=0.8019  train_loss=0.3091
+  step 8700 (epoch 4): val_spearman=0.8305  train_loss=0.3000
+  step 8800 (epoch 4): val_spearman=0.8327  train_loss=0.2937
+  step 8900 (epoch 4): val_spearman=0.8328  train_loss=0.2958
+  step 9000 (epoch 4): val_spearman=0.8410  train_loss=0.2934
+  step 9100 (epoch 4): val_spearman=0.8147  train_loss=0.2920
+  step 9200 (epoch 4): val_spearman=0.8393  train_loss=0.2939
+  step 9300 (epoch 4): val_spearman=0.8374  train_loss=0.2980
+  step 9400 (epoch 4): val_spearman=0.8148  train_loss=0.2965
+  step 9500 (epoch 4): val_spearman=0.8293  train_loss=0.2966
+  step 9600 (epoch 4): val_spearman=0.8338  train_loss=0.2936
+  step 9700 (epoch 4): val_spearman=0.8351  train_loss=0.2930
+  step 9800 (epoch 4): val_spearman=0.8428  train_loss=0.2960
+  step 9900 (epoch 4): val_spearman=0.8366  train_loss=0.2918
+  step 10000 (epoch 4): val_spearman=0.8328  train_loss=0.2919
+  step 10100 (epoch 4): val_spearman=0.7875  train_loss=0.2996
+  step 10200 (epoch 4): val_spearman=0.8348  train_loss=0.2947
+  step 10300 (epoch 4): val_spearman=0.8331  train_loss=0.2984
+  step 10400 (epoch 4): val_spearman=0.8280  train_loss=0.2997
+  step 10500 (epoch 4): val_spearman=0.8456  train_loss=0.2971
+  step 10600 (epoch 4): val_spearman=0.8506  train_loss=0.2946
+  step 10700 (epoch 4): val_spearman=0.8430  train_loss=0.2898
+  step 10800 (epoch 4): val_spearman=0.8138  train_loss=0.3017
+  step 10900 (epoch 4): val_spearman=0.8340  train_loss=0.2893
+  step 11000 (epoch 4): val_spearman=0.8224  train_loss=0.2953
+  step 11100 (epoch 4): val_spearman=0.8470  train_loss=0.2918
+  step 11200 (epoch 4): val_spearman=0.8494  train_loss=0.2945
+  step 11300 (epoch 4): val_spearman=0.8489  train_loss=0.2956
+  step 11400 (epoch 4): val_spearman=0.8205  train_loss=0.2984
+  step 11500 (epoch 4): val_spearman=0.8382  train_loss=0.2965
+  step 11600 (epoch 5): val_spearman=0.8409  train_loss=0.2880
+  step 11700 (epoch 5): val_spearman=0.8279  train_loss=0.2761
+  step 11800 (epoch 5): val_spearman=0.8502  train_loss=0.2739
+  step 11900 (epoch 5): val_spearman=0.8417  train_loss=0.2820
+  step 12000 (epoch 5): val_spearman=0.8297  train_loss=0.2757
+  step 12100 (epoch 5): val_spearman=0.8439  train_loss=0.2741
+  step 12200 (epoch 5): val_spearman=0.8294  train_loss=0.2787
+  step 12300 (epoch 5): val_spearman=0.8114  train_loss=0.2780
+  step 12400 (epoch 5): val_spearman=0.8258  train_loss=0.2758
+  step 12500 (epoch 5): val_spearman=0.8336  train_loss=0.2740
+  step 12600 (epoch 5): val_spearman=0.8418  train_loss=0.2790
+  step 12700 (epoch 5): val_spearman=0.8234  train_loss=0.2784
+  step 12800 (epoch 5): val_spearman=0.8309  train_loss=0.2772
+  step 12900 (epoch 5): val_spearman=0.8363  train_loss=0.2829
+  step 13000 (epoch 5): val_spearman=0.8387  train_loss=0.2722
+  step 13100 (epoch 5): val_spearman=0.8339  train_loss=0.2735
+  step 13200 (epoch 5): val_spearman=0.8509  train_loss=0.2766
+  step 13300 (epoch 5): val_spearman=0.8283  train_loss=0.2801
+  step 13400 (epoch 5): val_spearman=0.8264  train_loss=0.2779
+  step 13500 (epoch 5): val_spearman=0.8189  train_loss=0.2802
+  step 13600 (epoch 5): val_spearman=0.8364  train_loss=0.2863
+  step 13700 (epoch 5): val_spearman=0.8282  train_loss=0.2816
+  step 13800 (epoch 5): val_spearman=0.8332  train_loss=0.2771
+  step 13900 (epoch 5): val_spearman=0.8305  train_loss=0.2797
+  step 14000 (epoch 5): val_spearman=0.8279  train_loss=0.2781
+  step 14100 (epoch 5): val_spearman=0.8404  train_loss=0.2826
+  step 14200 (epoch 5): val_spearman=0.8544  train_loss=0.2747
+  step 14300 (epoch 5): val_spearman=0.8383  train_loss=0.2831
+  step 14400 (epoch 5): val_spearman=0.8369  train_loss=0.2850
+  step 14500 (epoch 6): val_spearman=0.8354  train_loss=0.2710
+  step 14600 (epoch 6): val_spearman=0.8300  train_loss=0.2508
+  step 14700 (epoch 6): val_spearman=0.8354  train_loss=0.2515
+  step 14800 (epoch 6): val_spearman=0.8400  train_loss=0.2499
+  step 14900 (epoch 6): val_spearman=0.8379  train_loss=0.2522
+  step 15000 (epoch 6): val_spearman=0.8232  train_loss=0.2493
+  step 15100 (epoch 6): val_spearman=0.8278  train_loss=0.2523
+  step 15200 (epoch 6): val_spearman=0.8269  train_loss=0.2551
+  step 15300 (epoch 6): val_spearman=0.8331  train_loss=0.2528
+  step 15400 (epoch 6): val_spearman=0.8324  train_loss=0.2549
+  step 15500 (epoch 6): val_spearman=0.8192  train_loss=0.2558
+  step 15600 (epoch 6): val_spearman=0.8158  train_loss=0.2544
+  step 15700 (epoch 6): val_spearman=0.8011  train_loss=0.2510
+  step 15800 (epoch 6): val_spearman=0.8387  train_loss=0.2553
+  step 15900 (epoch 6): val_spearman=0.8131  train_loss=0.2565
+  step 16000 (epoch 6): val_spearman=0.7877  train_loss=0.2558
+  step 16100 (epoch 6): val_spearman=0.7925  train_loss=0.2523
+  step 16200 (epoch 6): val_spearman=0.8176  train_loss=0.2547
+  step 16300 (epoch 6): val_spearman=0.8234  train_loss=0.2538
+  step 16400 (epoch 6): val_spearman=0.8266  train_loss=0.2546
+  step 16500 (epoch 6): val_spearman=0.7923  train_loss=0.2566
+  step 16600 (epoch 6): val_spearman=0.7765  train_loss=0.2552
+  step 16700 (epoch 6): val_spearman=0.8091  train_loss=0.2558
+  step 16800 (epoch 6): val_spearman=0.8167  train_loss=0.2600
+  step 16900 (epoch 6): val_spearman=0.8427  train_loss=0.2571
+  step 17000 (epoch 6): val_spearman=0.8231  train_loss=0.2560
+  step 17100 (epoch 6): val_spearman=0.8282  train_loss=0.2524
+  step 17200 (epoch 6): val_spearman=0.8178  train_loss=0.2491
+  step 17300 (epoch 6): val_spearman=0.8430  train_loss=0.2518
+  step 17400 (epoch 7): val_spearman=0.8298  train_loss=0.2417
+  step 17500 (epoch 7): val_spearman=0.8379  train_loss=0.2157
+  step 17600 (epoch 7): val_spearman=0.8314  train_loss=0.2148
+  step 17700 (epoch 7): val_spearman=0.8321  train_loss=0.2184
+  step 17800 (epoch 7): val_spearman=0.8276  train_loss=0.2160
+  step 17900 (epoch 7): val_spearman=0.8434  train_loss=0.2202
+  step 18000 (epoch 7): val_spearman=0.8198  train_loss=0.2173
+  step 18100 (epoch 7): val_spearman=0.8182  train_loss=0.2249
+  step 18200 (epoch 7): val_spearman=0.8574  train_loss=0.2230
+  step 18300 (epoch 7): val_spearman=0.7976  train_loss=0.2188
+  step 18400 (epoch 7): val_spearman=0.8164  train_loss=0.2223
+  step 18500 (epoch 7): val_spearman=0.8203  train_loss=0.2225
+  step 18600 (epoch 7): val_spearman=0.8036  train_loss=0.2179
+  step 18700 (epoch 7): val_spearman=0.8321  train_loss=0.2166
+  step 18800 (epoch 7): val_spearman=0.8247  train_loss=0.2284
+  step 18900 (epoch 7): val_spearman=0.8291  train_loss=0.2275
+  step 19000 (epoch 7): val_spearman=0.8247  train_loss=0.2256
+  step 19100 (epoch 7): val_spearman=0.8103  train_loss=0.2252
+  step 19200 (epoch 7): val_spearman=0.8200  train_loss=0.2215
+  step 19300 (epoch 7): val_spearman=0.7826  train_loss=0.2254
+  step 19400 (epoch 7): val_spearman=0.8030  train_loss=0.2262
+  step 19500 (epoch 7): val_spearman=0.7987  train_loss=0.2239
+  step 19600 (epoch 7): val_spearman=0.8278  train_loss=0.2294
+  step 19700 (epoch 7): val_spearman=0.8073  train_loss=0.2216
+  step 19800 (epoch 7): val_spearman=0.8380  train_loss=0.2222
+  step 19900 (epoch 7): val_spearman=0.8328  train_loss=0.2188
+  step 20000 (epoch 7): val_spearman=0.8235  train_loss=0.2234
+  step 20100 (epoch 7): val_spearman=0.8227  train_loss=0.2302
+  step 20200 (epoch 7): val_spearman=0.8375  train_loss=0.2271
+  step 20300 (epoch 8): val_spearman=0.8444  train_loss=0.2103
+  step 20400 (epoch 8): val_spearman=0.8245  train_loss=0.1798
+  step 20500 (epoch 8): val_spearman=0.8064  train_loss=0.1790
+  step 20600 (epoch 8): val_spearman=0.8196  train_loss=0.1853
+  step 20700 (epoch 8): val_spearman=0.8127  train_loss=0.1830
+  step 20800 (epoch 8): val_spearman=0.8184  train_loss=0.1805
+  step 20900 (epoch 8): val_spearman=0.8061  train_loss=0.1858
+  step 21000 (epoch 8): val_spearman=0.8104  train_loss=0.1858
+  step 21100 (epoch 8): val_spearman=0.8109  train_loss=0.1849
+  step 21200 (epoch 8): val_spearman=0.8162  train_loss=0.1916
+  step 21300 (epoch 8): val_spearman=0.8056  train_loss=0.1876
+  step 21400 (epoch 8): val_spearman=0.8211  train_loss=0.1870
+  step 21500 (epoch 8): val_spearman=0.8292  train_loss=0.1864
+  step 21600 (epoch 8): val_spearman=0.8322  train_loss=0.1862
+  step 21700 (epoch 8): val_spearman=0.8245  train_loss=0.1868
+  step 21800 (epoch 8): val_spearman=0.8224  train_loss=0.1895
+  step 21900 (epoch 8): val_spearman=0.8371  train_loss=0.1901
+  step 22000 (epoch 8): val_spearman=0.8341  train_loss=0.1872
+  step 22100 (epoch 8): val_spearman=0.8309  train_loss=0.1879
+  step 22200 (epoch 8): val_spearman=0.8356  train_loss=0.1898
+  step 22300 (epoch 8): val_spearman=0.8307  train_loss=0.1876
+  step 22400 (epoch 8): val_spearman=0.8190  train_loss=0.1863
+  step 22500 (epoch 8): val_spearman=0.8232  train_loss=0.1885
+  step 22600 (epoch 8): val_spearman=0.8472  train_loss=0.1899
+  step 22700 (epoch 8): val_spearman=0.8271  train_loss=0.1910
+  step 22800 (epoch 8): val_spearman=0.8417  train_loss=0.1898
+  step 22900 (epoch 8): val_spearman=0.8468  train_loss=0.1891
+  step 23000 (epoch 8): val_spearman=0.8162  train_loss=0.1929
+  step 23100 (epoch 8): val_spearman=0.8312  train_loss=0.1861
+  step 23200 (epoch 9): val_spearman=0.8483  train_loss=0.1706
+  step 23300 (epoch 9): val_spearman=0.8381  train_loss=0.1465
+  step 23400 (epoch 9): val_spearman=0.8448  train_loss=0.1463
+  step 23500 (epoch 9): val_spearman=0.8297  train_loss=0.1476
+  step 23600 (epoch 9): val_spearman=0.8427  train_loss=0.1479
+  step 23700 (epoch 9): val_spearman=0.8299  train_loss=0.1492
+  step 23800 (epoch 9): val_spearman=0.8290  train_loss=0.1512
+  step 23900 (epoch 9): val_spearman=0.8368  train_loss=0.1505
+  step 24000 (epoch 9): val_spearman=0.8186  train_loss=0.1532
+  step 24100 (epoch 9): val_spearman=0.8286  train_loss=0.1496
+  step 24200 (epoch 9): val_spearman=0.8415  train_loss=0.1507
+  step 24300 (epoch 9): val_spearman=0.8488  train_loss=0.1513
+  step 24400 (epoch 9): val_spearman=0.8498  train_loss=0.1497
+  step 24500 (epoch 9): val_spearman=0.8522  train_loss=0.1560
+  step 24600 (epoch 9): val_spearman=0.8513  train_loss=0.1490
+  step 24700 (epoch 9): val_spearman=0.8284  train_loss=0.1543
+  step 24800 (epoch 9): val_spearman=0.8234  train_loss=0.1542
+  step 24900 (epoch 9): val_spearman=0.8147  train_loss=0.1525
+  step 25000 (epoch 9): val_spearman=0.8215  train_loss=0.1543
+  step 25100 (epoch 9): val_spearman=0.8334  train_loss=0.1550
+  step 25200 (epoch 9): val_spearman=0.8295  train_loss=0.1565
+  step 25300 (epoch 9): val_spearman=0.8220  train_loss=0.1602
+  step 25400 (epoch 9): val_spearman=0.8320  train_loss=0.1590
+  step 25500 (epoch 9): val_spearman=0.8422  train_loss=0.1617
+  step 25600 (epoch 9): val_spearman=0.8221  train_loss=0.1546
+  step 25700 (epoch 9): val_spearman=0.8255  train_loss=0.1555
+  step 25800 (epoch 9): val_spearman=0.8234  train_loss=0.1589
+  step 25900 (epoch 9): val_spearman=0.8169  train_loss=0.1547
+  step 26000 (epoch 9): val_spearman=0.8078  train_loss=0.1585
+  step 26100 (epoch 10): val_spearman=0.8251  train_loss=0.1381
+  step 26200 (epoch 10): val_spearman=0.8006  train_loss=0.1157
+  step 26300 (epoch 10): val_spearman=0.8446  train_loss=0.1167
+  step 26400 (epoch 10): val_spearman=0.8497  train_loss=0.1171
+  step 26500 (epoch 10): val_spearman=0.8121  train_loss=0.1210
+  step 26600 (epoch 10): val_spearman=0.8385  train_loss=0.1152
+  step 26700 (epoch 10): val_spearman=0.8209  train_loss=0.1181
+  step 26800 (epoch 10): val_spearman=0.8127  train_loss=0.1227
+  step 26900 (epoch 10): val_spearman=0.7972  train_loss=0.1243
+  step 27000 (epoch 10): val_spearman=0.8212  train_loss=0.1225
+  step 27100 (epoch 10): val_spearman=0.8100  train_loss=0.1228
+  step 27200 (epoch 10): val_spearman=0.8089  train_loss=0.1275
+  step 27300 (epoch 10): val_spearman=0.8190  train_loss=0.1242
+  step 27400 (epoch 10): val_spearman=0.8336  train_loss=0.1245
+  step 27500 (epoch 10): val_spearman=0.8118  train_loss=0.1229
+  step 27600 (epoch 10): val_spearman=0.8238  train_loss=0.1256
+  step 27700 (epoch 10): val_spearman=0.8090  train_loss=0.1257
+  step 27800 (epoch 10): val_spearman=0.7854  train_loss=0.1272
+  step 27900 (epoch 10): val_spearman=0.8196  train_loss=0.1283
+  step 28000 (epoch 10): val_spearman=0.8283  train_loss=0.1280
+  step 28100 (epoch 10): val_spearman=0.8144  train_loss=0.1276
+  step 28200 (epoch 10): val_spearman=0.8124  train_loss=0.1256
+  step 28300 (epoch 10): val_spearman=0.8188  train_loss=0.1299
+  step 28400 (epoch 10): val_spearman=0.7993  train_loss=0.1271
+  step 28500 (epoch 10): val_spearman=0.8174  train_loss=0.1266
+  step 28600 (epoch 10): val_spearman=0.7845  train_loss=0.1284
+  step 28700 (epoch 10): val_spearman=0.8076  train_loss=0.1269
+  step 28800 (epoch 10): val_spearman=0.8182  train_loss=0.1328
+  step 28900 (epoch 10): val_spearman=0.8231  train_loss=0.1283
+  step 28930 (epoch 11): val_spearman=0.8038  train_loss=0.1253
+============================================================

outputs/pep-affibody-ablation-fe/libB_pseudo_bf16/train.log ADDED Viewed

The diff for this file is too large to render. See raw diff