igor174 commited on
Commit
3fe92cc
·
verified ·
1 Parent(s): 06587f4

Upload CAUM (jax) trained on MIND-small — 3 seeds

Browse files
seed_42/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46661584d959a93125cf9e06b08b854139a5e1b41f9fcaf59f431ddde61d5553
3
  size 47322396
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fdb3f797c03b0806b9d95206884cb6473b2633417d76fa09c756f15edfefa39
3
  size 47322396
seed_42/test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "loss": 4.885279593137135,
3
- "auc": 0.6716255651925904,
4
- "mrr": 0.31951080672544796,
5
- "ndcg@5": 0.3533953887559558,
6
- "ndcg@10": 0.417788739745737,
7
  "num_impressions": 72903.0
8
  }
 
1
  {
2
+ "loss": 4.885290258142447,
3
+ "auc": 0.6716320262703661,
4
+ "mrr": 0.31951266628908737,
5
+ "ndcg@5": 0.35341487453541737,
6
+ "ndcg@10": 0.4177790125019271,
7
  "num_impressions": 72903.0
8
  }
seed_42/training_run_summary.json CHANGED
@@ -257,44 +257,44 @@
257
  "initial_validation_metrics": {},
258
  "best_validation_summary": {
259
  "epoch_number": 8.0,
260
- "train_loss": 1.2569683923193469,
261
- "average_metric_value": 0.5173871047050278,
262
- "val_loss": 4.491243967664317,
263
- "val_auc": 0.7467889007717999,
264
- "val_mrr": 0.3941287371779766,
265
- "val_ndcg@5": 0.43629077698141816,
266
- "val_ndcg@10": 0.4923400038889164,
267
  "val_num_impressions": 7824.0,
268
  "timing": {
269
  "epoch_training_times": [
270
- 163.71576189994812,
271
- 128.66470193862915,
272
- 124.40946054458618,
273
- 122.63417339324951,
274
- 123.02388978004456,
275
- 124.40860843658447,
276
- 123.64945530891418,
277
- 124.03472113609314
278
  ],
279
  "epoch_validation_times": [
280
- 225.55031847953796,
281
- 155.1456437110901,
282
- 154.2360875606537,
283
- 154.55679368972778,
284
- 155.49029302597046,
285
- 155.03285694122314,
286
- 156.5079698562622,
287
- 172.0624237060547
288
  ],
289
- "total_training_time": 2363.861449956894
290
  }
291
  },
292
  "final_test_metrics": {
293
- "loss": 4.885279593137135,
294
- "auc": 0.6716255651925904,
295
- "mrr": 0.31951080672544796,
296
- "ndcg@5": 0.3533953887559558,
297
- "ndcg@10": 0.417788739745737,
298
  "num_impressions": 72903.0
299
  }
300
  }
 
257
  "initial_validation_metrics": {},
258
  "best_validation_summary": {
259
  "epoch_number": 8.0,
260
+ "train_loss": 1.256968167472918,
261
+ "average_metric_value": 0.5174154410910897,
262
+ "val_loss": 4.49124723870549,
263
+ "val_auc": 0.7468131525042653,
264
+ "val_mrr": 0.3941594308823248,
265
+ "val_ndcg@5": 0.4363602148970487,
266
+ "val_ndcg@10": 0.49232896608071997,
267
  "val_num_impressions": 7824.0,
268
  "timing": {
269
  "epoch_training_times": [
270
+ 163.05336737632751,
271
+ 125.91719460487366,
272
+ 123.6555745601654,
273
+ 124.48746538162231,
274
+ 126.33813762664795,
275
+ 125.54173946380615,
276
+ 122.81819033622742,
277
+ 124.80581545829773
278
  ],
279
  "epoch_validation_times": [
280
+ 224.672523021698,
281
+ 151.31402707099915,
282
+ 151.30706453323364,
283
+ 151.26560187339783,
284
+ 159.7723400592804,
285
+ 153.1495270729065,
286
+ 153.66180729866028,
287
+ 155.1824631690979
288
  ],
289
+ "total_training_time": 2337.687963247299
290
  }
291
  },
292
  "final_test_metrics": {
293
+ "loss": 4.885290258142447,
294
+ "auc": 0.6716320262703661,
295
+ "mrr": 0.31951266628908737,
296
+ "ndcg@5": 0.35341487453541737,
297
+ "ndcg@10": 0.4177790125019271,
298
  "num_impressions": 72903.0
299
  }
300
  }