| { |
| "best_global_step": 2184, |
| "best_metric": 0.862, |
| "best_model_checkpoint": "dfine_squirrel/checkpoint-2184", |
| "epoch": 30.0, |
| "eval_steps": 500, |
| "global_step": 2730, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_loss": 2.367178440093994, |
| "eval_map": 0.1766, |
| "eval_map_50": 0.23, |
| "eval_map_75": 0.1862, |
| "eval_map_class_0": 0.1766, |
| "eval_map_large": 0.1989, |
| "eval_map_medium": 0.0031, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.3422, |
| "eval_mar_10": 0.5248, |
| "eval_mar_100": 0.6224, |
| "eval_mar_100_class_0": 0.6224, |
| "eval_mar_large": 0.651, |
| "eval_mar_medium": 0.3462, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6845, |
| "eval_samples_per_second": 19.149, |
| "eval_steps_per_second": 2.394, |
| "step": 91 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_loss": 1.0650697946548462, |
| "eval_map": 0.7244, |
| "eval_map_50": 0.8127, |
| "eval_map_75": 0.7856, |
| "eval_map_class_0": 0.7244, |
| "eval_map_large": 0.7538, |
| "eval_map_medium": 0.4261, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.6901, |
| "eval_mar_10": 0.7888, |
| "eval_mar_100": 0.8596, |
| "eval_mar_100_class_0": 0.8596, |
| "eval_mar_large": 0.885, |
| "eval_mar_medium": 0.6385, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.633, |
| "eval_samples_per_second": 19.298, |
| "eval_steps_per_second": 2.412, |
| "step": 182 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_loss": 0.8899274468421936, |
| "eval_map": 0.7577, |
| "eval_map_50": 0.8321, |
| "eval_map_75": 0.7881, |
| "eval_map_class_0": 0.7577, |
| "eval_map_large": 0.7986, |
| "eval_map_medium": 0.4732, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7137, |
| "eval_mar_10": 0.8311, |
| "eval_mar_100": 0.8863, |
| "eval_mar_100_class_0": 0.8863, |
| "eval_mar_large": 0.9109, |
| "eval_mar_medium": 0.6769, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5407, |
| "eval_samples_per_second": 19.57, |
| "eval_steps_per_second": 2.446, |
| "step": 273 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_loss": 0.8310188055038452, |
| "eval_map": 0.7773, |
| "eval_map_50": 0.8432, |
| "eval_map_75": 0.8045, |
| "eval_map_class_0": 0.7773, |
| "eval_map_large": 0.814, |
| "eval_map_medium": 0.586, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7124, |
| "eval_mar_10": 0.841, |
| "eval_mar_100": 0.8894, |
| "eval_mar_100_class_0": 0.8894, |
| "eval_mar_large": 0.9122, |
| "eval_mar_medium": 0.7, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.599, |
| "eval_samples_per_second": 19.397, |
| "eval_steps_per_second": 2.425, |
| "step": 364 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_loss": 0.8332623243331909, |
| "eval_map": 0.7792, |
| "eval_map_50": 0.8513, |
| "eval_map_75": 0.8058, |
| "eval_map_class_0": 0.7792, |
| "eval_map_large": 0.8197, |
| "eval_map_medium": 0.6129, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.718, |
| "eval_mar_10": 0.8317, |
| "eval_mar_100": 0.9031, |
| "eval_mar_100_class_0": 0.9031, |
| "eval_mar_large": 0.9265, |
| "eval_mar_medium": 0.7077, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.61, |
| "eval_samples_per_second": 19.365, |
| "eval_steps_per_second": 2.421, |
| "step": 455 |
| }, |
| { |
| "epoch": 5.4945054945054945, |
| "grad_norm": 45.534889221191406, |
| "learning_rate": 4.086080586080586e-05, |
| "loss": 27.38396484375, |
| "step": 500 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_loss": 0.8361273407936096, |
| "eval_map": 0.8008, |
| "eval_map_50": 0.8684, |
| "eval_map_75": 0.8296, |
| "eval_map_class_0": 0.8008, |
| "eval_map_large": 0.8348, |
| "eval_map_medium": 0.5788, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.723, |
| "eval_mar_10": 0.8609, |
| "eval_mar_100": 0.9124, |
| "eval_mar_100_class_0": 0.9124, |
| "eval_mar_large": 0.9367, |
| "eval_mar_medium": 0.7077, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.591, |
| "eval_samples_per_second": 19.42, |
| "eval_steps_per_second": 2.428, |
| "step": 546 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_loss": 0.8077548146247864, |
| "eval_map": 0.8, |
| "eval_map_50": 0.8587, |
| "eval_map_75": 0.8191, |
| "eval_map_class_0": 0.8, |
| "eval_map_large": 0.8365, |
| "eval_map_medium": 0.5968, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7224, |
| "eval_mar_10": 0.8739, |
| "eval_mar_100": 0.9211, |
| "eval_mar_100_class_0": 0.9211, |
| "eval_mar_large": 0.9442, |
| "eval_mar_medium": 0.7308, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.4826, |
| "eval_samples_per_second": 19.745, |
| "eval_steps_per_second": 2.468, |
| "step": 637 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_loss": 0.8231956958770752, |
| "eval_map": 0.8173, |
| "eval_map_50": 0.8877, |
| "eval_map_75": 0.837, |
| "eval_map_class_0": 0.8173, |
| "eval_map_large": 0.8476, |
| "eval_map_medium": 0.6199, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7205, |
| "eval_mar_10": 0.8677, |
| "eval_mar_100": 0.9161, |
| "eval_mar_100_class_0": 0.9161, |
| "eval_mar_large": 0.9415, |
| "eval_mar_medium": 0.7, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.4352, |
| "eval_samples_per_second": 19.891, |
| "eval_steps_per_second": 2.486, |
| "step": 728 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_loss": 0.7746098041534424, |
| "eval_map": 0.8268, |
| "eval_map_50": 0.8863, |
| "eval_map_75": 0.8541, |
| "eval_map_class_0": 0.8268, |
| "eval_map_large": 0.8577, |
| "eval_map_medium": 0.6029, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7211, |
| "eval_mar_10": 0.8702, |
| "eval_mar_100": 0.9224, |
| "eval_mar_100_class_0": 0.9224, |
| "eval_mar_large": 0.951, |
| "eval_mar_medium": 0.6692, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6084, |
| "eval_samples_per_second": 19.369, |
| "eval_steps_per_second": 2.421, |
| "step": 819 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_loss": 0.8223000764846802, |
| "eval_map": 0.8324, |
| "eval_map_50": 0.8875, |
| "eval_map_75": 0.8682, |
| "eval_map_class_0": 0.8324, |
| "eval_map_large": 0.8586, |
| "eval_map_medium": 0.6198, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7311, |
| "eval_mar_10": 0.8801, |
| "eval_mar_100": 0.9193, |
| "eval_mar_100_class_0": 0.9193, |
| "eval_mar_large": 0.9456, |
| "eval_mar_medium": 0.6923, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6591, |
| "eval_samples_per_second": 19.222, |
| "eval_steps_per_second": 2.403, |
| "step": 910 |
| }, |
| { |
| "epoch": 10.989010989010989, |
| "grad_norm": 34.31671142578125, |
| "learning_rate": 3.17032967032967e-05, |
| "loss": 9.0921865234375, |
| "step": 1000 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_loss": 0.7678491473197937, |
| "eval_map": 0.8327, |
| "eval_map_50": 0.8851, |
| "eval_map_75": 0.8689, |
| "eval_map_class_0": 0.8327, |
| "eval_map_large": 0.8634, |
| "eval_map_medium": 0.5991, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7422, |
| "eval_mar_10": 0.8671, |
| "eval_mar_100": 0.9255, |
| "eval_mar_100_class_0": 0.9255, |
| "eval_mar_large": 0.9531, |
| "eval_mar_medium": 0.6846, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6366, |
| "eval_samples_per_second": 19.287, |
| "eval_steps_per_second": 2.411, |
| "step": 1001 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_loss": 0.7850316166877747, |
| "eval_map": 0.8328, |
| "eval_map_50": 0.8888, |
| "eval_map_75": 0.8545, |
| "eval_map_class_0": 0.8328, |
| "eval_map_large": 0.8635, |
| "eval_map_medium": 0.6134, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7366, |
| "eval_mar_10": 0.8752, |
| "eval_mar_100": 0.9335, |
| "eval_mar_100_class_0": 0.9335, |
| "eval_mar_large": 0.9585, |
| "eval_mar_medium": 0.7231, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.866, |
| "eval_samples_per_second": 18.643, |
| "eval_steps_per_second": 2.33, |
| "step": 1092 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_loss": 0.8330104351043701, |
| "eval_map": 0.8294, |
| "eval_map_50": 0.8882, |
| "eval_map_75": 0.8485, |
| "eval_map_class_0": 0.8294, |
| "eval_map_large": 0.8585, |
| "eval_map_medium": 0.583, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7416, |
| "eval_mar_10": 0.8689, |
| "eval_mar_100": 0.9267, |
| "eval_mar_100_class_0": 0.9267, |
| "eval_mar_large": 0.9503, |
| "eval_mar_medium": 0.7308, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6667, |
| "eval_samples_per_second": 19.2, |
| "eval_steps_per_second": 2.4, |
| "step": 1183 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_loss": 0.7800494432449341, |
| "eval_map": 0.8399, |
| "eval_map_50": 0.8977, |
| "eval_map_75": 0.8761, |
| "eval_map_class_0": 0.8399, |
| "eval_map_large": 0.87, |
| "eval_map_medium": 0.5989, |
| "eval_map_small": 0.0056, |
| "eval_mar_1": 0.741, |
| "eval_mar_10": 0.8758, |
| "eval_mar_100": 0.9348, |
| "eval_mar_100_class_0": 0.9348, |
| "eval_mar_large": 0.9517, |
| "eval_mar_medium": 0.7692, |
| "eval_mar_small": 0.6, |
| "eval_runtime": 6.5377, |
| "eval_samples_per_second": 19.579, |
| "eval_steps_per_second": 2.447, |
| "step": 1274 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_loss": 0.7594577074050903, |
| "eval_map": 0.8437, |
| "eval_map_50": 0.8993, |
| "eval_map_75": 0.8771, |
| "eval_map_class_0": 0.8437, |
| "eval_map_large": 0.8731, |
| "eval_map_medium": 0.6092, |
| "eval_map_small": 0.0061, |
| "eval_mar_1": 0.7509, |
| "eval_mar_10": 0.8925, |
| "eval_mar_100": 0.9466, |
| "eval_mar_100_class_0": 0.9466, |
| "eval_mar_large": 0.9633, |
| "eval_mar_medium": 0.7846, |
| "eval_mar_small": 0.6, |
| "eval_runtime": 6.6179, |
| "eval_samples_per_second": 19.341, |
| "eval_steps_per_second": 2.418, |
| "step": 1365 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_loss": 0.7757935523986816, |
| "eval_map": 0.843, |
| "eval_map_50": 0.9059, |
| "eval_map_75": 0.8657, |
| "eval_map_class_0": 0.843, |
| "eval_map_large": 0.8713, |
| "eval_map_medium": 0.6186, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7472, |
| "eval_mar_10": 0.8783, |
| "eval_mar_100": 0.9385, |
| "eval_mar_100_class_0": 0.9385, |
| "eval_mar_large": 0.9633, |
| "eval_mar_medium": 0.7308, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6266, |
| "eval_samples_per_second": 19.316, |
| "eval_steps_per_second": 2.415, |
| "step": 1456 |
| }, |
| { |
| "epoch": 16.483516483516482, |
| "grad_norm": 38.72512435913086, |
| "learning_rate": 2.2545787545787548e-05, |
| "loss": 8.323384765625, |
| "step": 1500 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_loss": 0.8078031539916992, |
| "eval_map": 0.844, |
| "eval_map_50": 0.9017, |
| "eval_map_75": 0.8816, |
| "eval_map_class_0": 0.844, |
| "eval_map_large": 0.8754, |
| "eval_map_medium": 0.6091, |
| "eval_map_small": 0.009, |
| "eval_mar_1": 0.7453, |
| "eval_mar_10": 0.8957, |
| "eval_mar_100": 0.9366, |
| "eval_mar_100_class_0": 0.9366, |
| "eval_mar_large": 0.9592, |
| "eval_mar_medium": 0.7077, |
| "eval_mar_small": 0.6, |
| "eval_runtime": 6.5387, |
| "eval_samples_per_second": 19.576, |
| "eval_steps_per_second": 2.447, |
| "step": 1547 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_loss": 0.771867036819458, |
| "eval_map": 0.8479, |
| "eval_map_50": 0.9069, |
| "eval_map_75": 0.8728, |
| "eval_map_class_0": 0.8479, |
| "eval_map_large": 0.8785, |
| "eval_map_medium": 0.6086, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7522, |
| "eval_mar_10": 0.8882, |
| "eval_mar_100": 0.9273, |
| "eval_mar_100_class_0": 0.9273, |
| "eval_mar_large": 0.9531, |
| "eval_mar_medium": 0.7077, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.8246, |
| "eval_samples_per_second": 18.756, |
| "eval_steps_per_second": 2.344, |
| "step": 1638 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_loss": 0.756177544593811, |
| "eval_map": 0.8552, |
| "eval_map_50": 0.9105, |
| "eval_map_75": 0.8779, |
| "eval_map_class_0": 0.8552, |
| "eval_map_large": 0.8853, |
| "eval_map_medium": 0.6193, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7509, |
| "eval_mar_10": 0.8882, |
| "eval_mar_100": 0.9323, |
| "eval_mar_100_class_0": 0.9323, |
| "eval_mar_large": 0.9585, |
| "eval_mar_medium": 0.7077, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5483, |
| "eval_samples_per_second": 19.547, |
| "eval_steps_per_second": 2.443, |
| "step": 1729 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_loss": 0.8165637850761414, |
| "eval_map": 0.8478, |
| "eval_map_50": 0.9076, |
| "eval_map_75": 0.8774, |
| "eval_map_class_0": 0.8478, |
| "eval_map_large": 0.8765, |
| "eval_map_medium": 0.6428, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7528, |
| "eval_mar_10": 0.8988, |
| "eval_mar_100": 0.9379, |
| "eval_mar_100_class_0": 0.9379, |
| "eval_mar_large": 0.9633, |
| "eval_mar_medium": 0.7231, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5543, |
| "eval_samples_per_second": 19.529, |
| "eval_steps_per_second": 2.441, |
| "step": 1820 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_loss": 0.7615771293640137, |
| "eval_map": 0.8519, |
| "eval_map_50": 0.9053, |
| "eval_map_75": 0.8843, |
| "eval_map_class_0": 0.8519, |
| "eval_map_large": 0.8818, |
| "eval_map_medium": 0.6332, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7578, |
| "eval_mar_10": 0.8919, |
| "eval_mar_100": 0.9385, |
| "eval_mar_100_class_0": 0.9385, |
| "eval_mar_large": 0.9646, |
| "eval_mar_medium": 0.7154, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6955, |
| "eval_samples_per_second": 19.117, |
| "eval_steps_per_second": 2.39, |
| "step": 1911 |
| }, |
| { |
| "epoch": 21.978021978021978, |
| "grad_norm": 37.53008270263672, |
| "learning_rate": 1.3388278388278389e-05, |
| "loss": 7.99486328125, |
| "step": 2000 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_loss": 0.7444530129432678, |
| "eval_map": 0.857, |
| "eval_map_50": 0.9102, |
| "eval_map_75": 0.8872, |
| "eval_map_class_0": 0.857, |
| "eval_map_large": 0.8856, |
| "eval_map_medium": 0.6327, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7497, |
| "eval_mar_10": 0.8839, |
| "eval_mar_100": 0.9354, |
| "eval_mar_100_class_0": 0.9354, |
| "eval_mar_large": 0.9605, |
| "eval_mar_medium": 0.7231, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5313, |
| "eval_samples_per_second": 19.598, |
| "eval_steps_per_second": 2.45, |
| "step": 2002 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_loss": 0.7569313645362854, |
| "eval_map": 0.85, |
| "eval_map_50": 0.9003, |
| "eval_map_75": 0.8792, |
| "eval_map_class_0": 0.85, |
| "eval_map_large": 0.8802, |
| "eval_map_medium": 0.6308, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7516, |
| "eval_mar_10": 0.9019, |
| "eval_mar_100": 0.9366, |
| "eval_mar_100_class_0": 0.9366, |
| "eval_mar_large": 0.9626, |
| "eval_mar_medium": 0.7154, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5869, |
| "eval_samples_per_second": 19.433, |
| "eval_steps_per_second": 2.429, |
| "step": 2093 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_loss": 0.755048930644989, |
| "eval_map": 0.862, |
| "eval_map_50": 0.9093, |
| "eval_map_75": 0.8837, |
| "eval_map_class_0": 0.862, |
| "eval_map_large": 0.8917, |
| "eval_map_medium": 0.6277, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7516, |
| "eval_mar_10": 0.8882, |
| "eval_mar_100": 0.9441, |
| "eval_mar_100_class_0": 0.9441, |
| "eval_mar_large": 0.9653, |
| "eval_mar_medium": 0.7769, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6153, |
| "eval_samples_per_second": 19.349, |
| "eval_steps_per_second": 2.419, |
| "step": 2184 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_loss": 0.7434877753257751, |
| "eval_map": 0.8561, |
| "eval_map_50": 0.9053, |
| "eval_map_75": 0.8875, |
| "eval_map_class_0": 0.8561, |
| "eval_map_large": 0.885, |
| "eval_map_medium": 0.6371, |
| "eval_map_small": 0.0055, |
| "eval_mar_1": 0.7559, |
| "eval_mar_10": 0.8981, |
| "eval_mar_100": 0.9478, |
| "eval_mar_100_class_0": 0.9478, |
| "eval_mar_large": 0.9633, |
| "eval_mar_medium": 0.7923, |
| "eval_mar_small": 0.7, |
| "eval_runtime": 6.5533, |
| "eval_samples_per_second": 19.532, |
| "eval_steps_per_second": 2.442, |
| "step": 2275 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_loss": 0.7752219438552856, |
| "eval_map": 0.8441, |
| "eval_map_50": 0.8961, |
| "eval_map_75": 0.8669, |
| "eval_map_class_0": 0.8441, |
| "eval_map_large": 0.8717, |
| "eval_map_medium": 0.6392, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7553, |
| "eval_mar_10": 0.8857, |
| "eval_mar_100": 0.9398, |
| "eval_mar_100_class_0": 0.9398, |
| "eval_mar_large": 0.9592, |
| "eval_mar_medium": 0.7923, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5969, |
| "eval_samples_per_second": 19.403, |
| "eval_steps_per_second": 2.425, |
| "step": 2366 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_loss": 0.7504961490631104, |
| "eval_map": 0.8505, |
| "eval_map_50": 0.8966, |
| "eval_map_75": 0.8745, |
| "eval_map_class_0": 0.8505, |
| "eval_map_large": 0.88, |
| "eval_map_medium": 0.6337, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7565, |
| "eval_mar_10": 0.8857, |
| "eval_mar_100": 0.9441, |
| "eval_mar_100_class_0": 0.9441, |
| "eval_mar_large": 0.9639, |
| "eval_mar_medium": 0.7923, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5131, |
| "eval_samples_per_second": 19.653, |
| "eval_steps_per_second": 2.457, |
| "step": 2457 |
| }, |
| { |
| "epoch": 27.47252747252747, |
| "grad_norm": 72.2485580444336, |
| "learning_rate": 4.230769230769231e-06, |
| "loss": 7.68200732421875, |
| "step": 2500 |
| }, |
| { |
| "epoch": 28.0, |
| "eval_loss": 0.7449190616607666, |
| "eval_map": 0.8533, |
| "eval_map_50": 0.9012, |
| "eval_map_75": 0.8801, |
| "eval_map_class_0": 0.8533, |
| "eval_map_large": 0.8826, |
| "eval_map_medium": 0.627, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7553, |
| "eval_mar_10": 0.8901, |
| "eval_mar_100": 0.9416, |
| "eval_mar_100_class_0": 0.9416, |
| "eval_mar_large": 0.9626, |
| "eval_mar_medium": 0.7769, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.6251, |
| "eval_samples_per_second": 19.32, |
| "eval_steps_per_second": 2.415, |
| "step": 2548 |
| }, |
| { |
| "epoch": 29.0, |
| "eval_loss": 0.7330126166343689, |
| "eval_map": 0.8577, |
| "eval_map_50": 0.9052, |
| "eval_map_75": 0.8842, |
| "eval_map_class_0": 0.8577, |
| "eval_map_large": 0.8874, |
| "eval_map_medium": 0.6278, |
| "eval_map_small": 0.0076, |
| "eval_mar_1": 0.7571, |
| "eval_mar_10": 0.8975, |
| "eval_mar_100": 0.9497, |
| "eval_mar_100_class_0": 0.9497, |
| "eval_mar_large": 0.966, |
| "eval_mar_medium": 0.7769, |
| "eval_mar_small": 0.8, |
| "eval_runtime": 6.6188, |
| "eval_samples_per_second": 19.339, |
| "eval_steps_per_second": 2.417, |
| "step": 2639 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_loss": 0.741165041923523, |
| "eval_map": 0.8559, |
| "eval_map_50": 0.9016, |
| "eval_map_75": 0.8852, |
| "eval_map_class_0": 0.8559, |
| "eval_map_large": 0.8848, |
| "eval_map_medium": 0.6332, |
| "eval_map_small": 0.0, |
| "eval_mar_1": 0.7571, |
| "eval_mar_10": 0.8957, |
| "eval_mar_100": 0.9385, |
| "eval_mar_100_class_0": 0.9385, |
| "eval_mar_large": 0.9639, |
| "eval_mar_medium": 0.7231, |
| "eval_mar_small": 0.0, |
| "eval_runtime": 6.5118, |
| "eval_samples_per_second": 19.656, |
| "eval_steps_per_second": 2.457, |
| "step": 2730 |
| }, |
| { |
| "epoch": 30.0, |
| "step": 2730, |
| "total_flos": 1.6368835442688e+18, |
| "train_loss": 11.706639954283997, |
| "train_runtime": 1986.2673, |
| "train_samples_per_second": 10.95, |
| "train_steps_per_second": 1.374 |
| } |
| ], |
| "logging_steps": 500, |
| "max_steps": 2730, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 30, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1.6368835442688e+18, |
| "train_batch_size": 8, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|