[ { "epoch": 1, "train_loss": 5.157754315270318, "train_tool_retrieval_accuracy": 0.8961538672447205, "train_parent_retrieval_accuracy": 0.7846153974533081, "val_tool_retrieval_accuracy": 0.5192307829856873, "val_parent_retrieval_accuracy": 0.692307710647583, "val_tool_classification_accuracy": 0.0, "val_parent_classification_accuracy": 0.3076923076923077, "learning_rate": 8.181818181818183e-06, "epoch_duration_seconds": 7.761668143000861, "best_val_tool_retrieval_accuracy": 0.5192307829856873, "best_epoch": 1, "train_parent_cross_entropy": 2.3311243984434338, "train_child_cross_entropy": 2.625902043448554, "train_parent_alignment": 0.9960288206736246, "train_child_alignment": 1.0112511979209051, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.5192307692307693, "validation/tool/silhouette_score": -0.09840114414691925, "validation/tool/global_near_overlap_rate": 0.7692307692307693, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.6923076923076923, "validation/parent/silhouette_score": -0.07535062730312347, "validation/parent/global_near_overlap_rate": 0.6153846153846154, "validation/parent/top_pair/label_a": "File System", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.5, "validation/parent/top_pair/centroid_cosine": 0.896780788898468 }, { "epoch": 2, "train_loss": 4.649685700734456, "train_tool_retrieval_accuracy": 0.8730769157409668, "train_parent_retrieval_accuracy": 0.7769230604171753, "val_tool_retrieval_accuracy": 0.5192307829856873, "val_parent_retrieval_accuracy": 0.7307692170143127, "val_tool_classification_accuracy": 0.038461538461538464, "val_parent_classification_accuracy": 0.40384615384615385, "learning_rate": 1.6363636363636366e-05, "epoch_duration_seconds": 1.7147771270028898, "best_val_tool_retrieval_accuracy": 0.5192307829856873, "best_epoch": 1, "train_parent_cross_entropy": 1.930469234784444, "train_child_cross_entropy": 2.5211688147650824, "train_parent_alignment": 0.9734141098128425, "train_child_alignment": 1.0070623556772869, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.5192307692307693, "validation/tool/silhouette_score": -0.10537859797477722, "validation/tool/global_near_overlap_rate": 0.7884615384615384, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.7307692307692307, "validation/parent/silhouette_score": -0.07874973863363266, "validation/parent/global_near_overlap_rate": 0.6538461538461539, "validation/parent/top_pair/label_a": "File System", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.44999998807907104, "validation/parent/top_pair/centroid_cosine": 0.9004660844802856 }, { "epoch": 3, "train_loss": 3.500072797139486, "train_tool_retrieval_accuracy": 0.8769230842590332, "train_parent_retrieval_accuracy": 0.7846153974533081, "val_tool_retrieval_accuracy": 0.5, "val_parent_retrieval_accuracy": 0.75, "val_tool_classification_accuracy": 0.07692307692307693, "val_parent_classification_accuracy": 0.5384615384615384, "learning_rate": 1.950738916256158e-05, "epoch_duration_seconds": 1.303288903000066, "best_val_tool_retrieval_accuracy": 0.5192307829856873, "best_epoch": 1, "train_parent_cross_entropy": 1.39888596534729, "train_child_cross_entropy": 1.9089170164532132, "train_parent_alignment": 0.9373632669448853, "train_child_alignment": 0.9853348599539863, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.5, "validation/tool/silhouette_score": -0.10424783825874329, "validation/tool/global_near_overlap_rate": 0.8076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.75, "validation/parent/silhouette_score": -0.08332549035549164, "validation/parent/global_near_overlap_rate": 0.6346153846153846, "validation/parent/top_pair/label_a": "File System", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.45000001788139343, "validation/parent/top_pair/centroid_cosine": 0.8934528231620789 }, { "epoch": 4, "train_loss": 2.730307208167182, "train_tool_retrieval_accuracy": 0.8961538672447205, "train_parent_retrieval_accuracy": 0.807692289352417, "val_tool_retrieval_accuracy": 0.5384615659713745, "val_parent_retrieval_accuracy": 0.7692307829856873, "val_tool_classification_accuracy": 0.17307692307692307, "val_parent_classification_accuracy": 0.7115384615384616, "learning_rate": 1.8620689655172415e-05, "epoch_duration_seconds": 1.3154947980001452, "best_val_tool_retrieval_accuracy": 0.5384615659713745, "best_epoch": 4, "train_parent_cross_entropy": 1.0005325476328533, "train_child_cross_entropy": 1.5424939393997192, "train_parent_alignment": 0.9058522052235074, "train_child_alignment": 0.9669552577866448, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.5384615384615384, "validation/tool/silhouette_score": -0.09466496855020523, "validation/tool/global_near_overlap_rate": 0.7884615384615384, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.7692307692307693, "validation/parent/silhouette_score": -0.0762428417801857, "validation/parent/global_near_overlap_rate": 0.5769230769230769, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Information Retrieval", "validation/parent/top_pair/mutual_overlap": 0.44999998807907104, "validation/parent/top_pair/centroid_cosine": 0.8568636178970337 }, { "epoch": 5, "train_loss": 2.2074906561109753, "train_tool_retrieval_accuracy": 0.9076923131942749, "train_parent_retrieval_accuracy": 0.8461538553237915, "val_tool_retrieval_accuracy": 0.5961538553237915, "val_parent_retrieval_accuracy": 0.7692307829856873, "val_tool_classification_accuracy": 0.3076923076923077, "val_parent_classification_accuracy": 0.75, "learning_rate": 1.7733990147783254e-05, "epoch_duration_seconds": 1.333961725998961, "best_val_tool_retrieval_accuracy": 0.5961538553237915, "best_epoch": 5, "train_parent_cross_entropy": 0.6690340472592248, "train_child_cross_entropy": 1.3546243641111586, "train_parent_alignment": 0.8832898471090529, "train_child_alignment": 0.9550319446457757, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.5961538461538461, "validation/tool/silhouette_score": -0.0741507038474083, "validation/tool/global_near_overlap_rate": 0.7307692307692307, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.7692307692307693, "validation/parent/silhouette_score": -0.06206924095749855, "validation/parent/global_near_overlap_rate": 0.38461538461538464, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Information Retrieval", "validation/parent/top_pair/mutual_overlap": 0.3499999940395355, "validation/parent/top_pair/centroid_cosine": 0.8201030492782593 }, { "epoch": 6, "train_loss": 1.5056148568789165, "train_tool_retrieval_accuracy": 0.9346153736114502, "train_parent_retrieval_accuracy": 0.8807692527770996, "val_tool_retrieval_accuracy": 0.6538461446762085, "val_parent_retrieval_accuracy": 0.807692289352417, "val_tool_classification_accuracy": 0.4423076923076923, "val_parent_classification_accuracy": 0.7884615384615384, "learning_rate": 1.684729064039409e-05, "epoch_duration_seconds": 2.3185505299989018, "best_val_tool_retrieval_accuracy": 0.6538461446762085, "best_epoch": 6, "train_parent_cross_entropy": 0.46070420576466453, "train_child_cross_entropy": 0.8664655850993263, "train_parent_alignment": 0.8618110550774468, "train_child_alignment": 0.9226394295692444, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.6538461538461539, "validation/tool/silhouette_score": -0.03729083389043808, "validation/tool/global_near_overlap_rate": 0.6730769230769231, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.8076923076923077, "validation/parent/silhouette_score": -0.03389709070324898, "validation/parent/global_near_overlap_rate": 0.3269230769230769, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.21666666865348816, "validation/parent/top_pair/centroid_cosine": 0.8001468181610107 }, { "epoch": 7, "train_loss": 1.2175099054972331, "train_tool_retrieval_accuracy": 0.9461538195610046, "train_parent_retrieval_accuracy": 0.9115384817123413, "val_tool_retrieval_accuracy": 0.7115384340286255, "val_parent_retrieval_accuracy": 0.8269230723381042, "val_tool_classification_accuracy": 0.5, "val_parent_classification_accuracy": 0.8076923076923077, "learning_rate": 1.5960591133004928e-05, "epoch_duration_seconds": 1.3010024789982708, "best_val_tool_retrieval_accuracy": 0.7115384340286255, "best_epoch": 7, "train_parent_cross_entropy": 0.34940624402629006, "train_child_cross_entropy": 0.6940820945633782, "train_parent_alignment": 0.8370489080746969, "train_child_alignment": 0.9031666649712456, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7115384615384616, "validation/tool/silhouette_score": -0.012219934724271297, "validation/tool/global_near_overlap_rate": 0.6346153846153846, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.8269230769230769, "validation/parent/silhouette_score": -0.012261098250746727, "validation/parent/global_near_overlap_rate": 0.3076923076923077, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.20000000298023224, "validation/parent/top_pair/centroid_cosine": 0.7784289121627808 }, { "epoch": 8, "train_loss": 0.92488608095381, "train_tool_retrieval_accuracy": 0.9576923251152039, "train_parent_retrieval_accuracy": 0.9230769276618958, "val_tool_retrieval_accuracy": 0.6730769276618958, "val_parent_retrieval_accuracy": 0.8269230723381042, "val_tool_classification_accuracy": 0.5961538461538461, "val_parent_classification_accuracy": 0.8461538461538461, "learning_rate": 1.5073891625615764e-05, "epoch_duration_seconds": 1.3682630530020106, "best_val_tool_retrieval_accuracy": 0.7115384340286255, "best_epoch": 7, "train_parent_cross_entropy": 0.23755988809797499, "train_child_cross_entropy": 0.5170698364575704, "train_parent_alignment": 0.8208589951197306, "train_child_alignment": 0.8817045291264852, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.6730769230769231, "validation/tool/silhouette_score": 0.004278222564607859, "validation/tool/global_near_overlap_rate": 0.5769230769230769, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.8269230769230769, "validation/parent/silhouette_score": 0.0034682746045291424, "validation/parent/global_near_overlap_rate": 0.2692307692307692, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.20000000298023224, "validation/parent/top_pair/centroid_cosine": 0.7186568975448608 }, { "epoch": 9, "train_loss": 0.7474626302719116, "train_tool_retrieval_accuracy": 0.9653846025466919, "train_parent_retrieval_accuracy": 0.9384615421295166, "val_tool_retrieval_accuracy": 0.6730769276618958, "val_parent_retrieval_accuracy": 0.8461538553237915, "val_tool_classification_accuracy": 0.6346153846153846, "val_parent_classification_accuracy": 0.8461538461538461, "learning_rate": 1.4187192118226602e-05, "epoch_duration_seconds": 2.020530112000415, "best_val_tool_retrieval_accuracy": 0.7115384340286255, "best_epoch": 7, "train_parent_cross_entropy": 0.19186763796541426, "train_child_cross_entropy": 0.38965080512894523, "train_parent_alignment": 0.800107995669047, "train_child_alignment": 0.8593339323997498, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.6730769230769231, "validation/tool/silhouette_score": 0.02403559535741806, "validation/tool/global_near_overlap_rate": 0.5384615384615384, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.8461538461538461, "validation/parent/silhouette_score": 0.017015840858221054, "validation/parent/global_near_overlap_rate": 0.25, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.15000000596046448, "validation/parent/top_pair/centroid_cosine": 0.6582691669464111 }, { "epoch": 10, "train_loss": 0.560799671543969, "train_tool_retrieval_accuracy": 0.9730769395828247, "train_parent_retrieval_accuracy": 0.949999988079071, "val_tool_retrieval_accuracy": 0.692307710647583, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.6538461538461539, "val_parent_classification_accuracy": 0.8461538461538461, "learning_rate": 1.330049261083744e-05, "epoch_duration_seconds": 1.3082187740001245, "best_val_tool_retrieval_accuracy": 0.7115384340286255, "best_epoch": 7, "train_parent_cross_entropy": 0.11244031579958068, "train_child_cross_entropy": 0.28610827691025204, "train_parent_alignment": 0.7726466457049052, "train_child_alignment": 0.8498640192879571, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.6923076923076923, "validation/tool/silhouette_score": 0.03721160441637039, "validation/tool/global_near_overlap_rate": 0.4423076923076923, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.03269634023308754, "validation/parent/global_near_overlap_rate": 0.23076923076923078, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.15000000596046448, "validation/parent/top_pair/centroid_cosine": 0.6069332361221313 }, { "epoch": 11, "train_loss": 0.4488269024425083, "train_tool_retrieval_accuracy": 0.9769230484962463, "train_parent_retrieval_accuracy": 0.9653846025466919, "val_tool_retrieval_accuracy": 0.7307692170143127, "val_parent_retrieval_accuracy": 0.9230769276618958, "val_tool_classification_accuracy": 0.6923076923076923, "val_parent_classification_accuracy": 0.8653846153846154, "learning_rate": 1.2413793103448277e-05, "epoch_duration_seconds": 1.3191320069963695, "best_val_tool_retrieval_accuracy": 0.7307692170143127, "best_epoch": 11, "train_parent_cross_entropy": 0.09428231045603752, "train_child_cross_entropy": 0.19627481864558327, "train_parent_alignment": 0.7582567930221558, "train_child_alignment": 0.8244408766428629, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7307692307692307, "validation/tool/silhouette_score": 0.04294625297188759, "validation/tool/global_near_overlap_rate": 0.40384615384615385, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9230769230769231, "validation/parent/silhouette_score": 0.04077092185616493, "validation/parent/global_near_overlap_rate": 0.25, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.15000000596046448, "validation/parent/top_pair/centroid_cosine": 0.5526243448257446 }, { "epoch": 12, "train_loss": 0.38162952330377364, "train_tool_retrieval_accuracy": 0.9846153855323792, "train_parent_retrieval_accuracy": 0.9730769395828247, "val_tool_retrieval_accuracy": 0.7692307829856873, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.6923076923076923, "val_parent_classification_accuracy": 0.8653846153846154, "learning_rate": 1.1527093596059114e-05, "epoch_duration_seconds": 1.3753753389974008, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.07771683939629132, "train_child_cross_entropy": 0.1482034358713362, "train_parent_alignment": 0.7491327060593499, "train_child_alignment": 0.807959775129954, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7692307692307693, "validation/tool/silhouette_score": 0.05038919299840927, "validation/tool/global_near_overlap_rate": 0.38461538461538464, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.04405605047941208, "validation/parent/global_near_overlap_rate": 0.23076923076923078, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.3341650366783142 }, { "epoch": 13, "train_loss": 0.34940913650724625, "train_tool_retrieval_accuracy": 0.9846153855323792, "train_parent_retrieval_accuracy": 0.9807692170143127, "val_tool_retrieval_accuracy": 0.7692307829856873, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7115384615384616, "val_parent_classification_accuracy": 0.8653846153846154, "learning_rate": 1.0640394088669953e-05, "epoch_duration_seconds": 1.9898250920014107, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.05860658983389536, "train_child_cross_entropy": 0.1373151573869917, "train_parent_alignment": 0.7339069644610087, "train_child_alignment": 0.8009669250912137, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7692307692307693, "validation/tool/silhouette_score": 0.06007323041558266, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.04259569197893143, "validation/parent/global_near_overlap_rate": 0.25, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.2915511727333069 }, { "epoch": 14, "train_loss": 0.3008048352268007, "train_tool_retrieval_accuracy": 0.9884615540504456, "train_parent_retrieval_accuracy": 0.9923076629638672, "val_tool_retrieval_accuracy": 0.75, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7115384615384616, "val_parent_classification_accuracy": 0.8461538461538461, "learning_rate": 9.75369458128079e-06, "epoch_duration_seconds": 1.3389712629941641, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.04300534518228637, "train_child_cross_entropy": 0.10681118857529429, "train_parent_alignment": 0.7165413432651095, "train_child_alignment": 0.7933415704303317, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.75, "validation/tool/silhouette_score": 0.063718281686306, "validation/tool/global_near_overlap_rate": 0.3269230769230769, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.05269314721226692, "validation/parent/global_near_overlap_rate": 0.21153846153846154, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.25321274995803833 }, { "epoch": 15, "train_loss": 0.2826983431975047, "train_tool_retrieval_accuracy": 0.9923076629638672, "train_parent_retrieval_accuracy": 0.9961538314819336, "val_tool_retrieval_accuracy": 0.7692307829856873, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7115384615384616, "val_parent_classification_accuracy": 0.8653846153846154, "learning_rate": 8.866995073891627e-06, "epoch_duration_seconds": 1.3003545039973687, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.04354299708373017, "train_child_cross_entropy": 0.08995897322893143, "train_parent_alignment": 0.7072291970252991, "train_child_alignment": 0.784734480910831, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7692307692307693, "validation/tool/silhouette_score": 0.06840348988771439, "validation/tool/global_near_overlap_rate": 0.3269230769230769, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.054581109434366226, "validation/parent/global_near_overlap_rate": 0.19230769230769232, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.22527211904525757 }, { "epoch": 16, "train_loss": 0.24080454806486765, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.75, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7307692307692307, "val_parent_classification_accuracy": 0.8846153846153846, "learning_rate": 7.980295566502464e-06, "epoch_duration_seconds": 2.0077261100013857, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.032339607261949115, "train_child_cross_entropy": 0.060213643643591136, "train_parent_alignment": 0.7098994188838534, "train_child_alignment": 0.7726135386361016, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.75, "validation/tool/silhouette_score": 0.07184359431266785, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.05527704581618309, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.20723675191402435 }, { "epoch": 17, "train_loss": 0.21917742159631518, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7692307829856873, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 7.093596059113301e-06, "epoch_duration_seconds": 1.297605815998395, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.019533097743988037, "train_child_cross_entropy": 0.05424659254236354, "train_parent_alignment": 0.6934020320574442, "train_child_alignment": 0.7605752746264139, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7692307692307693, "validation/tool/silhouette_score": 0.0746900886297226, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.06387268751859665, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.17757676541805267 }, { "epoch": 18, "train_loss": 0.2239979604880015, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7692307829856873, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 6.206896551724138e-06, "epoch_duration_seconds": 1.3268793469978846, "best_val_tool_retrieval_accuracy": 0.7692307829856873, "best_epoch": 12, "train_parent_cross_entropy": 0.021013346293734178, "train_child_cross_entropy": 0.057985921286874346, "train_parent_alignment": 0.6833301186561584, "train_child_alignment": 0.766656776269277, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7692307692307693, "validation/tool/silhouette_score": 0.07859379798173904, "validation/tool/global_near_overlap_rate": 0.3269230769230769, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.06772759556770325, "validation/parent/global_near_overlap_rate": 0.15384615384615385, "validation/parent/top_pair/label_a": "Information Retrieval", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.13333334028720856, "validation/parent/top_pair/centroid_cosine": 0.15037700533866882 }, { "epoch": 19, "train_loss": 0.2052950064341227, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7692307692307693, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 5.320197044334976e-06, "epoch_duration_seconds": 1.2910668359982083, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.01799314386314816, "train_child_cross_entropy": 0.04309294786718157, "train_parent_alignment": 0.6805168125364516, "train_child_alignment": 0.7615723013877869, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08252660185098648, "validation/tool/global_near_overlap_rate": 0.3269230769230769, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.0690055787563324, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.3109726309776306 }, { "epoch": 20, "train_loss": 0.1988206985923979, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 0.9961538314819336, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.8846153846153846, "learning_rate": 4.4334975369458135e-06, "epoch_duration_seconds": 1.9614776899979915, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.018124247073299356, "train_child_cross_entropy": 0.036885734647512436, "train_parent_alignment": 0.6738381319575839, "train_child_alignment": 0.7642690075768365, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08244223147630692, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.07241550087928772, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.2947779893875122 }, { "epoch": 21, "train_loss": 0.19204935597048867, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 0.9961538314819336, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7307692307692307, "val_parent_classification_accuracy": 0.8653846153846154, "learning_rate": 3.5467980295566506e-06, "epoch_duration_seconds": 1.3060714730017935, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.017510208094285593, "train_child_cross_entropy": 0.03250948815710015, "train_parent_alignment": 0.6696353885862563, "train_child_alignment": 0.7506611810790168, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.0829564779996872, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.07466989010572433, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.28267771005630493 }, { "epoch": 22, "train_loss": 0.1794411970509423, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 2.660098522167488e-06, "epoch_duration_seconds": 1.3172019779958646, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.014070622726447053, "train_child_cross_entropy": 0.026905071611205738, "train_parent_alignment": 0.6510205997361077, "train_child_alignment": 0.733634372552236, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08473511040210724, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.0743960365653038, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.2789847254753113 }, { "epoch": 23, "train_loss": 0.18609628081321716, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 1.7733990147783253e-06, "epoch_duration_seconds": 1.2904535019988543, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.01543032807401485, "train_child_cross_entropy": 0.030358499122990504, "train_parent_alignment": 0.6581042408943176, "train_child_alignment": 0.7449702355596755, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08613520115613937, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.07368122041225433, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.277476966381073 }, { "epoch": 24, "train_loss": 0.1794088515970442, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.7692307692307693, "val_parent_classification_accuracy": 0.9230769230769231, "learning_rate": 8.866995073891626e-07, "epoch_duration_seconds": 1.3085527120056213, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.01522777270939615, "train_child_cross_entropy": 0.025616472793949976, "train_parent_alignment": 0.6548879875077142, "train_child_alignment": 0.7307580312093099, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08699968457221985, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.07333475351333618, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.2760659158229828 }, { "epoch": 25, "train_loss": 0.18173575732443067, "train_tool_retrieval_accuracy": 0.9961538314819336, "train_parent_retrieval_accuracy": 1.0, "val_tool_retrieval_accuracy": 0.7884615659713745, "val_parent_retrieval_accuracy": 0.9038461446762085, "val_tool_classification_accuracy": 0.75, "val_parent_classification_accuracy": 0.9038461538461539, "learning_rate": 0.0, "epoch_duration_seconds": 1.3227032190043246, "best_val_tool_retrieval_accuracy": 0.7884615659713745, "best_epoch": 19, "train_parent_cross_entropy": 0.01568867434333596, "train_child_cross_entropy": 0.027332179869214695, "train_parent_alignment": 0.6537897917959425, "train_child_alignment": 0.733359158039093, "validation/tool/diagnostic_sample_size": 52, "validation/tool/label_count": 26, "validation/tool/subset_retrieval_accuracy": 0.7884615384615384, "validation/tool/silhouette_score": 0.08730607479810715, "validation/tool/global_near_overlap_rate": 0.3076923076923077, "validation/parent/diagnostic_sample_size": 52, "validation/parent/label_count": 6, "validation/parent/subset_retrieval_accuracy": 0.9038461538461539, "validation/parent/silhouette_score": 0.07345665991306305, "validation/parent/global_near_overlap_rate": 0.17307692307692307, "validation/parent/top_pair/label_a": "Computation", "validation/parent/top_pair/label_b": "Memory", "validation/parent/top_pair/mutual_overlap": 0.10000000149011612, "validation/parent/top_pair/centroid_cosine": 0.27413174510002136 } ]