Upload app.py with huggingface_hub
Browse files
app.py
CHANGED
|
@@ -874,9 +874,22 @@ VALIDATION = f"""
|
|
| 874 |
</div>
|
| 875 |
</div>
|
| 876 |
|
| 877 |
-
<
|
| 878 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 879 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 880 |
<div style="background:#161922;border:1px solid #252a35;border-radius:8px;overflow:hidden">
|
| 881 |
<table style="width:100%;border-collapse:collapse;font-size:0.86rem">
|
| 882 |
<thead><tr>
|
|
@@ -895,7 +908,11 @@ VALIDATION = f"""
|
|
| 895 |
<span style="color:#cbd5e1">Zero confident misclassifications across 5 unseen sites.</span>
|
| 896 |
</div>
|
| 897 |
|
| 898 |
-
<div style="
|
|
|
|
|
|
|
|
|
|
|
|
|
| 899 |
|
| 900 |
<!-- Confusion matrix (on definitive predictions only) -->
|
| 901 |
<div style="background:#161922;border:1px solid #252a35;border-radius:8px;padding:18px 20px">
|
|
|
|
| 874 |
</div>
|
| 875 |
</div>
|
| 876 |
|
| 877 |
+
<div style="margin:18px 0 8px">
|
| 878 |
+
<div style="color:#f4f4f5;font-size:0.95rem;font-weight:600;margin-bottom:4px">Demo cohort · 5 held-out sites, 10 subjects</div>
|
| 879 |
+
<div style="color:#8b95a7;font-size:0.82rem;line-height:1.6">Two subjects per site were randomly selected from the ABIDE I held-out pool. The model that trained on <em>all other sites</em> was used — it has never seen any data from these institutions.</div>
|
| 880 |
+
</div>
|
| 881 |
+
<img src="data:image/png;base64,{VAL_B64}" style="width:100%;border-radius:6px;margin-bottom:22px;border:1px solid #252a35"/>
|
| 882 |
+
|
| 883 |
+
<div style="margin:0 0 8px">
|
| 884 |
+
<div style="color:#f4f4f5;font-size:0.95rem;font-weight:600;margin-bottom:4px">Full 20-fold LOSO AUC · all 1,102 subjects</div>
|
| 885 |
+
<div style="color:#8b95a7;font-size:0.82rem;line-height:1.6">Each bar is one site blind to training. AUC 0.7298 is the mean across all 20 folds — every subject is test-only exactly once. Prior art uses same-site splits; this is a strictly harder evaluation.</div>
|
| 886 |
+
</div>
|
| 887 |
+
<img src="data:image/png;base64,{AUC_B64}" style="width:100%;border-radius:6px;margin-bottom:22px;border:1px solid #252a35"/>
|
| 888 |
|
| 889 |
+
<div style="margin:0 0 8px">
|
| 890 |
+
<div style="color:#f4f4f5;font-size:0.95rem;font-weight:600;margin-bottom:4px">Subject-level predictions · demo cohort</div>
|
| 891 |
+
<div style="color:#8b95a7;font-size:0.82rem;line-height:1.6">Predictions with 0.4 < p < 0.6 are flagged as inconclusive rather than forced to a label — surfacing borderline cases for clinical review instead of producing a confident wrong answer.</div>
|
| 892 |
+
</div>
|
| 893 |
<div style="background:#161922;border:1px solid #252a35;border-radius:8px;overflow:hidden">
|
| 894 |
<table style="width:100%;border-collapse:collapse;font-size:0.86rem">
|
| 895 |
<thead><tr>
|
|
|
|
| 908 |
<span style="color:#cbd5e1">Zero confident misclassifications across 5 unseen sites.</span>
|
| 909 |
</div>
|
| 910 |
|
| 911 |
+
<div style="margin:22px 0 8px">
|
| 912 |
+
<div style="color:#f4f4f5;font-size:0.95rem;font-weight:600;margin-bottom:4px">Diagnostic breakdown & published baselines</div>
|
| 913 |
+
<div style="color:#8b95a7;font-size:0.82rem;line-height:1.6">On definitive predictions (p > 0.6 or p < 0.4) the model achieves 100% sensitivity and specificity on the demo cohort. Compared against published ABIDE benchmarks — all of which used same-site evaluation.</div>
|
| 914 |
+
</div>
|
| 915 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:14px">
|
| 916 |
|
| 917 |
<!-- Confusion matrix (on definitive predictions only) -->
|
| 918 |
<div style="background:#161922;border:1px solid #252a35;border-radius:8px;padding:18px 20px">
|