Upload 44 files
Browse files- .gitattributes +4 -0
- mobilenetv2/README.md +13 -0
- mobilenetv2/config_resolved.yml +61 -0
- mobilenetv2/history.json +198 -0
- mobilenetv2/inference_config.json +99 -0
- mobilenetv2/metrics_test.json +38 -0
- mobilenetv2/metrics_val.json +39 -0
- mobilenetv2/onnx/model.onnx +3 -0
- mobilenetv2/onnx/model.onnx.data +3 -0
- mobilenetv2/pr_curve_val.png +0 -0
- mobilenetv2/preprocess.json +17 -0
- mobilenetv2/roc_curve_val.png +0 -0
- mobilenetv3_large/README.md +13 -0
- mobilenetv3_large/config_resolved.yml +61 -0
- mobilenetv3_large/history.json +100 -0
- mobilenetv3_large/inference_config.json +99 -0
- mobilenetv3_large/metrics_test.json +38 -0
- mobilenetv3_large/metrics_val.json +39 -0
- mobilenetv3_large/onnx/model.onnx +3 -0
- mobilenetv3_large/onnx/model.onnx.data +3 -0
- mobilenetv3_large/pr_curve_val.png +0 -0
- mobilenetv3_large/preprocess.json +17 -0
- mobilenetv3_large/roc_curve_val.png +0 -0
- mobilenetv3_small/README.md +13 -0
- mobilenetv3_small/config_resolved.yml +61 -0
- mobilenetv3_small/history.json +142 -0
- mobilenetv3_small/inference_config.json +99 -0
- mobilenetv3_small/metrics_test.json +38 -0
- mobilenetv3_small/metrics_val.json +39 -0
- mobilenetv3_small/onnx/model.onnx +3 -0
- mobilenetv3_small/onnx/model.onnx.data +3 -0
- mobilenetv3_small/pr_curve_val.png +0 -0
- mobilenetv3_small/preprocess.json +17 -0
- mobilenetv3_small/roc_curve_val.png +0 -0
- mobilevitv2/README.md +13 -0
- mobilevitv2/config_resolved.yml +62 -0
- mobilevitv2/history.json +240 -0
- mobilevitv2/inference_config.json +99 -0
- mobilevitv2/metrics_test.json +38 -0
- mobilevitv2/metrics_val.json +39 -0
- mobilevitv2/onnx/model.onnx +3 -0
- mobilevitv2/onnx/model.onnx.data +3 -0
- mobilevitv2/pr_curve_val.png +0 -0
- mobilevitv2/preprocess.json +17 -0
- mobilevitv2/roc_curve_val.png +0 -0
.gitattributes
CHANGED
|
@@ -46,3 +46,7 @@ assets/not_illuminated/4.jpg filter=lfs diff=lfs merge=lfs -text
|
|
| 46 |
assets/not_illuminated/5.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
assets/not_illuminated/6.jpg filter=lfs diff=lfs merge=lfs -text
|
| 48 |
assets/odil-logo.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 46 |
assets/not_illuminated/5.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
assets/not_illuminated/6.jpg filter=lfs diff=lfs merge=lfs -text
|
| 48 |
assets/odil-logo.png filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
mobilenetv2/onnx/model.onnx.data filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
mobilenetv3_large/onnx/model.onnx.data filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
mobilenetv3_small/onnx/model.onnx.data filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
mobilevitv2/onnx/model.onnx.data filter=lfs diff=lfs merge=lfs -text
|
mobilenetv2/README.md
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Run artefacts: run_20260228_173634_timm_mobilenetv2_100.ra_in1k
|
| 2 |
+
|
| 3 |
+
This folder is **uploadable as-is** to the Hugging Face Hub.
|
| 4 |
+
|
| 5 |
+
## Files
|
| 6 |
+
- `onnx/model.onnx`: single-file ONNX model
|
| 7 |
+
- `preprocess.json`: resize/normalize info
|
| 8 |
+
- `inference_config.json`: threshold + labels + IO names
|
| 9 |
+
- `metrics_val.json`, `metrics_test.json`
|
| 10 |
+
- `pr_curve_val.png`, `roc_curve_val.png`
|
| 11 |
+
|
| 12 |
+
## Quick inference (Python)
|
| 13 |
+
Use `scripts/infer_local.py` or `scripts/infer_hf.py`.
|
mobilenetv2/config_resolved.yml
ADDED
|
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run:
|
| 2 |
+
out_root: artefacts
|
| 3 |
+
name: null
|
| 4 |
+
seed: 42
|
| 5 |
+
device: auto
|
| 6 |
+
num_workers: 0
|
| 7 |
+
early_stopping_patience: 5
|
| 8 |
+
metric_for_best: ap
|
| 9 |
+
data:
|
| 10 |
+
source: local
|
| 11 |
+
local:
|
| 12 |
+
root: dataset
|
| 13 |
+
splits:
|
| 14 |
+
train: train
|
| 15 |
+
val: val
|
| 16 |
+
test: test
|
| 17 |
+
classes:
|
| 18 |
+
negative: non_illustration
|
| 19 |
+
positive: illustration
|
| 20 |
+
hf:
|
| 21 |
+
dataset: null
|
| 22 |
+
image_column: image
|
| 23 |
+
label_column: label
|
| 24 |
+
splits:
|
| 25 |
+
train: train
|
| 26 |
+
val: validation
|
| 27 |
+
test: test
|
| 28 |
+
label_names:
|
| 29 |
+
- '0'
|
| 30 |
+
- '1'
|
| 31 |
+
model:
|
| 32 |
+
backend: timm
|
| 33 |
+
name: mobilenetv2_100.ra_in1k
|
| 34 |
+
pretrained: true
|
| 35 |
+
freeze_backbone: false
|
| 36 |
+
preprocess:
|
| 37 |
+
mode: auto
|
| 38 |
+
img_size: 224
|
| 39 |
+
mean:
|
| 40 |
+
- 0.485
|
| 41 |
+
- 0.456
|
| 42 |
+
- 0.406
|
| 43 |
+
std:
|
| 44 |
+
- 0.229
|
| 45 |
+
- 0.224
|
| 46 |
+
- 0.225
|
| 47 |
+
augment:
|
| 48 |
+
enabled: true
|
| 49 |
+
hflip: true
|
| 50 |
+
rotation_deg: 5
|
| 51 |
+
jitter:
|
| 52 |
+
brightness: 0.12
|
| 53 |
+
contrast: 0.12
|
| 54 |
+
saturation: 0.08
|
| 55 |
+
hue: 0.02
|
| 56 |
+
train:
|
| 57 |
+
epochs: 15
|
| 58 |
+
batch_size: 32
|
| 59 |
+
lr: 3e-4
|
| 60 |
+
export:
|
| 61 |
+
opset: 18
|
mobilenetv2/history.json
ADDED
|
@@ -0,0 +1,198 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"epoch": 1,
|
| 4 |
+
"train_loss": 0.4656901870938865,
|
| 5 |
+
"val_loss": 0.12333274091698902,
|
| 6 |
+
"ap": 0.99714547458157,
|
| 7 |
+
"auc": 0.9969433719433719,
|
| 8 |
+
"thr": 0.9971259236335754,
|
| 9 |
+
"p@0.5": 0.9557522123893806,
|
| 10 |
+
"r@0.5": 0.9642857142857143,
|
| 11 |
+
"f1@0.5": 0.96,
|
| 12 |
+
"p@thr": 1.0,
|
| 13 |
+
"r@thr": 0.9464285714285714,
|
| 14 |
+
"f1@thr": 0.9724770642201835
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"epoch": 2,
|
| 18 |
+
"train_loss": 0.10773226243591952,
|
| 19 |
+
"val_loss": 0.11393067031193434,
|
| 20 |
+
"ap": 0.9976798953329111,
|
| 21 |
+
"auc": 0.9973455598455598,
|
| 22 |
+
"thr": 0.9217178821563721,
|
| 23 |
+
"p@0.5": 0.9646017699115044,
|
| 24 |
+
"r@0.5": 0.9732142857142857,
|
| 25 |
+
"f1@0.5": 0.9688888888888889,
|
| 26 |
+
"p@thr": 0.990909090909091,
|
| 27 |
+
"r@thr": 0.9732142857142857,
|
| 28 |
+
"f1@thr": 0.9819819819819819
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"epoch": 3,
|
| 32 |
+
"train_loss": 0.04070160786637423,
|
| 33 |
+
"val_loss": 0.03605190674483083,
|
| 34 |
+
"ap": 0.9994047619047619,
|
| 35 |
+
"auc": 0.9993564993564993,
|
| 36 |
+
"thr": 0.878259539604187,
|
| 37 |
+
"p@0.5": 1.0,
|
| 38 |
+
"r@0.5": 0.9910714285714286,
|
| 39 |
+
"f1@0.5": 0.9955156950672646,
|
| 40 |
+
"p@thr": 1.0,
|
| 41 |
+
"r@thr": 0.9910714285714286,
|
| 42 |
+
"f1@thr": 0.9955156950672646
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"epoch": 4,
|
| 46 |
+
"train_loss": 0.05677206691354175,
|
| 47 |
+
"val_loss": 0.024434951899300877,
|
| 48 |
+
"ap": 0.9997636390082348,
|
| 49 |
+
"auc": 0.9997586872586872,
|
| 50 |
+
"thr": 0.042775943875312805,
|
| 51 |
+
"p@0.5": 0.990990990990991,
|
| 52 |
+
"r@0.5": 0.9821428571428571,
|
| 53 |
+
"f1@0.5": 0.9865470852017937,
|
| 54 |
+
"p@thr": 0.9824561403508771,
|
| 55 |
+
"r@thr": 1.0,
|
| 56 |
+
"f1@thr": 0.9911504424778761
|
| 57 |
+
},
|
| 58 |
+
{
|
| 59 |
+
"epoch": 5,
|
| 60 |
+
"train_loss": 0.05333746283336592,
|
| 61 |
+
"val_loss": 0.09529338278794544,
|
| 62 |
+
"ap": 0.9996184371184371,
|
| 63 |
+
"auc": 0.9995978120978121,
|
| 64 |
+
"thr": 0.018688704818487167,
|
| 65 |
+
"p@0.5": 1.0,
|
| 66 |
+
"r@0.5": 0.9464285714285714,
|
| 67 |
+
"f1@0.5": 0.9724770642201835,
|
| 68 |
+
"p@thr": 1.0,
|
| 69 |
+
"r@thr": 0.9910714285714286,
|
| 70 |
+
"f1@thr": 0.9955156950672646
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"epoch": 6,
|
| 74 |
+
"train_loss": 0.1029799613893021,
|
| 75 |
+
"val_loss": 0.03771801323897047,
|
| 76 |
+
"ap": 0.9993358913813459,
|
| 77 |
+
"auc": 0.9992760617760618,
|
| 78 |
+
"thr": 0.9908594489097595,
|
| 79 |
+
"p@0.5": 0.9910714285714286,
|
| 80 |
+
"r@0.5": 0.9910714285714286,
|
| 81 |
+
"f1@0.5": 0.9910714285714286,
|
| 82 |
+
"p@thr": 1.0,
|
| 83 |
+
"r@thr": 0.9910714285714286,
|
| 84 |
+
"f1@thr": 0.9955156950672646
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"epoch": 7,
|
| 88 |
+
"train_loss": 0.017501240327736454,
|
| 89 |
+
"val_loss": 0.04377351038082062,
|
| 90 |
+
"ap": 0.9991359447004609,
|
| 91 |
+
"auc": 0.9990347490347491,
|
| 92 |
+
"thr": 0.9368125200271606,
|
| 93 |
+
"p@0.5": 0.9910714285714286,
|
| 94 |
+
"r@0.5": 0.9910714285714286,
|
| 95 |
+
"f1@0.5": 0.9910714285714286,
|
| 96 |
+
"p@thr": 1.0,
|
| 97 |
+
"r@thr": 0.9910714285714286,
|
| 98 |
+
"f1@thr": 0.9955156950672646
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"epoch": 8,
|
| 102 |
+
"train_loss": 0.030610826078336463,
|
| 103 |
+
"val_loss": 0.015787792323992886,
|
| 104 |
+
"ap": 0.9998412667057974,
|
| 105 |
+
"auc": 0.9998391248391248,
|
| 106 |
+
"thr": 0.4818607568740845,
|
| 107 |
+
"p@0.5": 0.9910714285714286,
|
| 108 |
+
"r@0.5": 0.9910714285714286,
|
| 109 |
+
"f1@0.5": 0.9910714285714286,
|
| 110 |
+
"p@thr": 0.9911504424778761,
|
| 111 |
+
"r@thr": 1.0,
|
| 112 |
+
"f1@thr": 0.9955555555555555
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"epoch": 9,
|
| 116 |
+
"train_loss": 0.006521744781084084,
|
| 117 |
+
"val_loss": 0.008422219177191437,
|
| 118 |
+
"ap": 0.9999209860935525,
|
| 119 |
+
"auc": 0.9999195624195624,
|
| 120 |
+
"thr": 0.5057958364486694,
|
| 121 |
+
"p@0.5": 0.9911504424778761,
|
| 122 |
+
"r@0.5": 1.0,
|
| 123 |
+
"f1@0.5": 0.9955555555555555,
|
| 124 |
+
"p@thr": 0.9911504424778761,
|
| 125 |
+
"r@thr": 1.0,
|
| 126 |
+
"f1@thr": 0.9955555555555555
|
| 127 |
+
},
|
| 128 |
+
{
|
| 129 |
+
"epoch": 10,
|
| 130 |
+
"train_loss": 0.02104085512313958,
|
| 131 |
+
"val_loss": 0.035103952907206804,
|
| 132 |
+
"ap": 0.9997608291253598,
|
| 133 |
+
"auc": 0.9997586872586872,
|
| 134 |
+
"thr": 0.8897470235824585,
|
| 135 |
+
"p@0.5": 0.9911504424778761,
|
| 136 |
+
"r@0.5": 1.0,
|
| 137 |
+
"f1@0.5": 0.9955555555555555,
|
| 138 |
+
"p@thr": 0.9911504424778761,
|
| 139 |
+
"r@thr": 1.0,
|
| 140 |
+
"f1@thr": 0.9955555555555555
|
| 141 |
+
},
|
| 142 |
+
{
|
| 143 |
+
"epoch": 11,
|
| 144 |
+
"train_loss": 0.009039335639143744,
|
| 145 |
+
"val_loss": 0.011095353777839989,
|
| 146 |
+
"ap": 0.9998412667057974,
|
| 147 |
+
"auc": 0.9998391248391248,
|
| 148 |
+
"thr": 0.7937497496604919,
|
| 149 |
+
"p@0.5": 0.9911504424778761,
|
| 150 |
+
"r@0.5": 1.0,
|
| 151 |
+
"f1@0.5": 0.9955555555555555,
|
| 152 |
+
"p@thr": 0.9911504424778761,
|
| 153 |
+
"r@thr": 1.0,
|
| 154 |
+
"f1@thr": 0.9955555555555555
|
| 155 |
+
},
|
| 156 |
+
{
|
| 157 |
+
"epoch": 12,
|
| 158 |
+
"train_loss": 0.044667846663854205,
|
| 159 |
+
"val_loss": 0.04292150645015421,
|
| 160 |
+
"ap": 0.9995977467948463,
|
| 161 |
+
"auc": 0.9995978120978121,
|
| 162 |
+
"thr": 0.9524211287498474,
|
| 163 |
+
"p@0.5": 0.9739130434782609,
|
| 164 |
+
"r@0.5": 1.0,
|
| 165 |
+
"f1@0.5": 0.986784140969163,
|
| 166 |
+
"p@thr": 0.9911504424778761,
|
| 167 |
+
"r@thr": 1.0,
|
| 168 |
+
"f1@thr": 0.9955555555555555
|
| 169 |
+
},
|
| 170 |
+
{
|
| 171 |
+
"epoch": 13,
|
| 172 |
+
"train_loss": 0.012496645635981064,
|
| 173 |
+
"val_loss": 0.024406921999018647,
|
| 174 |
+
"ap": 0.9996873613575865,
|
| 175 |
+
"auc": 0.9996782496782497,
|
| 176 |
+
"thr": 0.8616173267364502,
|
| 177 |
+
"p@0.5": 0.9823008849557522,
|
| 178 |
+
"r@0.5": 0.9910714285714286,
|
| 179 |
+
"f1@0.5": 0.9866666666666667,
|
| 180 |
+
"p@thr": 0.9910714285714286,
|
| 181 |
+
"r@thr": 0.9910714285714286,
|
| 182 |
+
"f1@thr": 0.9910714285714286
|
| 183 |
+
},
|
| 184 |
+
{
|
| 185 |
+
"epoch": 14,
|
| 186 |
+
"train_loss": 0.002151568810941998,
|
| 187 |
+
"val_loss": 0.019393305783328936,
|
| 188 |
+
"ap": 0.99984335839599,
|
| 189 |
+
"auc": 0.9998391248391248,
|
| 190 |
+
"thr": 0.9440849423408508,
|
| 191 |
+
"p@0.5": 0.9910714285714286,
|
| 192 |
+
"r@0.5": 0.9910714285714286,
|
| 193 |
+
"f1@0.5": 0.9910714285714286,
|
| 194 |
+
"p@thr": 1.0,
|
| 195 |
+
"r@thr": 0.9910714285714286,
|
| 196 |
+
"f1@thr": 0.9955156950672646
|
| 197 |
+
}
|
| 198 |
+
]
|
mobilenetv2/inference_config.json
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "timm",
|
| 3 |
+
"model_name": "mobilenetv2_100.ra_in1k",
|
| 4 |
+
"img_size": 224,
|
| 5 |
+
"mean": [
|
| 6 |
+
0.485,
|
| 7 |
+
0.456,
|
| 8 |
+
0.406
|
| 9 |
+
],
|
| 10 |
+
"std": [
|
| 11 |
+
0.229,
|
| 12 |
+
0.224,
|
| 13 |
+
0.225
|
| 14 |
+
],
|
| 15 |
+
"labels": [
|
| 16 |
+
"0",
|
| 17 |
+
"1"
|
| 18 |
+
],
|
| 19 |
+
"threshold": 0.5057958364486694,
|
| 20 |
+
"input_name": "pixel_values",
|
| 21 |
+
"output_name": "logits",
|
| 22 |
+
"val_metrics": {
|
| 23 |
+
"ap": 0.9999209860935525,
|
| 24 |
+
"auc": 0.9999195624195624,
|
| 25 |
+
"threshold": 0.5057958364486694,
|
| 26 |
+
"per_label": {
|
| 27 |
+
"report_by_label": {
|
| 28 |
+
"0": {
|
| 29 |
+
"precision": 1.0,
|
| 30 |
+
"recall": 0.990990990990991,
|
| 31 |
+
"f1-score": 0.995475113122172,
|
| 32 |
+
"support": 111.0
|
| 33 |
+
},
|
| 34 |
+
"1": {
|
| 35 |
+
"precision": 0.9911504424778761,
|
| 36 |
+
"recall": 1.0,
|
| 37 |
+
"f1-score": 0.9955555555555555,
|
| 38 |
+
"support": 112.0
|
| 39 |
+
}
|
| 40 |
+
},
|
| 41 |
+
"accuracy": 0.9955156950672646,
|
| 42 |
+
"confusion_matrix": {
|
| 43 |
+
"labels": [
|
| 44 |
+
"0",
|
| 45 |
+
"1"
|
| 46 |
+
],
|
| 47 |
+
"matrix": [
|
| 48 |
+
[
|
| 49 |
+
110,
|
| 50 |
+
1
|
| 51 |
+
],
|
| 52 |
+
[
|
| 53 |
+
0,
|
| 54 |
+
112
|
| 55 |
+
]
|
| 56 |
+
]
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"threshold_best_f1_score": 0.9955555555550555
|
| 60 |
+
},
|
| 61 |
+
"test_metrics": {
|
| 62 |
+
"ap": 0.9990159004614657,
|
| 63 |
+
"auc": 0.999034749034749,
|
| 64 |
+
"threshold": 0.5057958364486694,
|
| 65 |
+
"per_label": {
|
| 66 |
+
"report_by_label": {
|
| 67 |
+
"0": {
|
| 68 |
+
"precision": 0.9736842105263158,
|
| 69 |
+
"recall": 0.9910714285714286,
|
| 70 |
+
"f1-score": 0.9823008849557522,
|
| 71 |
+
"support": 112.0
|
| 72 |
+
},
|
| 73 |
+
"1": {
|
| 74 |
+
"precision": 0.9908256880733946,
|
| 75 |
+
"recall": 0.972972972972973,
|
| 76 |
+
"f1-score": 0.9818181818181818,
|
| 77 |
+
"support": 111.0
|
| 78 |
+
}
|
| 79 |
+
},
|
| 80 |
+
"accuracy": 0.9820627802690582,
|
| 81 |
+
"confusion_matrix": {
|
| 82 |
+
"labels": [
|
| 83 |
+
"0",
|
| 84 |
+
"1"
|
| 85 |
+
],
|
| 86 |
+
"matrix": [
|
| 87 |
+
[
|
| 88 |
+
111,
|
| 89 |
+
1
|
| 90 |
+
],
|
| 91 |
+
[
|
| 92 |
+
3,
|
| 93 |
+
108
|
| 94 |
+
]
|
| 95 |
+
]
|
| 96 |
+
}
|
| 97 |
+
}
|
| 98 |
+
}
|
| 99 |
+
}
|
mobilenetv2/metrics_test.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9990159004614657,
|
| 3 |
+
"auc": 0.999034749034749,
|
| 4 |
+
"threshold": 0.5057958364486694,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 0.9736842105263158,
|
| 9 |
+
"recall": 0.9910714285714286,
|
| 10 |
+
"f1-score": 0.9823008849557522,
|
| 11 |
+
"support": 112.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 0.9908256880733946,
|
| 15 |
+
"recall": 0.972972972972973,
|
| 16 |
+
"f1-score": 0.9818181818181818,
|
| 17 |
+
"support": 111.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9820627802690582,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
111,
|
| 29 |
+
1
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
3,
|
| 33 |
+
108
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
}
|
| 38 |
+
}
|
mobilenetv2/metrics_val.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9999209860935525,
|
| 3 |
+
"auc": 0.9999195624195624,
|
| 4 |
+
"threshold": 0.5057958364486694,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 1.0,
|
| 9 |
+
"recall": 0.990990990990991,
|
| 10 |
+
"f1-score": 0.995475113122172,
|
| 11 |
+
"support": 111.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 0.9911504424778761,
|
| 15 |
+
"recall": 1.0,
|
| 16 |
+
"f1-score": 0.9955555555555555,
|
| 17 |
+
"support": 112.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9955156950672646,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
110,
|
| 29 |
+
1
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
0,
|
| 33 |
+
112
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"threshold_best_f1_score": 0.9955555555550555
|
| 39 |
+
}
|
mobilenetv2/onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b3e245ce2bc82dab831778f74bf64b73b2d7d83eaa80a1412139d240a97b74f
|
| 3 |
+
size 9107464
|
mobilenetv2/onnx/model.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:487f35c2e3225d5ae5070b569c6609f49187554a63370546bfc4f1200e75cff3
|
| 3 |
+
size 8912896
|
mobilenetv2/pr_curve_val.png
ADDED
|
mobilenetv2/preprocess.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"img_size": 224,
|
| 3 |
+
"mean": [
|
| 4 |
+
0.485,
|
| 5 |
+
0.456,
|
| 6 |
+
0.406
|
| 7 |
+
],
|
| 8 |
+
"std": [
|
| 9 |
+
0.229,
|
| 10 |
+
0.224,
|
| 11 |
+
0.225
|
| 12 |
+
],
|
| 13 |
+
"labels": [
|
| 14 |
+
"non_illuminated",
|
| 15 |
+
"illuminated"
|
| 16 |
+
]
|
| 17 |
+
}
|
mobilenetv2/roc_curve_val.png
ADDED
|
mobilenetv3_large/README.md
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Run artefacts: run_20260228_171950_timm_mobilenetv3_large_100.ra_in1k
|
| 2 |
+
|
| 3 |
+
This folder is **uploadable as-is** to the Hugging Face Hub.
|
| 4 |
+
|
| 5 |
+
## Files
|
| 6 |
+
- `onnx/model.onnx`: single-file ONNX model
|
| 7 |
+
- `preprocess.json`: resize/normalize info
|
| 8 |
+
- `inference_config.json`: threshold + labels + IO names
|
| 9 |
+
- `metrics_val.json`, `metrics_test.json`
|
| 10 |
+
- `pr_curve_val.png`, `roc_curve_val.png`
|
| 11 |
+
|
| 12 |
+
## Quick inference (Python)
|
| 13 |
+
Use `scripts/infer_local.py` or `scripts/infer_hf.py`.
|
mobilenetv3_large/config_resolved.yml
ADDED
|
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run:
|
| 2 |
+
out_root: artefacts
|
| 3 |
+
name: null
|
| 4 |
+
seed: 42
|
| 5 |
+
device: auto
|
| 6 |
+
num_workers: 0
|
| 7 |
+
early_stopping_patience: 5
|
| 8 |
+
metric_for_best: ap
|
| 9 |
+
data:
|
| 10 |
+
source: local
|
| 11 |
+
local:
|
| 12 |
+
root: dataset
|
| 13 |
+
splits:
|
| 14 |
+
train: train
|
| 15 |
+
val: val
|
| 16 |
+
test: test
|
| 17 |
+
classes:
|
| 18 |
+
negative: non_illustration
|
| 19 |
+
positive: illustration
|
| 20 |
+
hf:
|
| 21 |
+
dataset: null
|
| 22 |
+
image_column: image
|
| 23 |
+
label_column: label
|
| 24 |
+
splits:
|
| 25 |
+
train: train
|
| 26 |
+
val: validation
|
| 27 |
+
test: test
|
| 28 |
+
label_names:
|
| 29 |
+
- '0'
|
| 30 |
+
- '1'
|
| 31 |
+
model:
|
| 32 |
+
backend: timm
|
| 33 |
+
name: mobilenetv3_large_100.ra_in1k
|
| 34 |
+
pretrained: true
|
| 35 |
+
freeze_backbone: false
|
| 36 |
+
preprocess:
|
| 37 |
+
mode: auto
|
| 38 |
+
img_size: 224
|
| 39 |
+
mean:
|
| 40 |
+
- 0.485
|
| 41 |
+
- 0.456
|
| 42 |
+
- 0.406
|
| 43 |
+
std:
|
| 44 |
+
- 0.229
|
| 45 |
+
- 0.224
|
| 46 |
+
- 0.225
|
| 47 |
+
augment:
|
| 48 |
+
enabled: true
|
| 49 |
+
hflip: true
|
| 50 |
+
rotation_deg: 5
|
| 51 |
+
jitter:
|
| 52 |
+
brightness: 0.12
|
| 53 |
+
contrast: 0.12
|
| 54 |
+
saturation: 0.08
|
| 55 |
+
hue: 0.02
|
| 56 |
+
train:
|
| 57 |
+
epochs: 15
|
| 58 |
+
batch_size: 32
|
| 59 |
+
lr: 3e-4
|
| 60 |
+
export:
|
| 61 |
+
opset: 18
|
mobilenetv3_large/history.json
ADDED
|
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"epoch": 1,
|
| 4 |
+
"train_loss": 0.6888182502288505,
|
| 5 |
+
"val_loss": 0.09036096846866773,
|
| 6 |
+
"ap": 0.9978410242521666,
|
| 7 |
+
"auc": 0.9971846846846846,
|
| 8 |
+
"thr": 0.2575071156024933,
|
| 9 |
+
"p@0.5": 1.0,
|
| 10 |
+
"r@0.5": 0.9821428571428571,
|
| 11 |
+
"f1@0.5": 0.990990990990991,
|
| 12 |
+
"p@thr": 0.9910714285714286,
|
| 13 |
+
"r@thr": 0.9910714285714286,
|
| 14 |
+
"f1@thr": 0.9910714285714286
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"epoch": 2,
|
| 18 |
+
"train_loss": 0.15885185961886264,
|
| 19 |
+
"val_loss": 0.0019039563731055864,
|
| 20 |
+
"ap": 1.0,
|
| 21 |
+
"auc": 1.0,
|
| 22 |
+
"thr": 0.8973163962364197,
|
| 23 |
+
"p@0.5": 1.0,
|
| 24 |
+
"r@0.5": 1.0,
|
| 25 |
+
"f1@0.5": 1.0,
|
| 26 |
+
"p@thr": 1.0,
|
| 27 |
+
"r@thr": 1.0,
|
| 28 |
+
"f1@thr": 1.0
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"epoch": 3,
|
| 32 |
+
"train_loss": 0.10055956929316821,
|
| 33 |
+
"val_loss": 0.07646948005555844,
|
| 34 |
+
"ap": 0.9996069237771489,
|
| 35 |
+
"auc": 0.9995978120978122,
|
| 36 |
+
"thr": 0.0031442823819816113,
|
| 37 |
+
"p@0.5": 1.0,
|
| 38 |
+
"r@0.5": 0.9732142857142857,
|
| 39 |
+
"f1@0.5": 0.9864253393665159,
|
| 40 |
+
"p@thr": 0.9910714285714286,
|
| 41 |
+
"r@thr": 0.9910714285714286,
|
| 42 |
+
"f1@thr": 0.9910714285714286
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"epoch": 4,
|
| 46 |
+
"train_loss": 0.09780621805036431,
|
| 47 |
+
"val_loss": 0.07303765171930365,
|
| 48 |
+
"ap": 0.999679660294191,
|
| 49 |
+
"auc": 0.9996782496782497,
|
| 50 |
+
"thr": 0.9988993406295776,
|
| 51 |
+
"p@0.5": 0.9824561403508771,
|
| 52 |
+
"r@0.5": 1.0,
|
| 53 |
+
"f1@0.5": 0.9911504424778761,
|
| 54 |
+
"p@thr": 0.9911504424778761,
|
| 55 |
+
"r@thr": 1.0,
|
| 56 |
+
"f1@thr": 0.9955555555555555
|
| 57 |
+
},
|
| 58 |
+
{
|
| 59 |
+
"epoch": 5,
|
| 60 |
+
"train_loss": 0.058571264585469386,
|
| 61 |
+
"val_loss": 0.07458657122999414,
|
| 62 |
+
"ap": 0.999679660294191,
|
| 63 |
+
"auc": 0.9996782496782497,
|
| 64 |
+
"thr": 0.9999737739562988,
|
| 65 |
+
"p@0.5": 0.9739130434782609,
|
| 66 |
+
"r@0.5": 1.0,
|
| 67 |
+
"f1@0.5": 0.986784140969163,
|
| 68 |
+
"p@thr": 0.9911504424778761,
|
| 69 |
+
"r@thr": 1.0,
|
| 70 |
+
"f1@thr": 0.9955555555555555
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"epoch": 6,
|
| 74 |
+
"train_loss": 0.09667659115752363,
|
| 75 |
+
"val_loss": 0.039825086668445565,
|
| 76 |
+
"ap": 0.9996873613575865,
|
| 77 |
+
"auc": 0.9996782496782497,
|
| 78 |
+
"thr": 0.5820810794830322,
|
| 79 |
+
"p@0.5": 0.9910714285714286,
|
| 80 |
+
"r@0.5": 0.9910714285714286,
|
| 81 |
+
"f1@0.5": 0.9910714285714286,
|
| 82 |
+
"p@thr": 0.9910714285714286,
|
| 83 |
+
"r@thr": 0.9910714285714286,
|
| 84 |
+
"f1@thr": 0.9910714285714286
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"epoch": 7,
|
| 88 |
+
"train_loss": 0.04965379409636074,
|
| 89 |
+
"val_loss": 0.017542159338566825,
|
| 90 |
+
"ap": 0.9999209860935525,
|
| 91 |
+
"auc": 0.9999195624195624,
|
| 92 |
+
"thr": 0.032808057963848114,
|
| 93 |
+
"p@0.5": 1.0,
|
| 94 |
+
"r@0.5": 0.9910714285714286,
|
| 95 |
+
"f1@0.5": 0.9955156950672646,
|
| 96 |
+
"p@thr": 0.9911504424778761,
|
| 97 |
+
"r@thr": 1.0,
|
| 98 |
+
"f1@thr": 0.9955555555555555
|
| 99 |
+
}
|
| 100 |
+
]
|
mobilenetv3_large/inference_config.json
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "timm",
|
| 3 |
+
"model_name": "mobilenetv3_large_100.ra_in1k",
|
| 4 |
+
"img_size": 224,
|
| 5 |
+
"mean": [
|
| 6 |
+
0.485,
|
| 7 |
+
0.456,
|
| 8 |
+
0.406
|
| 9 |
+
],
|
| 10 |
+
"std": [
|
| 11 |
+
0.229,
|
| 12 |
+
0.224,
|
| 13 |
+
0.225
|
| 14 |
+
],
|
| 15 |
+
"labels": [
|
| 16 |
+
"0",
|
| 17 |
+
"1"
|
| 18 |
+
],
|
| 19 |
+
"threshold": 0.8973163962364197,
|
| 20 |
+
"input_name": "pixel_values",
|
| 21 |
+
"output_name": "logits",
|
| 22 |
+
"val_metrics": {
|
| 23 |
+
"ap": 1.0,
|
| 24 |
+
"auc": 1.0,
|
| 25 |
+
"threshold": 0.8973163962364197,
|
| 26 |
+
"per_label": {
|
| 27 |
+
"report_by_label": {
|
| 28 |
+
"0": {
|
| 29 |
+
"precision": 1.0,
|
| 30 |
+
"recall": 1.0,
|
| 31 |
+
"f1-score": 1.0,
|
| 32 |
+
"support": 111.0
|
| 33 |
+
},
|
| 34 |
+
"1": {
|
| 35 |
+
"precision": 1.0,
|
| 36 |
+
"recall": 1.0,
|
| 37 |
+
"f1-score": 1.0,
|
| 38 |
+
"support": 112.0
|
| 39 |
+
}
|
| 40 |
+
},
|
| 41 |
+
"accuracy": 1.0,
|
| 42 |
+
"confusion_matrix": {
|
| 43 |
+
"labels": [
|
| 44 |
+
"0",
|
| 45 |
+
"1"
|
| 46 |
+
],
|
| 47 |
+
"matrix": [
|
| 48 |
+
[
|
| 49 |
+
111,
|
| 50 |
+
0
|
| 51 |
+
],
|
| 52 |
+
[
|
| 53 |
+
0,
|
| 54 |
+
112
|
| 55 |
+
]
|
| 56 |
+
]
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"threshold_best_f1_score": 0.9999999999995
|
| 60 |
+
},
|
| 61 |
+
"test_metrics": {
|
| 62 |
+
"ap": 0.9943021124135675,
|
| 63 |
+
"auc": 0.9917953667953668,
|
| 64 |
+
"threshold": 0.8973163962364197,
|
| 65 |
+
"per_label": {
|
| 66 |
+
"report_by_label": {
|
| 67 |
+
"0": {
|
| 68 |
+
"precision": 0.9739130434782609,
|
| 69 |
+
"recall": 1.0,
|
| 70 |
+
"f1-score": 0.986784140969163,
|
| 71 |
+
"support": 112.0
|
| 72 |
+
},
|
| 73 |
+
"1": {
|
| 74 |
+
"precision": 1.0,
|
| 75 |
+
"recall": 0.972972972972973,
|
| 76 |
+
"f1-score": 0.9863013698630136,
|
| 77 |
+
"support": 111.0
|
| 78 |
+
}
|
| 79 |
+
},
|
| 80 |
+
"accuracy": 0.9865470852017937,
|
| 81 |
+
"confusion_matrix": {
|
| 82 |
+
"labels": [
|
| 83 |
+
"0",
|
| 84 |
+
"1"
|
| 85 |
+
],
|
| 86 |
+
"matrix": [
|
| 87 |
+
[
|
| 88 |
+
112,
|
| 89 |
+
0
|
| 90 |
+
],
|
| 91 |
+
[
|
| 92 |
+
3,
|
| 93 |
+
108
|
| 94 |
+
]
|
| 95 |
+
]
|
| 96 |
+
}
|
| 97 |
+
}
|
| 98 |
+
}
|
| 99 |
+
}
|
mobilenetv3_large/metrics_test.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9943021124135675,
|
| 3 |
+
"auc": 0.9917953667953668,
|
| 4 |
+
"threshold": 0.8973163962364197,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 0.9739130434782609,
|
| 9 |
+
"recall": 1.0,
|
| 10 |
+
"f1-score": 0.986784140969163,
|
| 11 |
+
"support": 112.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 1.0,
|
| 15 |
+
"recall": 0.972972972972973,
|
| 16 |
+
"f1-score": 0.9863013698630136,
|
| 17 |
+
"support": 111.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9865470852017937,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
112,
|
| 29 |
+
0
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
3,
|
| 33 |
+
108
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
}
|
| 38 |
+
}
|
mobilenetv3_large/metrics_val.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 1.0,
|
| 3 |
+
"auc": 1.0,
|
| 4 |
+
"threshold": 0.8973163962364197,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 1.0,
|
| 9 |
+
"recall": 1.0,
|
| 10 |
+
"f1-score": 1.0,
|
| 11 |
+
"support": 111.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 1.0,
|
| 15 |
+
"recall": 1.0,
|
| 16 |
+
"f1-score": 1.0,
|
| 17 |
+
"support": 112.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 1.0,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
111,
|
| 29 |
+
0
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
0,
|
| 33 |
+
112
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"threshold_best_f1_score": 0.9999999999995
|
| 39 |
+
}
|
mobilenetv3_large/onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2407e4aa74ea8d398144046bbc3623273f93242ec4dfdac3d155ee4f20d636a6
|
| 3 |
+
size 17138155
|
mobilenetv3_large/onnx/model.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d414ec76a43e02aaffc7dd8c6024567589a18cd5a7dcdcdd9ca42d4374019ad4
|
| 3 |
+
size 16777216
|
mobilenetv3_large/pr_curve_val.png
ADDED
|
mobilenetv3_large/preprocess.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"img_size": 224,
|
| 3 |
+
"mean": [
|
| 4 |
+
0.485,
|
| 5 |
+
0.456,
|
| 6 |
+
0.406
|
| 7 |
+
],
|
| 8 |
+
"std": [
|
| 9 |
+
0.229,
|
| 10 |
+
0.224,
|
| 11 |
+
0.225
|
| 12 |
+
],
|
| 13 |
+
"labels": [
|
| 14 |
+
"non_illuminated",
|
| 15 |
+
"illuminated"
|
| 16 |
+
]
|
| 17 |
+
}
|
mobilenetv3_large/roc_curve_val.png
ADDED
|
mobilenetv3_small/README.md
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Run artefacts: run_20260228_165352_timm_mobilenetv3_small_100.lamb_in1k
|
| 2 |
+
|
| 3 |
+
This folder is **uploadable as-is** to the Hugging Face Hub.
|
| 4 |
+
|
| 5 |
+
## Files
|
| 6 |
+
- `onnx/model.onnx`: single-file ONNX model
|
| 7 |
+
- `preprocess.json`: resize/normalize info
|
| 8 |
+
- `inference_config.json`: threshold + labels + IO names
|
| 9 |
+
- `metrics_val.json`, `metrics_test.json`
|
| 10 |
+
- `pr_curve_val.png`, `roc_curve_val.png`
|
| 11 |
+
|
| 12 |
+
## Quick inference (Python)
|
| 13 |
+
Use `scripts/infer_local.py` or `scripts/infer_hf.py`.
|
mobilenetv3_small/config_resolved.yml
ADDED
|
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run:
|
| 2 |
+
out_root: artefacts
|
| 3 |
+
name: null
|
| 4 |
+
seed: 42
|
| 5 |
+
device: auto
|
| 6 |
+
num_workers: 0
|
| 7 |
+
early_stopping_patience: 5
|
| 8 |
+
metric_for_best: ap
|
| 9 |
+
data:
|
| 10 |
+
source: local
|
| 11 |
+
local:
|
| 12 |
+
root: dataset
|
| 13 |
+
splits:
|
| 14 |
+
train: train
|
| 15 |
+
val: val
|
| 16 |
+
test: test
|
| 17 |
+
classes:
|
| 18 |
+
negative: non_illustration
|
| 19 |
+
positive: illustration
|
| 20 |
+
hf:
|
| 21 |
+
dataset: null
|
| 22 |
+
image_column: image
|
| 23 |
+
label_column: label
|
| 24 |
+
splits:
|
| 25 |
+
train: train
|
| 26 |
+
val: validation
|
| 27 |
+
test: test
|
| 28 |
+
label_names:
|
| 29 |
+
- non_illustration
|
| 30 |
+
- illustration
|
| 31 |
+
model:
|
| 32 |
+
backend: timm
|
| 33 |
+
name: mobilenetv3_small_100.lamb_in1k
|
| 34 |
+
pretrained: true
|
| 35 |
+
freeze_backbone: false
|
| 36 |
+
preprocess:
|
| 37 |
+
mode: auto
|
| 38 |
+
img_size: 224
|
| 39 |
+
mean:
|
| 40 |
+
- 0.485
|
| 41 |
+
- 0.456
|
| 42 |
+
- 0.406
|
| 43 |
+
std:
|
| 44 |
+
- 0.229
|
| 45 |
+
- 0.224
|
| 46 |
+
- 0.225
|
| 47 |
+
augment:
|
| 48 |
+
enabled: true
|
| 49 |
+
hflip: true
|
| 50 |
+
rotation_deg: 5
|
| 51 |
+
jitter:
|
| 52 |
+
brightness: 0.12
|
| 53 |
+
contrast: 0.12
|
| 54 |
+
saturation: 0.08
|
| 55 |
+
hue: 0.02
|
| 56 |
+
train:
|
| 57 |
+
epochs: 15
|
| 58 |
+
batch_size: 32
|
| 59 |
+
lr: 3e-4
|
| 60 |
+
export:
|
| 61 |
+
opset: 18
|
mobilenetv3_small/history.json
ADDED
|
@@ -0,0 +1,142 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"epoch": 1,
|
| 4 |
+
"train_loss": 1.0868408999705217,
|
| 5 |
+
"val_loss": 0.36503355598792303,
|
| 6 |
+
"ap": 0.9907990553365204,
|
| 7 |
+
"auc": 0.988497425997426,
|
| 8 |
+
"thr": 0.9999947547912598,
|
| 9 |
+
"p@0.5": 0.8870967741935484,
|
| 10 |
+
"r@0.5": 0.9821428571428571,
|
| 11 |
+
"f1@0.5": 0.9322033898305084,
|
| 12 |
+
"p@thr": 1.0,
|
| 13 |
+
"r@thr": 0.9196428571428571,
|
| 14 |
+
"f1@thr": 0.958139534883721
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"epoch": 2,
|
| 18 |
+
"train_loss": 0.302987942066631,
|
| 19 |
+
"val_loss": 0.2148190059402363,
|
| 20 |
+
"ap": 0.9934472800285261,
|
| 21 |
+
"auc": 0.9906692406692407,
|
| 22 |
+
"thr": 0.016991911455988884,
|
| 23 |
+
"p@0.5": 0.9906542056074766,
|
| 24 |
+
"r@0.5": 0.9464285714285714,
|
| 25 |
+
"f1@0.5": 0.9680365296803652,
|
| 26 |
+
"p@thr": 0.972972972972973,
|
| 27 |
+
"r@thr": 0.9642857142857143,
|
| 28 |
+
"f1@thr": 0.968609865470852
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"epoch": 3,
|
| 32 |
+
"train_loss": 0.14406887335432783,
|
| 33 |
+
"val_loss": 0.5304914396331242,
|
| 34 |
+
"ap": 0.9889334136330994,
|
| 35 |
+
"auc": 0.9851994851994852,
|
| 36 |
+
"thr": 0.00013374762784224004,
|
| 37 |
+
"p@0.5": 1.0,
|
| 38 |
+
"r@0.5": 0.8839285714285714,
|
| 39 |
+
"f1@0.5": 0.9383886255924171,
|
| 40 |
+
"p@thr": 0.9553571428571429,
|
| 41 |
+
"r@thr": 0.9553571428571429,
|
| 42 |
+
"f1@thr": 0.9553571428571429
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"epoch": 4,
|
| 46 |
+
"train_loss": 0.1769583746228653,
|
| 47 |
+
"val_loss": 0.058696481264113184,
|
| 48 |
+
"ap": 0.9977053140096619,
|
| 49 |
+
"auc": 0.997104247104247,
|
| 50 |
+
"thr": 0.465135782957077,
|
| 51 |
+
"p@0.5": 1.0,
|
| 52 |
+
"r@0.5": 0.9732142857142857,
|
| 53 |
+
"f1@0.5": 0.9864253393665159,
|
| 54 |
+
"p@thr": 1.0,
|
| 55 |
+
"r@thr": 0.9821428571428571,
|
| 56 |
+
"f1@thr": 0.990990990990991
|
| 57 |
+
},
|
| 58 |
+
{
|
| 59 |
+
"epoch": 5,
|
| 60 |
+
"train_loss": 0.17612643633533895,
|
| 61 |
+
"val_loss": 0.03337511599862099,
|
| 62 |
+
"ap": 0.9996832014277973,
|
| 63 |
+
"auc": 0.9996782496782497,
|
| 64 |
+
"thr": 0.6726846694946289,
|
| 65 |
+
"p@0.5": 0.9739130434782609,
|
| 66 |
+
"r@0.5": 1.0,
|
| 67 |
+
"f1@0.5": 0.986784140969163,
|
| 68 |
+
"p@thr": 0.9824561403508771,
|
| 69 |
+
"r@thr": 1.0,
|
| 70 |
+
"f1@thr": 0.9911504424778761
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"epoch": 6,
|
| 74 |
+
"train_loss": 0.14776804928613163,
|
| 75 |
+
"val_loss": 0.06837118350501571,
|
| 76 |
+
"ap": 0.9963561767309908,
|
| 77 |
+
"auc": 0.9950933075933077,
|
| 78 |
+
"thr": 0.36535075306892395,
|
| 79 |
+
"p@0.5": 0.9908256880733946,
|
| 80 |
+
"r@0.5": 0.9642857142857143,
|
| 81 |
+
"f1@0.5": 0.9773755656108597,
|
| 82 |
+
"p@thr": 0.990990990990991,
|
| 83 |
+
"r@thr": 0.9821428571428571,
|
| 84 |
+
"f1@thr": 0.9865470852017937
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"epoch": 7,
|
| 88 |
+
"train_loss": 0.03750141184939297,
|
| 89 |
+
"val_loss": 0.08679394423565359,
|
| 90 |
+
"ap": 0.996049137237876,
|
| 91 |
+
"auc": 0.9936454311454311,
|
| 92 |
+
"thr": 0.4252488315105438,
|
| 93 |
+
"p@0.5": 0.9821428571428571,
|
| 94 |
+
"r@0.5": 0.9821428571428571,
|
| 95 |
+
"f1@0.5": 0.9821428571428571,
|
| 96 |
+
"p@thr": 0.9823008849557522,
|
| 97 |
+
"r@thr": 0.9910714285714286,
|
| 98 |
+
"f1@thr": 0.9866666666666667
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"epoch": 8,
|
| 102 |
+
"train_loss": 0.03465930855390704,
|
| 103 |
+
"val_loss": 0.11857123919045469,
|
| 104 |
+
"ap": 0.9957081515525549,
|
| 105 |
+
"auc": 0.9922779922779923,
|
| 106 |
+
"thr": 0.05427879840135574,
|
| 107 |
+
"p@0.5": 0.990909090909091,
|
| 108 |
+
"r@0.5": 0.9732142857142857,
|
| 109 |
+
"f1@0.5": 0.9819819819819819,
|
| 110 |
+
"p@thr": 0.9910714285714286,
|
| 111 |
+
"r@thr": 0.9910714285714286,
|
| 112 |
+
"f1@thr": 0.9910714285714286
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"epoch": 9,
|
| 116 |
+
"train_loss": 0.03247845499374142,
|
| 117 |
+
"val_loss": 0.044858380586666566,
|
| 118 |
+
"ap": 0.9973214285714286,
|
| 119 |
+
"auc": 0.9961389961389961,
|
| 120 |
+
"thr": 0.8741072416305542,
|
| 121 |
+
"p@0.5": 0.9910714285714286,
|
| 122 |
+
"r@0.5": 0.9910714285714286,
|
| 123 |
+
"f1@0.5": 0.9910714285714286,
|
| 124 |
+
"p@thr": 1.0,
|
| 125 |
+
"r@thr": 0.9910714285714286,
|
| 126 |
+
"f1@thr": 0.9955156950672646
|
| 127 |
+
},
|
| 128 |
+
{
|
| 129 |
+
"epoch": 10,
|
| 130 |
+
"train_loss": 0.0117425412234187,
|
| 131 |
+
"val_loss": 0.05417561992719909,
|
| 132 |
+
"ap": 0.9968185550082101,
|
| 133 |
+
"auc": 0.99501287001287,
|
| 134 |
+
"thr": 0.5849859714508057,
|
| 135 |
+
"p@0.5": 1.0,
|
| 136 |
+
"r@0.5": 0.9910714285714286,
|
| 137 |
+
"f1@0.5": 0.9955156950672646,
|
| 138 |
+
"p@thr": 1.0,
|
| 139 |
+
"r@thr": 0.9910714285714286,
|
| 140 |
+
"f1@thr": 0.9955156950672646
|
| 141 |
+
}
|
| 142 |
+
]
|
mobilenetv3_small/inference_config.json
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "timm",
|
| 3 |
+
"model_name": "mobilenetv3_small_100.lamb_in1k",
|
| 4 |
+
"img_size": 224,
|
| 5 |
+
"mean": [
|
| 6 |
+
0.485,
|
| 7 |
+
0.456,
|
| 8 |
+
0.406
|
| 9 |
+
],
|
| 10 |
+
"std": [
|
| 11 |
+
0.229,
|
| 12 |
+
0.224,
|
| 13 |
+
0.225
|
| 14 |
+
],
|
| 15 |
+
"labels": [
|
| 16 |
+
"0",
|
| 17 |
+
"1"
|
| 18 |
+
],
|
| 19 |
+
"threshold": 0.6726846694946289,
|
| 20 |
+
"input_name": "pixel_values",
|
| 21 |
+
"output_name": "logits",
|
| 22 |
+
"val_metrics": {
|
| 23 |
+
"ap": 0.9996832014277973,
|
| 24 |
+
"auc": 0.9996782496782497,
|
| 25 |
+
"threshold": 0.6726846694946289,
|
| 26 |
+
"per_label": {
|
| 27 |
+
"report_by_label": {
|
| 28 |
+
"0": {
|
| 29 |
+
"precision": 1.0,
|
| 30 |
+
"recall": 0.9819819819819819,
|
| 31 |
+
"f1-score": 0.990909090909091,
|
| 32 |
+
"support": 111.0
|
| 33 |
+
},
|
| 34 |
+
"1": {
|
| 35 |
+
"precision": 0.9824561403508771,
|
| 36 |
+
"recall": 1.0,
|
| 37 |
+
"f1-score": 0.9911504424778761,
|
| 38 |
+
"support": 112.0
|
| 39 |
+
}
|
| 40 |
+
},
|
| 41 |
+
"accuracy": 0.9910313901345291,
|
| 42 |
+
"confusion_matrix": {
|
| 43 |
+
"labels": [
|
| 44 |
+
"0",
|
| 45 |
+
"1"
|
| 46 |
+
],
|
| 47 |
+
"matrix": [
|
| 48 |
+
[
|
| 49 |
+
109,
|
| 50 |
+
2
|
| 51 |
+
],
|
| 52 |
+
[
|
| 53 |
+
0,
|
| 54 |
+
112
|
| 55 |
+
]
|
| 56 |
+
]
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"threshold_best_f1_score": 0.991150442477376
|
| 60 |
+
},
|
| 61 |
+
"test_metrics": {
|
| 62 |
+
"ap": 0.9961655087392702,
|
| 63 |
+
"auc": 0.9958172458172457,
|
| 64 |
+
"threshold": 0.6726846694946289,
|
| 65 |
+
"per_label": {
|
| 66 |
+
"report_by_label": {
|
| 67 |
+
"0": {
|
| 68 |
+
"precision": 0.9565217391304348,
|
| 69 |
+
"recall": 0.9821428571428571,
|
| 70 |
+
"f1-score": 0.9691629955947136,
|
| 71 |
+
"support": 112.0
|
| 72 |
+
},
|
| 73 |
+
"1": {
|
| 74 |
+
"precision": 0.9814814814814815,
|
| 75 |
+
"recall": 0.954954954954955,
|
| 76 |
+
"f1-score": 0.9680365296803652,
|
| 77 |
+
"support": 111.0
|
| 78 |
+
}
|
| 79 |
+
},
|
| 80 |
+
"accuracy": 0.968609865470852,
|
| 81 |
+
"confusion_matrix": {
|
| 82 |
+
"labels": [
|
| 83 |
+
"0",
|
| 84 |
+
"1"
|
| 85 |
+
],
|
| 86 |
+
"matrix": [
|
| 87 |
+
[
|
| 88 |
+
110,
|
| 89 |
+
2
|
| 90 |
+
],
|
| 91 |
+
[
|
| 92 |
+
5,
|
| 93 |
+
106
|
| 94 |
+
]
|
| 95 |
+
]
|
| 96 |
+
}
|
| 97 |
+
}
|
| 98 |
+
}
|
| 99 |
+
}
|
mobilenetv3_small/metrics_test.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9961655087392702,
|
| 3 |
+
"auc": 0.9958172458172457,
|
| 4 |
+
"threshold": 0.6726846694946289,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 0.9565217391304348,
|
| 9 |
+
"recall": 0.9821428571428571,
|
| 10 |
+
"f1-score": 0.9691629955947136,
|
| 11 |
+
"support": 112.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 0.9814814814814815,
|
| 15 |
+
"recall": 0.954954954954955,
|
| 16 |
+
"f1-score": 0.9680365296803652,
|
| 17 |
+
"support": 111.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.968609865470852,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
110,
|
| 29 |
+
2
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
5,
|
| 33 |
+
106
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
}
|
| 38 |
+
}
|
mobilenetv3_small/metrics_val.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9996832014277973,
|
| 3 |
+
"auc": 0.9996782496782497,
|
| 4 |
+
"threshold": 0.6726846694946289,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 1.0,
|
| 9 |
+
"recall": 0.9819819819819819,
|
| 10 |
+
"f1-score": 0.990909090909091,
|
| 11 |
+
"support": 111.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 0.9824561403508771,
|
| 15 |
+
"recall": 1.0,
|
| 16 |
+
"f1-score": 0.9911504424778761,
|
| 17 |
+
"support": 112.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9910313901345291,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
109,
|
| 29 |
+
2
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
0,
|
| 33 |
+
112
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"threshold_best_f1_score": 0.991150442477376
|
| 39 |
+
}
|
mobilenetv3_small/onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69e23671aff23a61a1615e3055ce6fdba7168768a4087429e4f21539adb75374
|
| 3 |
+
size 6375702
|
mobilenetv3_small/onnx/model.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c7ec5fe1621fcf920c10b1221b9e1aaa6277b754c0ad4c338b615452359131b
|
| 3 |
+
size 6094848
|
mobilenetv3_small/pr_curve_val.png
ADDED
|
mobilenetv3_small/preprocess.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"img_size": 224,
|
| 3 |
+
"mean": [
|
| 4 |
+
0.485,
|
| 5 |
+
0.456,
|
| 6 |
+
0.406
|
| 7 |
+
],
|
| 8 |
+
"std": [
|
| 9 |
+
0.229,
|
| 10 |
+
0.224,
|
| 11 |
+
0.225
|
| 12 |
+
],
|
| 13 |
+
"labels": [
|
| 14 |
+
"non_illuminated",
|
| 15 |
+
"illuminated"
|
| 16 |
+
]
|
| 17 |
+
}
|
mobilenetv3_small/roc_curve_val.png
ADDED
|
mobilevitv2/README.md
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Run artefacts: run_20260228_175756_transformers_apple__mobilevitv2-1.0-imagenet1k-256
|
| 2 |
+
|
| 3 |
+
This folder is **uploadable as-is** to the Hugging Face Hub.
|
| 4 |
+
|
| 5 |
+
## Files
|
| 6 |
+
- `onnx/model.onnx`: single-file ONNX model
|
| 7 |
+
- `preprocess.json`: resize/normalize info
|
| 8 |
+
- `inference_config.json`: threshold + labels + IO names
|
| 9 |
+
- `metrics_val.json`, `metrics_test.json`
|
| 10 |
+
- `pr_curve_val.png`, `roc_curve_val.png`
|
| 11 |
+
|
| 12 |
+
## Quick inference (Python)
|
| 13 |
+
Use `scripts/infer_local.py` or `scripts/infer_hf.py`.
|
mobilevitv2/config_resolved.yml
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run:
|
| 2 |
+
out_root: artefacts
|
| 3 |
+
name: null
|
| 4 |
+
seed: 42
|
| 5 |
+
device: auto
|
| 6 |
+
num_workers: 0
|
| 7 |
+
early_stopping_patience: 5
|
| 8 |
+
metric_for_best: ap
|
| 9 |
+
data:
|
| 10 |
+
source: local
|
| 11 |
+
local:
|
| 12 |
+
root: dataset
|
| 13 |
+
splits:
|
| 14 |
+
train: train
|
| 15 |
+
val: val
|
| 16 |
+
test: test
|
| 17 |
+
classes:
|
| 18 |
+
negative: non_illustration
|
| 19 |
+
positive: illustration
|
| 20 |
+
hf:
|
| 21 |
+
dataset: null
|
| 22 |
+
image_column: image
|
| 23 |
+
label_column: label
|
| 24 |
+
splits:
|
| 25 |
+
train: train
|
| 26 |
+
val: validation
|
| 27 |
+
test: test
|
| 28 |
+
label_names:
|
| 29 |
+
- '0'
|
| 30 |
+
- '1'
|
| 31 |
+
model:
|
| 32 |
+
backend: transformers
|
| 33 |
+
name: apple/mobilevitv2-1.0-imagenet1k-256
|
| 34 |
+
pretrained: true
|
| 35 |
+
freeze_backbone: false
|
| 36 |
+
preprocess:
|
| 37 |
+
processor_use_fast: false
|
| 38 |
+
mode: auto
|
| 39 |
+
img_size: 288
|
| 40 |
+
mean:
|
| 41 |
+
- 0.485
|
| 42 |
+
- 0.456
|
| 43 |
+
- 0.406
|
| 44 |
+
std:
|
| 45 |
+
- 0.229
|
| 46 |
+
- 0.224
|
| 47 |
+
- 0.225
|
| 48 |
+
augment:
|
| 49 |
+
enabled: true
|
| 50 |
+
hflip: true
|
| 51 |
+
rotation_deg: 5
|
| 52 |
+
jitter:
|
| 53 |
+
brightness: 0.12
|
| 54 |
+
contrast: 0.12
|
| 55 |
+
saturation: 0.08
|
| 56 |
+
hue: 0.02
|
| 57 |
+
train:
|
| 58 |
+
epochs: 30
|
| 59 |
+
batch_size: 32
|
| 60 |
+
lr: 5e-5
|
| 61 |
+
export:
|
| 62 |
+
opset: 18
|
mobilevitv2/history.json
ADDED
|
@@ -0,0 +1,240 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"epoch": 1,
|
| 4 |
+
"train_loss": 0.6136224432425066,
|
| 5 |
+
"val_loss": 0.5309888805661883,
|
| 6 |
+
"ap": 0.9715995957464956,
|
| 7 |
+
"auc": 0.9679054054054054,
|
| 8 |
+
"thr": 0.4898189306259155,
|
| 9 |
+
"p@0.5": 0.9578947368421052,
|
| 10 |
+
"r@0.5": 0.8125,
|
| 11 |
+
"f1@0.5": 0.8792270531400966,
|
| 12 |
+
"p@thr": 0.96,
|
| 13 |
+
"r@thr": 0.8571428571428571,
|
| 14 |
+
"f1@thr": 0.9056603773584906
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"epoch": 2,
|
| 18 |
+
"train_loss": 0.43488134398604883,
|
| 19 |
+
"val_loss": 0.33073335673127857,
|
| 20 |
+
"ap": 0.9852916498151716,
|
| 21 |
+
"auc": 0.9842342342342343,
|
| 22 |
+
"thr": 0.38356244564056396,
|
| 23 |
+
"p@0.5": 0.9702970297029703,
|
| 24 |
+
"r@0.5": 0.875,
|
| 25 |
+
"f1@0.5": 0.92018779342723,
|
| 26 |
+
"p@thr": 0.8934426229508197,
|
| 27 |
+
"r@thr": 0.9732142857142857,
|
| 28 |
+
"f1@thr": 0.9316239316239316
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"epoch": 3,
|
| 32 |
+
"train_loss": 0.2495211593129418,
|
| 33 |
+
"val_loss": 0.17889929243496486,
|
| 34 |
+
"ap": 0.9933598106062923,
|
| 35 |
+
"auc": 0.9931628056628057,
|
| 36 |
+
"thr": 0.5287375450134277,
|
| 37 |
+
"p@0.5": 0.9724770642201835,
|
| 38 |
+
"r@0.5": 0.9464285714285714,
|
| 39 |
+
"f1@0.5": 0.9592760180995475,
|
| 40 |
+
"p@thr": 0.9814814814814815,
|
| 41 |
+
"r@thr": 0.9464285714285714,
|
| 42 |
+
"f1@thr": 0.9636363636363636
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"epoch": 4,
|
| 46 |
+
"train_loss": 0.1396131490667661,
|
| 47 |
+
"val_loss": 0.11305808861340795,
|
| 48 |
+
"ap": 0.9972358158379304,
|
| 49 |
+
"auc": 0.9971846846846847,
|
| 50 |
+
"thr": 0.563666820526123,
|
| 51 |
+
"p@0.5": 0.9649122807017544,
|
| 52 |
+
"r@0.5": 0.9821428571428571,
|
| 53 |
+
"f1@0.5": 0.9734513274336283,
|
| 54 |
+
"p@thr": 0.9734513274336283,
|
| 55 |
+
"r@thr": 0.9821428571428571,
|
| 56 |
+
"f1@thr": 0.9777777777777777
|
| 57 |
+
},
|
| 58 |
+
{
|
| 59 |
+
"epoch": 5,
|
| 60 |
+
"train_loss": 0.09789776660953507,
|
| 61 |
+
"val_loss": 0.07542977162769862,
|
| 62 |
+
"ap": 0.9981531379843416,
|
| 63 |
+
"auc": 0.9981499356499356,
|
| 64 |
+
"thr": 0.6896249651908875,
|
| 65 |
+
"p@0.5": 0.9734513274336283,
|
| 66 |
+
"r@0.5": 0.9821428571428571,
|
| 67 |
+
"f1@0.5": 0.9777777777777777,
|
| 68 |
+
"p@thr": 0.990990990990991,
|
| 69 |
+
"r@thr": 0.9821428571428571,
|
| 70 |
+
"f1@thr": 0.9865470852017937
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"epoch": 6,
|
| 74 |
+
"train_loss": 0.0681087678354798,
|
| 75 |
+
"val_loss": 0.061588000639208725,
|
| 76 |
+
"ap": 0.9985445006096151,
|
| 77 |
+
"auc": 0.9985521235521235,
|
| 78 |
+
"thr": 0.8218199014663696,
|
| 79 |
+
"p@0.5": 0.9734513274336283,
|
| 80 |
+
"r@0.5": 0.9821428571428571,
|
| 81 |
+
"f1@0.5": 0.9777777777777777,
|
| 82 |
+
"p@thr": 0.990990990990991,
|
| 83 |
+
"r@thr": 0.9821428571428571,
|
| 84 |
+
"f1@thr": 0.9865470852017937
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"epoch": 7,
|
| 88 |
+
"train_loss": 0.05540698230492346,
|
| 89 |
+
"val_loss": 0.04914508613624743,
|
| 90 |
+
"ap": 0.9991342174369188,
|
| 91 |
+
"auc": 0.9991151866151866,
|
| 92 |
+
"thr": 0.4745059609413147,
|
| 93 |
+
"p@0.5": 0.9821428571428571,
|
| 94 |
+
"r@0.5": 0.9821428571428571,
|
| 95 |
+
"f1@0.5": 0.9821428571428571,
|
| 96 |
+
"p@thr": 0.9823008849557522,
|
| 97 |
+
"r@thr": 0.9910714285714286,
|
| 98 |
+
"f1@thr": 0.9866666666666667
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"epoch": 8,
|
| 102 |
+
"train_loss": 0.03588254682042382,
|
| 103 |
+
"val_loss": 0.04085694852152041,
|
| 104 |
+
"ap": 0.9993688789278946,
|
| 105 |
+
"auc": 0.9993564993564994,
|
| 106 |
+
"thr": 0.7428937554359436,
|
| 107 |
+
"p@0.5": 0.9823008849557522,
|
| 108 |
+
"r@0.5": 0.9910714285714286,
|
| 109 |
+
"f1@0.5": 0.9866666666666667,
|
| 110 |
+
"p@thr": 0.9910714285714286,
|
| 111 |
+
"r@thr": 0.9910714285714286,
|
| 112 |
+
"f1@thr": 0.9910714285714286
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"epoch": 9,
|
| 116 |
+
"train_loss": 0.030871574188385046,
|
| 117 |
+
"val_loss": 0.03756431902625731,
|
| 118 |
+
"ap": 0.9997670807453414,
|
| 119 |
+
"auc": 0.9997586872586873,
|
| 120 |
+
"thr": 0.8788256645202637,
|
| 121 |
+
"p@0.5": 0.9823008849557522,
|
| 122 |
+
"r@0.5": 0.9910714285714286,
|
| 123 |
+
"f1@0.5": 0.9866666666666667,
|
| 124 |
+
"p@thr": 1.0,
|
| 125 |
+
"r@thr": 0.9910714285714286,
|
| 126 |
+
"f1@thr": 0.9955156950672646
|
| 127 |
+
},
|
| 128 |
+
{
|
| 129 |
+
"epoch": 10,
|
| 130 |
+
"train_loss": 0.046899005813016134,
|
| 131 |
+
"val_loss": 0.038746476539277604,
|
| 132 |
+
"ap": 0.9997670807453414,
|
| 133 |
+
"auc": 0.9997586872586873,
|
| 134 |
+
"thr": 0.9239242672920227,
|
| 135 |
+
"p@0.5": 0.9823008849557522,
|
| 136 |
+
"r@0.5": 0.9910714285714286,
|
| 137 |
+
"f1@0.5": 0.9866666666666667,
|
| 138 |
+
"p@thr": 1.0,
|
| 139 |
+
"r@thr": 0.9910714285714286,
|
| 140 |
+
"f1@thr": 0.9955156950672646
|
| 141 |
+
},
|
| 142 |
+
{
|
| 143 |
+
"epoch": 11,
|
| 144 |
+
"train_loss": 0.023613250877877526,
|
| 145 |
+
"val_loss": 0.03057761028009866,
|
| 146 |
+
"ap": 0.9997670807453415,
|
| 147 |
+
"auc": 0.9997586872586873,
|
| 148 |
+
"thr": 0.868549108505249,
|
| 149 |
+
"p@0.5": 0.9823008849557522,
|
| 150 |
+
"r@0.5": 0.9910714285714286,
|
| 151 |
+
"f1@0.5": 0.9866666666666667,
|
| 152 |
+
"p@thr": 1.0,
|
| 153 |
+
"r@thr": 0.9910714285714286,
|
| 154 |
+
"f1@thr": 0.9955156950672646
|
| 155 |
+
},
|
| 156 |
+
{
|
| 157 |
+
"epoch": 12,
|
| 158 |
+
"train_loss": 0.019699306453041958,
|
| 159 |
+
"val_loss": 0.03165130536737187,
|
| 160 |
+
"ap": 0.9998433583959898,
|
| 161 |
+
"auc": 0.9998391248391248,
|
| 162 |
+
"thr": 0.91166090965271,
|
| 163 |
+
"p@0.5": 0.9823008849557522,
|
| 164 |
+
"r@0.5": 0.9910714285714286,
|
| 165 |
+
"f1@0.5": 0.9866666666666667,
|
| 166 |
+
"p@thr": 1.0,
|
| 167 |
+
"r@thr": 0.9910714285714286,
|
| 168 |
+
"f1@thr": 0.9955156950672646
|
| 169 |
+
},
|
| 170 |
+
{
|
| 171 |
+
"epoch": 13,
|
| 172 |
+
"train_loss": 0.034958065607387456,
|
| 173 |
+
"val_loss": 0.03394456846373422,
|
| 174 |
+
"ap": 0.9994747899159662,
|
| 175 |
+
"auc": 0.9994369369369369,
|
| 176 |
+
"thr": 0.8826852440834045,
|
| 177 |
+
"p@0.5": 0.9823008849557522,
|
| 178 |
+
"r@0.5": 0.9910714285714286,
|
| 179 |
+
"f1@0.5": 0.9866666666666667,
|
| 180 |
+
"p@thr": 1.0,
|
| 181 |
+
"r@thr": 0.9910714285714286,
|
| 182 |
+
"f1@thr": 0.9955156950672646
|
| 183 |
+
},
|
| 184 |
+
{
|
| 185 |
+
"epoch": 14,
|
| 186 |
+
"train_loss": 0.014708122704178095,
|
| 187 |
+
"val_loss": 0.032581535866484046,
|
| 188 |
+
"ap": 0.9997670807453414,
|
| 189 |
+
"auc": 0.9997586872586873,
|
| 190 |
+
"thr": 0.9223722219467163,
|
| 191 |
+
"p@0.5": 0.9823008849557522,
|
| 192 |
+
"r@0.5": 0.9910714285714286,
|
| 193 |
+
"f1@0.5": 0.9866666666666667,
|
| 194 |
+
"p@thr": 1.0,
|
| 195 |
+
"r@thr": 0.9910714285714286,
|
| 196 |
+
"f1@thr": 0.9955156950672646
|
| 197 |
+
},
|
| 198 |
+
{
|
| 199 |
+
"epoch": 15,
|
| 200 |
+
"train_loss": 0.010218438861722296,
|
| 201 |
+
"val_loss": 0.03164625232706645,
|
| 202 |
+
"ap": 0.9997670807453414,
|
| 203 |
+
"auc": 0.9997586872586873,
|
| 204 |
+
"thr": 0.9286591410636902,
|
| 205 |
+
"p@0.5": 0.9823008849557522,
|
| 206 |
+
"r@0.5": 0.9910714285714286,
|
| 207 |
+
"f1@0.5": 0.9866666666666667,
|
| 208 |
+
"p@thr": 1.0,
|
| 209 |
+
"r@thr": 0.9910714285714286,
|
| 210 |
+
"f1@thr": 0.9955156950672646
|
| 211 |
+
},
|
| 212 |
+
{
|
| 213 |
+
"epoch": 16,
|
| 214 |
+
"train_loss": 0.010789826745167375,
|
| 215 |
+
"val_loss": 0.03193989605642855,
|
| 216 |
+
"ap": 0.9997670807453415,
|
| 217 |
+
"auc": 0.9997586872586873,
|
| 218 |
+
"thr": 0.8773350119590759,
|
| 219 |
+
"p@0.5": 0.9823008849557522,
|
| 220 |
+
"r@0.5": 0.9910714285714286,
|
| 221 |
+
"f1@0.5": 0.9866666666666667,
|
| 222 |
+
"p@thr": 1.0,
|
| 223 |
+
"r@thr": 0.9910714285714286,
|
| 224 |
+
"f1@thr": 0.9955156950672646
|
| 225 |
+
},
|
| 226 |
+
{
|
| 227 |
+
"epoch": 17,
|
| 228 |
+
"train_loss": 0.008959678310378822,
|
| 229 |
+
"val_loss": 0.030488197691738605,
|
| 230 |
+
"ap": 0.9998433583959898,
|
| 231 |
+
"auc": 0.9998391248391248,
|
| 232 |
+
"thr": 0.9581832885742188,
|
| 233 |
+
"p@0.5": 0.9823008849557522,
|
| 234 |
+
"r@0.5": 0.9910714285714286,
|
| 235 |
+
"f1@0.5": 0.9866666666666667,
|
| 236 |
+
"p@thr": 1.0,
|
| 237 |
+
"r@thr": 0.9910714285714286,
|
| 238 |
+
"f1@thr": 0.9955156950672646
|
| 239 |
+
}
|
| 240 |
+
]
|
mobilevitv2/inference_config.json
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "transformers",
|
| 3 |
+
"model_name": "apple/mobilevitv2-1.0-imagenet1k-256",
|
| 4 |
+
"img_size": 288,
|
| 5 |
+
"mean": [
|
| 6 |
+
0.485,
|
| 7 |
+
0.456,
|
| 8 |
+
0.406
|
| 9 |
+
],
|
| 10 |
+
"std": [
|
| 11 |
+
0.229,
|
| 12 |
+
0.224,
|
| 13 |
+
0.225
|
| 14 |
+
],
|
| 15 |
+
"labels": [
|
| 16 |
+
"0",
|
| 17 |
+
"1"
|
| 18 |
+
],
|
| 19 |
+
"threshold": 0.91166090965271,
|
| 20 |
+
"input_name": "pixel_values",
|
| 21 |
+
"output_name": "logits",
|
| 22 |
+
"val_metrics": {
|
| 23 |
+
"ap": 0.9998433583959898,
|
| 24 |
+
"auc": 0.9998391248391248,
|
| 25 |
+
"threshold": 0.91166090965271,
|
| 26 |
+
"per_label": {
|
| 27 |
+
"report_by_label": {
|
| 28 |
+
"0": {
|
| 29 |
+
"precision": 0.9910714285714286,
|
| 30 |
+
"recall": 1.0,
|
| 31 |
+
"f1-score": 0.9955156950672646,
|
| 32 |
+
"support": 111.0
|
| 33 |
+
},
|
| 34 |
+
"1": {
|
| 35 |
+
"precision": 1.0,
|
| 36 |
+
"recall": 0.9910714285714286,
|
| 37 |
+
"f1-score": 0.9955156950672646,
|
| 38 |
+
"support": 112.0
|
| 39 |
+
}
|
| 40 |
+
},
|
| 41 |
+
"accuracy": 0.9955156950672646,
|
| 42 |
+
"confusion_matrix": {
|
| 43 |
+
"labels": [
|
| 44 |
+
"0",
|
| 45 |
+
"1"
|
| 46 |
+
],
|
| 47 |
+
"matrix": [
|
| 48 |
+
[
|
| 49 |
+
111,
|
| 50 |
+
0
|
| 51 |
+
],
|
| 52 |
+
[
|
| 53 |
+
1,
|
| 54 |
+
111
|
| 55 |
+
]
|
| 56 |
+
]
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"threshold_best_f1_score": 0.9955156950667645
|
| 60 |
+
},
|
| 61 |
+
"test_metrics": {
|
| 62 |
+
"ap": 0.9991997793851138,
|
| 63 |
+
"auc": 0.9991956241956241,
|
| 64 |
+
"threshold": 0.91166090965271,
|
| 65 |
+
"per_label": {
|
| 66 |
+
"report_by_label": {
|
| 67 |
+
"0": {
|
| 68 |
+
"precision": 0.9572649572649573,
|
| 69 |
+
"recall": 1.0,
|
| 70 |
+
"f1-score": 0.9781659388646288,
|
| 71 |
+
"support": 112.0
|
| 72 |
+
},
|
| 73 |
+
"1": {
|
| 74 |
+
"precision": 1.0,
|
| 75 |
+
"recall": 0.954954954954955,
|
| 76 |
+
"f1-score": 0.9769585253456221,
|
| 77 |
+
"support": 111.0
|
| 78 |
+
}
|
| 79 |
+
},
|
| 80 |
+
"accuracy": 0.9775784753363229,
|
| 81 |
+
"confusion_matrix": {
|
| 82 |
+
"labels": [
|
| 83 |
+
"0",
|
| 84 |
+
"1"
|
| 85 |
+
],
|
| 86 |
+
"matrix": [
|
| 87 |
+
[
|
| 88 |
+
112,
|
| 89 |
+
0
|
| 90 |
+
],
|
| 91 |
+
[
|
| 92 |
+
5,
|
| 93 |
+
106
|
| 94 |
+
]
|
| 95 |
+
]
|
| 96 |
+
}
|
| 97 |
+
}
|
| 98 |
+
}
|
| 99 |
+
}
|
mobilevitv2/metrics_test.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9991997793851138,
|
| 3 |
+
"auc": 0.9991956241956241,
|
| 4 |
+
"threshold": 0.91166090965271,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 0.9572649572649573,
|
| 9 |
+
"recall": 1.0,
|
| 10 |
+
"f1-score": 0.9781659388646288,
|
| 11 |
+
"support": 112.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 1.0,
|
| 15 |
+
"recall": 0.954954954954955,
|
| 16 |
+
"f1-score": 0.9769585253456221,
|
| 17 |
+
"support": 111.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9775784753363229,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
112,
|
| 29 |
+
0
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
5,
|
| 33 |
+
106
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
}
|
| 38 |
+
}
|
mobilevitv2/metrics_val.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"ap": 0.9998433583959898,
|
| 3 |
+
"auc": 0.9998391248391248,
|
| 4 |
+
"threshold": 0.91166090965271,
|
| 5 |
+
"per_label": {
|
| 6 |
+
"report_by_label": {
|
| 7 |
+
"0": {
|
| 8 |
+
"precision": 0.9910714285714286,
|
| 9 |
+
"recall": 1.0,
|
| 10 |
+
"f1-score": 0.9955156950672646,
|
| 11 |
+
"support": 111.0
|
| 12 |
+
},
|
| 13 |
+
"1": {
|
| 14 |
+
"precision": 1.0,
|
| 15 |
+
"recall": 0.9910714285714286,
|
| 16 |
+
"f1-score": 0.9955156950672646,
|
| 17 |
+
"support": 112.0
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"accuracy": 0.9955156950672646,
|
| 21 |
+
"confusion_matrix": {
|
| 22 |
+
"labels": [
|
| 23 |
+
"0",
|
| 24 |
+
"1"
|
| 25 |
+
],
|
| 26 |
+
"matrix": [
|
| 27 |
+
[
|
| 28 |
+
111,
|
| 29 |
+
0
|
| 30 |
+
],
|
| 31 |
+
[
|
| 32 |
+
1,
|
| 33 |
+
111
|
| 34 |
+
]
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"threshold_best_f1_score": 0.9955156950667645
|
| 39 |
+
}
|
mobilevitv2/onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35a22da40dff4c10f9d63c94992457aaa9e040557c2db2dba9ad91efd9c3e899
|
| 3 |
+
size 18858824
|
mobilevitv2/onnx/model.onnx.data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:086d3a9a704ba63008d524d86dabf78978119db0c620c61615c38794543879a9
|
| 3 |
+
size 17563648
|
mobilevitv2/pr_curve_val.png
ADDED
|
mobilevitv2/preprocess.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"img_size": 288,
|
| 3 |
+
"mean": [
|
| 4 |
+
0.485,
|
| 5 |
+
0.456,
|
| 6 |
+
0.406
|
| 7 |
+
],
|
| 8 |
+
"std": [
|
| 9 |
+
0.229,
|
| 10 |
+
0.224,
|
| 11 |
+
0.225
|
| 12 |
+
],
|
| 13 |
+
"labels": [
|
| 14 |
+
"non_illuminated",
|
| 15 |
+
"illuminated"
|
| 16 |
+
]
|
| 17 |
+
}
|
mobilevitv2/roc_curve_val.png
ADDED
|