File size: 2,964 Bytes
5436158
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
{
  "artifacts": {
    "config_json": "model/config.json",
    "model_safetensors": "model/model.safetensors",
    "summary_json": "model/finetune_summary.json"
  },
  "base_checkpoint": "/opt/opf/privacy_filter",
  "batch_size": 4,
  "best_epoch": 3,
  "best_metric": 0.11836049943755664,
  "best_metric_name": "validation_loss",
  "checkpoint_category_version": "v2",
  "device": "cuda",
  "elapsed_s": 665.0804580459953,
  "encoding": "o200k_base",
  "epoch_metrics": [
    {
      "elapsed_s": 223.2208842949476,
      "epoch": 1,
      "optimizer_steps": 3464,
      "train_batches": 3464,
      "train_loss": 0.19966075787397533,
      "train_token_accuracy": 0.9488236304310493,
      "train_tokens": 518247,
      "validation_batches": 362,
      "validation_loss": 0.12779622916233674,
      "validation_token_accuracy": 0.9629492646418937,
      "validation_tokens": 45964
    },
    {
      "elapsed_s": 215.3937597910408,
      "epoch": 2,
      "optimizer_steps": 3464,
      "train_batches": 3464,
      "train_loss": 0.116074429763646,
      "train_token_accuracy": 0.9701956788944268,
      "train_tokens": 518247,
      "validation_batches": 362,
      "validation_loss": 0.13543586285592848,
      "validation_token_accuracy": 0.9631885823688103,
      "validation_tokens": 45964
    },
    {
      "elapsed_s": 220.0128312209854,
      "epoch": 3,
      "optimizer_steps": 3464,
      "train_batches": 3464,
      "train_loss": 0.08883532059768282,
      "train_token_accuracy": 0.9779024287646624,
      "train_tokens": 518247,
      "validation_batches": 362,
      "validation_loss": 0.11836049943755664,
      "validation_token_accuracy": 0.9700635279784179,
      "validation_tokens": 45964
    }
  ],
  "epochs": 3,
  "generated_at_unix": 1777655501.3715181,
  "grad_accum_steps": 1,
  "label_space_json_path": "model/opf_label_space.json",
  "label_space_source": "label-space-json",
  "learning_rate": 0.0001,
  "max_grad_norm": 1.0,
  "num_output_labels": 49,
  "num_train_examples": 13851,
  "num_train_windows": 13853,
  "num_validation_examples": 1445,
  "num_validation_windows": 1445,
  "output_checkpoint_dir": "model/finetuned_v3",
  "output_head_reinitialized": true,
  "output_head_rows_copied": 49,
  "output_head_rows_copied_exact": 29,
  "output_head_rows_copied_fallback": 20,
  "resolved_category_version": "screenpipe_pii_v1",
  "resolved_n_ctx": 256,
  "schema_version": 1,
  "serialized_param_dtype": "bfloat16",
  "span_class_names": [
    "O",
    "private_person",
    "private_email",
    "private_phone",
    "private_address",
    "private_url",
    "private_company",
    "private_repo",
    "private_handle",
    "private_channel",
    "private_id",
    "private_date",
    "secret"
  ],
  "train_dataset": "model/opf_train_v3.jsonl",
  "train_dataset_variant": "full",
  "validation_dataset": "model/opf_val_v3.jsonl",
  "validation_dataset_variant": "full",
  "validation_split": null,
  "weight_decay": 0.0
}