{
  "model_base": "Qwen/Qwen3-4B-Instruct-2507",
  "model_name": "RegTech-4B-Instruct",
  "dataset": "./train.jsonl",
  "env_file": "/home/ubuntu/sophia-core-server/.tuning/.env.4B",
  "train_samples": 2330,
  "eval_samples": 258,
  "params": {
    "rank": 4,
    "alpha": 8,
    "dropout": 0.05,
    "lr": 1e-05,
    "scheduler": "cosine",
    "epochs": 1,
    "effective_batch": 8,
    "max_seq_length": 4096,
    "neftune_alpha": 0.0,
    "target_modules": [
      "q_proj",
      "k_proj",
      "v_proj",
      "o_proj",
      "gate_proj",
      "up_proj",
      "down_proj"
    ]
  },
  "results": {
    "total_steps": 292,
    "final_train_loss": 1.5045,
    "best_eval_loss": 1.601854681968689,
    "best_eval_step": 240,
    "best_token_accuracy": 0.6812,
    "elapsed_minutes": 8.6
  },
  "loss_history": {
    "train": [
      [
        10,
        2.1906
      ],
      [
        20,
        2.0417
      ],
      [
        30,
        2.1217
      ],
      [
        40,
        2.0513
      ],
      [
        50,
        1.9839
      ],
      [
        60,
        1.9423
      ],
      [
        70,
        1.9321
      ],
      [
        80,
        1.8047
      ],
      [
        90,
        1.7045
      ],
      [
        100,
        1.8603
      ],
      [
        110,
        1.721
      ],
      [
        120,
        1.6419
      ],
      [
        130,
        1.5821
      ],
      [
        140,
        1.5593
      ],
      [
        150,
        1.4756
      ],
      [
        160,
        1.4945
      ],
      [
        170,
        1.5168
      ],
      [
        180,
        1.5689
      ],
      [
        190,
        1.3763
      ],
      [
        200,
        1.5759
      ],
      [
        210,
        1.477
      ],
      [
        220,
        1.4889
      ],
      [
        230,
        1.4514
      ],
      [
        240,
        1.441
      ],
      [
        250,
        1.427
      ],
      [
        260,
        1.4423
      ],
      [
        270,
        1.4199
      ],
      [
        280,
        1.457
      ],
      [
        290,
        1.5045
      ]
    ],
    "eval": [
      [
        80,
        2.036996841430664
      ],
      [
        160,
        1.6603444814682007
      ],
      [
        240,
        1.601854681968689
      ]
    ],
    "token_accuracy": [
      [
        80,
        0.661
      ],
      [
        160,
        0.6759
      ],
      [
        240,
        0.6812
      ]
    ]
  }
}