jbae1213 commited on
Commit
a9e9a58
·
verified ·
1 Parent(s): d8b30ff

Upload training_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.json +39 -0
training_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "Qwen/Qwen3-4B-Instruct-2507",
3
+ "quantization": {
4
+ "load_in_4bit": false
5
+ },
6
+ "dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json",
7
+ "dataset_resolved_path": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json",
8
+ "num_train_samples": 5434,
9
+ "num_val_samples": 679,
10
+ "val_dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_val.json",
11
+ "val_ratio": null,
12
+ "max_samples": null,
13
+ "output_dir": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53",
14
+ "save_artifact_path": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53",
15
+ "lora": {
16
+ "r": 64,
17
+ "lora_alpha": 128,
18
+ "lora_dropout": 0.05
19
+ },
20
+ "training": {
21
+ "num_train_epochs": 2.0,
22
+ "per_device_train_batch_size": 4,
23
+ "gradient_accumulation_steps": 4,
24
+ "learning_rate": 0.0002,
25
+ "max_seq_length": 2048,
26
+ "weight_decay": 0.0,
27
+ "warmup_ratio": 0.05,
28
+ "lr_scheduler_type": "cosine",
29
+ "logging_steps": 20,
30
+ "save_strategy": "steps",
31
+ "save_steps": 500,
32
+ "save_total_limit": 2,
33
+ "eval_strategy": "steps",
34
+ "eval_steps": 500,
35
+ "bf16": true,
36
+ "seed": 3407
37
+ },
38
+ "system_prompt": "You are a finance expert. Based on your financial expertise, provide your response or viewpoint on the given financial question or topic."
39
+ }