LUNA-Training / sft_config.yaml
ASTERIZER's picture
Upload sft_config.yaml with huggingface_hub
5ea0407 verified
# ─────────────────────────────────────────────────────────────────────────────
# LUNA 100M β€” SFT Fine-Tuning Configuration
# ─────────────────────────────────────────────────────────────────────────────
auto_config: true
# ── Paths ─────────────────────────────────────────────────────────────────────
hf_model_repo: "ASTERIZER/LUNA-100M" # HF model repo with pretrained latest.pt
hf_dataset_repo: "ASTERIZER/Luna_Dataset" # HF dataset repo with SFT data
pretrained_ckpt: "Base/out/pretrain/luna_100m/latest.pt" # local path (auto-downloaded)
train_json: "Base/Datasets/sft_clean/train.json"
val_json: "Base/Datasets/sft_clean/val.json"
out_dir: "Base/out/sft/luna_100m_sft"
tokenizer_dir: "Base/checkpoints/EleutherAI/pythia-160m"
# ── Model (must match pretrained β€” do NOT change) ────────────────────────────
model:
vocab_size: 50304
seq_len: 1024
n_layer: 10
n_embd: 768
n_head: 12
# ── Training ──────────────────────────────────────────────────────────────────
train:
epochs: 2
max_tokens: 0 # 0 = use epochs instead
lr_warmup_steps: 200
save_interval: 500
log_interval: 10
eval_interval: 500 # run validation + eval prompts every N steps
max_norm: 1.0
# ── Optimizer (lower LR for fine-tuning) ──────────────────────────────────────
optimizer:
lr: 1.5e-5
min_lr: 1.0e-6
weight_decay: 0.01
betas: [0.9, 0.95]
eps: 1.0e-8
# ── Batch sizing ──────────────────────────────────────────────────────────────
batch:
global_batch: 64
micro_batch: 8
grad_accum: 8
# ── DataLoader ────────────────────────────────────────────────────────────────
dataloader:
num_workers: 4
pin_memory: true
# ── Hardware ──────────────────────────────────────────────────────────────────
hardware:
precision: "bf16"
compile: false
# ── Eval prompts (run after each checkpoint) ──────────────────────────────────
eval_prompts:
- "Who are you?"
- "What is your name?"
- "Who created you?"
- "Who is Asterizer?"
- "What is the capital of France?"
- "Explain photosynthesis in simple terms."
- "Write a short poem about the moon."
- "What is 25 times 4?"
- "Translate 'hello' to Spanish."
- "Summarize the theory of evolution in two sentences."