# ───────────────────────────────────────────────────────────────────────────── # LUNA 100M — SFT Fine-Tuning Configuration # ───────────────────────────────────────────────────────────────────────────── auto_config: true # ── Paths ───────────────────────────────────────────────────────────────────── hf_model_repo: "ASTERIZER/LUNA-100M" # HF model repo with pretrained latest.pt hf_dataset_repo: "ASTERIZER/Luna_Dataset" # HF dataset repo with SFT data pretrained_ckpt: "Base/out/pretrain/luna_100m/latest.pt" # local path (auto-downloaded) train_json: "Base/Datasets/sft_clean/train.json" val_json: "Base/Datasets/sft_clean/val.json" out_dir: "Base/out/sft/luna_100m_sft" tokenizer_dir: "Base/checkpoints/EleutherAI/pythia-160m" # ── Model (must match pretrained — do NOT change) ──────────────────────────── model: vocab_size: 50304 seq_len: 1024 n_layer: 10 n_embd: 768 n_head: 12 # ── Training ────────────────────────────────────────────────────────────────── train: epochs: 2 max_tokens: 0 # 0 = use epochs instead lr_warmup_steps: 200 save_interval: 500 log_interval: 10 eval_interval: 500 # run validation + eval prompts every N steps max_norm: 1.0 # ── Optimizer (lower LR for fine-tuning) ────────────────────────────────────── optimizer: lr: 1.5e-5 min_lr: 1.0e-6 weight_decay: 0.01 betas: [0.9, 0.95] eps: 1.0e-8 # ── Batch sizing ────────────────────────────────────────────────────────────── batch: global_batch: 64 micro_batch: 8 grad_accum: 8 # ── DataLoader ──────────────────────────────────────────────────────────────── dataloader: num_workers: 4 pin_memory: true # ── Hardware ────────────────────────────────────────────────────────────────── hardware: precision: "bf16" compile: false # ── Eval prompts (run after each checkpoint) ────────────────────────────────── eval_prompts: - "Who are you?" - "What is your name?" - "Who created you?" - "Who is Asterizer?" - "What is the capital of France?" - "Explain photosynthesis in simple terms." - "Write a short poem about the moon." - "What is 25 times 4?" - "Translate 'hello' to Spanish." - "Summarize the theory of evolution in two sentences."