OminiControlRotation / nl_tasks /config /commonsense_opt.yaml
nvan15's picture
Batch upload part 2
6bb0065 verified
model:
model_name: facebook/opt-125m #"openai-community/gpt2" #EleutherAI/pythia-160m #Qwen/Qwen2.5-0.5B
# adapter_path: "./nl_tasks/run_exps/ft2"
data_collator_mode: 'dynamic'
rotation_adapter_config:
r: 4
num_rotations: 2
target_modules: ["q_proj", "v_proj"]
data:
dataset_name: 'math'
# path: "./nl_tasks/data/MetaMathQA-40K" #MetaMathQA-40K.json"
path: "./data/gsm8k_test.jsonl"
dataset_split: train[:200]
dataset_field: [question, answer]
trainer_args:
learning_rate: 2e-4
# accumulate_grad_batches: 1
# dataloader_workers: 5
# save_interval: 1000
# sample_interval: 100
# max_steps: -1
gradient_checkpointing: False # (Turn off for faster training)
output_dir: "./run_exps"
# save_path: "runs"
max_steps: 40
# device: 'cuda'