| #!/bin/bash |
|
|
| |
|
|
|
|
| echo `date` |
| exp_dir=$1 |
| model_arch=${2:-"transformer_18_18"} |
|
|
| fairseq-train $exp_dir/final_bin \ |
| --max-source-positions=256 \ |
| --max-target-positions=256 \ |
| --source-lang=SRC \ |
| --target-lang=TGT \ |
| --max-update=1000000 \ |
| --save-interval-updates=2500 \ |
| --arch=$model_arch \ |
| --activation-fn gelu \ |
| --criterion=label_smoothed_cross_entropy \ |
| --label-smoothing=0.1 \ |
| --optimizer adam \ |
| --adam-betas "(0.9, 0.98)" \ |
| --lr-scheduler=inverse_sqrt \ |
| --clip-norm 1.0 \ |
| --warmup-init-lr 1e-07 \ |
| --lr 5e-4 \ |
| --warmup-updates 4000 \ |
| --dropout 0.2 \ |
| --save-dir $exp_dir/model \ |
| --keep-last-epochs 5 \ |
| --keep-interval-updates 3 \ |
| --patience 10 \ |
| --skip-invalid-size-inputs-valid-test \ |
| --fp16 \ |
| --user-dir model_configs \ |
| --update-freq=32 \ |
| --distributed-world-size 8 \ |
| --num-workers 24 \ |
| --max-tokens 1024 \ |
| --eval-bleu \ |
| --eval-bleu-args "{\"beam\": 1, \"lenpen\": 1.0, \"max_len_a\": 1.2, \"max_len_b\": 10}" \ |
| --eval-bleu-detok moses \ |
| --eval-bleu-remove-bpe sentencepiece \ |
| --eval-bleu-print-samples \ |
| --best-checkpoint-metric bleu \ |
| --maximize-best-checkpoint-metric \ |
| --task translation |
|
|