| accum_count: 100 |
| accum_steps: 0 |
| adam_beta2: 0.998 |
| attention_dropout: 0.1 |
| batch_size: 1500 |
| batch_type: tokens |
| bucket_size: 49304 |
| data: |
| 27e6308e0faf12cd1b4bed73708fad6f: |
| path_src: dataset/vep-ru/et-synt/source.txt |
| path_tgt: dataset/vep-ru/et-synt/target.txt |
| src_prefix: et_s_Latn |
| tgt_prefix: '' |
| transforms: &id001 |
| - sentencepiece |
| - filtertoolong |
| - prefix |
| weight: 37 |
| 2caaf1b1e5e15d4a06b5b77c438ba0bc: |
| path_src: dataset/vep-ru/fin-original/source.txt |
| path_tgt: dataset/vep-ru/fin-original/target.txt |
| src_prefix: fi_Latn |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 37 |
| 3def7622ce4622202126c8828c6fae3f: |
| path_src: dataset/vep-ru/fin-synt/source.txt |
| path_tgt: dataset/vep-ru/fin-synt/target.txt |
| src_prefix: fi_s_Latn |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 37 |
| 517216e92cd45eb876c79dc3bafaad18: |
| path_src: dataset/vep-ru/var/source.txt |
| path_tgt: dataset/vep-ru/var/target.txt |
| src_prefix: '' |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 167 |
| 815e8e066d03025e82529ef5c5ad232c: |
| path_src: dataset/vep-ru/vep/source.txt |
| path_tgt: dataset/vep-ru/vep/target.txt |
| src_prefix: '' |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 6 |
| 8e6d221db9fc70bb3fd1104c24c8f25c: |
| path_src: dataset/vep-ru/vep-dic/source.txt |
| path_tgt: dataset/vep-ru/vep-dic/target.txt |
| src_prefix: '' |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 1 |
| f080464d79eb04a44e9947db1b54c17b: |
| path_src: dataset/vep-ru/et-original/source.txt |
| path_tgt: dataset/vep-ru/et-original/target.txt |
| src_prefix: et_Latn |
| tgt_prefix: '' |
| transforms: *id001 |
| weight: 37 |
| valid: |
| path_src: run/vep_ru-1.0/src-val.txt |
| path_tgt: run/vep_ru-1.0/tgt-val.txt |
| transforms: *id001 |
| dec_layers: 20 |
| decay_method: rsqrt |
| decoder_type: transformer |
| dropout: 0.1 |
| dropout_steps: 0 |
| early_stopping: 0 |
| enc_layers: 20 |
| encoder_type: transformer |
| gpu_ranks: |
| - 0 |
| - 1 |
| heads: 8 |
| hidden_size: 512 |
| keep_checkpoint: 15 |
| label_smoothing: 0.1 |
| learning_rate: 0.005 |
| max_generator_batches: 2 |
| max_grad_norm: 0 |
| max_relative_positions: 20 |
| model_dtype: fp16 |
| normalization: tokens |
| num_workers: 6 |
| optim: pagedadamw8bit |
| param_init: 0 |
| param_init_glorot: true |
| pos_ffn_activation_fn: gated-gelu |
| position_encoding: false |
| queue_size: 10000 |
| reset_optim: none |
| rnn_size: 512 |
| save_checkpoint_steps: 500 |
| save_data: run/vep_ru-1.0/opennmt |
| save_model: run/vep_ru-1.0/opennmt/openmt.model |
| share_decoder_embeddings: true |
| share_embeddings: true |
| share_vocab: true |
| skip_empty_level: silent |
| src_onmttok_kwargs: |
| lang: vep |
| mode: none |
| src_seq_length: 185 |
| src_subword_alpha: 0.0 |
| src_subword_model: run/vep_ru-1.0/sentencepiece.model |
| src_subword_nbest: 1 |
| src_subword_type: sentencepiece |
| src_vocab: run/vep_ru-1.0/opennmt/openmt.vocab |
| src_vocab_size: 32000 |
| tgt_onmttok_kwargs: |
| lang: ru |
| mode: none |
| tgt_seq_length: 185 |
| tgt_subword_alpha: 0.0 |
| tgt_subword_model: run/vep_ru-1.0/sentencepiece.model |
| tgt_subword_nbest: 1 |
| tgt_subword_type: sentencepiece |
| tgt_vocab: run/vep_ru-1.0/opennmt/openmt.vocab |
| tgt_vocab_size: 32000 |
| train_steps: 2000 |
| transformer_ff: 6144 |
| update_vocab: 'False' |
| valid_batch_size: 64 |
| valid_metrics: |
| - BLEU |
| valid_steps: 500 |
| warmup_steps: 500 |
| word_vec_size: 512 |
| world_size: 2 |
|
|