| |
| |
|
|
| |
| |
| |
|
|
| |
| model: Conformer |
| model_conf: |
| ctc_weight: 0.3 |
| lsm_weight: 0.1 |
| length_normalized_loss: false |
|
|
| |
| encoder: ConformerEncoder |
| encoder_conf: |
| output_size: 512 |
| attention_heads: 16 |
| linear_units: 1536 |
| num_blocks: 32 |
| dropout_rate: 0.1 |
| positional_dropout_rate: 0.1 |
| attention_dropout_rate: 0.0 |
| input_layer: linear |
| normalize_before: true |
| pos_enc_layer_type: rel_pos |
| selfattention_layer_type: rel_selfattn |
| activation_type: swish |
| macaron_style: true |
| use_cnn_module: true |
| cnn_module_kernel: 5 |
|
|
| |
| decoder: TransformerDecoder |
| decoder_conf: |
| attention_heads: 16 |
| linear_units: 1536 |
| num_blocks: 16 |
| dropout_rate: 0.1 |
| positional_dropout_rate: 0.1 |
| self_attention_dropout_rate: 0.0 |
| src_attention_dropout_rate: 0.0 |
|
|
|
|
| |
| frontend: WavFrontend |
| frontend_conf: |
| fs: 16000 |
| window: hamming |
| n_mels: 80 |
| frame_length: 25 |
| frame_shift: 10 |
| lfr_m: 7 |
| lfr_n: 6 |
|
|
| specaug: SpecAug |
| specaug_conf: |
| apply_time_warp: true |
| time_warp_window: 5 |
| time_warp_mode: bicubic |
| apply_freq_mask: true |
| freq_mask_width_range: |
| - 0 |
| - 30 |
| num_freq_mask: 2 |
| apply_time_mask: true |
| time_mask_width_range: |
| - 0 |
| - 40 |
| num_time_mask: 2 |
|
|
| train_conf: |
| accum_grad: 1 |
| grad_clip: 5 |
| max_epoch: 150 |
| val_scheduler_criterion: |
| - valid |
| - acc |
| best_model_criterion: |
| - - valid |
| - acc |
| - max |
| keep_nbest_models: 10 |
| log_interval: 50 |
|
|
| optim: adam |
| optim_conf: |
| lr: 0.0005 |
| scheduler: warmuplr |
| scheduler_conf: |
| warmup_steps: 30000 |
|
|
| dataset: AudioDataset |
| dataset_conf: |
| index_ds: IndexDSJsonl |
| batch_sampler: DynamicBatchLocalShuffleSampler |
| batch_type: example |
| batch_size: 1 |
| max_token_length: 2048 |
| buffer_size: 500 |
| shuffle: True |
| num_workers: 0 |
|
|
| tokenizer: CharTokenizer |
| tokenizer_conf: |
| unk_symbol: <unk> |
| split_with_space: true |
|
|
|
|
| ctc_conf: |
| dropout_rate: 0.0 |
| ctc_type: builtin |
| reduce: true |
| ignore_nan_grad: true |
| normalize: null |
|
|