| config: null |
| print_config: false |
| log_level: INFO |
| drop_last_iter: false |
| dry_run: false |
| iterator_type: sequence |
| valid_iterator_type: null |
| output_dir: exp/lm_te_lm |
| ngpu: 1 |
| seed: 0 |
| num_workers: 1 |
| num_att_plot: 3 |
| dist_backend: nccl |
| dist_init_method: env:// |
| dist_world_size: null |
| dist_rank: null |
| local_rank: 0 |
| dist_master_addr: null |
| dist_master_port: null |
| dist_launcher: null |
| multiprocessing_distributed: false |
| unused_parameters: false |
| sharded_ddp: false |
| cudnn_enabled: true |
| cudnn_benchmark: false |
| cudnn_deterministic: true |
| use_tf32: false |
| collect_stats: false |
| write_collected_feats: false |
| max_epoch: 40 |
| patience: null |
| val_scheduler_criterion: |
| - valid |
| - loss |
| early_stopping_criterion: |
| - valid |
| - loss |
| - min |
| best_model_criterion: |
| - - train |
| - loss |
| - min |
| - - valid |
| - loss |
| - min |
| - - train |
| - acc |
| - max |
| - - valid |
| - acc |
| - max |
| keep_nbest_models: |
| - 10 |
| nbest_averaging_interval: 0 |
| grad_clip: 5.0 |
| grad_clip_type: 2.0 |
| grad_noise: false |
| accum_grad: 1 |
| no_forward_run: false |
| resume: true |
| train_dtype: float32 |
| use_amp: false |
| log_interval: null |
| use_matplotlib: true |
| use_tensorboard: true |
| create_graph_in_tensorboard: false |
| use_wandb: false |
| wandb_project: null |
| wandb_id: null |
| wandb_entity: null |
| wandb_name: null |
| wandb_model_log_interval: -1 |
| detect_anomaly: false |
| use_adapter: false |
| adapter: lora |
| save_strategy: all |
| adapter_conf: {} |
| pretrain_path: null |
| init_param: [] |
| ignore_init_mismatch: false |
| freeze_param: [] |
| num_iters_per_epoch: null |
| batch_size: 20 |
| valid_batch_size: null |
| batch_bins: 1000000 |
| valid_batch_bins: null |
| train_shape_file: |
| - exp/lm_stats_en_char/train/text_shape.char |
| valid_shape_file: |
| - exp/lm_stats_en_char/valid/text_shape.char |
| batch_type: folded |
| valid_batch_type: null |
| fold_length: |
| - 150 |
| sort_in_batch: descending |
| shuffle_within_batch: false |
| sort_batch: descending |
| multiple_iterator: false |
| chunk_length: 500 |
| chunk_shift_ratio: 0.5 |
| num_cache_chunks: 1024 |
| chunk_excluded_key_prefixes: [] |
| chunk_default_fs: null |
| chunk_max_abs_length: null |
| chunk_discard_short_samples: true |
| train_data_path_and_name_and_type: |
| - - dump/raw_copy/lm_train.txt |
| - text |
| - text |
| valid_data_path_and_name_and_type: |
| - - dump/raw_copy/org/valid/text |
| - text |
| - text |
| multi_task_dataset: false |
| allow_variable_data_keys: false |
| max_cache_size: 0.0 |
| max_cache_fd: 32 |
| allow_multi_rates: false |
| valid_max_cache_size: null |
| exclude_weight_decay: false |
| exclude_weight_decay_conf: {} |
| optim: adadelta |
| optim_conf: {} |
| scheduler: null |
| scheduler_conf: {} |
| token_list: |
| - <blank> |
| - <unk> |
| - <space> |
| - ్ |
| - ి |
| - ా |
| - ు |
| - ర |
| - న |
| - ం |
| - ల |
| - క |
| - త |
| - ప |
| - వ |
| - స |
| - య |
| - ద |
| - మ |
| - చ |
| - ట |
| - గ |
| - ే |
| - ో |
| - డ |
| - ీ |
| - ె |
| - అ |
| - బ |
| - ధ |
| - జ |
| - ూ |
| - ొ |
| - ఉ |
| - ై |
| - ష |
| - ణ |
| - శ |
| - భ |
| - ఆ |
| - హ |
| - ఇ |
| - థ |
| - ఎ |
| - ఫ |
| - ఈ |
| - ఒ |
| - ళ |
| - ఖ |
| - ృ |
| - ఏ |
| - ౌ |
| - ౖ |
| - ఘ |
| - ఐ |
| - ఛ |
| - ఓ |
| - ఠ |
| - ఞ |
| - ఊ |
| - ఔ |
| - ఢ |
| - ఋ |
| - ః |
| - <sos/eos> |
| init: null |
| use_preprocessor: true |
| token_type: char |
| bpemodel: null |
| non_linguistic_symbols: null |
| cleaner: null |
| g2p: null |
| lm: seq_rnn |
| lm_conf: {} |
| model: lm |
| model_conf: {} |
| required: |
| - output_dir |
| - token_list |
| version: '202402' |
| distributed: false |
|
|