diff --git "a/exp/asr_train_asr_raw_en_word/train.log" "b/exp/asr_train_asr_raw_en_word/train.log" deleted file mode 100644--- "a/exp/asr_train_asr_raw_en_word/train.log" +++ /dev/null @@ -1,4784 +0,0 @@ -# Running on v016.ib.bridges2.psc.edu -# Started at Mon Jan 31 04:07:00 EST 2022 -# SLURMD_NODENAME=v016 -# SLURM_CLUSTER_NAME=bridges2 -# SLURM_CONF=/var/spool/slurm/d/conf-cache/slurm.conf -# SLURM_CPUS_ON_NODE=5 -# SLURM_CPUS_PER_TASK=1 -# SLURM_EXPORT_ENV=PATH -# SLURM_GET_USER_ENV=1 -# SLURM_GTIDS=0 -# SLURM_JOBID=6473876 -# SLURM_JOB_ACCOUNT=cis210027p -# SLURM_JOB_CPUS_PER_NODE=5 -# SLURM_JOB_GID=24886 -# SLURM_JOB_GPUS=2 -# SLURM_JOB_ID=6473876 -# SLURM_JOB_NAME=exp/asr_train_asr_raw_en_word/train.log -# SLURM_JOB_NODELIST=v016 -# SLURM_JOB_NUM_NODES=1 -# SLURM_JOB_PARTITION=GPU-shared -# SLURM_JOB_QOS=gpu -# SLURM_JOB_UID=82326 -# SLURM_JOB_USER=ganesank -# SLURM_LOCALID=0 -# SLURM_NNODES=1 -# SLURM_NODEID=0 -# SLURM_NODELIST=v016 -# SLURM_NODE_ALIASES='(null)' -# SLURM_OPEN_MODE=a -# SLURM_PRIO_PROCESS=0 -# SLURM_PROCID=0 -# SLURM_SUBMIT_DIR=/ocean/projects/cis210027p/ganesank/karthik_new/espnet/egs2/dstc2/asr2 -# SLURM_SUBMIT_HOST=br014.ib.bridges2.psc.edu -# SLURM_TASKS_PER_NODE=5 -# SLURM_TASK_PID=41468 -# SLURM_TOPOLOGY_ADDR=v016 -# SLURM_TOPOLOGY_ADDR_PATTERN=node -# SLURM_WORKING_CLUSTER=bridges2:br003:6814:9216:109 -# python3 -m espnet2.bin.asr_train --use_preprocessor true --bpemodel none --token_type word --token_list data/en_token_list/word/tokens.txt --non_linguistic_symbols none --cleaner none --g2p none --valid_data_path_and_name_and_type dump/raw/valid/wav.scp,speech,sound --valid_data_path_and_name_and_type dump/raw/valid/text,text,text --valid_shape_file exp/asr_stats_raw_en_word/valid/speech_shape --valid_shape_file exp/asr_stats_raw_en_word/valid/text_shape.word --resume true --fold_length 80000 --fold_length 150 --output_dir exp/asr_train_asr_raw_en_word --config conf/train_asr.yaml --frontend_conf fs=16k --normalize=global_mvn --normalize_conf stats_file=exp/asr_stats_raw_en_word/train/feats_stats.npz --train_data_path_and_name_and_type dump/raw/train/wav.scp,speech,sound --train_data_path_and_name_and_type dump/raw/train/text,text,text --train_shape_file exp/asr_stats_raw_en_word/train/speech_shape --train_shape_file exp/asr_stats_raw_en_word/train/text_shape.word --ngpu 1 --multiprocessing_distributed True -/ocean/projects/cis210027p/ganesank/karthik_new/espnet/tools/venv/bin/python3 /ocean/projects/cis210027p/ganesank/karthik_new/espnet/espnet2/bin/asr_train.py --use_preprocessor true --bpemodel none --token_type word --token_list data/en_token_list/word/tokens.txt --non_linguistic_symbols none --cleaner none --g2p none --valid_data_path_and_name_and_type dump/raw/valid/wav.scp,speech,sound --valid_data_path_and_name_and_type dump/raw/valid/text,text,text --valid_shape_file exp/asr_stats_raw_en_word/valid/speech_shape --valid_shape_file exp/asr_stats_raw_en_word/valid/text_shape.word --resume true --fold_length 80000 --fold_length 150 --output_dir exp/asr_train_asr_raw_en_word --config conf/train_asr.yaml --frontend_conf fs=16k --normalize=global_mvn --normalize_conf stats_file=exp/asr_stats_raw_en_word/train/feats_stats.npz --train_data_path_and_name_and_type dump/raw/train/wav.scp,speech,sound --train_data_path_and_name_and_type dump/raw/train/text,text,text --train_shape_file exp/asr_stats_raw_en_word/train/speech_shape --train_shape_file exp/asr_stats_raw_en_word/train/text_shape.word --ngpu 1 --multiprocessing_distributed True -[v016] 2022-01-31 04:07:56,959 (asr:382) INFO: Vocabulary size: 613 -[v016] 2022-01-31 04:08:08,479 (abs_task:1132) INFO: pytorch.version=1.8.1+cu102, cuda.available=True, cudnn.version=7605, cudnn.benchmark=False, cudnn.deterministic=True -[v016] 2022-01-31 04:08:08,484 (abs_task:1133) INFO: Model structure: -ESPnetASRModel( - (frontend): DefaultFrontend( - (stft): Stft(n_fft=512, win_length=512, hop_length=128, center=True, normalized=False, onesided=True) - (frontend): Frontend() - (logmel): LogMel(sr=16000, n_fft=512, n_mels=80, fmin=0, fmax=8000.0, htk=False) - ) - (specaug): SpecAug( - (time_warp): TimeWarp(window=5, mode=bicubic) - (freq_mask): MaskAlongAxis(mask_width_range=[0, 30], num_mask=2, axis=freq) - (time_mask): MaskAlongAxis(mask_width_range=[0, 40], num_mask=2, axis=time) - ) - (normalize): GlobalMVN(stats_file=exp/asr_stats_raw_en_word/train/feats_stats.npz, norm_means=True, norm_vars=True) - (encoder): TransformerEncoder( - (embed): Conv2dSubsampling( - (conv): Sequential( - (0): Conv2d(1, 256, kernel_size=(3, 3), stride=(2, 2)) - (1): ReLU() - (2): Conv2d(256, 256, kernel_size=(3, 3), stride=(2, 2)) - (3): ReLU() - ) - (out): Sequential( - (0): Linear(in_features=4864, out_features=256, bias=True) - (1): PositionalEncoding( - (dropout): Dropout(p=0.1, inplace=False) - ) - ) - ) - (encoders): MultiSequential( - (0): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (1): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (2): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (3): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (4): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (5): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (6): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (7): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (8): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (9): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (10): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (11): EncoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - ) - (after_norm): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - ) - (decoder): TransformerDecoder( - (embed): Sequential( - (0): Embedding(613, 256) - (1): PositionalEncoding( - (dropout): Dropout(p=0.1, inplace=False) - ) - ) - (after_norm): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (output_layer): Linear(in_features=256, out_features=613, bias=True) - (decoders): MultiSequential( - (0): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (1): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (2): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (3): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (4): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - (5): DecoderLayer( - (self_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (src_attn): MultiHeadedAttention( - (linear_q): Linear(in_features=256, out_features=256, bias=True) - (linear_k): Linear(in_features=256, out_features=256, bias=True) - (linear_v): Linear(in_features=256, out_features=256, bias=True) - (linear_out): Linear(in_features=256, out_features=256, bias=True) - (dropout): Dropout(p=0.0, inplace=False) - ) - (feed_forward): PositionwiseFeedForward( - (w_1): Linear(in_features=256, out_features=2048, bias=True) - (w_2): Linear(in_features=2048, out_features=256, bias=True) - (dropout): Dropout(p=0.1, inplace=False) - (activation): ReLU() - ) - (norm1): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm2): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (norm3): LayerNorm((256,), eps=1e-12, elementwise_affine=True) - (dropout): Dropout(p=0.1, inplace=False) - ) - ) - ) - (ctc): CTC( - (ctc_lo): Linear(in_features=256, out_features=613, bias=True) - (ctc_loss): CTCLoss() - ) - (criterion_att): LabelSmoothingLoss( - (criterion): KLDivLoss() - ) -) - -Model summary: - Class Name: ESPnetASRModel - Total Number of model parameters: 27.56 M - Number of trainable parameters: 27.56 M (100.0%) - Size: 110.26 MB - Type: torch.float32 -[v016] 2022-01-31 04:08:08,485 (abs_task:1136) INFO: Optimizer: -Adam ( -Parameter Group 0 - amsgrad: False - betas: (0.9, 0.999) - eps: 1e-08 - initial_lr: 0.0002 - lr: 8e-09 - weight_decay: 0 -) -[v016] 2022-01-31 04:08:08,485 (abs_task:1137) INFO: Scheduler: WarmupLR(warmup_steps=25000) -[v016] 2022-01-31 04:08:08,487 (abs_task:1146) INFO: Saving the configuration in exp/asr_train_asr_raw_en_word/config.yaml -[v016] 2022-01-31 04:08:09,035 (abs_task:1493) INFO: [train] dataset: -ESPnetDataset( - speech: {"path": "dump/raw/train/wav.scp", "type": "sound"} - text: {"path": "dump/raw/train/text", "type": "text"} - preprocess: ) -[v016] 2022-01-31 04:08:09,035 (abs_task:1494) INFO: [train] Batch sampler: FoldedBatchSampler(N-batch=547, batch_size=20, shape_files=['exp/asr_stats_raw_en_word/train/speech_shape', 'exp/asr_stats_raw_en_word/train/text_shape.word'], sort_in_batch=descending, sort_batch=descending) -[v016] 2022-01-31 04:08:09,035 (abs_task:1495) INFO: [train] mini-batch sizes summary: N-batch=547, mean=19.9, min=6, max=20 -[v016] 2022-01-31 04:08:09,306 (abs_task:1493) INFO: [valid] dataset: -ESPnetDataset( - speech: {"path": "dump/raw/valid/wav.scp", "type": "sound"} - text: {"path": "dump/raw/valid/text", "type": "text"} - preprocess: ) -[v016] 2022-01-31 04:08:09,306 (abs_task:1494) INFO: [valid] Batch sampler: FoldedBatchSampler(N-batch=178, batch_size=20, shape_files=['exp/asr_stats_raw_en_word/valid/speech_shape', 'exp/asr_stats_raw_en_word/valid/text_shape.word'], sort_in_batch=descending, sort_batch=descending) -[v016] 2022-01-31 04:08:09,306 (abs_task:1495) INFO: [valid] mini-batch sizes summary: N-batch=178, mean=20.0, min=19, max=20 -[v016] 2022-01-31 04:08:09,335 (abs_task:1493) INFO: [plot_att] dataset: -ESPnetDataset( - speech: {"path": "dump/raw/valid/wav.scp", "type": "sound"} - text: {"path": "dump/raw/valid/text", "type": "text"} - preprocess: ) -[v016] 2022-01-31 04:08:09,335 (abs_task:1494) INFO: [plot_att] Batch sampler: UnsortedBatchSampler(N-batch=3559, batch_size=1, key_file=exp/asr_stats_raw_en_word/valid/speech_shape, -[v016] 2022-01-31 04:08:09,336 (abs_task:1495) INFO: [plot_att] mini-batch sizes summary: N-batch=3, mean=1.0, min=1, max=1 -[v016] 2022-01-31 04:08:12,793 (trainer:155) INFO: The training was resumed using exp/asr_train_asr_raw_en_word/checkpoint.pth -[v016] 2022-01-31 04:08:12,799 (trainer:273) INFO: 21/200epoch started -[v016] 2022-01-31 04:08:23,539 (trainer:653) INFO: 21epoch:train:1-27batch: iter_time=0.257, forward_time=0.053, loss=10.500, loss_att=6.421, loss_ctc=14.579, acc=0.818, backward_time=0.025, optim_step_time=0.023, optim0_lr0=8.764e-05, train_time=0.394 -[v016] 2022-01-31 04:08:32,120 (trainer:653) INFO: 21epoch:train:28-54batch: iter_time=0.217, forward_time=0.035, loss=8.680, loss_att=5.426, loss_ctc=11.934, acc=0.819, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.786e-05, train_time=0.318 -[v016] 2022-01-31 04:08:39,796 (trainer:653) INFO: 21epoch:train:55-81batch: iter_time=0.183, forward_time=0.035, loss=8.597, loss_att=5.359, loss_ctc=11.836, acc=0.828, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.807e-05, train_time=0.284 -[v016] 2022-01-31 04:08:46,904 (trainer:653) INFO: 21epoch:train:82-108batch: iter_time=0.158, forward_time=0.036, loss=10.495, loss_att=6.585, loss_ctc=14.405, acc=0.813, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.829e-05, train_time=0.263 -[v016] 2022-01-31 04:08:54,760 (trainer:653) INFO: 21epoch:train:109-135batch: iter_time=0.181, forward_time=0.036, loss=10.404, loss_att=6.396, loss_ctc=14.413, acc=0.813, backward_time=0.025, optim_step_time=0.023, optim0_lr0=8.850e-05, train_time=0.291 -[v016] 2022-01-31 04:09:01,997 (trainer:653) INFO: 21epoch:train:136-162batch: iter_time=0.168, forward_time=0.034, loss=7.216, loss_att=4.410, loss_ctc=10.021, acc=0.834, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.872e-05, train_time=0.268 -[v016] 2022-01-31 04:09:09,618 (trainer:653) INFO: 21epoch:train:163-189batch: iter_time=0.179, forward_time=0.035, loss=11.257, loss_att=7.039, loss_ctc=15.476, acc=0.797, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.894e-05, train_time=0.282 -[v016] 2022-01-31 04:09:15,380 (trainer:653) INFO: 21epoch:train:190-216batch: iter_time=0.110, forward_time=0.035, loss=8.634, loss_att=5.353, loss_ctc=11.914, acc=0.824, backward_time=0.024, optim_step_time=0.024, optim0_lr0=8.915e-05, train_time=0.212 -[v016] 2022-01-31 04:09:22,832 (trainer:653) INFO: 21epoch:train:217-243batch: iter_time=0.172, forward_time=0.035, loss=10.672, loss_att=6.522, loss_ctc=14.822, acc=0.818, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.937e-05, train_time=0.276 -[v016] 2022-01-31 04:09:29,054 (trainer:653) INFO: 21epoch:train:244-270batch: iter_time=0.129, forward_time=0.035, loss=10.486, loss_att=6.485, loss_ctc=14.487, acc=0.808, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.958e-05, train_time=0.230 -[v016] 2022-01-31 04:09:36,174 (trainer:653) INFO: 21epoch:train:271-297batch: iter_time=0.163, forward_time=0.035, loss=8.688, loss_att=5.537, loss_ctc=11.839, acc=0.825, backward_time=0.024, optim_step_time=0.023, optim0_lr0=8.980e-05, train_time=0.263 -[v016] 2022-01-31 04:09:42,787 (trainer:653) INFO: 21epoch:train:298-324batch: iter_time=0.138, forward_time=0.037, loss=11.554, loss_att=7.144, loss_ctc=15.964, acc=0.804, backward_time=0.025, optim_step_time=0.023, optim0_lr0=9.002e-05, train_time=0.245 -[v016] 2022-01-31 04:09:48,867 (trainer:653) INFO: 21epoch:train:325-351batch: iter_time=0.121, forward_time=0.036, loss=10.649, loss_att=6.650, loss_ctc=14.647, acc=0.798, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.023e-05, train_time=0.225 -[v016] 2022-01-31 04:09:54,827 (trainer:653) INFO: 21epoch:train:352-378batch: iter_time=0.121, forward_time=0.034, loss=7.120, loss_att=4.378, loss_ctc=9.862, acc=0.840, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.045e-05, train_time=0.220 -[v016] 2022-01-31 04:10:00,264 (trainer:653) INFO: 21epoch:train:379-405batch: iter_time=0.098, forward_time=0.035, loss=7.360, loss_att=4.603, loss_ctc=10.116, acc=0.837, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.066e-05, train_time=0.201 -[v016] 2022-01-31 04:10:07,350 (trainer:653) INFO: 21epoch:train:406-432batch: iter_time=0.160, forward_time=0.035, loss=9.018, loss_att=5.718, loss_ctc=12.317, acc=0.824, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.088e-05, train_time=0.262 -[v016] 2022-01-31 04:10:15,671 (trainer:653) INFO: 21epoch:train:433-459batch: iter_time=0.133, forward_time=0.097, loss=9.741, loss_att=6.145, loss_ctc=13.337, acc=0.816, backward_time=0.029, optim_step_time=0.025, optim0_lr0=9.110e-05, train_time=0.308 -[v016] 2022-01-31 04:10:22,688 (trainer:653) INFO: 21epoch:train:460-486batch: iter_time=0.155, forward_time=0.037, loss=11.695, loss_att=7.140, loss_ctc=16.250, acc=0.799, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.131e-05, train_time=0.260 -[v016] 2022-01-31 04:10:29,143 (trainer:653) INFO: 21epoch:train:487-513batch: iter_time=0.134, forward_time=0.035, loss=8.702, loss_att=5.420, loss_ctc=11.984, acc=0.816, backward_time=0.024, optim_step_time=0.026, optim0_lr0=9.153e-05, train_time=0.239 -[v016] 2022-01-31 04:10:35,020 (trainer:653) INFO: 21epoch:train:514-540batch: iter_time=0.115, forward_time=0.035, loss=8.034, loss_att=4.932, loss_ctc=11.137, acc=0.833, backward_time=0.025, optim_step_time=0.023, optim0_lr0=9.174e-05, train_time=0.217 -[v016] 2022-01-31 04:11:48,229 (trainer:328) INFO: 21epoch results: [train] iter_time=0.154, forward_time=0.039, loss=9.494, loss_att=5.897, loss_ctc=13.091, acc=0.818, backward_time=0.025, optim_step_time=0.023, optim0_lr0=8.972e-05, train_time=0.262, time=2 minutes and 23.59 seconds, total_count=11487, gpu_max_cached_mem_GB=5.195, [valid] loss=9.787, loss_att=6.687, loss_ctc=12.887, acc=0.823, cer=0.220, wer=0.663, cer_ctc=0.340, time=34.94 seconds, total_count=3738, gpu_max_cached_mem_GB=5.820, [att_plot] time=36.85 seconds, total_count=0, gpu_max_cached_mem_GB=5.820 -[v016] 2022-01-31 04:11:50,739 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:11:50,742 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/16epoch.pth -[v016] 2022-01-31 04:11:50,742 (trainer:261) INFO: 22/200epoch started. Estimated time to finish: 10 hours, 50 minutes and 11.71 seconds -[v016] 2022-01-31 04:11:59,229 (trainer:653) INFO: 22epoch:train:1-27batch: iter_time=0.153, forward_time=0.049, loss=10.752, loss_att=6.474, loss_ctc=15.030, acc=0.806, backward_time=0.037, optim_step_time=0.024, optim0_lr0=9.202e-05, train_time=0.287 -[v016] 2022-01-31 04:12:02,989 (trainer:653) INFO: 22epoch:train:28-54batch: iter_time=0.039, forward_time=0.034, loss=6.860, loss_att=4.297, loss_ctc=9.424, acc=0.831, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.223e-05, train_time=0.139 -[v016] 2022-01-31 04:12:06,480 (trainer:653) INFO: 22epoch:train:55-81batch: iter_time=0.028, forward_time=0.034, loss=7.252, loss_att=4.563, loss_ctc=9.941, acc=0.823, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.245e-05, train_time=0.129 -[v016] 2022-01-31 04:12:10,861 (trainer:653) INFO: 22epoch:train:82-108batch: iter_time=0.059, forward_time=0.036, loss=10.101, loss_att=6.210, loss_ctc=13.992, acc=0.810, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.266e-05, train_time=0.162 -[v016] 2022-01-31 04:12:14,535 (trainer:653) INFO: 22epoch:train:109-135batch: iter_time=0.033, forward_time=0.035, loss=8.321, loss_att=5.192, loss_ctc=11.450, acc=0.829, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.288e-05, train_time=0.136 -[v016] 2022-01-31 04:12:18,571 (trainer:653) INFO: 22epoch:train:136-162batch: iter_time=0.047, forward_time=0.035, loss=10.449, loss_att=6.602, loss_ctc=14.295, acc=0.819, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.310e-05, train_time=0.149 -[v016] 2022-01-31 04:12:21,418 (trainer:653) INFO: 22epoch:train:163-189batch: iter_time=0.004, forward_time=0.034, loss=8.121, loss_att=5.081, loss_ctc=11.162, acc=0.826, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.331e-05, train_time=0.105 -[v016] 2022-01-31 04:12:26,788 (trainer:653) INFO: 22epoch:train:190-216batch: iter_time=0.017, forward_time=0.076, loss=10.028, loss_att=6.308, loss_ctc=13.748, acc=0.820, backward_time=0.032, optim_step_time=0.046, optim0_lr0=9.353e-05, train_time=0.199 -[v016] 2022-01-31 04:12:31,078 (trainer:653) INFO: 22epoch:train:217-243batch: iter_time=0.051, forward_time=0.036, loss=8.611, loss_att=5.442, loss_ctc=11.780, acc=0.837, backward_time=0.026, optim_step_time=0.024, optim0_lr0=9.374e-05, train_time=0.159 -[v016] 2022-01-31 04:12:35,076 (trainer:653) INFO: 22epoch:train:244-270batch: iter_time=0.040, forward_time=0.036, loss=9.265, loss_att=5.738, loss_ctc=12.791, acc=0.826, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.396e-05, train_time=0.148 -[v016] 2022-01-31 04:12:40,863 (trainer:653) INFO: 22epoch:train:271-297batch: iter_time=0.023, forward_time=0.099, loss=9.521, loss_att=6.017, loss_ctc=13.025, acc=0.814, backward_time=0.025, optim_step_time=0.045, optim0_lr0=9.418e-05, train_time=0.214 -[v016] 2022-01-31 04:12:45,015 (trainer:653) INFO: 22epoch:train:298-324batch: iter_time=0.016, forward_time=0.051, loss=10.448, loss_att=6.491, loss_ctc=14.404, acc=0.807, backward_time=0.032, optim_step_time=0.029, optim0_lr0=9.439e-05, train_time=0.152 -[v016] 2022-01-31 04:12:48,374 (trainer:653) INFO: 22epoch:train:325-351batch: iter_time=0.019, forward_time=0.036, loss=9.354, loss_att=5.835, loss_ctc=12.874, acc=0.807, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.461e-05, train_time=0.124 -[v016] 2022-01-31 04:12:51,780 (trainer:653) INFO: 22epoch:train:352-378batch: iter_time=0.021, forward_time=0.035, loss=9.028, loss_att=5.569, loss_ctc=12.486, acc=0.829, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.482e-05, train_time=0.126 -[v016] 2022-01-31 04:12:56,689 (trainer:653) INFO: 22epoch:train:379-405batch: iter_time=0.068, forward_time=0.039, loss=8.644, loss_att=5.332, loss_ctc=11.956, acc=0.838, backward_time=0.026, optim_step_time=0.025, optim0_lr0=9.504e-05, train_time=0.181 -[v016] 2022-01-31 04:13:02,828 (trainer:653) INFO: 22epoch:train:406-432batch: iter_time=0.125, forward_time=0.035, loss=10.646, loss_att=6.361, loss_ctc=14.931, acc=0.822, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.526e-05, train_time=0.227 -[v016] 2022-01-31 04:13:07,494 (trainer:653) INFO: 22epoch:train:433-459batch: iter_time=0.075, forward_time=0.033, loss=9.362, loss_att=5.629, loss_ctc=13.094, acc=0.832, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.547e-05, train_time=0.173 -[v016] 2022-01-31 04:13:13,080 (trainer:653) INFO: 22epoch:train:460-486batch: iter_time=0.104, forward_time=0.035, loss=9.227, loss_att=5.837, loss_ctc=12.616, acc=0.813, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.569e-05, train_time=0.207 -[v016] 2022-01-31 04:13:18,378 (trainer:653) INFO: 22epoch:train:487-513batch: iter_time=0.091, forward_time=0.036, loss=8.507, loss_att=5.196, loss_ctc=11.818, acc=0.833, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.590e-05, train_time=0.196 -[v016] 2022-01-31 04:13:25,203 (trainer:653) INFO: 22epoch:train:514-540batch: iter_time=0.146, forward_time=0.036, loss=9.622, loss_att=6.014, loss_ctc=13.231, acc=0.828, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.612e-05, train_time=0.252 -[v016] 2022-01-31 04:14:22,203 (trainer:328) INFO: 22epoch results: [train] iter_time=0.059, forward_time=0.042, loss=9.165, loss_att=5.683, loss_ctc=12.647, acc=0.823, backward_time=0.026, optim_step_time=0.026, optim0_lr0=9.410e-05, train_time=0.174, time=1 minute and 35.76 seconds, total_count=12034, gpu_max_cached_mem_GB=5.820, [valid] loss=9.840, loss_att=6.559, loss_ctc=13.121, acc=0.828, cer=0.221, wer=0.654, cer_ctc=0.349, time=18.26 seconds, total_count=3916, gpu_max_cached_mem_GB=5.820, [att_plot] time=37.13 seconds, total_count=0, gpu_max_cached_mem_GB=5.820 -[v016] 2022-01-31 04:14:24,941 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 04:14:24,944 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/17epoch.pth -[v016] 2022-01-31 04:14:24,944 (trainer:261) INFO: 23/200epoch started. Estimated time to finish: 9 hours, 12 minutes and 0.88 seconds -[v016] 2022-01-31 04:14:31,317 (trainer:653) INFO: 23epoch:train:1-27batch: iter_time=0.087, forward_time=0.052, loss=10.071, loss_att=6.069, loss_ctc=14.073, acc=0.826, backward_time=0.040, optim_step_time=0.023, optim0_lr0=9.639e-05, train_time=0.226 -[v016] 2022-01-31 04:14:35,374 (trainer:653) INFO: 23epoch:train:28-54batch: iter_time=0.049, forward_time=0.034, loss=8.022, loss_att=4.818, loss_ctc=11.227, acc=0.841, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.661e-05, train_time=0.150 -[v016] 2022-01-31 04:14:39,199 (trainer:653) INFO: 23epoch:train:55-81batch: iter_time=0.041, forward_time=0.034, loss=7.378, loss_att=4.598, loss_ctc=10.157, acc=0.838, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.682e-05, train_time=0.141 -[v016] 2022-01-31 04:14:42,484 (trainer:653) INFO: 23epoch:train:82-108batch: iter_time=0.020, forward_time=0.034, loss=7.694, loss_att=4.780, loss_ctc=10.608, acc=0.839, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.704e-05, train_time=0.121 -[v016] 2022-01-31 04:14:48,803 (trainer:653) INFO: 23epoch:train:109-135batch: iter_time=0.055, forward_time=0.097, loss=8.698, loss_att=5.360, loss_ctc=12.037, acc=0.825, backward_time=0.031, optim_step_time=0.026, optim0_lr0=9.726e-05, train_time=0.234 -[v016] 2022-01-31 04:14:55,410 (trainer:653) INFO: 23epoch:train:136-162batch: iter_time=0.141, forward_time=0.035, loss=9.566, loss_att=5.728, loss_ctc=13.404, acc=0.835, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.747e-05, train_time=0.244 -[v016] 2022-01-31 04:14:59,806 (trainer:653) INFO: 23epoch:train:163-189batch: iter_time=0.059, forward_time=0.036, loss=9.266, loss_att=5.771, loss_ctc=12.762, acc=0.821, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.769e-05, train_time=0.163 -[v016] 2022-01-31 04:15:04,139 (trainer:653) INFO: 23epoch:train:190-216batch: iter_time=0.052, forward_time=0.040, loss=8.176, loss_att=5.111, loss_ctc=11.241, acc=0.837, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.790e-05, train_time=0.160 -[v016] 2022-01-31 04:15:08,993 (trainer:653) INFO: 23epoch:train:217-243batch: iter_time=0.075, forward_time=0.035, loss=9.492, loss_att=5.863, loss_ctc=13.121, acc=0.824, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.812e-05, train_time=0.180 -[v016] 2022-01-31 04:15:15,842 (trainer:653) INFO: 23epoch:train:244-270batch: iter_time=0.124, forward_time=0.042, loss=10.875, loss_att=6.781, loss_ctc=14.969, acc=0.812, backward_time=0.026, optim_step_time=0.024, optim0_lr0=9.834e-05, train_time=0.252 -[v016] 2022-01-31 04:15:22,067 (trainer:653) INFO: 23epoch:train:271-297batch: iter_time=0.127, forward_time=0.035, loss=9.313, loss_att=5.617, loss_ctc=13.009, acc=0.823, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.855e-05, train_time=0.232 -[v016] 2022-01-31 04:15:27,041 (trainer:653) INFO: 23epoch:train:298-324batch: iter_time=0.084, forward_time=0.034, loss=7.607, loss_att=4.626, loss_ctc=10.588, acc=0.841, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.877e-05, train_time=0.184 -[v016] 2022-01-31 04:15:31,814 (trainer:653) INFO: 23epoch:train:325-351batch: iter_time=0.074, forward_time=0.035, loss=10.085, loss_att=6.354, loss_ctc=13.816, acc=0.809, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.898e-05, train_time=0.177 -[v016] 2022-01-31 04:15:35,798 (trainer:653) INFO: 23epoch:train:352-378batch: iter_time=0.042, forward_time=0.037, loss=8.549, loss_att=5.278, loss_ctc=11.820, acc=0.831, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.920e-05, train_time=0.147 -[v016] 2022-01-31 04:15:40,658 (trainer:653) INFO: 23epoch:train:379-405batch: iter_time=0.076, forward_time=0.035, loss=8.139, loss_att=5.144, loss_ctc=11.135, acc=0.829, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.942e-05, train_time=0.180 -[v016] 2022-01-31 04:15:44,046 (trainer:653) INFO: 23epoch:train:406-432batch: iter_time=0.022, forward_time=0.036, loss=9.136, loss_att=5.573, loss_ctc=12.699, acc=0.819, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.963e-05, train_time=0.125 -[v016] 2022-01-31 04:15:47,908 (trainer:653) INFO: 23epoch:train:433-459batch: iter_time=0.042, forward_time=0.034, loss=6.734, loss_att=4.142, loss_ctc=9.327, acc=0.849, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.985e-05, train_time=0.143 -[v016] 2022-01-31 04:15:53,733 (trainer:653) INFO: 23epoch:train:460-486batch: iter_time=0.110, forward_time=0.036, loss=9.450, loss_att=5.679, loss_ctc=13.222, acc=0.836, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.215 -[v016] 2022-01-31 04:15:56,990 (trainer:653) INFO: 23epoch:train:487-513batch: iter_time=0.020, forward_time=0.034, loss=7.582, loss_att=4.635, loss_ctc=10.528, acc=0.830, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.003e-04, train_time=0.120 -[v016] 2022-01-31 04:16:02,020 (trainer:653) INFO: 23epoch:train:514-540batch: iter_time=0.074, forward_time=0.038, loss=11.018, loss_att=6.727, loss_ctc=15.308, acc=0.815, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.005e-04, train_time=0.186 -[v016] 2022-01-31 04:16:57,565 (trainer:328) INFO: 23epoch results: [train] iter_time=0.069, forward_time=0.040, loss=8.874, loss_att=5.453, loss_ctc=12.295, acc=0.829, backward_time=0.025, optim_step_time=0.024, optim0_lr0=9.847e-05, train_time=0.179, time=1 minute and 38.4 seconds, total_count=12581, gpu_max_cached_mem_GB=5.820, [valid] loss=9.105, loss_att=6.232, loss_ctc=11.978, acc=0.836, cer=0.207, wer=0.621, cer_ctc=0.321, time=19.98 seconds, total_count=4094, gpu_max_cached_mem_GB=5.820, [att_plot] time=34.03 seconds, total_count=0, gpu_max_cached_mem_GB=5.820 -[v016] 2022-01-31 04:17:00,284 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:17:00,286 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/18epoch.pth -[v016] 2022-01-31 04:17:00,286 (trainer:261) INFO: 24/200epoch started. Estimated time to finish: 8 hours, 38 minutes and 41.72 seconds -[v016] 2022-01-31 04:17:04,093 (trainer:653) INFO: 24epoch:train:1-27batch: iter_time=0.025, forward_time=0.035, loss=8.971, loss_att=5.505, loss_ctc=12.436, acc=0.827, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.008e-04, train_time=0.135 -[v016] 2022-01-31 04:17:08,396 (trainer:653) INFO: 24epoch:train:28-54batch: iter_time=0.054, forward_time=0.036, loss=8.516, loss_att=5.161, loss_ctc=11.871, acc=0.846, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.010e-04, train_time=0.159 -[v016] 2022-01-31 04:17:12,459 (trainer:653) INFO: 24epoch:train:55-81batch: iter_time=0.046, forward_time=0.036, loss=10.777, loss_att=6.695, loss_ctc=14.859, acc=0.809, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.012e-04, train_time=0.150 -[v016] 2022-01-31 04:17:15,765 (trainer:653) INFO: 24epoch:train:82-108batch: iter_time=0.020, forward_time=0.035, loss=7.361, loss_att=4.509, loss_ctc=10.212, acc=0.847, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.014e-04, train_time=0.122 -[v016] 2022-01-31 04:17:20,313 (trainer:653) INFO: 24epoch:train:109-135batch: iter_time=0.068, forward_time=0.034, loss=7.522, loss_att=4.490, loss_ctc=10.554, acc=0.839, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.016e-04, train_time=0.168 -[v016] 2022-01-31 04:17:24,224 (trainer:653) INFO: 24epoch:train:136-162batch: iter_time=0.040, forward_time=0.037, loss=9.391, loss_att=5.749, loss_ctc=13.034, acc=0.823, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.018e-04, train_time=0.145 -[v016] 2022-01-31 04:17:27,568 (trainer:653) INFO: 24epoch:train:163-189batch: iter_time=0.016, forward_time=0.038, loss=8.485, loss_att=5.189, loss_ctc=11.780, acc=0.836, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.021e-04, train_time=0.124 -[v016] 2022-01-31 04:17:32,465 (trainer:653) INFO: 24epoch:train:190-216batch: iter_time=0.075, forward_time=0.036, loss=10.512, loss_att=6.415, loss_ctc=14.609, acc=0.816, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.023e-04, train_time=0.181 -[v016] 2022-01-31 04:17:35,578 (trainer:653) INFO: 24epoch:train:217-243batch: iter_time=0.012, forward_time=0.035, loss=9.324, loss_att=5.709, loss_ctc=12.938, acc=0.812, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.025e-04, train_time=0.115 -[v016] 2022-01-31 04:17:39,263 (trainer:653) INFO: 24epoch:train:244-270batch: iter_time=0.035, forward_time=0.034, loss=7.551, loss_att=4.670, loss_ctc=10.433, acc=0.836, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.027e-04, train_time=0.136 -[v016] 2022-01-31 04:17:43,652 (trainer:653) INFO: 24epoch:train:271-297batch: iter_time=0.059, forward_time=0.035, loss=8.061, loss_att=4.983, loss_ctc=11.139, acc=0.832, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.029e-04, train_time=0.162 -[v016] 2022-01-31 04:17:49,443 (trainer:653) INFO: 24epoch:train:298-324batch: iter_time=0.018, forward_time=0.113, loss=7.815, loss_att=4.838, loss_ctc=10.792, acc=0.840, backward_time=0.035, optim_step_time=0.025, optim0_lr0=1.031e-04, train_time=0.214 -[v016] 2022-01-31 04:17:55,520 (trainer:653) INFO: 24epoch:train:325-351batch: iter_time=0.116, forward_time=0.038, loss=10.079, loss_att=6.006, loss_ctc=14.151, acc=0.833, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.034e-04, train_time=0.225 -[v016] 2022-01-31 04:17:59,578 (trainer:653) INFO: 24epoch:train:352-378batch: iter_time=0.044, forward_time=0.036, loss=9.452, loss_att=5.777, loss_ctc=13.127, acc=0.824, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.036e-04, train_time=0.150 -[v016] 2022-01-31 04:18:03,209 (trainer:653) INFO: 24epoch:train:379-405batch: iter_time=0.033, forward_time=0.035, loss=7.892, loss_att=4.790, loss_ctc=10.995, acc=0.848, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.038e-04, train_time=0.134 -[v016] 2022-01-31 04:18:09,978 (trainer:653) INFO: 24epoch:train:406-432batch: iter_time=0.085, forward_time=0.081, loss=6.568, loss_att=4.088, loss_ctc=9.048, acc=0.853, backward_time=0.028, optim_step_time=0.024, optim0_lr0=1.040e-04, train_time=0.250 -[v016] 2022-01-31 04:18:14,475 (trainer:653) INFO: 24epoch:train:433-459batch: iter_time=0.061, forward_time=0.036, loss=9.558, loss_att=5.793, loss_ctc=13.323, acc=0.826, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.042e-04, train_time=0.166 -[v016] 2022-01-31 04:18:18,792 (trainer:653) INFO: 24epoch:train:460-486batch: iter_time=0.055, forward_time=0.035, loss=8.333, loss_att=5.074, loss_ctc=11.592, acc=0.843, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.044e-04, train_time=0.160 -[v016] 2022-01-31 04:18:22,332 (trainer:653) INFO: 24epoch:train:487-513batch: iter_time=0.030, forward_time=0.035, loss=7.913, loss_att=4.798, loss_ctc=11.028, acc=0.836, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.047e-04, train_time=0.131 -[v016] 2022-01-31 04:18:26,857 (trainer:653) INFO: 24epoch:train:514-540batch: iter_time=0.062, forward_time=0.038, loss=7.856, loss_att=4.756, loss_ctc=10.955, acc=0.849, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.049e-04, train_time=0.167 -[v016] 2022-01-31 04:19:19,460 (trainer:328) INFO: 24epoch results: [train] iter_time=0.047, forward_time=0.042, loss=8.588, loss_att=5.245, loss_ctc=11.931, acc=0.834, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.028e-04, train_time=0.159, time=1 minute and 27.42 seconds, total_count=13128, gpu_max_cached_mem_GB=5.822, [valid] loss=9.055, loss_att=6.223, loss_ctc=11.888, acc=0.836, cer=0.199, wer=0.619, cer_ctc=0.326, time=18.59 seconds, total_count=4272, gpu_max_cached_mem_GB=5.822, [att_plot] time=33.06 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:19:22,504 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:19:22,506 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/19epoch.pth -[v016] 2022-01-31 04:19:22,507 (trainer:261) INFO: 25/200epoch started. Estimated time to finish: 8 hours, 11 minutes and 7.11 seconds -[v016] 2022-01-31 04:19:29,051 (trainer:653) INFO: 25epoch:train:1-27batch: iter_time=0.131, forward_time=0.036, loss=8.460, loss_att=5.139, loss_ctc=11.780, acc=0.844, backward_time=0.026, optim_step_time=0.023, optim0_lr0=1.051e-04, train_time=0.238 -[v016] 2022-01-31 04:19:33,862 (trainer:653) INFO: 25epoch:train:28-54batch: iter_time=0.079, forward_time=0.033, loss=7.147, loss_att=4.401, loss_ctc=9.893, acc=0.842, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.054e-04, train_time=0.179 -[v016] 2022-01-31 04:19:38,137 (trainer:653) INFO: 25epoch:train:55-81batch: iter_time=0.047, forward_time=0.036, loss=10.011, loss_att=6.030, loss_ctc=13.992, acc=0.824, backward_time=0.024, optim_step_time=0.030, optim0_lr0=1.056e-04, train_time=0.158 -[v016] 2022-01-31 04:19:41,508 (trainer:653) INFO: 25epoch:train:82-108batch: iter_time=0.023, forward_time=0.035, loss=8.054, loss_att=4.871, loss_ctc=11.238, acc=0.834, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.058e-04, train_time=0.125 -[v016] 2022-01-31 04:19:45,402 (trainer:653) INFO: 25epoch:train:109-135batch: iter_time=0.044, forward_time=0.034, loss=7.397, loss_att=4.542, loss_ctc=10.252, acc=0.832, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.060e-04, train_time=0.144 -[v016] 2022-01-31 04:19:49,047 (trainer:653) INFO: 25epoch:train:136-162batch: iter_time=0.032, forward_time=0.035, loss=8.155, loss_att=4.899, loss_ctc=11.410, acc=0.838, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.062e-04, train_time=0.135 -[v016] 2022-01-31 04:19:53,204 (trainer:653) INFO: 25epoch:train:163-189batch: iter_time=0.044, forward_time=0.037, loss=8.673, loss_att=5.241, loss_ctc=12.104, acc=0.826, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.064e-04, train_time=0.154 -[v016] 2022-01-31 04:19:58,267 (trainer:653) INFO: 25epoch:train:190-216batch: iter_time=0.082, forward_time=0.036, loss=9.527, loss_att=5.633, loss_ctc=13.421, acc=0.842, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.067e-04, train_time=0.187 -[v016] 2022-01-31 04:20:02,626 (trainer:653) INFO: 25epoch:train:217-243batch: iter_time=0.055, forward_time=0.036, loss=8.951, loss_att=5.232, loss_ctc=12.671, acc=0.842, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.069e-04, train_time=0.161 -[v016] 2022-01-31 04:20:07,087 (trainer:653) INFO: 25epoch:train:244-270batch: iter_time=0.061, forward_time=0.036, loss=8.774, loss_att=5.312, loss_ctc=12.237, acc=0.837, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.071e-04, train_time=0.165 -[v016] 2022-01-31 04:20:11,241 (trainer:653) INFO: 25epoch:train:271-297batch: iter_time=0.048, forward_time=0.037, loss=7.178, loss_att=4.303, loss_ctc=10.054, acc=0.848, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.073e-04, train_time=0.154 -[v016] 2022-01-31 04:20:17,837 (trainer:653) INFO: 25epoch:train:298-324batch: iter_time=0.071, forward_time=0.050, loss=8.548, loss_att=5.118, loss_ctc=11.978, acc=0.835, backward_time=0.071, optim_step_time=0.026, optim0_lr0=1.075e-04, train_time=0.244 -[v016] 2022-01-31 04:20:22,561 (trainer:653) INFO: 25epoch:train:325-351batch: iter_time=0.071, forward_time=0.035, loss=8.534, loss_att=5.225, loss_ctc=11.844, acc=0.829, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.077e-04, train_time=0.175 -[v016] 2022-01-31 04:20:26,720 (trainer:653) INFO: 25epoch:train:352-378batch: iter_time=0.052, forward_time=0.035, loss=8.037, loss_att=4.819, loss_ctc=11.255, acc=0.844, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.080e-04, train_time=0.154 -[v016] 2022-01-31 04:20:30,990 (trainer:653) INFO: 25epoch:train:379-405batch: iter_time=0.054, forward_time=0.035, loss=9.108, loss_att=5.504, loss_ctc=12.711, acc=0.833, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.082e-04, train_time=0.158 -[v016] 2022-01-31 04:20:38,685 (trainer:653) INFO: 25epoch:train:406-432batch: iter_time=0.082, forward_time=0.118, loss=8.157, loss_att=4.811, loss_ctc=11.504, acc=0.849, backward_time=0.035, optim_step_time=0.023, optim0_lr0=1.084e-04, train_time=0.285 -[v016] 2022-01-31 04:20:43,561 (trainer:653) INFO: 25epoch:train:433-459batch: iter_time=0.077, forward_time=0.035, loss=9.091, loss_att=5.529, loss_ctc=12.653, acc=0.836, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.086e-04, train_time=0.180 -[v016] 2022-01-31 04:20:49,252 (trainer:653) INFO: 25epoch:train:460-486batch: iter_time=0.106, forward_time=0.036, loss=9.367, loss_att=5.604, loss_ctc=13.130, acc=0.833, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.088e-04, train_time=0.211 -[v016] 2022-01-31 04:20:54,008 (trainer:653) INFO: 25epoch:train:487-513batch: iter_time=0.073, forward_time=0.035, loss=7.754, loss_att=4.819, loss_ctc=10.689, acc=0.832, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.090e-04, train_time=0.176 -[v016] 2022-01-31 04:20:58,257 (trainer:653) INFO: 25epoch:train:514-540batch: iter_time=0.055, forward_time=0.035, loss=8.461, loss_att=5.214, loss_ctc=11.709, acc=0.837, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.092e-04, train_time=0.157 -[v016] 2022-01-31 04:21:51,032 (trainer:328) INFO: 25epoch results: [train] iter_time=0.064, forward_time=0.040, loss=8.451, loss_att=5.100, loss_ctc=11.801, acc=0.837, backward_time=0.027, optim_step_time=0.024, optim0_lr0=1.072e-04, train_time=0.176, time=1 minute and 36.74 seconds, total_count=13675, gpu_max_cached_mem_GB=5.822, [valid] loss=8.797, loss_att=6.015, loss_ctc=11.579, acc=0.844, cer=0.198, wer=0.607, cer_ctc=0.304, time=19.5 seconds, total_count=4450, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.17 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:21:53,501 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:21:53,504 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/20epoch.pth -[v016] 2022-01-31 04:21:53,504 (trainer:261) INFO: 26/200epoch started. Estimated time to finish: 7 hours, 58 minutes and 44.66 seconds -[v016] 2022-01-31 04:21:58,450 (trainer:653) INFO: 26epoch:train:1-27batch: iter_time=0.069, forward_time=0.036, loss=10.117, loss_att=5.996, loss_ctc=14.238, acc=0.830, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.178 -[v016] 2022-01-31 04:22:02,004 (trainer:653) INFO: 26epoch:train:28-54batch: iter_time=0.031, forward_time=0.034, loss=6.945, loss_att=4.128, loss_ctc=9.761, acc=0.854, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.097e-04, train_time=0.131 -[v016] 2022-01-31 04:22:05,887 (trainer:653) INFO: 26epoch:train:55-81batch: iter_time=0.039, forward_time=0.037, loss=8.157, loss_att=4.739, loss_ctc=11.574, acc=0.853, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.100e-04, train_time=0.144 -[v016] 2022-01-31 04:22:09,369 (trainer:653) INFO: 26epoch:train:82-108batch: iter_time=0.022, forward_time=0.038, loss=9.258, loss_att=5.610, loss_ctc=12.907, acc=0.821, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.102e-04, train_time=0.129 -[v016] 2022-01-31 04:22:12,515 (trainer:653) INFO: 26epoch:train:109-135batch: iter_time=0.016, forward_time=0.034, loss=7.597, loss_att=4.684, loss_ctc=10.509, acc=0.836, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.104e-04, train_time=0.116 -[v016] 2022-01-31 04:22:15,815 (trainer:653) INFO: 26epoch:train:136-162batch: iter_time=0.021, forward_time=0.034, loss=7.090, loss_att=4.350, loss_ctc=9.829, acc=0.851, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.106e-04, train_time=0.122 -[v016] 2022-01-31 04:22:18,853 (trainer:653) INFO: 26epoch:train:163-189batch: iter_time=0.010, forward_time=0.035, loss=7.554, loss_att=4.582, loss_ctc=10.526, acc=0.858, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.108e-04, train_time=0.112 -[v016] 2022-01-31 04:22:21,671 (trainer:653) INFO: 26epoch:train:190-216batch: iter_time=0.002, forward_time=0.035, loss=8.261, loss_att=4.851, loss_ctc=11.671, acc=0.850, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.110e-04, train_time=0.104 -[v016] 2022-01-31 04:22:24,707 (trainer:653) INFO: 26epoch:train:217-243batch: iter_time=0.004, forward_time=0.036, loss=6.525, loss_att=3.949, loss_ctc=9.100, acc=0.854, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.112e-04, train_time=0.112 -[v016] 2022-01-31 04:22:31,474 (trainer:653) INFO: 26epoch:train:244-270batch: iter_time=0.049, forward_time=0.103, loss=7.584, loss_att=4.675, loss_ctc=10.494, acc=0.833, backward_time=0.031, optim_step_time=0.045, optim0_lr0=1.115e-04, train_time=0.250 -[v016] 2022-01-31 04:22:36,643 (trainer:653) INFO: 26epoch:train:271-297batch: iter_time=0.089, forward_time=0.035, loss=9.138, loss_att=5.664, loss_ctc=12.612, acc=0.824, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.117e-04, train_time=0.191 -[v016] 2022-01-31 04:22:40,153 (trainer:653) INFO: 26epoch:train:298-324batch: iter_time=0.027, forward_time=0.035, loss=8.338, loss_att=5.113, loss_ctc=11.562, acc=0.835, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.119e-04, train_time=0.130 -[v016] 2022-01-31 04:22:44,150 (trainer:653) INFO: 26epoch:train:325-351batch: iter_time=0.043, forward_time=0.035, loss=8.664, loss_att=5.220, loss_ctc=12.107, acc=0.834, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.121e-04, train_time=0.148 -[v016] 2022-01-31 04:22:49,006 (trainer:653) INFO: 26epoch:train:352-378batch: iter_time=0.076, forward_time=0.035, loss=9.626, loss_att=5.885, loss_ctc=13.367, acc=0.828, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.123e-04, train_time=0.180 -[v016] 2022-01-31 04:22:52,848 (trainer:653) INFO: 26epoch:train:379-405batch: iter_time=0.035, forward_time=0.035, loss=7.775, loss_att=4.527, loss_ctc=11.022, acc=0.848, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.125e-04, train_time=0.142 -[v016] 2022-01-31 04:22:58,617 (trainer:653) INFO: 26epoch:train:406-432batch: iter_time=0.106, forward_time=0.036, loss=9.698, loss_att=5.781, loss_ctc=13.615, acc=0.844, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.128e-04, train_time=0.213 -[v016] 2022-01-31 04:23:02,479 (trainer:653) INFO: 26epoch:train:433-459batch: iter_time=0.039, forward_time=0.035, loss=8.404, loss_att=5.139, loss_ctc=11.669, acc=0.846, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.130e-04, train_time=0.143 -[v016] 2022-01-31 04:23:06,584 (trainer:653) INFO: 26epoch:train:460-486batch: iter_time=0.051, forward_time=0.034, loss=6.900, loss_att=4.247, loss_ctc=9.553, acc=0.846, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.132e-04, train_time=0.152 -[v016] 2022-01-31 04:23:10,563 (trainer:653) INFO: 26epoch:train:487-513batch: iter_time=0.043, forward_time=0.036, loss=8.547, loss_att=5.021, loss_ctc=12.074, acc=0.852, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.134e-04, train_time=0.147 -[v016] 2022-01-31 04:23:14,840 (trainer:653) INFO: 26epoch:train:514-540batch: iter_time=0.030, forward_time=0.036, loss=7.477, loss_att=4.396, loss_ctc=10.559, acc=0.851, backward_time=0.025, optim_step_time=0.048, optim0_lr0=1.136e-04, train_time=0.158 -[v016] 2022-01-31 04:24:15,615 (trainer:328) INFO: 26epoch results: [train] iter_time=0.042, forward_time=0.041, loss=8.175, loss_att=4.923, loss_ctc=11.427, acc=0.842, backward_time=0.025, optim_step_time=0.026, optim0_lr0=1.116e-04, train_time=0.155, time=1 minute and 25.37 seconds, total_count=14222, gpu_max_cached_mem_GB=5.822, [valid] loss=8.506, loss_att=5.806, loss_ctc=11.206, acc=0.850, cer=0.187, wer=0.593, cer_ctc=0.304, time=22.32 seconds, total_count=4628, gpu_max_cached_mem_GB=5.822, [att_plot] time=34.39 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:24:19,165 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:24:19,167 (trainer:261) INFO: 27/200epoch started. Estimated time to finish: 7 hours, 47 minutes and 4.65 seconds -[v016] 2022-01-31 04:24:27,734 (trainer:653) INFO: 27epoch:train:1-27batch: iter_time=0.157, forward_time=0.063, loss=7.455, loss_att=4.397, loss_ctc=10.513, acc=0.849, backward_time=0.030, optim_step_time=0.024, optim0_lr0=1.139e-04, train_time=0.304 -[v016] 2022-01-31 04:24:33,312 (trainer:653) INFO: 27epoch:train:28-54batch: iter_time=0.107, forward_time=0.034, loss=7.199, loss_att=4.337, loss_ctc=10.062, acc=0.852, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.141e-04, train_time=0.207 -[v016] 2022-01-31 04:24:38,256 (trainer:653) INFO: 27epoch:train:55-81batch: iter_time=0.079, forward_time=0.036, loss=9.956, loss_att=5.916, loss_ctc=13.997, acc=0.828, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.143e-04, train_time=0.183 -[v016] 2022-01-31 04:24:44,914 (trainer:653) INFO: 27epoch:train:82-108batch: iter_time=0.142, forward_time=0.037, loss=8.516, loss_att=5.084, loss_ctc=11.948, acc=0.841, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.145e-04, train_time=0.246 -[v016] 2022-01-31 04:24:49,658 (trainer:653) INFO: 27epoch:train:109-135batch: iter_time=0.071, forward_time=0.036, loss=9.368, loss_att=5.543, loss_ctc=13.192, acc=0.831, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.148e-04, train_time=0.175 -[v016] 2022-01-31 04:24:54,917 (trainer:653) INFO: 27epoch:train:136-162batch: iter_time=0.095, forward_time=0.034, loss=5.614, loss_att=3.522, loss_ctc=7.705, acc=0.856, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.150e-04, train_time=0.194 -[v016] 2022-01-31 04:24:59,278 (trainer:653) INFO: 27epoch:train:163-189batch: iter_time=0.059, forward_time=0.035, loss=7.289, loss_att=4.319, loss_ctc=10.259, acc=0.850, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.152e-04, train_time=0.161 -[v016] 2022-01-31 04:25:03,191 (trainer:653) INFO: 27epoch:train:190-216batch: iter_time=0.042, forward_time=0.035, loss=7.305, loss_att=4.256, loss_ctc=10.354, acc=0.867, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.154e-04, train_time=0.145 -[v016] 2022-01-31 04:25:07,580 (trainer:653) INFO: 27epoch:train:217-243batch: iter_time=0.052, forward_time=0.041, loss=7.839, loss_att=4.625, loss_ctc=11.054, acc=0.847, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.156e-04, train_time=0.162 -[v016] 2022-01-31 04:25:13,042 (trainer:653) INFO: 27epoch:train:244-270batch: iter_time=0.101, forward_time=0.034, loss=7.459, loss_att=4.502, loss_ctc=10.417, acc=0.838, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.158e-04, train_time=0.202 -[v016] 2022-01-31 04:25:18,085 (trainer:653) INFO: 27epoch:train:271-297batch: iter_time=0.061, forward_time=0.049, loss=8.082, loss_att=4.760, loss_ctc=11.403, acc=0.848, backward_time=0.027, optim_step_time=0.025, optim0_lr0=1.161e-04, train_time=0.187 -[v016] 2022-01-31 04:25:22,834 (trainer:653) INFO: 27epoch:train:298-324batch: iter_time=0.072, forward_time=0.035, loss=8.598, loss_att=4.980, loss_ctc=12.217, acc=0.843, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.163e-04, train_time=0.176 -[v016] 2022-01-31 04:25:27,318 (trainer:653) INFO: 27epoch:train:325-351batch: iter_time=0.066, forward_time=0.034, loss=8.790, loss_att=5.159, loss_ctc=12.422, acc=0.843, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.165e-04, train_time=0.166 -[v016] 2022-01-31 04:25:31,395 (trainer:653) INFO: 27epoch:train:352-378batch: iter_time=0.053, forward_time=0.033, loss=7.038, loss_att=4.190, loss_ctc=9.886, acc=0.854, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.167e-04, train_time=0.151 -[v016] 2022-01-31 04:25:36,125 (trainer:653) INFO: 27epoch:train:379-405batch: iter_time=0.076, forward_time=0.034, loss=9.478, loss_att=5.559, loss_ctc=13.397, acc=0.833, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.169e-04, train_time=0.175 -[v016] 2022-01-31 04:25:41,132 (trainer:653) INFO: 27epoch:train:406-432batch: iter_time=0.085, forward_time=0.034, loss=8.044, loss_att=4.799, loss_ctc=11.289, acc=0.838, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.171e-04, train_time=0.185 -[v016] 2022-01-31 04:25:45,964 (trainer:653) INFO: 27epoch:train:433-459batch: iter_time=0.076, forward_time=0.035, loss=7.883, loss_att=4.687, loss_ctc=11.080, acc=0.843, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.174e-04, train_time=0.179 -[v016] 2022-01-31 04:25:50,000 (trainer:653) INFO: 27epoch:train:460-486batch: iter_time=0.046, forward_time=0.035, loss=7.427, loss_att=4.488, loss_ctc=10.366, acc=0.849, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.176e-04, train_time=0.149 -[v016] 2022-01-31 04:25:55,459 (trainer:653) INFO: 27epoch:train:487-513batch: iter_time=0.030, forward_time=0.089, loss=8.408, loss_att=4.855, loss_ctc=11.960, acc=0.848, backward_time=0.027, optim_step_time=0.032, optim0_lr0=1.178e-04, train_time=0.202 -[v016] 2022-01-31 04:25:59,859 (trainer:653) INFO: 27epoch:train:514-540batch: iter_time=0.059, forward_time=0.035, loss=7.868, loss_att=4.739, loss_ctc=10.997, acc=0.848, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.180e-04, train_time=0.163 -[v016] 2022-01-31 04:27:05,346 (trainer:328) INFO: 27epoch results: [train] iter_time=0.076, forward_time=0.040, loss=8.004, loss_att=4.747, loss_ctc=11.261, acc=0.845, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.160e-04, train_time=0.185, time=1 minute and 41.83 seconds, total_count=14769, gpu_max_cached_mem_GB=5.822, [valid] loss=8.791, loss_att=5.963, loss_ctc=11.619, acc=0.846, cer=0.198, wer=0.607, cer_ctc=0.300, time=26.53 seconds, total_count=4806, gpu_max_cached_mem_GB=5.822, [att_plot] time=37.71 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:27:08,041 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 04:27:08,044 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/21epoch.pth, exp/asr_train_asr_raw_en_word/22epoch.pth -[v016] 2022-01-31 04:27:08,044 (trainer:261) INFO: 28/200epoch started. Estimated time to finish: 7 hours, 47 minutes and 36.77 seconds -[v016] 2022-01-31 04:27:15,466 (trainer:653) INFO: 28epoch:train:1-27batch: iter_time=0.122, forward_time=0.054, loss=9.109, loss_att=5.477, loss_ctc=12.742, acc=0.837, backward_time=0.038, optim_step_time=0.025, optim0_lr0=1.183e-04, train_time=0.266 -[v016] 2022-01-31 04:27:22,349 (trainer:653) INFO: 28epoch:train:28-54batch: iter_time=0.150, forward_time=0.035, loss=6.800, loss_att=4.121, loss_ctc=9.480, acc=0.851, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.185e-04, train_time=0.254 -[v016] 2022-01-31 04:27:27,112 (trainer:653) INFO: 28epoch:train:55-81batch: iter_time=0.068, forward_time=0.036, loss=8.871, loss_att=5.103, loss_ctc=12.639, acc=0.845, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.187e-04, train_time=0.176 -[v016] 2022-01-31 04:27:33,537 (trainer:653) INFO: 28epoch:train:82-108batch: iter_time=0.114, forward_time=0.043, loss=7.389, loss_att=4.373, loss_ctc=10.404, acc=0.857, backward_time=0.025, optim_step_time=0.032, optim0_lr0=1.189e-04, train_time=0.237 -[v016] 2022-01-31 04:27:39,019 (trainer:653) INFO: 28epoch:train:109-135batch: iter_time=0.099, forward_time=0.035, loss=7.602, loss_att=4.468, loss_ctc=10.736, acc=0.840, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.191e-04, train_time=0.203 -[v016] 2022-01-31 04:27:44,774 (trainer:653) INFO: 28epoch:train:136-162batch: iter_time=0.108, forward_time=0.036, loss=7.161, loss_att=4.209, loss_ctc=10.112, acc=0.857, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.194e-04, train_time=0.213 -[v016] 2022-01-31 04:27:50,426 (trainer:653) INFO: 28epoch:train:163-189batch: iter_time=0.107, forward_time=0.034, loss=7.554, loss_att=4.442, loss_ctc=10.666, acc=0.853, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.196e-04, train_time=0.209 -[v016] 2022-01-31 04:28:02,324 (trainer:653) INFO: 28epoch:train:190-216batch: iter_time=0.189, forward_time=0.170, loss=7.392, loss_att=4.410, loss_ctc=10.373, acc=0.852, backward_time=0.028, optim_step_time=0.024, optim0_lr0=1.198e-04, train_time=0.440 -[v016] 2022-01-31 04:28:10,627 (trainer:653) INFO: 28epoch:train:217-243batch: iter_time=0.203, forward_time=0.036, loss=8.724, loss_att=5.024, loss_ctc=12.423, acc=0.842, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.200e-04, train_time=0.307 -[v016] 2022-01-31 04:28:18,460 (trainer:653) INFO: 28epoch:train:244-270batch: iter_time=0.183, forward_time=0.036, loss=9.148, loss_att=5.221, loss_ctc=13.074, acc=0.836, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.202e-04, train_time=0.290 -[v016] 2022-01-31 04:28:24,282 (trainer:653) INFO: 28epoch:train:271-297batch: iter_time=0.110, forward_time=0.035, loss=7.601, loss_att=4.513, loss_ctc=10.689, acc=0.851, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.204e-04, train_time=0.215 -[v016] 2022-01-31 04:28:30,618 (trainer:653) INFO: 28epoch:train:298-324batch: iter_time=0.132, forward_time=0.035, loss=7.491, loss_att=4.456, loss_ctc=10.525, acc=0.856, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.206e-04, train_time=0.234 -[v016] 2022-01-31 04:28:35,521 (trainer:653) INFO: 28epoch:train:325-351batch: iter_time=0.081, forward_time=0.034, loss=7.411, loss_att=4.409, loss_ctc=10.414, acc=0.845, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.209e-04, train_time=0.181 -[v016] 2022-01-31 04:28:41,848 (trainer:653) INFO: 28epoch:train:352-378batch: iter_time=0.130, forward_time=0.035, loss=7.257, loss_att=4.353, loss_ctc=10.162, acc=0.849, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.211e-04, train_time=0.234 -[v016] 2022-01-31 04:28:48,758 (trainer:653) INFO: 28epoch:train:379-405batch: iter_time=0.155, forward_time=0.034, loss=7.746, loss_att=4.597, loss_ctc=10.896, acc=0.848, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.213e-04, train_time=0.256 -[v016] 2022-01-31 04:28:53,748 (trainer:653) INFO: 28epoch:train:406-432batch: iter_time=0.081, forward_time=0.035, loss=8.865, loss_att=5.180, loss_ctc=12.549, acc=0.834, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.215e-04, train_time=0.185 -[v016] 2022-01-31 04:28:58,946 (trainer:653) INFO: 28epoch:train:433-459batch: iter_time=0.091, forward_time=0.034, loss=8.149, loss_att=4.854, loss_ctc=11.443, acc=0.844, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.217e-04, train_time=0.192 -[v016] 2022-01-31 04:29:03,909 (trainer:653) INFO: 28epoch:train:460-486batch: iter_time=0.082, forward_time=0.035, loss=7.936, loss_att=4.686, loss_ctc=11.185, acc=0.850, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.219e-04, train_time=0.184 -[v016] 2022-01-31 04:29:09,173 (trainer:653) INFO: 28epoch:train:487-513batch: iter_time=0.086, forward_time=0.035, loss=6.943, loss_att=4.121, loss_ctc=9.766, acc=0.857, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.222e-04, train_time=0.195 -[v016] 2022-01-31 04:29:14,920 (trainer:653) INFO: 28epoch:train:514-540batch: iter_time=0.111, forward_time=0.034, loss=7.659, loss_att=4.557, loss_ctc=10.760, acc=0.848, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.224e-04, train_time=0.213 -[v016] 2022-01-31 04:30:19,377 (trainer:328) INFO: 28epoch results: [train] iter_time=0.120, forward_time=0.043, loss=7.853, loss_att=4.638, loss_ctc=11.068, acc=0.847, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.204e-04, train_time=0.234, time=2 minutes and 8.49 seconds, total_count=15316, gpu_max_cached_mem_GB=5.822, [valid] loss=8.356, loss_att=5.732, loss_ctc=10.981, acc=0.855, cer=0.175, wer=0.582, cer_ctc=0.285, time=28.84 seconds, total_count=4984, gpu_max_cached_mem_GB=5.822, [att_plot] time=33.79 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:30:22,433 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:30:22,435 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/23epoch.pth -[v016] 2022-01-31 04:30:22,436 (trainer:261) INFO: 29/200epoch started. Estimated time to finish: 7 hours, 56 minutes and 27.18 seconds -[v016] 2022-01-31 04:30:29,193 (trainer:653) INFO: 29epoch:train:1-27batch: iter_time=0.055, forward_time=0.072, loss=8.919, loss_att=5.117, loss_ctc=12.720, acc=0.845, backward_time=0.028, optim_step_time=0.024, optim0_lr0=1.226e-04, train_time=0.210 -[v016] 2022-01-31 04:30:32,035 (trainer:653) INFO: 29epoch:train:28-54batch: iter_time=0.003, forward_time=0.036, loss=7.995, loss_att=4.626, loss_ctc=11.363, acc=0.847, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.229e-04, train_time=0.105 -[v016] 2022-01-31 04:30:35,265 (trainer:653) INFO: 29epoch:train:55-81batch: iter_time=0.016, forward_time=0.035, loss=7.306, loss_att=4.246, loss_ctc=10.365, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.231e-04, train_time=0.119 -[v016] 2022-01-31 04:30:39,331 (trainer:653) INFO: 29epoch:train:82-108batch: iter_time=0.046, forward_time=0.036, loss=8.935, loss_att=5.156, loss_ctc=12.713, acc=0.850, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.233e-04, train_time=0.150 -[v016] 2022-01-31 04:30:43,290 (trainer:653) INFO: 29epoch:train:109-135batch: iter_time=0.043, forward_time=0.035, loss=8.356, loss_att=4.860, loss_ctc=11.852, acc=0.844, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.235e-04, train_time=0.146 -[v016] 2022-01-31 04:30:47,185 (trainer:653) INFO: 29epoch:train:136-162batch: iter_time=0.043, forward_time=0.034, loss=7.061, loss_att=4.240, loss_ctc=9.883, acc=0.858, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.237e-04, train_time=0.144 -[v016] 2022-01-31 04:30:53,678 (trainer:653) INFO: 29epoch:train:163-189batch: iter_time=0.027, forward_time=0.107, loss=7.507, loss_att=4.439, loss_ctc=10.574, acc=0.858, backward_time=0.039, optim_step_time=0.040, optim0_lr0=1.239e-04, train_time=0.239 -[v016] 2022-01-31 04:30:57,564 (trainer:653) INFO: 29epoch:train:190-216batch: iter_time=0.040, forward_time=0.035, loss=7.851, loss_att=4.704, loss_ctc=10.999, acc=0.849, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.242e-04, train_time=0.144 -[v016] 2022-01-31 04:31:01,860 (trainer:653) INFO: 29epoch:train:217-243batch: iter_time=0.055, forward_time=0.035, loss=6.931, loss_att=4.125, loss_ctc=9.737, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.244e-04, train_time=0.159 -[v016] 2022-01-31 04:31:05,311 (trainer:653) INFO: 29epoch:train:244-270batch: iter_time=0.025, forward_time=0.035, loss=7.111, loss_att=4.201, loss_ctc=10.020, acc=0.860, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.246e-04, train_time=0.128 -[v016] 2022-01-31 04:31:08,435 (trainer:653) INFO: 29epoch:train:271-297batch: iter_time=0.013, forward_time=0.035, loss=8.133, loss_att=4.844, loss_ctc=11.422, acc=0.843, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.248e-04, train_time=0.115 -[v016] 2022-01-31 04:31:11,693 (trainer:653) INFO: 29epoch:train:298-324batch: iter_time=0.018, forward_time=0.035, loss=6.428, loss_att=3.953, loss_ctc=8.902, acc=0.860, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.250e-04, train_time=0.120 -[v016] 2022-01-31 04:31:15,156 (trainer:653) INFO: 29epoch:train:325-351batch: iter_time=0.018, forward_time=0.041, loss=7.712, loss_att=4.518, loss_ctc=10.907, acc=0.856, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.252e-04, train_time=0.128 -[v016] 2022-01-31 04:31:19,241 (trainer:653) INFO: 29epoch:train:352-378batch: iter_time=0.046, forward_time=0.036, loss=8.757, loss_att=5.176, loss_ctc=12.337, acc=0.835, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.255e-04, train_time=0.151 -[v016] 2022-01-31 04:31:23,278 (trainer:653) INFO: 29epoch:train:379-405batch: iter_time=0.048, forward_time=0.034, loss=7.147, loss_att=4.144, loss_ctc=10.149, acc=0.855, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.257e-04, train_time=0.149 -[v016] 2022-01-31 04:31:26,879 (trainer:653) INFO: 29epoch:train:406-432batch: iter_time=0.033, forward_time=0.034, loss=6.591, loss_att=3.964, loss_ctc=9.218, acc=0.863, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.259e-04, train_time=0.133 -[v016] 2022-01-31 04:31:30,179 (trainer:653) INFO: 29epoch:train:433-459batch: iter_time=0.017, forward_time=0.036, loss=7.958, loss_att=4.685, loss_ctc=11.232, acc=0.849, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.261e-04, train_time=0.122 -[v016] 2022-01-31 04:31:40,480 (trainer:653) INFO: 29epoch:train:460-486batch: iter_time=0.272, forward_time=0.038, loss=7.395, loss_att=4.357, loss_ctc=10.434, acc=0.853, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.263e-04, train_time=0.378 -[v016] 2022-01-31 04:31:45,435 (trainer:653) INFO: 29epoch:train:487-513batch: iter_time=0.083, forward_time=0.034, loss=7.101, loss_att=4.265, loss_ctc=9.938, acc=0.849, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.265e-04, train_time=0.183 -[v016] 2022-01-31 04:31:50,640 (trainer:653) INFO: 29epoch:train:514-540batch: iter_time=0.089, forward_time=0.035, loss=8.073, loss_att=4.766, loss_ctc=11.381, acc=0.853, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.268e-04, train_time=0.193 -[v016] 2022-01-31 04:32:36,025 (trainer:328) INFO: 29epoch results: [train] iter_time=0.051, forward_time=0.041, loss=7.649, loss_att=4.515, loss_ctc=10.784, acc=0.852, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.247e-04, train_time=0.162, time=1 minute and 29.98 seconds, total_count=15863, gpu_max_cached_mem_GB=5.822, [valid] loss=8.371, loss_att=5.719, loss_ctc=11.022, acc=0.853, cer=0.173, wer=0.574, cer_ctc=0.277, time=10.65 seconds, total_count=5162, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.87 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:32:38,459 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 04:32:38,462 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/24epoch.pth -[v016] 2022-01-31 04:32:38,462 (trainer:261) INFO: 30/200epoch started. Estimated time to finish: 7 hours, 44 minutes and 7.58 seconds -[v016] 2022-01-31 04:32:43,778 (trainer:653) INFO: 30epoch:train:1-27batch: iter_time=0.086, forward_time=0.036, loss=7.815, loss_att=4.501, loss_ctc=11.130, acc=0.853, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.270e-04, train_time=0.193 -[v016] 2022-01-31 04:32:47,741 (trainer:653) INFO: 30epoch:train:28-54batch: iter_time=0.042, forward_time=0.036, loss=7.774, loss_att=4.552, loss_ctc=10.996, acc=0.849, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.272e-04, train_time=0.148 -[v016] 2022-01-31 04:32:52,610 (trainer:653) INFO: 30epoch:train:55-81batch: iter_time=0.077, forward_time=0.035, loss=7.662, loss_att=4.467, loss_ctc=10.856, acc=0.852, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.275e-04, train_time=0.180 -[v016] 2022-01-31 04:32:56,857 (trainer:653) INFO: 30epoch:train:82-108batch: iter_time=0.056, forward_time=0.034, loss=6.737, loss_att=3.873, loss_ctc=9.601, acc=0.856, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.277e-04, train_time=0.157 -[v016] 2022-01-31 04:33:03,192 (trainer:653) INFO: 30epoch:train:109-135batch: iter_time=0.072, forward_time=0.065, loss=6.495, loss_att=3.868, loss_ctc=9.121, acc=0.861, backward_time=0.027, optim_step_time=0.046, optim0_lr0=1.279e-04, train_time=0.234 -[v016] 2022-01-31 04:33:07,138 (trainer:653) INFO: 30epoch:train:136-162batch: iter_time=0.041, forward_time=0.036, loss=8.148, loss_att=4.656, loss_ctc=11.639, acc=0.857, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.281e-04, train_time=0.146 -[v016] 2022-01-31 04:33:11,128 (trainer:653) INFO: 30epoch:train:163-189batch: iter_time=0.045, forward_time=0.035, loss=6.719, loss_att=3.957, loss_ctc=9.482, acc=0.865, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.283e-04, train_time=0.148 -[v016] 2022-01-31 04:33:14,890 (trainer:653) INFO: 30epoch:train:190-216batch: iter_time=0.032, forward_time=0.035, loss=6.639, loss_att=4.037, loss_ctc=9.240, acc=0.861, backward_time=0.025, optim_step_time=0.026, optim0_lr0=1.285e-04, train_time=0.139 -[v016] 2022-01-31 04:33:23,145 (trainer:653) INFO: 30epoch:train:217-243batch: iter_time=0.105, forward_time=0.062, loss=7.918, loss_att=4.555, loss_ctc=11.282, acc=0.850, backward_time=0.079, optim_step_time=0.027, optim0_lr0=1.288e-04, train_time=0.306 -[v016] 2022-01-31 04:33:28,642 (trainer:653) INFO: 30epoch:train:244-270batch: iter_time=0.099, forward_time=0.035, loss=8.632, loss_att=5.040, loss_ctc=12.224, acc=0.852, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.290e-04, train_time=0.203 -[v016] 2022-01-31 04:33:35,511 (trainer:653) INFO: 30epoch:train:271-297batch: iter_time=0.139, forward_time=0.036, loss=7.254, loss_att=4.175, loss_ctc=10.334, acc=0.855, backward_time=0.034, optim_step_time=0.023, optim0_lr0=1.292e-04, train_time=0.254 -[v016] 2022-01-31 04:33:40,247 (trainer:653) INFO: 30epoch:train:298-324batch: iter_time=0.070, forward_time=0.035, loss=7.851, loss_att=4.661, loss_ctc=11.040, acc=0.856, backward_time=0.026, optim_step_time=0.023, optim0_lr0=1.294e-04, train_time=0.175 -[v016] 2022-01-31 04:33:46,131 (trainer:653) INFO: 30epoch:train:325-351batch: iter_time=0.112, forward_time=0.036, loss=7.889, loss_att=4.642, loss_ctc=11.135, acc=0.853, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.296e-04, train_time=0.218 -[v016] 2022-01-31 04:33:51,543 (trainer:653) INFO: 30epoch:train:352-378batch: iter_time=0.098, forward_time=0.035, loss=7.871, loss_att=4.673, loss_ctc=11.070, acc=0.854, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.298e-04, train_time=0.200 -[v016] 2022-01-31 04:33:56,243 (trainer:653) INFO: 30epoch:train:379-405batch: iter_time=0.073, forward_time=0.034, loss=6.927, loss_att=4.134, loss_ctc=9.719, acc=0.847, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.300e-04, train_time=0.174 -[v016] 2022-01-31 04:34:00,817 (trainer:653) INFO: 30epoch:train:406-432batch: iter_time=0.067, forward_time=0.034, loss=6.882, loss_att=4.066, loss_ctc=9.698, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.303e-04, train_time=0.169 -[v016] 2022-01-31 04:34:05,904 (trainer:653) INFO: 30epoch:train:433-459batch: iter_time=0.087, forward_time=0.034, loss=6.545, loss_att=3.780, loss_ctc=9.311, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.305e-04, train_time=0.188 -[v016] 2022-01-31 04:34:11,608 (trainer:653) INFO: 30epoch:train:460-486batch: iter_time=0.107, forward_time=0.035, loss=7.256, loss_att=4.258, loss_ctc=10.254, acc=0.856, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.307e-04, train_time=0.211 -[v016] 2022-01-31 04:34:16,300 (trainer:653) INFO: 30epoch:train:487-513batch: iter_time=0.069, forward_time=0.036, loss=9.233, loss_att=5.366, loss_ctc=13.100, acc=0.841, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.309e-04, train_time=0.174 -[v016] 2022-01-31 04:34:21,177 (trainer:653) INFO: 30epoch:train:514-540batch: iter_time=0.076, forward_time=0.036, loss=7.428, loss_att=4.226, loss_ctc=10.631, acc=0.858, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.311e-04, train_time=0.180 -[v016] 2022-01-31 04:35:27,427 (trainer:328) INFO: 30epoch results: [train] iter_time=0.078, forward_time=0.038, loss=7.473, loss_att=4.369, loss_ctc=10.576, acc=0.855, backward_time=0.028, optim_step_time=0.025, optim0_lr0=1.291e-04, train_time=0.190, time=1 minute and 44.17 seconds, total_count=16410, gpu_max_cached_mem_GB=5.822, [valid] loss=8.225, loss_att=5.599, loss_ctc=10.851, acc=0.856, cer=0.173, wer=0.573, cer_ctc=0.286, time=30.3 seconds, total_count=5340, gpu_max_cached_mem_GB=5.822, [att_plot] time=34.47 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:35:30,397 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:35:30,401 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/25epoch.pth -[v016] 2022-01-31 04:35:30,401 (trainer:261) INFO: 31/200epoch started. Estimated time to finish: 7 hours, 43 minutes and 59.22 seconds -[v016] 2022-01-31 04:35:37,295 (trainer:653) INFO: 31epoch:train:1-27batch: iter_time=0.139, forward_time=0.038, loss=7.766, loss_att=4.538, loss_ctc=10.994, acc=0.857, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.314e-04, train_time=0.249 -[v016] 2022-01-31 04:35:42,142 (trainer:653) INFO: 31epoch:train:28-54batch: iter_time=0.073, forward_time=0.036, loss=8.770, loss_att=5.039, loss_ctc=12.501, acc=0.839, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.316e-04, train_time=0.179 -[v016] 2022-01-31 04:35:45,883 (trainer:653) INFO: 31epoch:train:55-81batch: iter_time=0.035, forward_time=0.035, loss=8.282, loss_att=4.711, loss_ctc=11.853, acc=0.844, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.318e-04, train_time=0.138 -[v016] 2022-01-31 04:35:50,453 (trainer:653) INFO: 31epoch:train:82-108batch: iter_time=0.067, forward_time=0.035, loss=7.510, loss_att=4.340, loss_ctc=10.679, acc=0.861, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.320e-04, train_time=0.169 -[v016] 2022-01-31 04:35:54,822 (trainer:653) INFO: 31epoch:train:109-135batch: iter_time=0.061, forward_time=0.034, loss=6.097, loss_att=3.604, loss_ctc=8.590, acc=0.869, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.323e-04, train_time=0.162 -[v016] 2022-01-31 04:35:58,450 (trainer:653) INFO: 31epoch:train:136-162batch: iter_time=0.033, forward_time=0.034, loss=5.965, loss_att=3.613, loss_ctc=8.316, acc=0.856, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.325e-04, train_time=0.134 -[v016] 2022-01-31 04:36:05,981 (trainer:653) INFO: 31epoch:train:163-189batch: iter_time=0.016, forward_time=0.157, loss=7.771, loss_att=4.405, loss_ctc=11.137, acc=0.861, backward_time=0.045, optim_step_time=0.029, optim0_lr0=1.327e-04, train_time=0.279 -[v016] 2022-01-31 04:36:10,980 (trainer:653) INFO: 31epoch:train:190-216batch: iter_time=0.083, forward_time=0.034, loss=6.262, loss_att=3.731, loss_ctc=8.794, acc=0.869, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.329e-04, train_time=0.185 -[v016] 2022-01-31 04:36:16,027 (trainer:653) INFO: 31epoch:train:217-243batch: iter_time=0.084, forward_time=0.035, loss=7.492, loss_att=4.259, loss_ctc=10.724, acc=0.856, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.331e-04, train_time=0.187 -[v016] 2022-01-31 04:36:21,000 (trainer:653) INFO: 31epoch:train:244-270batch: iter_time=0.075, forward_time=0.039, loss=8.580, loss_att=4.778, loss_ctc=12.383, acc=0.860, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.333e-04, train_time=0.184 -[v016] 2022-01-31 04:36:26,845 (trainer:653) INFO: 31epoch:train:271-297batch: iter_time=0.111, forward_time=0.035, loss=7.605, loss_att=4.526, loss_ctc=10.683, acc=0.854, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.336e-04, train_time=0.216 -[v016] 2022-01-31 04:36:31,115 (trainer:653) INFO: 31epoch:train:298-324batch: iter_time=0.055, forward_time=0.035, loss=5.766, loss_att=3.488, loss_ctc=8.043, acc=0.872, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.338e-04, train_time=0.158 -[v016] 2022-01-31 04:36:36,243 (trainer:653) INFO: 31epoch:train:325-351batch: iter_time=0.082, forward_time=0.036, loss=7.693, loss_att=4.515, loss_ctc=10.870, acc=0.848, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.340e-04, train_time=0.190 -[v016] 2022-01-31 04:36:42,403 (trainer:653) INFO: 31epoch:train:352-378batch: iter_time=0.126, forward_time=0.034, loss=6.393, loss_att=3.810, loss_ctc=8.976, acc=0.863, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.342e-04, train_time=0.228 -[v016] 2022-01-31 04:36:48,369 (trainer:653) INFO: 31epoch:train:379-405batch: iter_time=0.117, forward_time=0.036, loss=8.333, loss_att=4.708, loss_ctc=11.958, acc=0.851, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.344e-04, train_time=0.221 -[v016] 2022-01-31 04:36:53,481 (trainer:653) INFO: 31epoch:train:406-432batch: iter_time=0.084, forward_time=0.036, loss=8.642, loss_att=4.881, loss_ctc=12.404, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.346e-04, train_time=0.189 -[v016] 2022-01-31 04:36:57,701 (trainer:653) INFO: 31epoch:train:433-459batch: iter_time=0.056, forward_time=0.034, loss=6.084, loss_att=3.622, loss_ctc=8.546, acc=0.868, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.349e-04, train_time=0.156 -[v016] 2022-01-31 04:37:02,523 (trainer:653) INFO: 31epoch:train:460-486batch: iter_time=0.078, forward_time=0.035, loss=7.025, loss_att=4.145, loss_ctc=9.905, acc=0.855, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.351e-04, train_time=0.178 -[v016] 2022-01-31 04:37:07,538 (trainer:653) INFO: 31epoch:train:487-513batch: iter_time=0.079, forward_time=0.037, loss=7.090, loss_att=4.268, loss_ctc=9.912, acc=0.851, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.353e-04, train_time=0.185 -[v016] 2022-01-31 04:37:12,951 (trainer:653) INFO: 31epoch:train:514-540batch: iter_time=0.099, forward_time=0.035, loss=7.177, loss_att=4.245, loss_ctc=10.109, acc=0.850, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.355e-04, train_time=0.200 -[v016] 2022-01-31 04:38:08,231 (trainer:328) INFO: 31epoch results: [train] iter_time=0.078, forward_time=0.041, loss=7.342, loss_att=4.273, loss_ctc=10.411, acc=0.858, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.335e-04, train_time=0.190, time=1 minute and 44.06 seconds, total_count=16957, gpu_max_cached_mem_GB=5.822, [valid] loss=8.032, loss_att=5.484, loss_ctc=10.580, acc=0.860, cer=0.173, wer=0.554, cer_ctc=0.286, time=21.47 seconds, total_count=5518, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.19 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:38:12,292 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:38:12,295 (trainer:261) INFO: 32/200epoch started. Estimated time to finish: 7 hours, 40 minutes and 46.79 seconds -[v016] 2022-01-31 04:38:18,712 (trainer:653) INFO: 32epoch:train:1-27batch: iter_time=0.070, forward_time=0.066, loss=8.922, loss_att=5.073, loss_ctc=12.772, acc=0.841, backward_time=0.041, optim_step_time=0.025, optim0_lr0=1.358e-04, train_time=0.231 -[v016] 2022-01-31 04:38:22,500 (trainer:653) INFO: 32epoch:train:28-54batch: iter_time=0.034, forward_time=0.036, loss=7.337, loss_att=4.272, loss_ctc=10.402, acc=0.857, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.360e-04, train_time=0.141 -[v016] 2022-01-31 04:38:27,210 (trainer:653) INFO: 32epoch:train:55-81batch: iter_time=0.071, forward_time=0.035, loss=6.794, loss_att=3.851, loss_ctc=9.737, acc=0.868, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.362e-04, train_time=0.174 -[v016] 2022-01-31 04:38:30,527 (trainer:653) INFO: 32epoch:train:82-108batch: iter_time=0.016, forward_time=0.038, loss=6.893, loss_att=3.978, loss_ctc=9.808, acc=0.859, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.364e-04, train_time=0.123 -[v016] 2022-01-31 04:38:34,117 (trainer:653) INFO: 32epoch:train:109-135batch: iter_time=0.027, forward_time=0.036, loss=8.232, loss_att=4.619, loss_ctc=11.846, acc=0.853, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.366e-04, train_time=0.133 -[v016] 2022-01-31 04:38:38,013 (trainer:653) INFO: 32epoch:train:136-162batch: iter_time=0.040, forward_time=0.035, loss=6.888, loss_att=3.886, loss_ctc=9.889, acc=0.867, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.369e-04, train_time=0.144 -[v016] 2022-01-31 04:38:41,347 (trainer:653) INFO: 32epoch:train:163-189batch: iter_time=0.029, forward_time=0.032, loss=6.115, loss_att=3.529, loss_ctc=8.700, acc=0.872, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.371e-04, train_time=0.123 -[v016] 2022-01-31 04:38:44,721 (trainer:653) INFO: 32epoch:train:190-216batch: iter_time=0.020, forward_time=0.036, loss=6.792, loss_att=3.970, loss_ctc=9.615, acc=0.870, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.373e-04, train_time=0.125 -[v016] 2022-01-31 04:38:48,293 (trainer:653) INFO: 32epoch:train:217-243batch: iter_time=0.025, forward_time=0.036, loss=6.882, loss_att=3.936, loss_ctc=9.827, acc=0.869, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.375e-04, train_time=0.132 -[v016] 2022-01-31 04:38:51,746 (trainer:653) INFO: 32epoch:train:244-270batch: iter_time=0.019, forward_time=0.037, loss=8.671, loss_att=4.999, loss_ctc=12.344, acc=0.842, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.377e-04, train_time=0.128 -[v016] 2022-01-31 04:38:59,702 (trainer:653) INFO: 32epoch:train:271-297batch: iter_time=0.069, forward_time=0.070, loss=7.020, loss_att=4.022, loss_ctc=10.019, acc=0.860, backward_time=0.093, optim_step_time=0.026, optim0_lr0=1.379e-04, train_time=0.294 -[v016] 2022-01-31 04:39:04,534 (trainer:653) INFO: 32epoch:train:298-324batch: iter_time=0.070, forward_time=0.037, loss=7.233, loss_att=4.231, loss_ctc=10.235, acc=0.859, backward_time=0.028, optim_step_time=0.024, optim0_lr0=1.382e-04, train_time=0.179 -[v016] 2022-01-31 04:39:08,410 (trainer:653) INFO: 32epoch:train:325-351batch: iter_time=0.038, forward_time=0.036, loss=5.824, loss_att=3.372, loss_ctc=8.276, acc=0.872, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.384e-04, train_time=0.143 -[v016] 2022-01-31 04:39:12,061 (trainer:653) INFO: 32epoch:train:352-378batch: iter_time=0.030, forward_time=0.036, loss=6.005, loss_att=3.626, loss_ctc=8.385, acc=0.868, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.386e-04, train_time=0.135 -[v016] 2022-01-31 04:39:18,404 (trainer:653) INFO: 32epoch:train:379-405batch: iter_time=0.134, forward_time=0.035, loss=6.993, loss_att=4.043, loss_ctc=9.944, acc=0.861, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.388e-04, train_time=0.235 -[v016] 2022-01-31 04:39:23,201 (trainer:653) INFO: 32epoch:train:406-432batch: iter_time=0.069, forward_time=0.036, loss=7.304, loss_att=4.287, loss_ctc=10.321, acc=0.869, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.390e-04, train_time=0.177 -[v016] 2022-01-31 04:39:28,761 (trainer:653) INFO: 32epoch:train:433-459batch: iter_time=0.102, forward_time=0.036, loss=7.389, loss_att=4.280, loss_ctc=10.498, acc=0.848, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.392e-04, train_time=0.206 -[v016] 2022-01-31 04:39:34,126 (trainer:653) INFO: 32epoch:train:460-486batch: iter_time=0.097, forward_time=0.034, loss=6.861, loss_att=4.068, loss_ctc=9.653, acc=0.858, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.394e-04, train_time=0.199 -[v016] 2022-01-31 04:39:38,351 (trainer:653) INFO: 32epoch:train:487-513batch: iter_time=0.056, forward_time=0.034, loss=6.610, loss_att=3.891, loss_ctc=9.328, acc=0.861, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.397e-04, train_time=0.156 -[v016] 2022-01-31 04:39:43,279 (trainer:653) INFO: 32epoch:train:514-540batch: iter_time=0.078, forward_time=0.035, loss=7.721, loss_att=4.479, loss_ctc=10.964, acc=0.865, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.399e-04, train_time=0.182 -[v016] 2022-01-31 04:40:51,230 (trainer:328) INFO: 32epoch results: [train] iter_time=0.055, forward_time=0.039, loss=7.131, loss_att=4.127, loss_ctc=10.136, acc=0.861, backward_time=0.029, optim_step_time=0.024, optim0_lr0=1.379e-04, train_time=0.168, time=1 minute and 32.39 seconds, total_count=17504, gpu_max_cached_mem_GB=5.822, [valid] loss=7.883, loss_att=5.442, loss_ctc=10.324, acc=0.865, cer=0.163, wer=0.542, cer_ctc=0.259, time=26.22 seconds, total_count=5696, gpu_max_cached_mem_GB=5.822, [att_plot] time=40.24 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:40:54,102 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:40:54,105 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/26epoch.pth, exp/asr_train_asr_raw_en_word/27epoch.pth -[v016] 2022-01-31 04:40:54,105 (trainer:261) INFO: 33/200epoch started. Estimated time to finish: 7 hours, 37 minutes and 38.28 seconds -[v016] 2022-01-31 04:41:04,282 (trainer:653) INFO: 33epoch:train:1-27batch: iter_time=0.161, forward_time=0.094, loss=6.491, loss_att=3.783, loss_ctc=9.200, acc=0.868, backward_time=0.053, optim_step_time=0.025, optim0_lr0=1.402e-04, train_time=0.368 -[v016] 2022-01-31 04:41:10,370 (trainer:653) INFO: 33epoch:train:28-54batch: iter_time=0.120, forward_time=0.036, loss=7.769, loss_att=4.504, loss_ctc=11.035, acc=0.850, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.404e-04, train_time=0.226 -[v016] 2022-01-31 04:41:15,707 (trainer:653) INFO: 33epoch:train:55-81batch: iter_time=0.090, forward_time=0.039, loss=6.841, loss_att=3.920, loss_ctc=9.762, acc=0.864, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.406e-04, train_time=0.197 -[v016] 2022-01-31 04:41:20,800 (trainer:653) INFO: 33epoch:train:82-108batch: iter_time=0.083, forward_time=0.035, loss=6.892, loss_att=3.980, loss_ctc=9.803, acc=0.865, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.408e-04, train_time=0.188 -[v016] 2022-01-31 04:41:27,058 (trainer:653) INFO: 33epoch:train:109-135batch: iter_time=0.124, forward_time=0.036, loss=7.751, loss_att=4.456, loss_ctc=11.047, acc=0.865, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.410e-04, train_time=0.232 -[v016] 2022-01-31 04:41:32,943 (trainer:653) INFO: 33epoch:train:136-162batch: iter_time=0.113, forward_time=0.035, loss=6.299, loss_att=3.623, loss_ctc=8.974, acc=0.876, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.412e-04, train_time=0.218 -[v016] 2022-01-31 04:41:37,401 (trainer:653) INFO: 33epoch:train:163-189batch: iter_time=0.063, forward_time=0.034, loss=6.637, loss_att=3.871, loss_ctc=9.404, acc=0.869, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.414e-04, train_time=0.165 -[v016] 2022-01-31 04:41:42,343 (trainer:653) INFO: 33epoch:train:190-216batch: iter_time=0.083, forward_time=0.034, loss=5.294, loss_att=3.136, loss_ctc=7.451, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.417e-04, train_time=0.183 -[v016] 2022-01-31 04:41:48,374 (trainer:653) INFO: 33epoch:train:217-243batch: iter_time=0.117, forward_time=0.034, loss=5.925, loss_att=3.439, loss_ctc=8.410, acc=0.868, backward_time=0.024, optim_step_time=0.027, optim0_lr0=1.419e-04, train_time=0.223 -[v016] 2022-01-31 04:41:55,252 (trainer:653) INFO: 33epoch:train:244-270batch: iter_time=0.144, forward_time=0.036, loss=6.702, loss_att=3.917, loss_ctc=9.488, acc=0.866, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.421e-04, train_time=0.250 -[v016] 2022-01-31 04:42:00,688 (trainer:653) INFO: 33epoch:train:271-297batch: iter_time=0.099, forward_time=0.034, loss=6.157, loss_att=3.618, loss_ctc=8.696, acc=0.867, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.423e-04, train_time=0.202 -[v016] 2022-01-31 04:42:05,875 (trainer:653) INFO: 33epoch:train:298-324batch: iter_time=0.091, forward_time=0.034, loss=6.459, loss_att=3.830, loss_ctc=9.087, acc=0.859, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.425e-04, train_time=0.192 -[v016] 2022-01-31 04:42:15,068 (trainer:653) INFO: 33epoch:train:325-351batch: iter_time=0.204, forward_time=0.061, loss=7.495, loss_att=4.313, loss_ctc=10.676, acc=0.857, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.427e-04, train_time=0.340 -[v016] 2022-01-31 04:42:21,847 (trainer:653) INFO: 33epoch:train:352-378batch: iter_time=0.148, forward_time=0.035, loss=7.206, loss_att=4.047, loss_ctc=10.365, acc=0.873, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.430e-04, train_time=0.251 -[v016] 2022-01-31 04:42:30,120 (trainer:653) INFO: 33epoch:train:379-405batch: iter_time=0.201, forward_time=0.036, loss=6.861, loss_att=3.985, loss_ctc=9.736, acc=0.865, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.432e-04, train_time=0.306 -[v016] 2022-01-31 04:42:36,552 (trainer:653) INFO: 33epoch:train:406-432batch: iter_time=0.136, forward_time=0.035, loss=6.314, loss_att=3.685, loss_ctc=8.944, acc=0.866, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.434e-04, train_time=0.238 -[v016] 2022-01-31 04:42:43,109 (trainer:653) INFO: 33epoch:train:433-459batch: iter_time=0.136, forward_time=0.036, loss=8.594, loss_att=4.875, loss_ctc=12.312, acc=0.854, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.436e-04, train_time=0.243 -[v016] 2022-01-31 04:42:48,922 (trainer:653) INFO: 33epoch:train:460-486batch: iter_time=0.111, forward_time=0.036, loss=8.480, loss_att=4.992, loss_ctc=11.968, acc=0.853, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.438e-04, train_time=0.215 -[v016] 2022-01-31 04:42:59,613 (trainer:653) INFO: 33epoch:train:487-513batch: iter_time=0.186, forward_time=0.108, loss=7.430, loss_att=4.270, loss_ctc=10.590, acc=0.863, backward_time=0.032, optim_step_time=0.047, optim0_lr0=1.440e-04, train_time=0.396 -[v016] 2022-01-31 04:43:06,771 (trainer:653) INFO: 33epoch:train:514-540batch: iter_time=0.161, forward_time=0.036, loss=7.086, loss_att=4.045, loss_ctc=10.128, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.443e-04, train_time=0.265 -[v016] 2022-01-31 04:44:14,218 (trainer:328) INFO: 33epoch results: [train] iter_time=0.129, forward_time=0.043, loss=6.967, loss_att=4.031, loss_ctc=9.903, acc=0.864, backward_time=0.026, optim_step_time=0.025, optim0_lr0=1.422e-04, train_time=0.245, time=2 minutes and 14.35 seconds, total_count=18051, gpu_max_cached_mem_GB=5.822, [valid] loss=7.661, loss_att=5.329, loss_ctc=9.993, acc=0.867, cer=0.159, wer=0.534, cer_ctc=0.249, time=32.08 seconds, total_count=5874, gpu_max_cached_mem_GB=5.822, [att_plot] time=33.5 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:44:16,804 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:44:16,807 (trainer:261) INFO: 34/200epoch started. Estimated time to finish: 7 hours, 43 minutes and 19.18 seconds -[v016] 2022-01-31 04:44:21,492 (trainer:653) INFO: 34epoch:train:1-27batch: iter_time=0.060, forward_time=0.036, loss=6.397, loss_att=3.658, loss_ctc=9.137, acc=0.879, backward_time=0.027, optim_step_time=0.023, optim0_lr0=1.445e-04, train_time=0.168 -[v016] 2022-01-31 04:44:25,588 (trainer:653) INFO: 34epoch:train:28-54batch: iter_time=0.048, forward_time=0.036, loss=7.488, loss_att=4.294, loss_ctc=10.683, acc=0.864, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.447e-04, train_time=0.151 -[v016] 2022-01-31 04:44:29,832 (trainer:653) INFO: 34epoch:train:55-81batch: iter_time=0.055, forward_time=0.035, loss=7.094, loss_att=3.965, loss_ctc=10.224, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.450e-04, train_time=0.157 -[v016] 2022-01-31 04:44:33,452 (trainer:653) INFO: 34epoch:train:82-108batch: iter_time=0.032, forward_time=0.035, loss=6.465, loss_att=3.851, loss_ctc=9.079, acc=0.867, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.452e-04, train_time=0.134 -[v016] 2022-01-31 04:44:36,980 (trainer:653) INFO: 34epoch:train:109-135batch: iter_time=0.027, forward_time=0.036, loss=7.352, loss_att=4.241, loss_ctc=10.464, acc=0.855, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.454e-04, train_time=0.130 -[v016] 2022-01-31 04:44:40,621 (trainer:653) INFO: 34epoch:train:136-162batch: iter_time=0.032, forward_time=0.035, loss=7.315, loss_att=4.029, loss_ctc=10.601, acc=0.867, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.456e-04, train_time=0.135 -[v016] 2022-01-31 04:44:44,222 (trainer:653) INFO: 34epoch:train:163-189batch: iter_time=0.030, forward_time=0.035, loss=7.826, loss_att=4.394, loss_ctc=11.257, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.458e-04, train_time=0.133 -[v016] 2022-01-31 04:44:47,574 (trainer:653) INFO: 34epoch:train:190-216batch: iter_time=0.018, forward_time=0.035, loss=6.966, loss_att=3.877, loss_ctc=10.056, acc=0.871, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.460e-04, train_time=0.124 -[v016] 2022-01-31 04:44:50,843 (trainer:653) INFO: 34epoch:train:217-243batch: iter_time=0.018, forward_time=0.035, loss=6.983, loss_att=3.967, loss_ctc=10.000, acc=0.865, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.463e-04, train_time=0.121 -[v016] 2022-01-31 04:44:53,952 (trainer:653) INFO: 34epoch:train:244-270batch: iter_time=0.013, forward_time=0.035, loss=6.488, loss_att=3.808, loss_ctc=9.168, acc=0.865, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.465e-04, train_time=0.115 -[v016] 2022-01-31 04:44:57,645 (trainer:653) INFO: 34epoch:train:271-297batch: iter_time=0.033, forward_time=0.035, loss=7.149, loss_att=4.138, loss_ctc=10.160, acc=0.865, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.467e-04, train_time=0.137 -[v016] 2022-01-31 04:45:01,624 (trainer:653) INFO: 34epoch:train:298-324batch: iter_time=0.045, forward_time=0.035, loss=6.651, loss_att=3.781, loss_ctc=9.520, acc=0.873, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.469e-04, train_time=0.147 -[v016] 2022-01-31 04:45:04,613 (trainer:653) INFO: 34epoch:train:325-351batch: iter_time=0.007, forward_time=0.036, loss=7.130, loss_att=4.107, loss_ctc=10.153, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.471e-04, train_time=0.110 -[v016] 2022-01-31 04:45:08,312 (trainer:653) INFO: 34epoch:train:352-378batch: iter_time=0.037, forward_time=0.034, loss=5.613, loss_att=3.333, loss_ctc=7.894, acc=0.864, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.473e-04, train_time=0.137 -[v016] 2022-01-31 04:45:11,395 (trainer:653) INFO: 34epoch:train:379-405batch: iter_time=0.012, forward_time=0.035, loss=6.365, loss_att=3.706, loss_ctc=9.023, acc=0.866, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.476e-04, train_time=0.114 -[v016] 2022-01-31 04:45:19,764 (trainer:653) INFO: 34epoch:train:406-432batch: iter_time=0.028, forward_time=0.091, loss=5.213, loss_att=3.033, loss_ctc=7.393, acc=0.881, backward_time=0.134, optim_step_time=0.027, optim0_lr0=1.478e-04, train_time=0.310 -[v016] 2022-01-31 04:45:23,824 (trainer:653) INFO: 34epoch:train:433-459batch: iter_time=0.042, forward_time=0.037, loss=9.578, loss_att=5.340, loss_ctc=13.816, acc=0.839, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.480e-04, train_time=0.150 -[v016] 2022-01-31 04:45:28,908 (trainer:653) INFO: 34epoch:train:460-486batch: iter_time=0.080, forward_time=0.037, loss=7.775, loss_att=4.381, loss_ctc=11.169, acc=0.865, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.482e-04, train_time=0.188 -[v016] 2022-01-31 04:45:35,016 (trainer:653) INFO: 34epoch:train:487-513batch: iter_time=0.122, forward_time=0.037, loss=6.004, loss_att=3.551, loss_ctc=8.457, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.484e-04, train_time=0.226 -[v016] 2022-01-31 04:45:39,488 (trainer:653) INFO: 34epoch:train:514-540batch: iter_time=0.064, forward_time=0.034, loss=6.015, loss_att=3.464, loss_ctc=8.565, acc=0.870, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.486e-04, train_time=0.166 -[v016] 2022-01-31 04:46:27,900 (trainer:328) INFO: 34epoch results: [train] iter_time=0.041, forward_time=0.038, loss=6.875, loss_att=3.938, loss_ctc=9.813, acc=0.867, backward_time=0.030, optim_step_time=0.023, optim0_lr0=1.466e-04, train_time=0.153, time=1 minute and 23.91 seconds, total_count=18598, gpu_max_cached_mem_GB=5.822, [valid] loss=7.956, loss_att=5.465, loss_ctc=10.448, acc=0.864, cer=0.163, wer=0.540, cer_ctc=0.268, time=11.51 seconds, total_count=6052, gpu_max_cached_mem_GB=5.822, [att_plot] time=35.62 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:46:30,770 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 04:46:30,773 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/28epoch.pth, exp/asr_train_asr_raw_en_word/29epoch.pth -[v016] 2022-01-31 04:46:30,774 (trainer:261) INFO: 35/200epoch started. Estimated time to finish: 7 hours, 34 minutes and 7.41 seconds -[v016] 2022-01-31 04:46:36,725 (trainer:653) INFO: 35epoch:train:1-27batch: iter_time=0.112, forward_time=0.035, loss=7.521, loss_att=4.248, loss_ctc=10.794, acc=0.859, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.489e-04, train_time=0.218 -[v016] 2022-01-31 04:46:41,342 (trainer:653) INFO: 35epoch:train:28-54batch: iter_time=0.069, forward_time=0.035, loss=6.785, loss_att=3.853, loss_ctc=9.716, acc=0.861, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.491e-04, train_time=0.171 -[v016] 2022-01-31 04:46:45,235 (trainer:653) INFO: 35epoch:train:55-81batch: iter_time=0.040, forward_time=0.035, loss=7.119, loss_att=3.992, loss_ctc=10.246, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.493e-04, train_time=0.144 -[v016] 2022-01-31 04:46:48,831 (trainer:653) INFO: 35epoch:train:82-108batch: iter_time=0.030, forward_time=0.035, loss=6.531, loss_att=3.794, loss_ctc=9.267, acc=0.872, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.496e-04, train_time=0.133 -[v016] 2022-01-31 04:46:52,797 (trainer:653) INFO: 35epoch:train:109-135batch: iter_time=0.042, forward_time=0.034, loss=5.904, loss_att=3.421, loss_ctc=8.387, acc=0.873, backward_time=0.028, optim_step_time=0.023, optim0_lr0=1.498e-04, train_time=0.147 -[v016] 2022-01-31 04:46:56,186 (trainer:653) INFO: 35epoch:train:136-162batch: iter_time=0.023, forward_time=0.035, loss=5.549, loss_att=3.295, loss_ctc=7.803, acc=0.883, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.500e-04, train_time=0.125 -[v016] 2022-01-31 04:46:59,938 (trainer:653) INFO: 35epoch:train:163-189batch: iter_time=0.031, forward_time=0.037, loss=7.032, loss_att=3.914, loss_ctc=10.150, acc=0.870, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.502e-04, train_time=0.138 -[v016] 2022-01-31 04:47:04,502 (trainer:653) INFO: 35epoch:train:190-216batch: iter_time=0.063, forward_time=0.036, loss=7.283, loss_att=4.107, loss_ctc=10.459, acc=0.863, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.504e-04, train_time=0.169 -[v016] 2022-01-31 04:47:09,253 (trainer:653) INFO: 35epoch:train:217-243batch: iter_time=0.074, forward_time=0.035, loss=6.357, loss_att=3.728, loss_ctc=8.985, acc=0.875, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.506e-04, train_time=0.176 -[v016] 2022-01-31 04:47:13,269 (trainer:653) INFO: 35epoch:train:244-270batch: iter_time=0.044, forward_time=0.036, loss=7.035, loss_att=4.059, loss_ctc=10.012, acc=0.862, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.508e-04, train_time=0.148 -[v016] 2022-01-31 04:47:16,839 (trainer:653) INFO: 35epoch:train:271-297batch: iter_time=0.029, forward_time=0.035, loss=6.581, loss_att=3.768, loss_ctc=9.395, acc=0.869, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.511e-04, train_time=0.132 -[v016] 2022-01-31 04:47:21,187 (trainer:653) INFO: 35epoch:train:298-324batch: iter_time=0.059, forward_time=0.034, loss=4.942, loss_att=3.001, loss_ctc=6.884, acc=0.885, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.513e-04, train_time=0.161 -[v016] 2022-01-31 04:47:24,888 (trainer:653) INFO: 35epoch:train:325-351batch: iter_time=0.036, forward_time=0.034, loss=6.000, loss_att=3.485, loss_ctc=8.516, acc=0.873, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.515e-04, train_time=0.137 -[v016] 2022-01-31 04:47:28,922 (trainer:653) INFO: 35epoch:train:352-378batch: iter_time=0.044, forward_time=0.035, loss=6.400, loss_att=3.712, loss_ctc=9.088, acc=0.875, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.517e-04, train_time=0.149 -[v016] 2022-01-31 04:47:33,143 (trainer:653) INFO: 35epoch:train:379-405batch: iter_time=0.048, forward_time=0.038, loss=6.820, loss_att=3.912, loss_ctc=9.728, acc=0.879, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.519e-04, train_time=0.156 -[v016] 2022-01-31 04:47:38,102 (trainer:653) INFO: 35epoch:train:406-432batch: iter_time=0.079, forward_time=0.036, loss=7.838, loss_att=4.354, loss_ctc=11.322, acc=0.862, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.521e-04, train_time=0.183 -[v016] 2022-01-31 04:47:42,160 (trainer:653) INFO: 35epoch:train:433-459batch: iter_time=0.047, forward_time=0.035, loss=6.663, loss_att=3.891, loss_ctc=9.434, acc=0.865, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.524e-04, train_time=0.150 -[v016] 2022-01-31 04:47:52,109 (trainer:653) INFO: 35epoch:train:460-486batch: iter_time=0.091, forward_time=0.168, loss=7.732, loss_att=4.455, loss_ctc=11.008, acc=0.863, backward_time=0.037, optim_step_time=0.029, optim0_lr0=1.526e-04, train_time=0.366 -[v016] 2022-01-31 04:47:57,470 (trainer:653) INFO: 35epoch:train:487-513batch: iter_time=0.092, forward_time=0.036, loss=6.809, loss_att=3.950, loss_ctc=9.668, acc=0.866, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.528e-04, train_time=0.201 -[v016] 2022-01-31 04:48:02,557 (trainer:653) INFO: 35epoch:train:514-540batch: iter_time=0.086, forward_time=0.035, loss=6.517, loss_att=3.752, loss_ctc=9.282, acc=0.868, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.530e-04, train_time=0.188 -[v016] 2022-01-31 04:49:03,923 (trainer:328) INFO: 35epoch results: [train] iter_time=0.057, forward_time=0.042, loss=6.682, loss_att=3.842, loss_ctc=9.522, acc=0.870, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.510e-04, train_time=0.170, time=1 minute and 33.13 seconds, total_count=19145, gpu_max_cached_mem_GB=5.822, [valid] loss=7.530, loss_att=5.248, loss_ctc=9.812, acc=0.870, cer=0.148, wer=0.522, cer_ctc=0.239, time=25.02 seconds, total_count=6230, gpu_max_cached_mem_GB=5.822, [att_plot] time=34.95 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:49:06,924 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:49:06,927 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/30epoch.pth -[v016] 2022-01-31 04:49:06,928 (trainer:261) INFO: 36/200epoch started. Estimated time to finish: 7 hours, 29 minutes and 55.41 seconds -[v016] 2022-01-31 04:49:15,717 (trainer:653) INFO: 36epoch:train:1-27batch: iter_time=0.194, forward_time=0.037, loss=5.647, loss_att=3.269, loss_ctc=8.025, acc=0.882, backward_time=0.026, optim_step_time=0.023, optim0_lr0=1.533e-04, train_time=0.311 -[v016] 2022-01-31 04:49:21,559 (trainer:653) INFO: 36epoch:train:28-54batch: iter_time=0.114, forward_time=0.035, loss=6.133, loss_att=3.481, loss_ctc=8.784, acc=0.874, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.535e-04, train_time=0.216 -[v016] 2022-01-31 04:49:26,281 (trainer:653) INFO: 36epoch:train:55-81batch: iter_time=0.060, forward_time=0.035, loss=6.267, loss_att=3.557, loss_ctc=8.978, acc=0.875, backward_time=0.028, optim_step_time=0.032, optim0_lr0=1.537e-04, train_time=0.175 -[v016] 2022-01-31 04:49:31,172 (trainer:653) INFO: 36epoch:train:82-108batch: iter_time=0.074, forward_time=0.037, loss=7.651, loss_att=4.282, loss_ctc=11.021, acc=0.873, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.539e-04, train_time=0.181 -[v016] 2022-01-31 04:49:35,015 (trainer:653) INFO: 36epoch:train:109-135batch: iter_time=0.039, forward_time=0.035, loss=6.589, loss_att=3.625, loss_ctc=9.553, acc=0.875, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.541e-04, train_time=0.142 -[v016] 2022-01-31 04:49:39,984 (trainer:653) INFO: 36epoch:train:136-162batch: iter_time=0.080, forward_time=0.036, loss=7.387, loss_att=4.122, loss_ctc=10.653, acc=0.871, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.544e-04, train_time=0.184 -[v016] 2022-01-31 04:49:44,107 (trainer:653) INFO: 36epoch:train:163-189batch: iter_time=0.052, forward_time=0.034, loss=5.597, loss_att=3.261, loss_ctc=7.933, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.546e-04, train_time=0.152 -[v016] 2022-01-31 04:49:48,398 (trainer:653) INFO: 36epoch:train:190-216batch: iter_time=0.053, forward_time=0.036, loss=7.863, loss_att=4.443, loss_ctc=11.284, acc=0.872, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.548e-04, train_time=0.159 -[v016] 2022-01-31 04:49:54,205 (trainer:653) INFO: 36epoch:train:217-243batch: iter_time=0.112, forward_time=0.035, loss=6.391, loss_att=3.699, loss_ctc=9.082, acc=0.869, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.550e-04, train_time=0.215 -[v016] 2022-01-31 04:50:00,701 (trainer:653) INFO: 36epoch:train:244-270batch: iter_time=0.099, forward_time=0.067, loss=6.990, loss_att=3.960, loss_ctc=10.019, acc=0.868, backward_time=0.026, optim_step_time=0.023, optim0_lr0=1.552e-04, train_time=0.240 -[v016] 2022-01-31 04:50:07,598 (trainer:653) INFO: 36epoch:train:271-297batch: iter_time=0.151, forward_time=0.036, loss=7.020, loss_att=4.085, loss_ctc=9.956, acc=0.862, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.554e-04, train_time=0.255 -[v016] 2022-01-31 04:50:11,986 (trainer:653) INFO: 36epoch:train:298-324batch: iter_time=0.062, forward_time=0.034, loss=5.280, loss_att=3.178, loss_ctc=7.382, acc=0.889, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.557e-04, train_time=0.162 -[v016] 2022-01-31 04:50:19,095 (trainer:653) INFO: 36epoch:train:325-351batch: iter_time=0.065, forward_time=0.112, loss=5.700, loss_att=3.317, loss_ctc=8.082, acc=0.868, backward_time=0.039, optim_step_time=0.024, optim0_lr0=1.559e-04, train_time=0.263 -[v016] 2022-01-31 04:50:24,815 (trainer:653) INFO: 36epoch:train:352-378batch: iter_time=0.109, forward_time=0.035, loss=6.372, loss_att=3.601, loss_ctc=9.143, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.561e-04, train_time=0.212 -[v016] 2022-01-31 04:50:29,762 (trainer:653) INFO: 36epoch:train:379-405batch: iter_time=0.086, forward_time=0.033, loss=6.063, loss_att=3.429, loss_ctc=8.697, acc=0.879, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.563e-04, train_time=0.183 -[v016] 2022-01-31 04:50:35,072 (trainer:653) INFO: 36epoch:train:406-432batch: iter_time=0.094, forward_time=0.035, loss=8.325, loss_att=4.608, loss_ctc=12.041, acc=0.860, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.565e-04, train_time=0.196 -[v016] 2022-01-31 04:50:40,203 (trainer:653) INFO: 36epoch:train:433-459batch: iter_time=0.090, forward_time=0.034, loss=6.209, loss_att=3.547, loss_ctc=8.871, acc=0.872, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.567e-04, train_time=0.190 -[v016] 2022-01-31 04:50:45,721 (trainer:653) INFO: 36epoch:train:460-486batch: iter_time=0.100, forward_time=0.036, loss=6.351, loss_att=3.624, loss_ctc=9.079, acc=0.874, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.570e-04, train_time=0.204 -[v016] 2022-01-31 04:50:51,968 (trainer:653) INFO: 36epoch:train:487-513batch: iter_time=0.129, forward_time=0.035, loss=6.509, loss_att=3.710, loss_ctc=9.308, acc=0.875, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.572e-04, train_time=0.231 -[v016] 2022-01-31 04:50:57,506 (trainer:653) INFO: 36epoch:train:514-540batch: iter_time=0.100, forward_time=0.036, loss=7.366, loss_att=4.115, loss_ctc=10.616, acc=0.870, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.574e-04, train_time=0.205 -[v016] 2022-01-31 04:51:52,974 (trainer:328) INFO: 36epoch results: [train] iter_time=0.093, forward_time=0.040, loss=6.572, loss_att=3.737, loss_ctc=9.406, acc=0.873, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.554e-04, train_time=0.204, time=1 minute and 52.03 seconds, total_count=19692, gpu_max_cached_mem_GB=5.822, [valid] loss=7.913, loss_att=5.436, loss_ctc=10.391, acc=0.865, cer=0.161, wer=0.539, cer_ctc=0.259, time=17.67 seconds, total_count=6408, gpu_max_cached_mem_GB=5.822, [att_plot] time=36.32 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:51:56,110 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 04:51:56,113 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/31epoch.pth -[v016] 2022-01-31 04:51:56,113 (trainer:261) INFO: 37/200epoch started. Estimated time to finish: 7 hours, 28 minutes and 8.97 seconds -[v016] 2022-01-31 04:52:02,517 (trainer:653) INFO: 37epoch:train:1-27batch: iter_time=0.082, forward_time=0.058, loss=5.500, loss_att=3.241, loss_ctc=7.759, acc=0.881, backward_time=0.040, optim_step_time=0.023, optim0_lr0=1.577e-04, train_time=0.232 -[v016] 2022-01-31 04:52:06,266 (trainer:653) INFO: 37epoch:train:28-54batch: iter_time=0.038, forward_time=0.034, loss=5.213, loss_att=2.849, loss_ctc=7.578, acc=0.892, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.579e-04, train_time=0.139 -[v016] 2022-01-31 04:52:09,638 (trainer:653) INFO: 37epoch:train:55-81batch: iter_time=0.023, forward_time=0.035, loss=6.043, loss_att=3.498, loss_ctc=8.589, acc=0.873, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.581e-04, train_time=0.125 -[v016] 2022-01-31 04:52:13,166 (trainer:653) INFO: 37epoch:train:82-108batch: iter_time=0.028, forward_time=0.035, loss=5.993, loss_att=3.486, loss_ctc=8.500, acc=0.872, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.583e-04, train_time=0.130 -[v016] 2022-01-31 04:52:17,263 (trainer:653) INFO: 37epoch:train:109-135batch: iter_time=0.048, forward_time=0.035, loss=7.146, loss_att=3.980, loss_ctc=10.311, acc=0.873, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.585e-04, train_time=0.151 -[v016] 2022-01-31 04:52:21,139 (trainer:653) INFO: 37epoch:train:136-162batch: iter_time=0.041, forward_time=0.035, loss=6.183, loss_att=3.501, loss_ctc=8.864, acc=0.870, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.587e-04, train_time=0.143 -[v016] 2022-01-31 04:52:24,895 (trainer:653) INFO: 37epoch:train:163-189batch: iter_time=0.036, forward_time=0.035, loss=6.947, loss_att=3.937, loss_ctc=9.958, acc=0.869, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.590e-04, train_time=0.139 -[v016] 2022-01-31 04:52:27,810 (trainer:653) INFO: 37epoch:train:190-216batch: iter_time=0.004, forward_time=0.035, loss=7.248, loss_att=4.016, loss_ctc=10.479, acc=0.866, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.592e-04, train_time=0.108 -[v016] 2022-01-31 04:52:30,808 (trainer:653) INFO: 37epoch:train:217-243batch: iter_time=0.007, forward_time=0.035, loss=7.058, loss_att=3.985, loss_ctc=10.132, acc=0.860, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.594e-04, train_time=0.111 -[v016] 2022-01-31 04:52:34,243 (trainer:653) INFO: 37epoch:train:244-270batch: iter_time=0.024, forward_time=0.034, loss=5.643, loss_att=3.252, loss_ctc=8.035, acc=0.873, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.596e-04, train_time=0.127 -[v016] 2022-01-31 04:52:37,450 (trainer:653) INFO: 37epoch:train:271-297batch: iter_time=0.008, forward_time=0.040, loss=7.257, loss_att=4.061, loss_ctc=10.454, acc=0.875, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.598e-04, train_time=0.118 -[v016] 2022-01-31 04:52:41,530 (trainer:653) INFO: 37epoch:train:298-324batch: iter_time=0.044, forward_time=0.036, loss=7.829, loss_att=4.401, loss_ctc=11.258, acc=0.865, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.600e-04, train_time=0.151 -[v016] 2022-01-31 04:52:45,694 (trainer:653) INFO: 37epoch:train:325-351batch: iter_time=0.052, forward_time=0.035, loss=6.941, loss_att=3.969, loss_ctc=9.913, acc=0.850, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.602e-04, train_time=0.154 -[v016] 2022-01-31 04:52:49,723 (trainer:653) INFO: 37epoch:train:352-378batch: iter_time=0.047, forward_time=0.035, loss=6.317, loss_att=3.599, loss_ctc=9.035, acc=0.875, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.605e-04, train_time=0.149 -[v016] 2022-01-31 04:52:53,746 (trainer:653) INFO: 37epoch:train:379-405batch: iter_time=0.044, forward_time=0.035, loss=7.455, loss_att=4.135, loss_ctc=10.775, acc=0.864, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.607e-04, train_time=0.149 -[v016] 2022-01-31 04:52:56,896 (trainer:653) INFO: 37epoch:train:406-432batch: iter_time=0.010, forward_time=0.036, loss=7.198, loss_att=4.125, loss_ctc=10.272, acc=0.871, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.609e-04, train_time=0.116 -[v016] 2022-01-31 04:53:00,083 (trainer:653) INFO: 37epoch:train:433-459batch: iter_time=0.014, forward_time=0.035, loss=6.183, loss_att=3.571, loss_ctc=8.796, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.611e-04, train_time=0.118 -[v016] 2022-01-31 04:53:05,536 (trainer:653) INFO: 37epoch:train:460-486batch: iter_time=0.027, forward_time=0.068, loss=6.227, loss_att=3.655, loss_ctc=8.800, acc=0.862, backward_time=0.029, optim_step_time=0.049, optim0_lr0=1.613e-04, train_time=0.202 -[v016] 2022-01-31 04:53:09,546 (trainer:653) INFO: 37epoch:train:487-513batch: iter_time=0.048, forward_time=0.034, loss=4.664, loss_att=2.731, loss_ctc=6.597, acc=0.888, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.615e-04, train_time=0.148 -[v016] 2022-01-31 04:53:14,982 (trainer:653) INFO: 37epoch:train:514-540batch: iter_time=0.097, forward_time=0.035, loss=6.161, loss_att=3.390, loss_ctc=8.932, acc=0.886, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.618e-04, train_time=0.201 -[v016] 2022-01-31 04:54:12,145 (trainer:328) INFO: 37epoch results: [train] iter_time=0.037, forward_time=0.038, loss=6.459, loss_att=3.664, loss_ctc=9.255, acc=0.872, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.597e-04, train_time=0.146, time=1 minute and 20.36 seconds, total_count=20239, gpu_max_cached_mem_GB=5.822, [valid] loss=7.465, loss_att=5.287, loss_ctc=9.643, acc=0.870, cer=0.152, wer=0.521, cer_ctc=0.244, time=18.35 seconds, total_count=6586, gpu_max_cached_mem_GB=5.822, [att_plot] time=37.2 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:54:14,671 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss -[v016] 2022-01-31 04:54:14,674 (trainer:261) INFO: 38/200epoch started. Estimated time to finish: 7 hours, 21 minutes and 21.5 seconds -[v016] 2022-01-31 04:54:23,860 (trainer:653) INFO: 38epoch:train:1-27batch: iter_time=0.189, forward_time=0.057, loss=6.623, loss_att=3.674, loss_ctc=9.571, acc=0.880, backward_time=0.038, optim_step_time=0.024, optim0_lr0=1.620e-04, train_time=0.332 -[v016] 2022-01-31 04:54:28,857 (trainer:653) INFO: 38epoch:train:28-54batch: iter_time=0.078, forward_time=0.036, loss=5.712, loss_att=3.140, loss_ctc=8.284, acc=0.887, backward_time=0.025, optim_step_time=0.026, optim0_lr0=1.622e-04, train_time=0.185 -[v016] 2022-01-31 04:54:34,087 (trainer:653) INFO: 38epoch:train:55-81batch: iter_time=0.090, forward_time=0.036, loss=6.063, loss_att=3.439, loss_ctc=8.688, acc=0.876, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.625e-04, train_time=0.193 -[v016] 2022-01-31 04:54:39,292 (trainer:653) INFO: 38epoch:train:82-108batch: iter_time=0.089, forward_time=0.036, loss=7.549, loss_att=4.248, loss_ctc=10.849, acc=0.859, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.627e-04, train_time=0.193 -[v016] 2022-01-31 04:54:42,408 (trainer:653) INFO: 38epoch:train:109-135batch: iter_time=0.013, forward_time=0.035, loss=6.598, loss_att=3.705, loss_ctc=9.492, acc=0.868, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.629e-04, train_time=0.115 -[v016] 2022-01-31 04:54:46,818 (trainer:653) INFO: 38epoch:train:136-162batch: iter_time=0.054, forward_time=0.037, loss=6.500, loss_att=3.668, loss_ctc=9.333, acc=0.878, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.631e-04, train_time=0.163 -[v016] 2022-01-31 04:54:51,902 (trainer:653) INFO: 38epoch:train:163-189batch: iter_time=0.084, forward_time=0.036, loss=5.930, loss_att=3.305, loss_ctc=8.555, acc=0.886, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.633e-04, train_time=0.188 -[v016] 2022-01-31 04:54:56,653 (trainer:653) INFO: 38epoch:train:190-216batch: iter_time=0.074, forward_time=0.034, loss=5.153, loss_att=3.012, loss_ctc=7.293, acc=0.880, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.635e-04, train_time=0.176 -[v016] 2022-01-31 04:55:01,396 (trainer:653) INFO: 38epoch:train:217-243batch: iter_time=0.070, forward_time=0.037, loss=5.384, loss_att=3.104, loss_ctc=7.664, acc=0.874, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.638e-04, train_time=0.175 -[v016] 2022-01-31 04:55:06,807 (trainer:653) INFO: 38epoch:train:244-270batch: iter_time=0.088, forward_time=0.042, loss=7.431, loss_att=4.106, loss_ctc=10.755, acc=0.873, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.640e-04, train_time=0.200 -[v016] 2022-01-31 04:55:12,670 (trainer:653) INFO: 38epoch:train:271-297batch: iter_time=0.109, forward_time=0.037, loss=6.223, loss_att=3.435, loss_ctc=9.012, acc=0.895, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.642e-04, train_time=0.217 -[v016] 2022-01-31 04:55:18,082 (trainer:653) INFO: 38epoch:train:298-324batch: iter_time=0.094, forward_time=0.036, loss=7.089, loss_att=3.995, loss_ctc=10.183, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.644e-04, train_time=0.200 -[v016] 2022-01-31 04:55:26,015 (trainer:653) INFO: 38epoch:train:325-351batch: iter_time=0.146, forward_time=0.071, loss=6.025, loss_att=3.386, loss_ctc=8.664, acc=0.876, backward_time=0.027, optim_step_time=0.025, optim0_lr0=1.646e-04, train_time=0.294 -[v016] 2022-01-31 04:55:31,421 (trainer:653) INFO: 38epoch:train:352-378batch: iter_time=0.099, forward_time=0.034, loss=5.588, loss_att=3.170, loss_ctc=8.005, acc=0.886, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.648e-04, train_time=0.200 -[v016] 2022-01-31 04:55:39,614 (trainer:653) INFO: 38epoch:train:379-405batch: iter_time=0.122, forward_time=0.093, loss=6.087, loss_att=3.430, loss_ctc=8.744, acc=0.878, backward_time=0.026, optim_step_time=0.041, optim0_lr0=1.651e-04, train_time=0.303 -[v016] 2022-01-31 04:55:47,574 (trainer:653) INFO: 38epoch:train:406-432batch: iter_time=0.194, forward_time=0.034, loss=5.797, loss_att=3.283, loss_ctc=8.311, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.653e-04, train_time=0.295 -[v016] 2022-01-31 04:55:55,551 (trainer:653) INFO: 38epoch:train:433-459batch: iter_time=0.192, forward_time=0.035, loss=6.578, loss_att=3.676, loss_ctc=9.480, acc=0.879, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.655e-04, train_time=0.295 -[v016] 2022-01-31 04:56:03,179 (trainer:653) INFO: 38epoch:train:460-486batch: iter_time=0.142, forward_time=0.054, loss=6.551, loss_att=3.552, loss_ctc=9.550, acc=0.879, backward_time=0.042, optim_step_time=0.023, optim0_lr0=1.657e-04, train_time=0.282 -[v016] 2022-01-31 04:56:09,339 (trainer:653) INFO: 38epoch:train:487-513batch: iter_time=0.124, forward_time=0.035, loss=7.088, loss_att=4.069, loss_ctc=10.106, acc=0.870, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.659e-04, train_time=0.228 -[v016] 2022-01-31 04:56:15,163 (trainer:653) INFO: 38epoch:train:514-540batch: iter_time=0.115, forward_time=0.034, loss=6.068, loss_att=3.454, loss_ctc=8.683, acc=0.875, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.661e-04, train_time=0.215 -[v016] 2022-01-31 04:57:17,963 (trainer:328) INFO: 38epoch results: [train] iter_time=0.108, forward_time=0.042, loss=6.311, loss_att=3.548, loss_ctc=9.075, acc=0.877, backward_time=0.026, optim_step_time=0.025, optim0_lr0=1.641e-04, train_time=0.223, time=2 minutes and 2.14 seconds, total_count=20786, gpu_max_cached_mem_GB=5.822, [valid] loss=7.668, loss_att=5.316, loss_ctc=10.021, acc=0.870, cer=0.151, wer=0.524, cer_ctc=0.252, time=28.41 seconds, total_count=6764, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.61 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:57:21,135 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 04:57:21,138 (trainer:261) INFO: 39/200epoch started. Estimated time to finish: 7 hours, 22 minutes and 15.04 seconds -[v016] 2022-01-31 04:57:25,722 (trainer:653) INFO: 39epoch:train:1-27batch: iter_time=0.055, forward_time=0.036, loss=6.046, loss_att=3.403, loss_ctc=8.689, acc=0.881, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.664e-04, train_time=0.161 -[v016] 2022-01-31 04:57:31,071 (trainer:653) INFO: 39epoch:train:28-54batch: iter_time=0.092, forward_time=0.037, loss=6.496, loss_att=3.632, loss_ctc=9.361, acc=0.878, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.666e-04, train_time=0.198 -[v016] 2022-01-31 04:57:34,722 (trainer:653) INFO: 39epoch:train:55-81batch: iter_time=0.033, forward_time=0.034, loss=5.530, loss_att=3.165, loss_ctc=7.896, acc=0.879, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.668e-04, train_time=0.135 -[v016] 2022-01-31 04:57:39,003 (trainer:653) INFO: 39epoch:train:82-108batch: iter_time=0.055, forward_time=0.035, loss=5.675, loss_att=3.251, loss_ctc=8.099, acc=0.881, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.671e-04, train_time=0.158 -[v016] 2022-01-31 04:57:41,902 (trainer:653) INFO: 39epoch:train:109-135batch: iter_time=0.002, forward_time=0.036, loss=6.458, loss_att=3.595, loss_ctc=9.322, acc=0.879, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.673e-04, train_time=0.107 -[v016] 2022-01-31 04:57:45,441 (trainer:653) INFO: 39epoch:train:136-162batch: iter_time=0.028, forward_time=0.035, loss=6.791, loss_att=3.710, loss_ctc=9.872, acc=0.868, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.675e-04, train_time=0.131 -[v016] 2022-01-31 04:57:48,305 (trainer:653) INFO: 39epoch:train:163-189batch: iter_time=8.884e-04, forward_time=0.036, loss=6.825, loss_att=3.716, loss_ctc=9.935, acc=0.875, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.677e-04, train_time=0.106 -[v016] 2022-01-31 04:57:53,344 (trainer:653) INFO: 39epoch:train:190-216batch: iter_time=0.013, forward_time=0.066, loss=5.806, loss_att=3.216, loss_ctc=8.397, acc=0.885, backward_time=0.029, optim_step_time=0.027, optim0_lr0=1.679e-04, train_time=0.186 -[v016] 2022-01-31 04:57:57,112 (trainer:653) INFO: 39epoch:train:217-243batch: iter_time=0.036, forward_time=0.035, loss=6.601, loss_att=3.686, loss_ctc=9.516, acc=0.878, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.681e-04, train_time=0.139 -[v016] 2022-01-31 04:58:01,228 (trainer:653) INFO: 39epoch:train:244-270batch: iter_time=0.048, forward_time=0.036, loss=7.730, loss_att=4.233, loss_ctc=11.227, acc=0.869, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.684e-04, train_time=0.152 -[v016] 2022-01-31 04:58:04,432 (trainer:653) INFO: 39epoch:train:271-297batch: iter_time=0.015, forward_time=0.035, loss=5.721, loss_att=3.252, loss_ctc=8.190, acc=0.871, backward_time=0.024, optim_step_time=0.025, optim0_lr0=1.686e-04, train_time=0.118 -[v016] 2022-01-31 04:58:08,246 (trainer:653) INFO: 39epoch:train:298-324batch: iter_time=0.037, forward_time=0.035, loss=5.347, loss_att=3.031, loss_ctc=7.663, acc=0.894, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.688e-04, train_time=0.141 -[v016] 2022-01-31 04:58:11,305 (trainer:653) INFO: 39epoch:train:325-351batch: iter_time=0.010, forward_time=0.035, loss=5.543, loss_att=3.180, loss_ctc=7.907, acc=0.876, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.690e-04, train_time=0.113 -[v016] 2022-01-31 04:58:14,801 (trainer:653) INFO: 39epoch:train:352-378batch: iter_time=0.024, forward_time=0.036, loss=6.357, loss_att=3.444, loss_ctc=9.271, acc=0.888, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.692e-04, train_time=0.129 -[v016] 2022-01-31 04:58:17,829 (trainer:653) INFO: 39epoch:train:379-405batch: iter_time=0.003, forward_time=0.035, loss=6.739, loss_att=3.656, loss_ctc=9.823, acc=0.879, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.694e-04, train_time=0.111 -[v016] 2022-01-31 04:58:27,473 (trainer:653) INFO: 39epoch:train:406-432batch: iter_time=0.141, forward_time=0.111, loss=5.498, loss_att=3.122, loss_ctc=7.874, acc=0.884, backward_time=0.031, optim_step_time=0.029, optim0_lr0=1.696e-04, train_time=0.357 -[v016] 2022-01-31 04:58:31,844 (trainer:653) INFO: 39epoch:train:433-459batch: iter_time=0.056, forward_time=0.038, loss=5.729, loss_att=3.246, loss_ctc=8.211, acc=0.885, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.699e-04, train_time=0.162 -[v016] 2022-01-31 04:58:36,165 (trainer:653) INFO: 39epoch:train:460-486batch: iter_time=0.058, forward_time=0.034, loss=5.895, loss_att=3.291, loss_ctc=8.499, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.701e-04, train_time=0.160 -[v016] 2022-01-31 04:58:39,687 (trainer:653) INFO: 39epoch:train:487-513batch: iter_time=0.027, forward_time=0.035, loss=5.302, loss_att=2.967, loss_ctc=7.638, acc=0.885, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.703e-04, train_time=0.130 -[v016] 2022-01-31 04:58:44,421 (trainer:653) INFO: 39epoch:train:514-540batch: iter_time=0.069, forward_time=0.036, loss=7.239, loss_att=4.009, loss_ctc=10.468, acc=0.881, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.705e-04, train_time=0.175 -[v016] 2022-01-31 04:59:29,324 (trainer:328) INFO: 39epoch results: [train] iter_time=0.040, forward_time=0.041, loss=6.180, loss_att=3.448, loss_ctc=8.912, acc=0.880, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.685e-04, train_time=0.153, time=1 minute and 24.26 seconds, total_count=21333, gpu_max_cached_mem_GB=5.822, [valid] loss=7.389, loss_att=5.264, loss_ctc=9.513, acc=0.876, cer=0.143, wer=0.506, cer_ctc=0.238, time=11.21 seconds, total_count=6942, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.57 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 04:59:32,439 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 04:59:32,442 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/32epoch.pth, exp/asr_train_asr_raw_en_word/34epoch.pth -[v016] 2022-01-31 04:59:32,443 (trainer:261) INFO: 40/200epoch started. Estimated time to finish: 7 hours, 14 minutes and 55.92 seconds -[v016] 2022-01-31 04:59:38,518 (trainer:653) INFO: 40epoch:train:1-27batch: iter_time=0.111, forward_time=0.036, loss=6.987, loss_att=3.794, loss_ctc=10.179, acc=0.880, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.708e-04, train_time=0.219 -[v016] 2022-01-31 04:59:44,140 (trainer:653) INFO: 40epoch:train:28-54batch: iter_time=0.105, forward_time=0.035, loss=6.756, loss_att=3.845, loss_ctc=9.666, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.710e-04, train_time=0.208 -[v016] 2022-01-31 04:59:48,133 (trainer:653) INFO: 40epoch:train:55-81batch: iter_time=0.046, forward_time=0.035, loss=5.919, loss_att=3.255, loss_ctc=8.583, acc=0.876, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.712e-04, train_time=0.148 -[v016] 2022-01-31 04:59:52,077 (trainer:653) INFO: 40epoch:train:82-108batch: iter_time=0.044, forward_time=0.035, loss=5.097, loss_att=2.931, loss_ctc=7.264, acc=0.896, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.714e-04, train_time=0.146 -[v016] 2022-01-31 04:59:56,985 (trainer:653) INFO: 40epoch:train:109-135batch: iter_time=0.079, forward_time=0.034, loss=6.364, loss_att=3.396, loss_ctc=9.331, acc=0.886, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.716e-04, train_time=0.182 -[v016] 2022-01-31 05:00:02,224 (trainer:653) INFO: 40epoch:train:136-162batch: iter_time=0.091, forward_time=0.035, loss=5.763, loss_att=3.239, loss_ctc=8.286, acc=0.887, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.719e-04, train_time=0.194 -[v016] 2022-01-31 05:00:07,725 (trainer:653) INFO: 40epoch:train:163-189batch: iter_time=0.098, forward_time=0.036, loss=7.012, loss_att=3.985, loss_ctc=10.039, acc=0.868, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.721e-04, train_time=0.204 -[v016] 2022-01-31 05:00:12,617 (trainer:653) INFO: 40epoch:train:190-216batch: iter_time=0.078, forward_time=0.035, loss=6.835, loss_att=3.768, loss_ctc=9.903, acc=0.872, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.723e-04, train_time=0.181 -[v016] 2022-01-31 05:00:18,475 (trainer:653) INFO: 40epoch:train:217-243batch: iter_time=0.055, forward_time=0.080, loss=5.515, loss_att=3.111, loss_ctc=7.920, acc=0.889, backward_time=0.030, optim_step_time=0.027, optim0_lr0=1.725e-04, train_time=0.214 -[v016] 2022-01-31 05:00:21,917 (trainer:653) INFO: 40epoch:train:244-270batch: iter_time=0.025, forward_time=0.035, loss=5.868, loss_att=3.224, loss_ctc=8.512, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.727e-04, train_time=0.127 -[v016] 2022-01-31 05:00:25,803 (trainer:653) INFO: 40epoch:train:271-297batch: iter_time=0.043, forward_time=0.034, loss=5.416, loss_att=2.982, loss_ctc=7.851, acc=0.897, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.729e-04, train_time=0.144 -[v016] 2022-01-31 05:00:30,224 (trainer:653) INFO: 40epoch:train:298-324batch: iter_time=0.054, forward_time=0.039, loss=7.067, loss_att=3.871, loss_ctc=10.262, acc=0.879, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.732e-04, train_time=0.163 -[v016] 2022-01-31 05:00:34,656 (trainer:653) INFO: 40epoch:train:325-351batch: iter_time=0.056, forward_time=0.038, loss=5.694, loss_att=3.129, loss_ctc=8.260, acc=0.881, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.734e-04, train_time=0.163 -[v016] 2022-01-31 05:00:38,627 (trainer:653) INFO: 40epoch:train:352-378batch: iter_time=0.046, forward_time=0.034, loss=5.411, loss_att=3.158, loss_ctc=7.664, acc=0.877, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.736e-04, train_time=0.147 -[v016] 2022-01-31 05:00:41,834 (trainer:653) INFO: 40epoch:train:379-405batch: iter_time=0.017, forward_time=0.034, loss=5.544, loss_att=3.124, loss_ctc=7.963, acc=0.892, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.738e-04, train_time=0.119 -[v016] 2022-01-31 05:00:46,395 (trainer:653) INFO: 40epoch:train:406-432batch: iter_time=0.061, forward_time=0.037, loss=5.613, loss_att=3.128, loss_ctc=8.098, acc=0.891, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.740e-04, train_time=0.169 -[v016] 2022-01-31 05:00:53,613 (trainer:653) INFO: 40epoch:train:433-459batch: iter_time=0.079, forward_time=0.106, loss=5.799, loss_att=3.333, loss_ctc=8.265, acc=0.876, backward_time=0.033, optim_step_time=0.023, optim0_lr0=1.742e-04, train_time=0.267 -[v016] 2022-01-31 05:00:59,525 (trainer:653) INFO: 40epoch:train:460-486batch: iter_time=0.116, forward_time=0.036, loss=5.691, loss_att=3.185, loss_ctc=8.197, acc=0.874, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.745e-04, train_time=0.219 -[v016] 2022-01-31 05:01:05,205 (trainer:653) INFO: 40epoch:train:487-513batch: iter_time=0.107, forward_time=0.036, loss=6.411, loss_att=3.568, loss_ctc=9.255, acc=0.878, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.747e-04, train_time=0.210 -[v016] 2022-01-31 05:01:12,397 (trainer:653) INFO: 40epoch:train:514-540batch: iter_time=0.163, forward_time=0.035, loss=6.478, loss_att=3.563, loss_ctc=9.392, acc=0.867, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.749e-04, train_time=0.266 -[v016] 2022-01-31 05:02:16,675 (trainer:328) INFO: 40epoch results: [train] iter_time=0.074, forward_time=0.041, loss=6.060, loss_att=3.377, loss_ctc=8.742, acc=0.881, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.729e-04, train_time=0.185, time=1 minute and 41.43 seconds, total_count=21880, gpu_max_cached_mem_GB=5.822, [valid] loss=7.456, loss_att=5.257, loss_ctc=9.656, acc=0.875, cer=0.139, wer=0.497, cer_ctc=0.232, time=26.03 seconds, total_count=7120, gpu_max_cached_mem_GB=5.822, [att_plot] time=36.69 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:02:19,600 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:02:19,603 (trainer:261) INFO: 41/200epoch started. Estimated time to finish: 7 hours, 12 minutes and 54.43 seconds -[v016] 2022-01-31 05:02:28,485 (trainer:653) INFO: 41epoch:train:1-27batch: iter_time=0.176, forward_time=0.057, loss=5.103, loss_att=2.863, loss_ctc=7.343, acc=0.895, backward_time=0.037, optim_step_time=0.025, optim0_lr0=1.752e-04, train_time=0.324 -[v016] 2022-01-31 05:02:34,145 (trainer:653) INFO: 41epoch:train:28-54batch: iter_time=0.105, forward_time=0.036, loss=6.114, loss_att=3.201, loss_ctc=9.028, acc=0.888, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.754e-04, train_time=0.210 -[v016] 2022-01-31 05:02:39,454 (trainer:653) INFO: 41epoch:train:55-81batch: iter_time=0.091, forward_time=0.038, loss=5.896, loss_att=3.179, loss_ctc=8.613, acc=0.884, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.756e-04, train_time=0.196 -[v016] 2022-01-31 05:02:44,846 (trainer:653) INFO: 41epoch:train:82-108batch: iter_time=0.097, forward_time=0.035, loss=5.404, loss_att=3.079, loss_ctc=7.730, acc=0.892, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.758e-04, train_time=0.199 -[v016] 2022-01-31 05:02:49,199 (trainer:653) INFO: 41epoch:train:109-135batch: iter_time=0.059, forward_time=0.035, loss=6.288, loss_att=3.390, loss_ctc=9.185, acc=0.878, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.760e-04, train_time=0.161 -[v016] 2022-01-31 05:02:53,983 (trainer:653) INFO: 41epoch:train:136-162batch: iter_time=0.074, forward_time=0.035, loss=5.425, loss_att=3.154, loss_ctc=7.696, acc=0.884, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.762e-04, train_time=0.177 -[v016] 2022-01-31 05:02:58,499 (trainer:653) INFO: 41epoch:train:163-189batch: iter_time=0.067, forward_time=0.035, loss=5.806, loss_att=3.143, loss_ctc=8.469, acc=0.882, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.765e-04, train_time=0.167 -[v016] 2022-01-31 05:03:03,734 (trainer:653) INFO: 41epoch:train:190-216batch: iter_time=0.095, forward_time=0.034, loss=5.994, loss_att=3.227, loss_ctc=8.762, acc=0.891, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.767e-04, train_time=0.194 -[v016] 2022-01-31 05:03:08,284 (trainer:653) INFO: 41epoch:train:217-243batch: iter_time=0.069, forward_time=0.034, loss=5.314, loss_att=2.963, loss_ctc=7.666, acc=0.885, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.769e-04, train_time=0.168 -[v016] 2022-01-31 05:03:12,970 (trainer:653) INFO: 41epoch:train:244-270batch: iter_time=0.072, forward_time=0.035, loss=4.926, loss_att=2.851, loss_ctc=7.001, acc=0.891, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.771e-04, train_time=0.173 -[v016] 2022-01-31 05:03:18,632 (trainer:653) INFO: 41epoch:train:271-297batch: iter_time=0.105, forward_time=0.035, loss=5.818, loss_att=3.279, loss_ctc=8.357, acc=0.892, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.773e-04, train_time=0.209 -[v016] 2022-01-31 05:03:23,627 (trainer:653) INFO: 41epoch:train:298-324batch: iter_time=0.081, forward_time=0.035, loss=6.219, loss_att=3.330, loss_ctc=9.109, acc=0.892, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.775e-04, train_time=0.185 -[v016] 2022-01-31 05:03:29,952 (trainer:653) INFO: 41epoch:train:325-351batch: iter_time=0.133, forward_time=0.034, loss=6.378, loss_att=3.495, loss_ctc=9.261, acc=0.885, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.778e-04, train_time=0.234 -[v016] 2022-01-31 05:03:35,390 (trainer:653) INFO: 41epoch:train:352-378batch: iter_time=0.096, forward_time=0.036, loss=6.980, loss_att=3.826, loss_ctc=10.133, acc=0.882, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.780e-04, train_time=0.201 -[v016] 2022-01-31 05:03:39,956 (trainer:653) INFO: 41epoch:train:379-405batch: iter_time=0.071, forward_time=0.033, loss=6.824, loss_att=3.759, loss_ctc=9.889, acc=0.870, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.782e-04, train_time=0.169 -[v016] 2022-01-31 05:03:44,054 (trainer:653) INFO: 41epoch:train:406-432batch: iter_time=0.049, forward_time=0.035, loss=6.665, loss_att=3.643, loss_ctc=9.687, acc=0.871, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.784e-04, train_time=0.152 -[v016] 2022-01-31 05:03:52,241 (trainer:653) INFO: 41epoch:train:433-459batch: iter_time=0.093, forward_time=0.125, loss=5.387, loss_att=3.051, loss_ctc=7.722, acc=0.888, backward_time=0.033, optim_step_time=0.024, optim0_lr0=1.786e-04, train_time=0.303 -[v016] 2022-01-31 05:03:56,865 (trainer:653) INFO: 41epoch:train:460-486batch: iter_time=0.066, forward_time=0.036, loss=6.903, loss_att=3.770, loss_ctc=10.035, acc=0.876, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.788e-04, train_time=0.171 -[v016] 2022-01-31 05:04:01,727 (trainer:653) INFO: 41epoch:train:487-513batch: iter_time=0.075, forward_time=0.036, loss=6.327, loss_att=3.434, loss_ctc=9.220, acc=0.880, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.790e-04, train_time=0.180 -[v016] 2022-01-31 05:04:06,457 (trainer:653) INFO: 41epoch:train:514-540batch: iter_time=0.069, forward_time=0.036, loss=6.886, loss_att=3.747, loss_ctc=10.024, acc=0.877, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.793e-04, train_time=0.175 -[v016] 2022-01-31 05:05:04,404 (trainer:328) INFO: 41epoch results: [train] iter_time=0.087, forward_time=0.041, loss=6.014, loss_att=3.312, loss_ctc=8.716, acc=0.884, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.772e-04, train_time=0.197, time=1 minute and 48.27 seconds, total_count=22427, gpu_max_cached_mem_GB=5.822, [valid] loss=7.299, loss_att=5.272, loss_ctc=9.327, acc=0.875, cer=0.142, wer=0.506, cer_ctc=0.233, time=26.73 seconds, total_count=7298, gpu_max_cached_mem_GB=5.822, [att_plot] time=29.73 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:05:06,658 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:05:06,661 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/33epoch.pth -[v016] 2022-01-31 05:05:06,661 (trainer:261) INFO: 42/200epoch started. Estimated time to finish: 7 hours, 10 minutes and 47.81 seconds -[v016] 2022-01-31 05:05:10,150 (trainer:653) INFO: 42epoch:train:1-27batch: iter_time=0.023, forward_time=0.033, loss=5.365, loss_att=2.915, loss_ctc=7.815, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.795e-04, train_time=0.122 -[v016] 2022-01-31 05:05:12,752 (trainer:653) INFO: 42epoch:train:28-54batch: iter_time=1.130e-04, forward_time=0.033, loss=5.562, loss_att=3.124, loss_ctc=8.001, acc=0.890, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.798e-04, train_time=0.096 -[v016] 2022-01-31 05:05:15,397 (trainer:653) INFO: 42epoch:train:55-81batch: iter_time=0.001, forward_time=0.033, loss=6.216, loss_att=3.308, loss_ctc=9.124, acc=0.883, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.800e-04, train_time=0.098 -[v016] 2022-01-31 05:05:18,248 (trainer:653) INFO: 42epoch:train:82-108batch: iter_time=0.003, forward_time=0.035, loss=7.611, loss_att=4.031, loss_ctc=11.191, acc=0.875, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.802e-04, train_time=0.105 -[v016] 2022-01-31 05:05:21,364 (trainer:653) INFO: 42epoch:train:109-135batch: iter_time=0.022, forward_time=0.032, loss=5.062, loss_att=2.825, loss_ctc=7.299, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.804e-04, train_time=0.115 -[v016] 2022-01-31 05:05:24,017 (trainer:653) INFO: 42epoch:train:136-162batch: iter_time=0.003, forward_time=0.033, loss=5.694, loss_att=3.135, loss_ctc=8.253, acc=0.889, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.806e-04, train_time=0.098 -[v016] 2022-01-31 05:05:26,663 (trainer:653) INFO: 42epoch:train:163-189batch: iter_time=7.232e-04, forward_time=0.034, loss=6.529, loss_att=3.598, loss_ctc=9.460, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.808e-04, train_time=0.098 -[v016] 2022-01-31 05:05:29,554 (trainer:653) INFO: 42epoch:train:190-216batch: iter_time=0.005, forward_time=0.035, loss=8.084, loss_att=4.366, loss_ctc=11.803, acc=0.865, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.810e-04, train_time=0.107 -[v016] 2022-01-31 05:05:32,099 (trainer:653) INFO: 42epoch:train:217-243batch: iter_time=9.215e-05, forward_time=0.033, loss=5.849, loss_att=3.235, loss_ctc=8.463, acc=0.876, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.813e-04, train_time=0.094 -[v016] 2022-01-31 05:05:34,631 (trainer:653) INFO: 42epoch:train:244-270batch: iter_time=9.509e-05, forward_time=0.032, loss=5.400, loss_att=2.962, loss_ctc=7.838, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.815e-04, train_time=0.094 -[v016] 2022-01-31 05:05:37,210 (trainer:653) INFO: 42epoch:train:271-297batch: iter_time=9.310e-05, forward_time=0.034, loss=5.606, loss_att=3.107, loss_ctc=8.106, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.817e-04, train_time=0.095 -[v016] 2022-01-31 05:05:39,739 (trainer:653) INFO: 42epoch:train:298-324batch: iter_time=1.156e-04, forward_time=0.032, loss=5.220, loss_att=3.010, loss_ctc=7.429, acc=0.879, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.819e-04, train_time=0.093 -[v016] 2022-01-31 05:05:42,225 (trainer:653) INFO: 42epoch:train:325-351batch: iter_time=9.845e-05, forward_time=0.032, loss=4.520, loss_att=2.584, loss_ctc=6.456, acc=0.900, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.821e-04, train_time=0.092 -[v016] 2022-01-31 05:05:44,820 (trainer:653) INFO: 42epoch:train:352-378batch: iter_time=2.699e-04, forward_time=0.033, loss=6.199, loss_att=3.452, loss_ctc=8.945, acc=0.881, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.823e-04, train_time=0.096 -[v016] 2022-01-31 05:05:47,957 (trainer:653) INFO: 42epoch:train:379-405batch: iter_time=0.021, forward_time=0.032, loss=5.543, loss_att=3.087, loss_ctc=8.000, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.826e-04, train_time=0.116 -[v016] 2022-01-31 05:05:50,677 (trainer:653) INFO: 42epoch:train:406-432batch: iter_time=0.005, forward_time=0.033, loss=5.989, loss_att=3.346, loss_ctc=8.632, acc=0.880, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.828e-04, train_time=0.101 -[v016] 2022-01-31 05:05:53,466 (trainer:653) INFO: 42epoch:train:433-459batch: iter_time=0.006, forward_time=0.034, loss=6.370, loss_att=3.503, loss_ctc=9.237, acc=0.885, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.830e-04, train_time=0.103 -[v016] 2022-01-31 05:05:56,132 (trainer:653) INFO: 42epoch:train:460-486batch: iter_time=0.002, forward_time=0.033, loss=5.498, loss_att=3.047, loss_ctc=7.949, acc=0.883, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.832e-04, train_time=0.099 -[v016] 2022-01-31 05:05:58,721 (trainer:653) INFO: 42epoch:train:487-513batch: iter_time=0.001, forward_time=0.033, loss=5.530, loss_att=3.029, loss_ctc=8.031, acc=0.890, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.834e-04, train_time=0.096 -[v016] 2022-01-31 05:06:01,266 (trainer:653) INFO: 42epoch:train:514-540batch: iter_time=9.757e-05, forward_time=0.033, loss=5.229, loss_att=2.945, loss_ctc=7.514, acc=0.888, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.836e-04, train_time=0.094 -[v016] 2022-01-31 05:06:38,828 (trainer:328) INFO: 42epoch results: [train] iter_time=0.005, forward_time=0.033, loss=5.892, loss_att=3.251, loss_ctc=8.533, acc=0.884, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.816e-04, train_time=0.101, time=55.25 seconds, total_count=22974, gpu_max_cached_mem_GB=5.822, [valid] loss=7.219, loss_att=5.189, loss_ctc=9.248, acc=0.878, cer=0.137, wer=0.488, cer_ctc=0.228, time=8.49 seconds, total_count=7476, gpu_max_cached_mem_GB=5.822, [att_plot] time=28.3 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:06:41,003 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, valid.acc -[v016] 2022-01-31 05:06:41,006 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/35epoch.pth, exp/asr_train_asr_raw_en_word/36epoch.pth -[v016] 2022-01-31 05:06:41,006 (trainer:261) INFO: 43/200epoch started. Estimated time to finish: 6 hours, 59 minutes and 55.3 seconds -[v016] 2022-01-31 05:06:43,701 (trainer:653) INFO: 43epoch:train:1-27batch: iter_time=0.003, forward_time=0.034, loss=4.821, loss_att=2.773, loss_ctc=6.868, acc=0.890, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.839e-04, train_time=0.099 -[v016] 2022-01-31 05:06:46,304 (trainer:653) INFO: 43epoch:train:28-54batch: iter_time=1.157e-04, forward_time=0.034, loss=5.947, loss_att=3.226, loss_ctc=8.668, acc=0.893, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.841e-04, train_time=0.096 -[v016] 2022-01-31 05:06:48,847 (trainer:653) INFO: 43epoch:train:55-81batch: iter_time=1.000e-04, forward_time=0.033, loss=4.950, loss_att=2.667, loss_ctc=7.232, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.843e-04, train_time=0.094 -[v016] 2022-01-31 05:06:51,450 (trainer:653) INFO: 43epoch:train:82-108batch: iter_time=9.298e-05, forward_time=0.034, loss=5.616, loss_att=3.075, loss_ctc=8.157, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.846e-04, train_time=0.096 -[v016] 2022-01-31 05:06:54,513 (trainer:653) INFO: 43epoch:train:109-135batch: iter_time=0.015, forward_time=0.034, loss=6.244, loss_att=3.313, loss_ctc=9.176, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.848e-04, train_time=0.113 -[v016] 2022-01-31 05:06:57,040 (trainer:653) INFO: 43epoch:train:136-162batch: iter_time=9.241e-05, forward_time=0.033, loss=5.790, loss_att=3.135, loss_ctc=8.445, acc=0.884, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.850e-04, train_time=0.093 -[v016] 2022-01-31 05:06:59,602 (trainer:653) INFO: 43epoch:train:163-189batch: iter_time=9.535e-05, forward_time=0.033, loss=5.651, loss_att=3.079, loss_ctc=8.222, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.852e-04, train_time=0.095 -[v016] 2022-01-31 05:07:02,258 (trainer:653) INFO: 43epoch:train:190-216batch: iter_time=9.753e-05, forward_time=0.034, loss=5.793, loss_att=3.260, loss_ctc=8.327, acc=0.893, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.854e-04, train_time=0.098 -[v016] 2022-01-31 05:07:04,851 (trainer:653) INFO: 43epoch:train:217-243batch: iter_time=9.197e-05, forward_time=0.034, loss=5.344, loss_att=2.910, loss_ctc=7.779, acc=0.898, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.856e-04, train_time=0.096 -[v016] 2022-01-31 05:07:07,532 (trainer:653) INFO: 43epoch:train:244-270batch: iter_time=9.319e-05, forward_time=0.035, loss=6.977, loss_att=3.709, loss_ctc=10.244, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.859e-04, train_time=0.099 -[v016] 2022-01-31 05:07:10,077 (trainer:653) INFO: 43epoch:train:271-297batch: iter_time=9.518e-05, forward_time=0.033, loss=5.841, loss_att=3.283, loss_ctc=8.399, acc=0.884, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.861e-04, train_time=0.094 -[v016] 2022-01-31 05:07:12,695 (trainer:653) INFO: 43epoch:train:298-324batch: iter_time=1.032e-04, forward_time=0.034, loss=6.514, loss_att=3.481, loss_ctc=9.546, acc=0.884, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.863e-04, train_time=0.097 -[v016] 2022-01-31 05:07:15,272 (trainer:653) INFO: 43epoch:train:325-351batch: iter_time=9.886e-05, forward_time=0.034, loss=5.709, loss_att=3.160, loss_ctc=8.258, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.865e-04, train_time=0.095 -[v016] 2022-01-31 05:07:18,032 (trainer:653) INFO: 43epoch:train:352-378batch: iter_time=1.293e-04, forward_time=0.036, loss=6.310, loss_att=3.486, loss_ctc=9.134, acc=0.879, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.867e-04, train_time=0.102 -[v016] 2022-01-31 05:07:20,906 (trainer:653) INFO: 43epoch:train:379-405batch: iter_time=1.262e-04, forward_time=0.037, loss=5.357, loss_att=3.037, loss_ctc=7.677, acc=0.890, backward_time=0.026, optim_step_time=0.024, optim0_lr0=1.869e-04, train_time=0.106 -[v016] 2022-01-31 05:07:24,270 (trainer:653) INFO: 43epoch:train:406-432batch: iter_time=0.021, forward_time=0.036, loss=5.559, loss_att=3.069, loss_ctc=8.048, acc=0.882, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.872e-04, train_time=0.124 -[v016] 2022-01-31 05:07:27,135 (trainer:653) INFO: 43epoch:train:433-459batch: iter_time=1.637e-04, forward_time=0.037, loss=5.268, loss_att=2.969, loss_ctc=7.567, acc=0.888, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.874e-04, train_time=0.106 -[v016] 2022-01-31 05:07:30,023 (trainer:653) INFO: 43epoch:train:460-486batch: iter_time=1.447e-04, forward_time=0.037, loss=6.256, loss_att=3.440, loss_ctc=9.072, acc=0.890, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.876e-04, train_time=0.107 -[v016] 2022-01-31 05:07:32,858 (trainer:653) INFO: 43epoch:train:487-513batch: iter_time=1.067e-04, forward_time=0.036, loss=5.911, loss_att=3.229, loss_ctc=8.593, acc=0.884, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.878e-04, train_time=0.105 -[v016] 2022-01-31 05:07:35,639 (trainer:653) INFO: 43epoch:train:514-540batch: iter_time=1.252e-04, forward_time=0.035, loss=5.430, loss_att=2.971, loss_ctc=7.890, acc=0.879, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.880e-04, train_time=0.103 -[v016] 2022-01-31 05:08:12,861 (trainer:328) INFO: 43epoch results: [train] iter_time=0.002, forward_time=0.035, loss=5.781, loss_att=3.169, loss_ctc=8.392, acc=0.888, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.860e-04, train_time=0.101, time=55.46 seconds, total_count=23521, gpu_max_cached_mem_GB=5.822, [valid] loss=7.334, loss_att=5.291, loss_ctc=9.378, acc=0.877, cer=0.141, wer=0.493, cer_ctc=0.231, time=6.15 seconds, total_count=7654, gpu_max_cached_mem_GB=5.822, [att_plot] time=30.25 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:08:15,336 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:08:15,339 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/37epoch.pth, exp/asr_train_asr_raw_en_word/38epoch.pth -[v016] 2022-01-31 05:08:15,339 (trainer:261) INFO: 44/200epoch started. Estimated time to finish: 6 hours, 49 minutes and 51.25 seconds -[v016] 2022-01-31 05:08:18,265 (trainer:653) INFO: 44epoch:train:1-27batch: iter_time=0.003, forward_time=0.036, loss=4.796, loss_att=2.568, loss_ctc=7.024, acc=0.894, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.883e-04, train_time=0.108 -[v016] 2022-01-31 05:08:21,000 (trainer:653) INFO: 44epoch:train:28-54batch: iter_time=1.335e-04, forward_time=0.035, loss=5.385, loss_att=2.920, loss_ctc=7.850, acc=0.888, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.885e-04, train_time=0.101 -[v016] 2022-01-31 05:08:23,812 (trainer:653) INFO: 44epoch:train:55-81batch: iter_time=1.443e-04, forward_time=0.036, loss=6.376, loss_att=3.416, loss_ctc=9.335, acc=0.879, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.887e-04, train_time=0.104 -[v016] 2022-01-31 05:08:26,514 (trainer:653) INFO: 44epoch:train:82-108batch: iter_time=0.001, forward_time=0.034, loss=5.146, loss_att=2.747, loss_ctc=7.545, acc=0.901, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.889e-04, train_time=0.100 -[v016] 2022-01-31 05:08:29,304 (trainer:653) INFO: 44epoch:train:109-135batch: iter_time=1.253e-04, forward_time=0.036, loss=6.629, loss_att=3.531, loss_ctc=9.728, acc=0.881, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.892e-04, train_time=0.103 -[v016] 2022-01-31 05:08:32,135 (trainer:653) INFO: 44epoch:train:136-162batch: iter_time=1.298e-04, forward_time=0.037, loss=6.135, loss_att=3.354, loss_ctc=8.915, acc=0.878, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.894e-04, train_time=0.105 -[v016] 2022-01-31 05:08:34,838 (trainer:653) INFO: 44epoch:train:163-189batch: iter_time=9.660e-05, forward_time=0.036, loss=6.394, loss_att=3.451, loss_ctc=9.336, acc=0.884, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.896e-04, train_time=0.100 -[v016] 2022-01-31 05:08:37,418 (trainer:653) INFO: 44epoch:train:190-216batch: iter_time=9.996e-05, forward_time=0.034, loss=4.973, loss_att=2.801, loss_ctc=7.145, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.898e-04, train_time=0.095 -[v016] 2022-01-31 05:08:40,008 (trainer:653) INFO: 44epoch:train:217-243batch: iter_time=1.022e-04, forward_time=0.034, loss=4.779, loss_att=2.737, loss_ctc=6.822, acc=0.902, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.900e-04, train_time=0.096 -[v016] 2022-01-31 05:08:42,631 (trainer:653) INFO: 44epoch:train:244-270batch: iter_time=9.281e-05, forward_time=0.035, loss=5.291, loss_att=3.025, loss_ctc=7.557, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.902e-04, train_time=0.097 -[v016] 2022-01-31 05:08:45,247 (trainer:653) INFO: 44epoch:train:271-297batch: iter_time=9.327e-05, forward_time=0.035, loss=5.453, loss_att=2.911, loss_ctc=7.995, acc=0.890, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.904e-04, train_time=0.097 -[v016] 2022-01-31 05:08:47,888 (trainer:653) INFO: 44epoch:train:298-324batch: iter_time=9.279e-05, forward_time=0.035, loss=5.920, loss_att=3.207, loss_ctc=8.634, acc=0.894, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.907e-04, train_time=0.098 -[v016] 2022-01-31 05:08:50,597 (trainer:653) INFO: 44epoch:train:325-351batch: iter_time=9.425e-05, forward_time=0.036, loss=7.031, loss_att=3.704, loss_ctc=10.358, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.909e-04, train_time=0.100 -[v016] 2022-01-31 05:08:53,213 (trainer:653) INFO: 44epoch:train:352-378batch: iter_time=9.393e-05, forward_time=0.034, loss=4.959, loss_att=2.772, loss_ctc=7.147, acc=0.905, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.911e-04, train_time=0.097 -[v016] 2022-01-31 05:08:55,796 (trainer:653) INFO: 44epoch:train:379-405batch: iter_time=9.761e-05, forward_time=0.034, loss=5.836, loss_att=3.227, loss_ctc=8.445, acc=0.875, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.913e-04, train_time=0.095 -[v016] 2022-01-31 05:08:58,716 (trainer:653) INFO: 44epoch:train:406-432batch: iter_time=0.012, forward_time=0.034, loss=5.407, loss_att=3.037, loss_ctc=7.778, acc=0.888, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.915e-04, train_time=0.108 -[v016] 2022-01-31 05:09:01,257 (trainer:653) INFO: 44epoch:train:433-459batch: iter_time=9.590e-05, forward_time=0.033, loss=4.503, loss_att=2.469, loss_ctc=6.537, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.917e-04, train_time=0.094 -[v016] 2022-01-31 05:09:03,879 (trainer:653) INFO: 44epoch:train:460-486batch: iter_time=1.093e-04, forward_time=0.034, loss=6.201, loss_att=3.422, loss_ctc=8.980, acc=0.879, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.920e-04, train_time=0.097 -[v016] 2022-01-31 05:09:06,529 (trainer:653) INFO: 44epoch:train:487-513batch: iter_time=9.904e-05, forward_time=0.034, loss=6.291, loss_att=3.317, loss_ctc=9.265, acc=0.894, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.922e-04, train_time=0.098 -[v016] 2022-01-31 05:09:09,133 (trainer:653) INFO: 44epoch:train:514-540batch: iter_time=1.016e-04, forward_time=0.034, loss=5.589, loss_att=3.045, loss_ctc=8.133, acc=0.883, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.924e-04, train_time=0.096 -[v016] 2022-01-31 05:09:43,702 (trainer:328) INFO: 44epoch results: [train] iter_time=9.040e-04, forward_time=0.035, loss=5.673, loss_att=3.093, loss_ctc=8.254, acc=0.890, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.904e-04, train_time=0.099, time=54.55 seconds, total_count=24068, gpu_max_cached_mem_GB=5.822, [valid] loss=7.187, loss_att=5.260, loss_ctc=9.114, acc=0.879, cer=0.135, wer=0.486, cer_ctc=0.213, time=5.75 seconds, total_count=7832, gpu_max_cached_mem_GB=5.822, [att_plot] time=28.07 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:09:45,868 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:09:45,871 (trainer:261) INFO: 45/200epoch started. Estimated time to finish: 6 hours, 40 minutes and 4.97 seconds -[v016] 2022-01-31 05:09:48,588 (trainer:653) INFO: 45epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=5.065, loss_att=2.729, loss_ctc=7.401, acc=0.894, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.927e-04, train_time=0.100 -[v016] 2022-01-31 05:09:51,172 (trainer:653) INFO: 45epoch:train:28-54batch: iter_time=1.006e-04, forward_time=0.034, loss=5.192, loss_att=2.847, loss_ctc=7.537, acc=0.895, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.929e-04, train_time=0.095 -[v016] 2022-01-31 05:09:53,767 (trainer:653) INFO: 45epoch:train:55-81batch: iter_time=1.098e-04, forward_time=0.034, loss=5.441, loss_att=2.863, loss_ctc=8.019, acc=0.894, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.931e-04, train_time=0.096 -[v016] 2022-01-31 05:09:56,318 (trainer:653) INFO: 45epoch:train:82-108batch: iter_time=9.949e-05, forward_time=0.033, loss=4.896, loss_att=2.619, loss_ctc=7.172, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.933e-04, train_time=0.094 -[v016] 2022-01-31 05:09:58,914 (trainer:653) INFO: 45epoch:train:109-135batch: iter_time=9.968e-05, forward_time=0.034, loss=5.276, loss_att=2.882, loss_ctc=7.669, acc=0.896, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.935e-04, train_time=0.096 -[v016] 2022-01-31 05:10:01,623 (trainer:653) INFO: 45epoch:train:136-162batch: iter_time=0.006, forward_time=0.033, loss=5.172, loss_att=2.824, loss_ctc=7.520, acc=0.895, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.937e-04, train_time=0.100 -[v016] 2022-01-31 05:10:04,241 (trainer:653) INFO: 45epoch:train:163-189batch: iter_time=9.868e-05, forward_time=0.034, loss=6.235, loss_att=3.376, loss_ctc=9.094, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.940e-04, train_time=0.097 -[v016] 2022-01-31 05:10:06,767 (trainer:653) INFO: 45epoch:train:190-216batch: iter_time=1.026e-04, forward_time=0.033, loss=5.187, loss_att=2.812, loss_ctc=7.563, acc=0.896, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.942e-04, train_time=0.093 -[v016] 2022-01-31 05:10:09,390 (trainer:653) INFO: 45epoch:train:217-243batch: iter_time=1.062e-04, forward_time=0.034, loss=6.346, loss_att=3.381, loss_ctc=9.311, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.944e-04, train_time=0.097 -[v016] 2022-01-31 05:10:12,051 (trainer:653) INFO: 45epoch:train:244-270batch: iter_time=1.085e-04, forward_time=0.034, loss=5.175, loss_att=2.783, loss_ctc=7.566, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.946e-04, train_time=0.098 -[v016] 2022-01-31 05:10:14,601 (trainer:653) INFO: 45epoch:train:271-297batch: iter_time=1.098e-04, forward_time=0.033, loss=4.593, loss_att=2.617, loss_ctc=6.569, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.948e-04, train_time=0.094 -[v016] 2022-01-31 05:10:17,170 (trainer:653) INFO: 45epoch:train:298-324batch: iter_time=1.068e-04, forward_time=0.033, loss=5.897, loss_att=3.334, loss_ctc=8.460, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.950e-04, train_time=0.095 -[v016] 2022-01-31 05:10:19,711 (trainer:653) INFO: 45epoch:train:325-351batch: iter_time=9.695e-05, forward_time=0.033, loss=5.016, loss_att=2.748, loss_ctc=7.284, acc=0.896, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.953e-04, train_time=0.094 -[v016] 2022-01-31 05:10:22,280 (trainer:653) INFO: 45epoch:train:352-378batch: iter_time=9.955e-05, forward_time=0.034, loss=5.199, loss_att=2.808, loss_ctc=7.591, acc=0.894, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.955e-04, train_time=0.095 -[v016] 2022-01-31 05:10:24,845 (trainer:653) INFO: 45epoch:train:379-405batch: iter_time=9.496e-05, forward_time=0.034, loss=5.616, loss_att=3.002, loss_ctc=8.229, acc=0.889, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.957e-04, train_time=0.095 -[v016] 2022-01-31 05:10:27,419 (trainer:653) INFO: 45epoch:train:406-432batch: iter_time=9.836e-05, forward_time=0.034, loss=6.227, loss_att=3.481, loss_ctc=8.973, acc=0.878, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.959e-04, train_time=0.095 -[v016] 2022-01-31 05:10:30,029 (trainer:653) INFO: 45epoch:train:433-459batch: iter_time=9.646e-05, forward_time=0.034, loss=5.972, loss_att=3.214, loss_ctc=8.731, acc=0.887, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.961e-04, train_time=0.096 -[v016] 2022-01-31 05:10:33,027 (trainer:653) INFO: 45epoch:train:460-486batch: iter_time=0.012, forward_time=0.034, loss=6.877, loss_att=3.738, loss_ctc=10.016, acc=0.881, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.963e-04, train_time=0.111 -[v016] 2022-01-31 05:10:35,574 (trainer:653) INFO: 45epoch:train:487-513batch: iter_time=9.611e-05, forward_time=0.034, loss=5.784, loss_att=3.177, loss_ctc=8.390, acc=0.882, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.966e-04, train_time=0.094 -[v016] 2022-01-31 05:10:38,172 (trainer:653) INFO: 45epoch:train:514-540batch: iter_time=9.370e-05, forward_time=0.034, loss=6.507, loss_att=3.538, loss_ctc=9.476, acc=0.882, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.968e-04, train_time=0.096 -[v016] 2022-01-31 05:11:13,357 (trainer:328) INFO: 45epoch results: [train] iter_time=0.001, forward_time=0.034, loss=5.579, loss_att=3.038, loss_ctc=8.120, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.947e-04, train_time=0.097, time=53.04 seconds, total_count=24615, gpu_max_cached_mem_GB=5.822, [valid] loss=7.142, loss_att=5.219, loss_ctc=9.066, acc=0.881, cer=0.134, wer=0.481, cer_ctc=0.221, time=5.7 seconds, total_count=8010, gpu_max_cached_mem_GB=5.822, [att_plot] time=28.74 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:11:15,399 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:11:15,425 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/40epoch.pth -[v016] 2022-01-31 05:11:15,425 (trainer:261) INFO: 46/200epoch started. Estimated time to finish: 6 hours, 30 minutes and 52.28 seconds -[v016] 2022-01-31 05:11:18,229 (trainer:653) INFO: 46epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=5.664, loss_att=2.963, loss_ctc=8.365, acc=0.900, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.970e-04, train_time=0.103 -[v016] 2022-01-31 05:11:20,738 (trainer:653) INFO: 46epoch:train:28-54batch: iter_time=9.682e-05, forward_time=0.032, loss=4.908, loss_att=2.624, loss_ctc=7.193, acc=0.905, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.973e-04, train_time=0.093 -[v016] 2022-01-31 05:11:23,320 (trainer:653) INFO: 46epoch:train:55-81batch: iter_time=1.006e-04, forward_time=0.034, loss=5.177, loss_att=2.741, loss_ctc=7.613, acc=0.893, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.975e-04, train_time=0.095 -[v016] 2022-01-31 05:11:25,840 (trainer:653) INFO: 46epoch:train:82-108batch: iter_time=9.713e-05, forward_time=0.033, loss=5.112, loss_att=2.819, loss_ctc=7.406, acc=0.889, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.977e-04, train_time=0.093 -[v016] 2022-01-31 05:11:28,392 (trainer:653) INFO: 46epoch:train:109-135batch: iter_time=9.606e-05, forward_time=0.033, loss=4.584, loss_att=2.548, loss_ctc=6.619, acc=0.893, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.979e-04, train_time=0.094 -[v016] 2022-01-31 05:11:30,984 (trainer:653) INFO: 46epoch:train:136-162batch: iter_time=9.800e-05, forward_time=0.034, loss=6.166, loss_att=3.305, loss_ctc=9.028, acc=0.888, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.981e-04, train_time=0.096 -[v016] 2022-01-31 05:11:33,542 (trainer:653) INFO: 46epoch:train:163-189batch: iter_time=9.830e-05, forward_time=0.033, loss=5.500, loss_att=3.032, loss_ctc=7.967, acc=0.884, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.983e-04, train_time=0.094 -[v016] 2022-01-31 05:11:36,196 (trainer:653) INFO: 46epoch:train:190-216batch: iter_time=1.055e-04, forward_time=0.035, loss=6.019, loss_att=3.214, loss_ctc=8.824, acc=0.896, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.986e-04, train_time=0.098 -[v016] 2022-01-31 05:11:38,831 (trainer:653) INFO: 46epoch:train:217-243batch: iter_time=1.067e-04, forward_time=0.034, loss=6.129, loss_att=3.243, loss_ctc=9.015, acc=0.886, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.988e-04, train_time=0.097 -[v016] 2022-01-31 05:11:41,429 (trainer:653) INFO: 46epoch:train:244-270batch: iter_time=1.036e-04, forward_time=0.034, loss=5.903, loss_att=3.143, loss_ctc=8.663, acc=0.882, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.990e-04, train_time=0.096 -[v016] 2022-01-31 05:11:44,036 (trainer:653) INFO: 46epoch:train:271-297batch: iter_time=9.436e-05, forward_time=0.034, loss=5.516, loss_att=2.994, loss_ctc=8.038, acc=0.881, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.992e-04, train_time=0.096 -[v016] 2022-01-31 05:11:46,682 (trainer:653) INFO: 46epoch:train:298-324batch: iter_time=1.084e-04, forward_time=0.034, loss=5.327, loss_att=2.874, loss_ctc=7.781, acc=0.904, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.994e-04, train_time=0.098 -[v016] 2022-01-31 05:11:49,165 (trainer:653) INFO: 46epoch:train:325-351batch: iter_time=1.020e-04, forward_time=0.032, loss=4.319, loss_att=2.549, loss_ctc=6.089, acc=0.889, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.996e-04, train_time=0.092 -[v016] 2022-01-31 05:11:51,790 (trainer:653) INFO: 46epoch:train:352-378batch: iter_time=9.894e-05, forward_time=0.034, loss=6.403, loss_att=3.446, loss_ctc=9.359, acc=0.885, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.998e-04, train_time=0.097 -[v016] 2022-01-31 05:11:54,405 (trainer:653) INFO: 46epoch:train:379-405batch: iter_time=1.082e-04, forward_time=0.034, loss=6.063, loss_att=3.304, loss_ctc=8.822, acc=0.891, backward_time=0.022, optim_step_time=0.021, optim0_lr0=2.000e-04, train_time=0.097 -[v016] 2022-01-31 05:11:57,024 (trainer:653) INFO: 46epoch:train:406-432batch: iter_time=1.006e-04, forward_time=0.034, loss=5.324, loss_att=2.912, loss_ctc=7.736, acc=0.898, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.999e-04, train_time=0.097 -[v016] 2022-01-31 05:11:59,539 (trainer:653) INFO: 46epoch:train:433-459batch: iter_time=9.882e-05, forward_time=0.033, loss=4.556, loss_att=2.540, loss_ctc=6.572, acc=0.901, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.998e-04, train_time=0.093 -[v016] 2022-01-31 05:12:02,106 (trainer:653) INFO: 46epoch:train:460-486batch: iter_time=1.021e-04, forward_time=0.034, loss=4.718, loss_att=2.597, loss_ctc=6.839, acc=0.904, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.996e-04, train_time=0.095 -[v016] 2022-01-31 05:12:04,864 (trainer:653) INFO: 46epoch:train:487-513batch: iter_time=0.005, forward_time=0.034, loss=6.005, loss_att=3.193, loss_ctc=8.816, acc=0.895, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.995e-04, train_time=0.102 -[v016] 2022-01-31 05:12:07,582 (trainer:653) INFO: 46epoch:train:514-540batch: iter_time=0.005, forward_time=0.033, loss=6.245, loss_att=3.383, loss_ctc=9.107, acc=0.875, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.994e-04, train_time=0.100 -[v016] 2022-01-31 05:12:46,623 (trainer:328) INFO: 46epoch results: [train] iter_time=7.440e-04, forward_time=0.034, loss=5.472, loss_att=2.967, loss_ctc=7.977, acc=0.892, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.988e-04, train_time=0.096, time=52.88 seconds, total_count=25162, gpu_max_cached_mem_GB=5.822, [valid] loss=7.274, loss_att=5.197, loss_ctc=9.351, acc=0.881, cer=0.137, wer=0.478, cer_ctc=0.233, time=5.8 seconds, total_count=8188, gpu_max_cached_mem_GB=5.822, [att_plot] time=32.52 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:12:48,882 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 05:12:48,887 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/39epoch.pth -[v016] 2022-01-31 05:12:48,892 (trainer:261) INFO: 47/200epoch started. Estimated time to finish: 6 hours, 22 minutes and 38.37 seconds -[v016] 2022-01-31 05:12:51,982 (trainer:653) INFO: 47epoch:train:1-27batch: iter_time=0.005, forward_time=0.035, loss=5.879, loss_att=3.053, loss_ctc=8.704, acc=0.897, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.993e-04, train_time=0.114 -[v016] 2022-01-31 05:12:54,812 (trainer:653) INFO: 47epoch:train:28-54batch: iter_time=2.256e-04, forward_time=0.035, loss=5.321, loss_att=2.781, loss_ctc=7.861, acc=0.896, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.992e-04, train_time=0.105 -[v016] 2022-01-31 05:12:57,586 (trainer:653) INFO: 47epoch:train:55-81batch: iter_time=2.540e-04, forward_time=0.037, loss=5.347, loss_att=2.944, loss_ctc=7.750, acc=0.896, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.991e-04, train_time=0.103 -[v016] 2022-01-31 05:13:00,389 (trainer:653) INFO: 47epoch:train:82-108batch: iter_time=2.383e-04, forward_time=0.035, loss=5.753, loss_att=3.003, loss_ctc=8.503, acc=0.898, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.990e-04, train_time=0.103 -[v016] 2022-01-31 05:13:03,173 (trainer:653) INFO: 47epoch:train:109-135batch: iter_time=1.813e-04, forward_time=0.038, loss=4.584, loss_att=2.557, loss_ctc=6.610, acc=0.900, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.989e-04, train_time=0.103 -[v016] 2022-01-31 05:13:06,043 (trainer:653) INFO: 47epoch:train:136-162batch: iter_time=3.826e-04, forward_time=0.035, loss=4.494, loss_att=2.504, loss_ctc=6.484, acc=0.902, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.988e-04, train_time=0.106 -[v016] 2022-01-31 05:13:09,011 (trainer:653) INFO: 47epoch:train:163-189batch: iter_time=2.412e-04, forward_time=0.039, loss=4.823, loss_att=2.709, loss_ctc=6.936, acc=0.899, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.987e-04, train_time=0.110 -[v016] 2022-01-31 05:13:11,694 (trainer:653) INFO: 47epoch:train:190-216batch: iter_time=1.585e-04, forward_time=0.036, loss=4.797, loss_att=2.720, loss_ctc=6.874, acc=0.883, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.986e-04, train_time=0.099 -[v016] 2022-01-31 05:13:14,491 (trainer:653) INFO: 47epoch:train:217-243batch: iter_time=1.766e-04, forward_time=0.035, loss=6.033, loss_att=3.172, loss_ctc=8.894, acc=0.895, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.984e-04, train_time=0.103 -[v016] 2022-01-31 05:13:17,388 (trainer:653) INFO: 47epoch:train:244-270batch: iter_time=2.114e-04, forward_time=0.040, loss=4.313, loss_att=2.337, loss_ctc=6.289, acc=0.904, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.983e-04, train_time=0.107 -[v016] 2022-01-31 05:13:20,345 (trainer:653) INFO: 47epoch:train:271-297batch: iter_time=2.363e-04, forward_time=0.035, loss=6.626, loss_att=3.532, loss_ctc=9.720, acc=0.885, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.982e-04, train_time=0.109 -[v016] 2022-01-31 05:13:23,082 (trainer:653) INFO: 47epoch:train:298-324batch: iter_time=2.461e-04, forward_time=0.034, loss=5.843, loss_att=3.111, loss_ctc=8.575, acc=0.889, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.981e-04, train_time=0.101 -[v016] 2022-01-31 05:13:25,857 (trainer:653) INFO: 47epoch:train:325-351batch: iter_time=2.817e-04, forward_time=0.034, loss=5.889, loss_att=3.040, loss_ctc=8.738, acc=0.896, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.980e-04, train_time=0.103 -[v016] 2022-01-31 05:13:28,871 (trainer:653) INFO: 47epoch:train:352-378batch: iter_time=0.003, forward_time=0.036, loss=4.931, loss_att=2.727, loss_ctc=7.135, acc=0.900, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.979e-04, train_time=0.109 -[v016] 2022-01-31 05:13:31,558 (trainer:653) INFO: 47epoch:train:379-405batch: iter_time=1.571e-04, forward_time=0.034, loss=5.201, loss_att=2.855, loss_ctc=7.546, acc=0.896, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.978e-04, train_time=0.099 -[v016] 2022-01-31 05:13:34,286 (trainer:653) INFO: 47epoch:train:406-432batch: iter_time=3.705e-04, forward_time=0.038, loss=4.346, loss_att=2.403, loss_ctc=6.289, acc=0.908, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.977e-04, train_time=0.101 -[v016] 2022-01-31 05:13:37,185 (trainer:653) INFO: 47epoch:train:433-459batch: iter_time=3.385e-04, forward_time=0.037, loss=5.589, loss_att=3.063, loss_ctc=8.114, acc=0.889, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.976e-04, train_time=0.107 -[v016] 2022-01-31 05:13:39,795 (trainer:653) INFO: 47epoch:train:460-486batch: iter_time=0.003, forward_time=0.033, loss=4.972, loss_att=2.656, loss_ctc=7.289, acc=0.905, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.975e-04, train_time=0.097 -[v016] 2022-01-31 05:13:42,745 (trainer:653) INFO: 47epoch:train:487-513batch: iter_time=2.468e-04, forward_time=0.034, loss=5.167, loss_att=2.849, loss_ctc=7.484, acc=0.895, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.974e-04, train_time=0.109 -[v016] 2022-01-31 05:13:45,569 (trainer:653) INFO: 47epoch:train:514-540batch: iter_time=2.141e-04, forward_time=0.034, loss=5.985, loss_att=3.242, loss_ctc=8.728, acc=0.890, backward_time=0.022, optim_step_time=0.026, optim0_lr0=1.973e-04, train_time=0.104 -[v016] 2022-01-31 05:14:23,872 (trainer:328) INFO: 47epoch results: [train] iter_time=7.230e-04, forward_time=0.036, loss=5.330, loss_att=2.880, loss_ctc=7.781, acc=0.896, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.983e-04, train_time=0.105, time=57.47 seconds, total_count=25709, gpu_max_cached_mem_GB=5.822, [valid] loss=7.013, loss_att=5.152, loss_ctc=8.873, acc=0.881, cer=0.132, wer=0.491, cer_ctc=0.212, time=6.33 seconds, total_count=8366, gpu_max_cached_mem_GB=5.822, [att_plot] time=31.17 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:14:25,931 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:14:25,957 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/41epoch.pth -[v016] 2022-01-31 05:14:25,960 (trainer:261) INFO: 48/200epoch started. Estimated time to finish: 6 hours, 15 minutes and 14.56 seconds -[v016] 2022-01-31 05:14:28,932 (trainer:653) INFO: 48epoch:train:1-27batch: iter_time=0.004, forward_time=0.040, loss=4.832, loss_att=2.551, loss_ctc=7.113, acc=0.904, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.972e-04, train_time=0.110 -[v016] 2022-01-31 05:14:31,722 (trainer:653) INFO: 48epoch:train:28-54batch: iter_time=2.109e-04, forward_time=0.037, loss=4.901, loss_att=2.611, loss_ctc=7.192, acc=0.900, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.971e-04, train_time=0.103 -[v016] 2022-01-31 05:14:34,640 (trainer:653) INFO: 48epoch:train:55-81batch: iter_time=3.751e-04, forward_time=0.035, loss=5.666, loss_att=2.863, loss_ctc=8.468, acc=0.902, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.970e-04, train_time=0.108 -[v016] 2022-01-31 05:14:37,440 (trainer:653) INFO: 48epoch:train:82-108batch: iter_time=1.768e-04, forward_time=0.040, loss=4.150, loss_att=2.319, loss_ctc=5.981, acc=0.909, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.969e-04, train_time=0.103 -[v016] 2022-01-31 05:14:40,105 (trainer:653) INFO: 48epoch:train:109-135batch: iter_time=2.020e-04, forward_time=0.033, loss=4.834, loss_att=2.661, loss_ctc=7.006, acc=0.898, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.968e-04, train_time=0.097 -[v016] 2022-01-31 05:14:42,953 (trainer:653) INFO: 48epoch:train:136-162batch: iter_time=2.795e-04, forward_time=0.034, loss=5.280, loss_att=2.774, loss_ctc=7.787, acc=0.903, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.967e-04, train_time=0.105 -[v016] 2022-01-31 05:14:45,711 (trainer:653) INFO: 48epoch:train:163-189batch: iter_time=1.920e-04, forward_time=0.035, loss=5.770, loss_att=3.061, loss_ctc=8.480, acc=0.897, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.965e-04, train_time=0.102 -[v016] 2022-01-31 05:14:48,492 (trainer:653) INFO: 48epoch:train:190-216batch: iter_time=2.818e-04, forward_time=0.035, loss=4.989, loss_att=2.664, loss_ctc=7.314, acc=0.901, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.964e-04, train_time=0.103 -[v016] 2022-01-31 05:14:51,313 (trainer:653) INFO: 48epoch:train:217-243batch: iter_time=2.165e-04, forward_time=0.037, loss=5.571, loss_att=2.911, loss_ctc=8.231, acc=0.902, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.963e-04, train_time=0.104 -[v016] 2022-01-31 05:14:54,127 (trainer:653) INFO: 48epoch:train:244-270batch: iter_time=1.555e-04, forward_time=0.038, loss=5.119, loss_att=2.761, loss_ctc=7.477, acc=0.898, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.962e-04, train_time=0.104 -[v016] 2022-01-31 05:14:56,946 (trainer:653) INFO: 48epoch:train:271-297batch: iter_time=2.547e-04, forward_time=0.034, loss=4.458, loss_att=2.530, loss_ctc=6.387, acc=0.897, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.961e-04, train_time=0.104 -[v016] 2022-01-31 05:14:59,646 (trainer:653) INFO: 48epoch:train:298-324batch: iter_time=2.033e-04, forward_time=0.034, loss=4.650, loss_att=2.473, loss_ctc=6.826, acc=0.909, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.960e-04, train_time=0.099 -[v016] 2022-01-31 05:15:02,489 (trainer:653) INFO: 48epoch:train:325-351batch: iter_time=1.190e-04, forward_time=0.041, loss=4.979, loss_att=2.709, loss_ctc=7.249, acc=0.905, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.959e-04, train_time=0.105 -[v016] 2022-01-31 05:15:05,334 (trainer:653) INFO: 48epoch:train:352-378batch: iter_time=0.002, forward_time=0.039, loss=5.310, loss_att=2.883, loss_ctc=7.737, acc=0.904, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.958e-04, train_time=0.105 -[v016] 2022-01-31 05:15:08,177 (trainer:653) INFO: 48epoch:train:379-405batch: iter_time=1.791e-04, forward_time=0.038, loss=5.637, loss_att=3.145, loss_ctc=8.130, acc=0.886, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.957e-04, train_time=0.105 -[v016] 2022-01-31 05:15:11,121 (trainer:653) INFO: 48epoch:train:406-432batch: iter_time=2.967e-04, forward_time=0.035, loss=5.645, loss_att=3.103, loss_ctc=8.187, acc=0.875, backward_time=0.022, optim_step_time=0.026, optim0_lr0=1.956e-04, train_time=0.109 -[v016] 2022-01-31 05:15:14,372 (trainer:653) INFO: 48epoch:train:433-459batch: iter_time=0.010, forward_time=0.036, loss=5.272, loss_att=2.814, loss_ctc=7.730, acc=0.905, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.955e-04, train_time=0.120 -[v016] 2022-01-31 05:15:17,091 (trainer:653) INFO: 48epoch:train:460-486batch: iter_time=1.560e-04, forward_time=0.036, loss=5.424, loss_att=2.945, loss_ctc=7.904, acc=0.893, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.954e-04, train_time=0.100 -[v016] 2022-01-31 05:15:20,154 (trainer:653) INFO: 48epoch:train:487-513batch: iter_time=2.714e-04, forward_time=0.039, loss=7.019, loss_att=3.663, loss_ctc=10.374, acc=0.885, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.953e-04, train_time=0.113 -[v016] 2022-01-31 05:15:22,922 (trainer:653) INFO: 48epoch:train:514-540batch: iter_time=1.975e-04, forward_time=0.034, loss=4.776, loss_att=2.592, loss_ctc=6.961, acc=0.901, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.952e-04, train_time=0.102 -[v016] 2022-01-31 05:16:13,230 (trainer:328) INFO: 48epoch results: [train] iter_time=9.711e-04, forward_time=0.037, loss=5.182, loss_att=2.787, loss_ctc=7.577, acc=0.899, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.962e-04, train_time=0.105, time=57.75 seconds, total_count=26256, gpu_max_cached_mem_GB=5.822, [valid] loss=7.225, loss_att=5.276, loss_ctc=9.175, acc=0.883, cer=0.129, wer=0.471, cer_ctc=0.208, time=6.54 seconds, total_count=8544, gpu_max_cached_mem_GB=5.822, [att_plot] time=42.88 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:16:19,477 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 05:16:19,527 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/43epoch.pth -[v016] 2022-01-31 05:16:19,568 (trainer:261) INFO: 49/200epoch started. Estimated time to finish: 6 hours, 9 minutes and 45.13 seconds -[v016] 2022-01-31 05:16:37,155 (trainer:653) INFO: 49epoch:train:1-27batch: iter_time=0.301, forward_time=0.197, loss=4.850, loss_att=2.533, loss_ctc=7.166, acc=0.901, backward_time=0.035, optim_step_time=0.036, optim0_lr0=1.951e-04, train_time=0.629 -[v016] 2022-01-31 05:16:44,604 (trainer:653) INFO: 49epoch:train:28-54batch: iter_time=0.176, forward_time=0.033, loss=3.608, loss_att=2.071, loss_ctc=5.144, acc=0.906, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.950e-04, train_time=0.277 -[v016] 2022-01-31 05:16:50,693 (trainer:653) INFO: 49epoch:train:55-81batch: iter_time=0.130, forward_time=0.033, loss=4.970, loss_att=2.616, loss_ctc=7.323, acc=0.901, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.949e-04, train_time=0.225 -[v016] 2022-01-31 05:16:57,187 (trainer:653) INFO: 49epoch:train:82-108batch: iter_time=0.126, forward_time=0.046, loss=4.937, loss_att=2.596, loss_ctc=7.278, acc=0.902, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.948e-04, train_time=0.240 -[v016] 2022-01-31 05:17:03,368 (trainer:653) INFO: 49epoch:train:109-135batch: iter_time=0.130, forward_time=0.033, loss=5.246, loss_att=2.803, loss_ctc=7.689, acc=0.902, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.947e-04, train_time=0.229 -[v016] 2022-01-31 05:17:09,497 (trainer:653) INFO: 49epoch:train:136-162batch: iter_time=0.127, forward_time=0.035, loss=5.551, loss_att=2.928, loss_ctc=8.173, acc=0.905, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.946e-04, train_time=0.227 -[v016] 2022-01-31 05:17:15,869 (trainer:653) INFO: 49epoch:train:163-189batch: iter_time=0.133, forward_time=0.036, loss=4.763, loss_att=2.589, loss_ctc=6.937, acc=0.909, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.945e-04, train_time=0.236 -[v016] 2022-01-31 05:17:22,324 (trainer:653) INFO: 49epoch:train:190-216batch: iter_time=0.137, forward_time=0.038, loss=4.316, loss_att=2.311, loss_ctc=6.320, acc=0.911, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.944e-04, train_time=0.239 -[v016] 2022-01-31 05:17:28,038 (trainer:653) INFO: 49epoch:train:217-243batch: iter_time=0.108, forward_time=0.038, loss=5.016, loss_att=2.694, loss_ctc=7.338, acc=0.897, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.943e-04, train_time=0.211 -[v016] 2022-01-31 05:17:34,047 (trainer:653) INFO: 49epoch:train:244-270batch: iter_time=0.122, forward_time=0.033, loss=4.837, loss_att=2.467, loss_ctc=7.208, acc=0.906, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.942e-04, train_time=0.219 -[v016] 2022-01-31 05:17:39,670 (trainer:653) INFO: 49epoch:train:271-297batch: iter_time=0.112, forward_time=0.033, loss=5.102, loss_att=2.640, loss_ctc=7.564, acc=0.905, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.941e-04, train_time=0.211 -[v016] 2022-01-31 05:17:45,817 (trainer:653) INFO: 49epoch:train:298-324batch: iter_time=0.129, forward_time=0.034, loss=5.092, loss_att=2.713, loss_ctc=7.470, acc=0.906, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.940e-04, train_time=0.227 -[v016] 2022-01-31 05:17:52,310 (trainer:653) INFO: 49epoch:train:325-351batch: iter_time=0.144, forward_time=0.033, loss=5.136, loss_att=2.814, loss_ctc=7.459, acc=0.898, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.939e-04, train_time=0.240 -[v016] 2022-01-31 05:17:58,507 (trainer:653) INFO: 49epoch:train:352-378batch: iter_time=0.124, forward_time=0.038, loss=5.563, loss_att=2.918, loss_ctc=8.207, acc=0.894, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.938e-04, train_time=0.229 -[v016] 2022-01-31 05:18:04,740 (trainer:653) INFO: 49epoch:train:379-405batch: iter_time=0.128, forward_time=0.034, loss=6.239, loss_att=3.318, loss_ctc=9.161, acc=0.888, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.937e-04, train_time=0.231 -[v016] 2022-01-31 05:18:11,936 (trainer:653) INFO: 49epoch:train:406-432batch: iter_time=0.166, forward_time=0.035, loss=5.055, loss_att=2.667, loss_ctc=7.444, acc=0.906, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.936e-04, train_time=0.266 -[v016] 2022-01-31 05:18:18,726 (trainer:653) INFO: 49epoch:train:433-459batch: iter_time=0.153, forward_time=0.034, loss=5.343, loss_att=2.811, loss_ctc=7.875, acc=0.900, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.935e-04, train_time=0.251 -[v016] 2022-01-31 05:18:26,295 (trainer:653) INFO: 49epoch:train:460-486batch: iter_time=0.178, forward_time=0.034, loss=5.987, loss_att=3.135, loss_ctc=8.839, acc=0.887, backward_time=0.026, optim_step_time=0.022, optim0_lr0=1.934e-04, train_time=0.280 -[v016] 2022-01-31 05:18:32,080 (trainer:653) INFO: 49epoch:train:487-513batch: iter_time=0.118, forward_time=0.033, loss=5.503, loss_att=2.975, loss_ctc=8.030, acc=0.891, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.933e-04, train_time=0.214 -[v016] 2022-01-31 05:18:36,574 (trainer:653) INFO: 49epoch:train:514-540batch: iter_time=0.069, forward_time=0.032, loss=4.306, loss_att=2.462, loss_ctc=6.151, acc=0.898, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.932e-04, train_time=0.166 -[v016] 2022-01-31 05:19:35,833 (trainer:328) INFO: 49epoch results: [train] iter_time=0.140, forward_time=0.043, loss=5.057, loss_att=2.698, loss_ctc=7.415, acc=0.901, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.941e-04, train_time=0.252, time=2 minutes and 18.46 seconds, total_count=26803, gpu_max_cached_mem_GB=5.822, [valid] loss=7.162, loss_att=5.380, loss_ctc=8.944, acc=0.881, cer=0.132, wer=0.481, cer_ctc=0.207, time=27.32 seconds, total_count=8722, gpu_max_cached_mem_GB=5.822, [att_plot] time=30.34 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:19:38,075 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:19:38,079 (trainer:261) INFO: 50/200epoch started. Estimated time to finish: 6 hours, 11 minutes and 53 seconds -[v016] 2022-01-31 05:19:41,176 (trainer:653) INFO: 50epoch:train:1-27batch: iter_time=0.003, forward_time=0.039, loss=5.496, loss_att=2.715, loss_ctc=8.276, acc=0.907, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.931e-04, train_time=0.110 -[v016] 2022-01-31 05:19:44,005 (trainer:653) INFO: 50epoch:train:28-54batch: iter_time=2.146e-04, forward_time=0.035, loss=4.410, loss_att=2.379, loss_ctc=6.441, acc=0.901, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.930e-04, train_time=0.105 -[v016] 2022-01-31 05:19:47,242 (trainer:653) INFO: 50epoch:train:55-81batch: iter_time=2.064e-04, forward_time=0.041, loss=4.806, loss_att=2.548, loss_ctc=7.065, acc=0.909, backward_time=0.024, optim_step_time=0.029, optim0_lr0=1.929e-04, train_time=0.120 -[v016] 2022-01-31 05:19:49,985 (trainer:653) INFO: 50epoch:train:82-108batch: iter_time=1.129e-04, forward_time=0.035, loss=5.390, loss_att=2.701, loss_ctc=8.079, acc=0.907, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.928e-04, train_time=0.101 -[v016] 2022-01-31 05:19:52,576 (trainer:653) INFO: 50epoch:train:109-135batch: iter_time=1.024e-04, forward_time=0.034, loss=4.890, loss_att=2.715, loss_ctc=7.064, acc=0.895, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.927e-04, train_time=0.096 -[v016] 2022-01-31 05:19:55,174 (trainer:653) INFO: 50epoch:train:136-162batch: iter_time=9.628e-05, forward_time=0.034, loss=5.095, loss_att=2.732, loss_ctc=7.459, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.926e-04, train_time=0.096 -[v016] 2022-01-31 05:19:58,322 (trainer:653) INFO: 50epoch:train:163-189batch: iter_time=2.596e-04, forward_time=0.040, loss=5.196, loss_att=2.702, loss_ctc=7.690, acc=0.905, backward_time=0.023, optim_step_time=0.027, optim0_lr0=1.925e-04, train_time=0.116 -[v016] 2022-01-31 05:20:01,034 (trainer:653) INFO: 50epoch:train:190-216batch: iter_time=0.002, forward_time=0.035, loss=5.159, loss_att=2.622, loss_ctc=7.696, acc=0.910, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.924e-04, train_time=0.100 -[v016] 2022-01-31 05:20:03,566 (trainer:653) INFO: 50epoch:train:217-243batch: iter_time=9.249e-05, forward_time=0.033, loss=3.811, loss_att=2.079, loss_ctc=5.543, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.923e-04, train_time=0.094 -[v016] 2022-01-31 05:20:06,673 (trainer:653) INFO: 50epoch:train:244-270batch: iter_time=2.492e-04, forward_time=0.042, loss=4.926, loss_att=2.709, loss_ctc=7.143, acc=0.895, backward_time=0.023, optim_step_time=0.028, optim0_lr0=1.922e-04, train_time=0.115 -[v016] 2022-01-31 05:20:09,405 (trainer:653) INFO: 50epoch:train:271-297batch: iter_time=1.102e-04, forward_time=0.035, loss=5.176, loss_att=2.738, loss_ctc=7.614, acc=0.909, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.921e-04, train_time=0.101 -[v016] 2022-01-31 05:20:12,056 (trainer:653) INFO: 50epoch:train:298-324batch: iter_time=1.038e-04, forward_time=0.035, loss=5.537, loss_att=3.076, loss_ctc=7.997, acc=0.895, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.920e-04, train_time=0.098 -[v016] 2022-01-31 05:20:14,584 (trainer:653) INFO: 50epoch:train:325-351batch: iter_time=9.903e-05, forward_time=0.033, loss=4.270, loss_att=2.288, loss_ctc=6.251, acc=0.909, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.919e-04, train_time=0.093 -[v016] 2022-01-31 05:20:17,858 (trainer:653) INFO: 50epoch:train:352-378batch: iter_time=2.774e-04, forward_time=0.041, loss=3.991, loss_att=2.169, loss_ctc=5.813, acc=0.916, backward_time=0.027, optim_step_time=0.028, optim0_lr0=1.919e-04, train_time=0.121 -[v016] 2022-01-31 05:20:21,201 (trainer:653) INFO: 50epoch:train:379-405batch: iter_time=4.174e-04, forward_time=0.044, loss=5.070, loss_att=2.687, loss_ctc=7.454, acc=0.894, backward_time=0.024, optim_step_time=0.033, optim0_lr0=1.918e-04, train_time=0.124 -[v016] 2022-01-31 05:20:24,398 (trainer:653) INFO: 50epoch:train:406-432batch: iter_time=1.479e-04, forward_time=0.041, loss=4.396, loss_att=2.364, loss_ctc=6.428, acc=0.910, backward_time=0.028, optim_step_time=0.027, optim0_lr0=1.917e-04, train_time=0.118 -[v016] 2022-01-31 05:20:27,455 (trainer:653) INFO: 50epoch:train:433-459batch: iter_time=3.377e-04, forward_time=0.038, loss=4.859, loss_att=2.649, loss_ctc=7.068, acc=0.901, backward_time=0.025, optim_step_time=0.028, optim0_lr0=1.916e-04, train_time=0.113 -[v016] 2022-01-31 05:20:31,165 (trainer:653) INFO: 50epoch:train:460-486batch: iter_time=8.962e-04, forward_time=0.052, loss=4.412, loss_att=2.445, loss_ctc=6.378, acc=0.901, backward_time=0.027, optim_step_time=0.028, optim0_lr0=1.915e-04, train_time=0.137 -[v016] 2022-01-31 05:20:35,471 (trainer:653) INFO: 50epoch:train:487-513batch: iter_time=0.001, forward_time=0.049, loss=5.601, loss_att=3.043, loss_ctc=8.158, acc=0.890, backward_time=0.030, optim_step_time=0.031, optim0_lr0=1.914e-04, train_time=0.154 -[v016] 2022-01-31 05:20:44,122 (trainer:653) INFO: 50epoch:train:514-540batch: iter_time=0.006, forward_time=0.097, loss=5.268, loss_att=2.886, loss_ctc=7.650, acc=0.893, backward_time=0.029, optim_step_time=0.068, optim0_lr0=1.913e-04, train_time=0.309 -[v016] 2022-01-31 05:21:30,192 (trainer:328) INFO: 50epoch results: [train] iter_time=0.001, forward_time=0.042, loss=4.897, loss_att=2.618, loss_ctc=7.176, acc=0.902, backward_time=0.024, optim_step_time=0.027, optim0_lr0=1.922e-04, train_time=0.121, time=1 minute and 7.16 seconds, total_count=27350, gpu_max_cached_mem_GB=5.822, [valid] loss=6.922, loss_att=5.204, loss_ctc=8.640, acc=0.886, cer=0.123, wer=0.462, cer_ctc=0.198, time=9.47 seconds, total_count=8900, gpu_max_cached_mem_GB=5.822, [att_plot] time=35.42 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:21:33,871 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:21:33,876 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/42epoch.pth -[v016] 2022-01-31 05:21:33,881 (trainer:261) INFO: 51/200epoch started. Estimated time to finish: 6 hours, 6 minutes and 45.39 seconds -[v016] 2022-01-31 05:21:40,514 (trainer:653) INFO: 51epoch:train:1-27batch: iter_time=0.009, forward_time=0.148, loss=4.508, loss_att=2.392, loss_ctc=6.624, acc=0.909, backward_time=0.030, optim_step_time=0.022, optim0_lr0=1.912e-04, train_time=0.237 -[v016] 2022-01-31 05:21:43,337 (trainer:653) INFO: 51epoch:train:28-54batch: iter_time=1.517e-04, forward_time=0.036, loss=4.609, loss_att=2.412, loss_ctc=6.806, acc=0.908, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.911e-04, train_time=0.104 -[v016] 2022-01-31 05:21:46,096 (trainer:653) INFO: 51epoch:train:55-81batch: iter_time=1.055e-04, forward_time=0.035, loss=5.123, loss_att=2.658, loss_ctc=7.589, acc=0.906, backward_time=0.024, optim_step_time=0.022, optim0_lr0=1.910e-04, train_time=0.102 -[v016] 2022-01-31 05:21:48,807 (trainer:653) INFO: 51epoch:train:82-108batch: iter_time=1.157e-04, forward_time=0.035, loss=4.504, loss_att=2.346, loss_ctc=6.662, acc=0.909, backward_time=0.024, optim_step_time=0.022, optim0_lr0=1.909e-04, train_time=0.100 -[v016] 2022-01-31 05:21:51,657 (trainer:653) INFO: 51epoch:train:109-135batch: iter_time=1.198e-04, forward_time=0.039, loss=5.110, loss_att=2.667, loss_ctc=7.554, acc=0.908, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.908e-04, train_time=0.105 -[v016] 2022-01-31 05:21:54,372 (trainer:653) INFO: 51epoch:train:136-162batch: iter_time=1.315e-04, forward_time=0.035, loss=4.691, loss_att=2.604, loss_ctc=6.777, acc=0.904, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.907e-04, train_time=0.100 -[v016] 2022-01-31 05:21:57,085 (trainer:653) INFO: 51epoch:train:163-189batch: iter_time=1.313e-04, forward_time=0.035, loss=5.190, loss_att=2.680, loss_ctc=7.701, acc=0.899, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.906e-04, train_time=0.100 -[v016] 2022-01-31 05:21:59,953 (trainer:653) INFO: 51epoch:train:190-216batch: iter_time=0.006, forward_time=0.035, loss=4.549, loss_att=2.451, loss_ctc=6.648, acc=0.907, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.905e-04, train_time=0.106 -[v016] 2022-01-31 05:22:02,620 (trainer:653) INFO: 51epoch:train:217-243batch: iter_time=1.002e-04, forward_time=0.034, loss=4.297, loss_att=2.365, loss_ctc=6.229, acc=0.909, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.904e-04, train_time=0.099 -[v016] 2022-01-31 05:22:05,328 (trainer:653) INFO: 51epoch:train:244-270batch: iter_time=1.198e-04, forward_time=0.035, loss=4.785, loss_att=2.461, loss_ctc=7.110, acc=0.914, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.903e-04, train_time=0.100 -[v016] 2022-01-31 05:22:08,185 (trainer:653) INFO: 51epoch:train:271-297batch: iter_time=1.156e-04, forward_time=0.037, loss=5.605, loss_att=2.926, loss_ctc=8.284, acc=0.902, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.902e-04, train_time=0.106 -[v016] 2022-01-31 05:22:10,982 (trainer:653) INFO: 51epoch:train:298-324batch: iter_time=1.325e-04, forward_time=0.036, loss=4.957, loss_att=2.610, loss_ctc=7.305, acc=0.900, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.901e-04, train_time=0.103 -[v016] 2022-01-31 05:22:13,753 (trainer:653) INFO: 51epoch:train:325-351batch: iter_time=1.279e-04, forward_time=0.035, loss=4.784, loss_att=2.526, loss_ctc=7.043, acc=0.892, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.900e-04, train_time=0.102 -[v016] 2022-01-31 05:22:16,393 (trainer:653) INFO: 51epoch:train:352-378batch: iter_time=1.184e-04, forward_time=0.034, loss=4.783, loss_att=2.536, loss_ctc=7.029, acc=0.904, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.899e-04, train_time=0.098 -[v016] 2022-01-31 05:22:19,277 (trainer:653) INFO: 51epoch:train:379-405batch: iter_time=2.811e-04, forward_time=0.035, loss=4.762, loss_att=2.407, loss_ctc=7.117, acc=0.916, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.899e-04, train_time=0.107 -[v016] 2022-01-31 05:22:21,886 (trainer:653) INFO: 51epoch:train:406-432batch: iter_time=1.156e-04, forward_time=0.034, loss=4.669, loss_att=2.501, loss_ctc=6.837, acc=0.907, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.898e-04, train_time=0.096 -[v016] 2022-01-31 05:22:24,526 (trainer:653) INFO: 51epoch:train:433-459batch: iter_time=8.982e-05, forward_time=0.035, loss=5.461, loss_att=2.810, loss_ctc=8.112, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.897e-04, train_time=0.098 -[v016] 2022-01-31 05:22:27,123 (trainer:653) INFO: 51epoch:train:460-486batch: iter_time=9.714e-05, forward_time=0.034, loss=4.665, loss_att=2.553, loss_ctc=6.777, acc=0.898, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.896e-04, train_time=0.096 -[v016] 2022-01-31 05:22:29,745 (trainer:653) INFO: 51epoch:train:487-513batch: iter_time=1.154e-04, forward_time=0.035, loss=4.730, loss_att=2.533, loss_ctc=6.927, acc=0.900, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.895e-04, train_time=0.097 -[v016] 2022-01-31 05:22:32,871 (trainer:653) INFO: 51epoch:train:514-540batch: iter_time=0.016, forward_time=0.035, loss=5.285, loss_att=2.664, loss_ctc=7.906, acc=0.907, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.894e-04, train_time=0.116 -[v016] 2022-01-31 05:23:09,866 (trainer:328) INFO: 51epoch results: [train] iter_time=0.002, forward_time=0.041, loss=4.853, loss_att=2.553, loss_ctc=7.152, acc=0.905, backward_time=0.024, optim_step_time=0.022, optim0_lr0=1.903e-04, train_time=0.108, time=59.7 seconds, total_count=27897, gpu_max_cached_mem_GB=5.822, [valid] loss=6.977, loss_att=5.222, loss_ctc=8.731, acc=0.888, cer=0.123, wer=0.462, cer_ctc=0.201, time=5.97 seconds, total_count=9078, gpu_max_cached_mem_GB=5.822, [att_plot] time=30.23 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:23:11,979 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 05:23:11,983 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/44epoch.pth -[v016] 2022-01-31 05:23:11,986 (trainer:261) INFO: 52/200epoch started. Estimated time to finish: 6 hours and 25.11 seconds -[v016] 2022-01-31 05:23:14,819 (trainer:653) INFO: 52epoch:train:1-27batch: iter_time=0.004, forward_time=0.036, loss=4.495, loss_att=2.362, loss_ctc=6.628, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.893e-04, train_time=0.105 -[v016] 2022-01-31 05:23:17,427 (trainer:653) INFO: 52epoch:train:28-54batch: iter_time=1.133e-04, forward_time=0.034, loss=4.284, loss_att=2.349, loss_ctc=6.218, acc=0.907, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.892e-04, train_time=0.096 -[v016] 2022-01-31 05:23:20,134 (trainer:653) INFO: 52epoch:train:55-81batch: iter_time=2.684e-04, forward_time=0.035, loss=4.859, loss_att=2.568, loss_ctc=7.150, acc=0.905, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.891e-04, train_time=0.100 -[v016] 2022-01-31 05:23:22,685 (trainer:653) INFO: 52epoch:train:82-108batch: iter_time=1.118e-04, forward_time=0.034, loss=3.791, loss_att=2.040, loss_ctc=5.543, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.890e-04, train_time=0.094 -[v016] 2022-01-31 05:23:25,230 (trainer:653) INFO: 52epoch:train:109-135batch: iter_time=9.460e-05, forward_time=0.033, loss=4.076, loss_att=2.072, loss_ctc=6.080, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.889e-04, train_time=0.094 -[v016] 2022-01-31 05:23:28,195 (trainer:653) INFO: 52epoch:train:136-162batch: iter_time=3.362e-04, forward_time=0.041, loss=5.854, loss_att=2.900, loss_ctc=8.808, acc=0.900, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.888e-04, train_time=0.109 -[v016] 2022-01-31 05:23:30,767 (trainer:653) INFO: 52epoch:train:163-189batch: iter_time=1.254e-04, forward_time=0.034, loss=4.720, loss_att=2.494, loss_ctc=6.946, acc=0.902, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.887e-04, train_time=0.095 -[v016] 2022-01-31 05:23:33,733 (trainer:653) INFO: 52epoch:train:190-216batch: iter_time=0.010, forward_time=0.037, loss=4.740, loss_att=2.511, loss_ctc=6.970, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.886e-04, train_time=0.110 -[v016] 2022-01-31 05:23:36,618 (trainer:653) INFO: 52epoch:train:217-243batch: iter_time=2.720e-04, forward_time=0.036, loss=4.865, loss_att=2.532, loss_ctc=7.199, acc=0.910, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.886e-04, train_time=0.107 -[v016] 2022-01-31 05:23:39,178 (trainer:653) INFO: 52epoch:train:244-270batch: iter_time=1.193e-04, forward_time=0.034, loss=4.417, loss_att=2.273, loss_ctc=6.561, acc=0.910, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.885e-04, train_time=0.095 -[v016] 2022-01-31 05:23:41,896 (trainer:653) INFO: 52epoch:train:271-297batch: iter_time=9.906e-05, forward_time=0.037, loss=5.124, loss_att=2.684, loss_ctc=7.564, acc=0.909, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.884e-04, train_time=0.100 -[v016] 2022-01-31 05:23:44,545 (trainer:653) INFO: 52epoch:train:298-324batch: iter_time=2.427e-04, forward_time=0.035, loss=4.813, loss_att=2.561, loss_ctc=7.064, acc=0.908, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.883e-04, train_time=0.098 -[v016] 2022-01-31 05:23:47,030 (trainer:653) INFO: 52epoch:train:325-351batch: iter_time=9.328e-05, forward_time=0.032, loss=3.897, loss_att=2.192, loss_ctc=5.603, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.882e-04, train_time=0.092 -[v016] 2022-01-31 05:23:49,715 (trainer:653) INFO: 52epoch:train:352-378batch: iter_time=9.429e-05, forward_time=0.035, loss=5.670, loss_att=2.937, loss_ctc=8.403, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.881e-04, train_time=0.099 -[v016] 2022-01-31 05:23:52,306 (trainer:653) INFO: 52epoch:train:379-405batch: iter_time=9.259e-05, forward_time=0.034, loss=4.703, loss_att=2.463, loss_ctc=6.944, acc=0.906, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.880e-04, train_time=0.096 -[v016] 2022-01-31 05:23:54,860 (trainer:653) INFO: 52epoch:train:406-432batch: iter_time=1.071e-04, forward_time=0.034, loss=4.406, loss_att=2.389, loss_ctc=6.423, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.879e-04, train_time=0.094 -[v016] 2022-01-31 05:23:57,411 (trainer:653) INFO: 52epoch:train:433-459batch: iter_time=9.618e-05, forward_time=0.034, loss=4.231, loss_att=2.241, loss_ctc=6.221, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.878e-04, train_time=0.094 -[v016] 2022-01-31 05:24:00,049 (trainer:653) INFO: 52epoch:train:460-486batch: iter_time=9.708e-05, forward_time=0.034, loss=4.299, loss_att=2.342, loss_ctc=6.256, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.877e-04, train_time=0.098 -[v016] 2022-01-31 05:24:03,503 (trainer:653) INFO: 52epoch:train:487-513batch: iter_time=9.531e-05, forward_time=0.034, loss=4.805, loss_att=2.526, loss_ctc=7.084, acc=0.904, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.877e-04, train_time=0.128 -[v016] 2022-01-31 05:24:06,241 (trainer:653) INFO: 52epoch:train:514-540batch: iter_time=0.004, forward_time=0.034, loss=5.659, loss_att=2.946, loss_ctc=8.372, acc=0.899, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.876e-04, train_time=0.101 -[v016] 2022-01-31 05:24:43,934 (trainer:328) INFO: 52epoch results: [train] iter_time=0.001, forward_time=0.035, loss=4.692, loss_att=2.475, loss_ctc=6.908, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.884e-04, train_time=0.100, time=54.98 seconds, total_count=28444, gpu_max_cached_mem_GB=5.822, [valid] loss=6.900, loss_att=5.146, loss_ctc=8.653, acc=0.889, cer=0.125, wer=0.453, cer_ctc=0.203, time=5.95 seconds, total_count=9256, gpu_max_cached_mem_GB=5.822, [att_plot] time=31 seconds, total_count=0, gpu_max_cached_mem_GB=5.822 -[v016] 2022-01-31 05:24:46,024 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:24:46,031 (trainer:261) INFO: 53/200epoch started. Estimated time to finish: 5 hours, 54 minutes and 3.68 seconds -[v016] 2022-01-31 05:24:49,143 (trainer:653) INFO: 53epoch:train:1-27batch: iter_time=0.010, forward_time=0.035, loss=4.775, loss_att=2.409, loss_ctc=7.141, acc=0.906, backward_time=0.024, optim_step_time=0.021, optim0_lr0=1.875e-04, train_time=0.111 -[v016] 2022-01-31 05:24:51,759 (trainer:653) INFO: 53epoch:train:28-54batch: iter_time=1.093e-04, forward_time=0.034, loss=4.650, loss_att=2.403, loss_ctc=6.897, acc=0.909, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.874e-04, train_time=0.097 -[v016] 2022-01-31 05:24:54,449 (trainer:653) INFO: 53epoch:train:55-81batch: iter_time=1.422e-04, forward_time=0.037, loss=4.734, loss_att=2.505, loss_ctc=6.962, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.873e-04, train_time=0.099 -[v016] 2022-01-31 05:24:57,130 (trainer:653) INFO: 53epoch:train:82-108batch: iter_time=1.267e-04, forward_time=0.035, loss=4.458, loss_att=2.325, loss_ctc=6.591, acc=0.915, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.872e-04, train_time=0.099 -[v016] 2022-01-31 05:24:59,677 (trainer:653) INFO: 53epoch:train:109-135batch: iter_time=1.023e-04, forward_time=0.033, loss=4.145, loss_att=2.184, loss_ctc=6.106, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.871e-04, train_time=0.094 -[v016] 2022-01-31 05:25:02,198 (trainer:653) INFO: 53epoch:train:136-162batch: iter_time=9.824e-05, forward_time=0.033, loss=4.213, loss_att=2.303, loss_ctc=6.124, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.870e-04, train_time=0.093 -[v016] 2022-01-31 05:25:04,933 (trainer:653) INFO: 53epoch:train:163-189batch: iter_time=9.553e-05, forward_time=0.037, loss=4.587, loss_att=2.425, loss_ctc=6.749, acc=0.916, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.869e-04, train_time=0.101 -[v016] 2022-01-31 05:25:07,870 (trainer:653) INFO: 53epoch:train:190-216batch: iter_time=0.011, forward_time=0.034, loss=4.756, loss_att=2.373, loss_ctc=7.139, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.868e-04, train_time=0.109 -[v016] 2022-01-31 05:25:10,455 (trainer:653) INFO: 53epoch:train:217-243batch: iter_time=1.002e-04, forward_time=0.033, loss=4.753, loss_att=2.524, loss_ctc=6.981, acc=0.898, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.867e-04, train_time=0.095 -[v016] 2022-01-31 05:25:13,010 (trainer:653) INFO: 53epoch:train:244-270batch: iter_time=1.108e-04, forward_time=0.033, loss=3.666, loss_att=1.972, loss_ctc=5.360, acc=0.916, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.867e-04, train_time=0.094 -[v016] 2022-01-31 05:25:15,693 (trainer:653) INFO: 53epoch:train:271-297batch: iter_time=1.033e-04, forward_time=0.035, loss=4.996, loss_att=2.601, loss_ctc=7.391, acc=0.907, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.866e-04, train_time=0.099 -[v016] 2022-01-31 05:25:18,714 (trainer:653) INFO: 53epoch:train:298-324batch: iter_time=2.003e-04, forward_time=0.040, loss=3.958, loss_att=2.105, loss_ctc=5.811, acc=0.917, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.865e-04, train_time=0.112 -[v016] 2022-01-31 05:25:21,564 (trainer:653) INFO: 53epoch:train:325-351batch: iter_time=2.106e-04, forward_time=0.034, loss=4.191, loss_att=2.296, loss_ctc=6.086, acc=0.911, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.864e-04, train_time=0.105 -[v016] 2022-01-31 05:25:24,238 (trainer:653) INFO: 53epoch:train:352-378batch: iter_time=1.259e-04, forward_time=0.035, loss=4.919, loss_att=2.596, loss_ctc=7.243, acc=0.908, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.863e-04, train_time=0.099 -[v016] 2022-01-31 05:25:26,883 (trainer:653) INFO: 53epoch:train:379-405batch: iter_time=9.510e-05, forward_time=0.037, loss=4.254, loss_att=2.319, loss_ctc=6.189, acc=0.901, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.862e-04, train_time=0.098 -[v016] 2022-01-31 05:25:29,459 (trainer:653) INFO: 53epoch:train:406-432batch: iter_time=1.161e-04, forward_time=0.034, loss=4.551, loss_att=2.367, loss_ctc=6.735, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.861e-04, train_time=0.095 -[v016] 2022-01-31 05:25:32,114 (trainer:653) INFO: 53epoch:train:433-459batch: iter_time=9.983e-05, forward_time=0.035, loss=5.678, loss_att=2.902, loss_ctc=8.454, acc=0.900, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.860e-04, train_time=0.098 -[v016] 2022-01-31 05:25:34,682 (trainer:653) INFO: 53epoch:train:460-486batch: iter_time=1.085e-04, forward_time=0.033, loss=4.766, loss_att=2.512, loss_ctc=7.019, acc=0.903, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.860e-04, train_time=0.095 -[v016] 2022-01-31 05:25:37,251 (trainer:653) INFO: 53epoch:train:487-513batch: iter_time=9.201e-05, forward_time=0.034, loss=5.119, loss_att=2.564, loss_ctc=7.675, acc=0.904, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.859e-04, train_time=0.095 -[v016] 2022-01-31 05:25:39,958 (trainer:653) INFO: 53epoch:train:514-540batch: iter_time=0.002, forward_time=0.035, loss=5.499, loss_att=2.802, loss_ctc=8.197, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.858e-04, train_time=0.100 -[v016] 2022-01-31 05:26:19,905 (trainer:328) INFO: 53epoch results: [train] iter_time=0.001, forward_time=0.035, loss=4.626, loss_att=2.423, loss_ctc=6.829, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.866e-04, train_time=0.099, time=54.63 seconds, total_count=28991, gpu_max_cached_mem_GB=5.824, [valid] loss=6.872, loss_att=5.295, loss_ctc=8.450, acc=0.888, cer=0.120, wer=0.447, cer_ctc=0.189, time=6.46 seconds, total_count=9434, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.75 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:26:22,436 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:26:22,441 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/45epoch.pth, exp/asr_train_asr_raw_en_word/46epoch.pth -[v016] 2022-01-31 05:26:22,444 (trainer:261) INFO: 54/200epoch started. Estimated time to finish: 5 hours, 48 minutes and 10.22 seconds -[v016] 2022-01-31 05:26:27,953 (trainer:653) INFO: 54epoch:train:1-27batch: iter_time=0.014, forward_time=0.058, loss=4.382, loss_att=2.311, loss_ctc=6.452, acc=0.905, backward_time=0.033, optim_step_time=0.023, optim0_lr0=1.857e-04, train_time=0.199 -[v016] 2022-01-31 05:26:30,648 (trainer:653) INFO: 54epoch:train:28-54batch: iter_time=1.126e-04, forward_time=0.036, loss=5.059, loss_att=2.618, loss_ctc=7.500, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.856e-04, train_time=0.100 -[v016] 2022-01-31 05:26:33,210 (trainer:653) INFO: 54epoch:train:55-81batch: iter_time=9.142e-05, forward_time=0.033, loss=3.888, loss_att=2.054, loss_ctc=5.723, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.855e-04, train_time=0.095 -[v016] 2022-01-31 05:26:36,247 (trainer:653) INFO: 54epoch:train:82-108batch: iter_time=4.351e-04, forward_time=0.039, loss=4.005, loss_att=2.142, loss_ctc=5.868, acc=0.913, backward_time=0.023, optim_step_time=0.029, optim0_lr0=1.854e-04, train_time=0.112 -[v016] 2022-01-31 05:26:38,868 (trainer:653) INFO: 54epoch:train:109-135batch: iter_time=9.144e-05, forward_time=0.034, loss=3.939, loss_att=2.104, loss_ctc=5.775, acc=0.916, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.853e-04, train_time=0.097 -[v016] 2022-01-31 05:26:41,844 (trainer:653) INFO: 54epoch:train:136-162batch: iter_time=0.014, forward_time=0.034, loss=4.630, loss_att=2.398, loss_ctc=6.861, acc=0.906, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.852e-04, train_time=0.110 -[v016] 2022-01-31 05:26:44,934 (trainer:653) INFO: 54epoch:train:163-189batch: iter_time=3.890e-04, forward_time=0.040, loss=5.093, loss_att=2.618, loss_ctc=7.568, acc=0.899, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.852e-04, train_time=0.114 -[v016] 2022-01-31 05:26:47,545 (trainer:653) INFO: 54epoch:train:190-216batch: iter_time=1.033e-04, forward_time=0.034, loss=4.380, loss_att=2.259, loss_ctc=6.501, acc=0.914, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.851e-04, train_time=0.097 -[v016] 2022-01-31 05:26:50,162 (trainer:653) INFO: 54epoch:train:217-243batch: iter_time=1.058e-04, forward_time=0.034, loss=4.313, loss_att=2.205, loss_ctc=6.420, acc=0.916, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.850e-04, train_time=0.097 -[v016] 2022-01-31 05:26:52,722 (trainer:653) INFO: 54epoch:train:244-270batch: iter_time=1.048e-04, forward_time=0.033, loss=4.396, loss_att=2.356, loss_ctc=6.436, acc=0.905, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.849e-04, train_time=0.095 -[v016] 2022-01-31 05:26:55,281 (trainer:653) INFO: 54epoch:train:271-297batch: iter_time=9.526e-05, forward_time=0.034, loss=4.208, loss_att=2.195, loss_ctc=6.220, acc=0.909, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.848e-04, train_time=0.095 -[v016] 2022-01-31 05:26:57,885 (trainer:653) INFO: 54epoch:train:298-324batch: iter_time=9.278e-05, forward_time=0.034, loss=4.668, loss_att=2.377, loss_ctc=6.960, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.847e-04, train_time=0.096 -[v016] 2022-01-31 05:27:00,448 (trainer:653) INFO: 54epoch:train:325-351batch: iter_time=1.002e-04, forward_time=0.034, loss=4.050, loss_att=2.200, loss_ctc=5.901, acc=0.905, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.846e-04, train_time=0.095 -[v016] 2022-01-31 05:27:03,038 (trainer:653) INFO: 54epoch:train:352-378batch: iter_time=9.876e-05, forward_time=0.034, loss=3.795, loss_att=2.106, loss_ctc=5.484, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.846e-04, train_time=0.096 -[v016] 2022-01-31 05:27:05,709 (trainer:653) INFO: 54epoch:train:379-405batch: iter_time=9.638e-05, forward_time=0.035, loss=5.446, loss_att=2.927, loss_ctc=7.965, acc=0.900, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.845e-04, train_time=0.099 -[v016] 2022-01-31 05:27:08,653 (trainer:653) INFO: 54epoch:train:406-432batch: iter_time=2.561e-04, forward_time=0.039, loss=4.797, loss_att=2.495, loss_ctc=7.098, acc=0.911, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.844e-04, train_time=0.109 -[v016] 2022-01-31 05:27:11,272 (trainer:653) INFO: 54epoch:train:433-459batch: iter_time=1.152e-04, forward_time=0.034, loss=4.299, loss_att=2.312, loss_ctc=6.286, acc=0.915, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.843e-04, train_time=0.097 -[v016] 2022-01-31 05:27:14,215 (trainer:653) INFO: 54epoch:train:460-486batch: iter_time=0.012, forward_time=0.034, loss=4.488, loss_att=2.435, loss_ctc=6.540, acc=0.906, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.842e-04, train_time=0.109 -[v016] 2022-01-31 05:27:17,114 (trainer:653) INFO: 54epoch:train:487-513batch: iter_time=2.038e-04, forward_time=0.035, loss=4.461, loss_att=2.365, loss_ctc=6.558, acc=0.920, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.841e-04, train_time=0.106 -[v016] 2022-01-31 05:27:19,789 (trainer:653) INFO: 54epoch:train:514-540batch: iter_time=9.969e-05, forward_time=0.034, loss=4.808, loss_att=2.458, loss_ctc=7.158, acc=0.919, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.841e-04, train_time=0.099 -[v016] 2022-01-31 05:27:57,126 (trainer:328) INFO: 54epoch results: [train] iter_time=0.002, forward_time=0.036, loss=4.491, loss_att=2.361, loss_ctc=6.622, acc=0.911, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.849e-04, train_time=0.106, time=58.13 seconds, total_count=29538, gpu_max_cached_mem_GB=5.824, [valid] loss=6.696, loss_att=5.122, loss_ctc=8.271, acc=0.892, cer=0.116, wer=0.437, cer_ctc=0.181, time=5.82 seconds, total_count=9612, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.69 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:27:59,443 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:27:59,453 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/47epoch.pth, exp/asr_train_asr_raw_en_word/48epoch.pth, exp/asr_train_asr_raw_en_word/49epoch.pth -[v016] 2022-01-31 05:27:59,460 (trainer:261) INFO: 55/200epoch started. Estimated time to finish: 5 hours, 42 minutes and 34.45 seconds -[v016] 2022-01-31 05:28:02,366 (trainer:653) INFO: 55epoch:train:1-27batch: iter_time=0.004, forward_time=0.036, loss=4.576, loss_att=2.275, loss_ctc=6.878, acc=0.917, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.839e-04, train_time=0.107 -[v016] 2022-01-31 05:28:05,094 (trainer:653) INFO: 55epoch:train:28-54batch: iter_time=1.025e-04, forward_time=0.035, loss=4.617, loss_att=2.318, loss_ctc=6.916, acc=0.919, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.839e-04, train_time=0.101 -[v016] 2022-01-31 05:28:07,697 (trainer:653) INFO: 55epoch:train:55-81batch: iter_time=9.373e-05, forward_time=0.034, loss=3.692, loss_att=1.888, loss_ctc=5.497, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.838e-04, train_time=0.096 -[v016] 2022-01-31 05:28:10,512 (trainer:653) INFO: 55epoch:train:82-108batch: iter_time=1.633e-04, forward_time=0.035, loss=3.901, loss_att=2.022, loss_ctc=5.779, acc=0.920, backward_time=0.023, optim_step_time=0.027, optim0_lr0=1.837e-04, train_time=0.104 -[v016] 2022-01-31 05:28:13,130 (trainer:653) INFO: 55epoch:train:109-135batch: iter_time=1.217e-04, forward_time=0.034, loss=4.047, loss_att=2.107, loss_ctc=5.987, acc=0.913, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.836e-04, train_time=0.097 -[v016] 2022-01-31 05:28:16,207 (trainer:653) INFO: 55epoch:train:136-162batch: iter_time=0.017, forward_time=0.034, loss=4.486, loss_att=2.355, loss_ctc=6.618, acc=0.915, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.835e-04, train_time=0.114 -[v016] 2022-01-31 05:28:19,046 (trainer:653) INFO: 55epoch:train:163-189batch: iter_time=1.149e-04, forward_time=0.042, loss=4.153, loss_att=2.233, loss_ctc=6.074, acc=0.910, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.834e-04, train_time=0.105 -[v016] 2022-01-31 05:28:21,625 (trainer:653) INFO: 55epoch:train:190-216batch: iter_time=1.261e-04, forward_time=0.034, loss=4.350, loss_att=2.291, loss_ctc=6.409, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.834e-04, train_time=0.095 -[v016] 2022-01-31 05:28:24,144 (trainer:653) INFO: 55epoch:train:217-243batch: iter_time=1.008e-04, forward_time=0.033, loss=3.656, loss_att=1.999, loss_ctc=5.314, acc=0.914, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.833e-04, train_time=0.093 -[v016] 2022-01-31 05:28:26,754 (trainer:653) INFO: 55epoch:train:244-270batch: iter_time=9.626e-05, forward_time=0.034, loss=4.813, loss_att=2.521, loss_ctc=7.105, acc=0.908, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.832e-04, train_time=0.096 -[v016] 2022-01-31 05:28:29,325 (trainer:653) INFO: 55epoch:train:271-297batch: iter_time=1.010e-04, forward_time=0.034, loss=4.366, loss_att=2.310, loss_ctc=6.422, acc=0.913, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.831e-04, train_time=0.095 -[v016] 2022-01-31 05:28:32,064 (trainer:653) INFO: 55epoch:train:298-324batch: iter_time=1.601e-04, forward_time=0.036, loss=4.299, loss_att=2.316, loss_ctc=6.282, acc=0.906, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.830e-04, train_time=0.101 -[v016] 2022-01-31 05:28:34,651 (trainer:653) INFO: 55epoch:train:325-351batch: iter_time=1.253e-04, forward_time=0.034, loss=4.195, loss_att=2.282, loss_ctc=6.108, acc=0.910, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.829e-04, train_time=0.096 -[v016] 2022-01-31 05:28:37,259 (trainer:653) INFO: 55epoch:train:352-378batch: iter_time=1.025e-04, forward_time=0.034, loss=4.951, loss_att=2.463, loss_ctc=7.439, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.829e-04, train_time=0.096 -[v016] 2022-01-31 05:28:39,919 (trainer:653) INFO: 55epoch:train:379-405batch: iter_time=1.477e-04, forward_time=0.034, loss=3.981, loss_att=2.080, loss_ctc=5.882, acc=0.919, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.828e-04, train_time=0.098 -[v016] 2022-01-31 05:28:42,556 (trainer:653) INFO: 55epoch:train:406-432batch: iter_time=9.332e-05, forward_time=0.035, loss=4.772, loss_att=2.332, loss_ctc=7.212, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.827e-04, train_time=0.097 -[v016] 2022-01-31 05:28:45,229 (trainer:653) INFO: 55epoch:train:433-459batch: iter_time=9.724e-05, forward_time=0.035, loss=5.683, loss_att=2.809, loss_ctc=8.558, acc=0.907, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.826e-04, train_time=0.099 -[v016] 2022-01-31 05:28:48,206 (trainer:653) INFO: 55epoch:train:460-486batch: iter_time=0.013, forward_time=0.034, loss=4.724, loss_att=2.441, loss_ctc=7.008, acc=0.913, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.825e-04, train_time=0.110 -[v016] 2022-01-31 05:28:50,754 (trainer:653) INFO: 55epoch:train:487-513batch: iter_time=9.574e-05, forward_time=0.033, loss=4.016, loss_att=2.157, loss_ctc=5.874, acc=0.910, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.825e-04, train_time=0.094 -[v016] 2022-01-31 05:28:53,325 (trainer:653) INFO: 55epoch:train:514-540batch: iter_time=1.011e-04, forward_time=0.034, loss=3.886, loss_att=2.143, loss_ctc=5.629, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.824e-04, train_time=0.095 -[v016] 2022-01-31 05:29:29,448 (trainer:328) INFO: 55epoch results: [train] iter_time=0.002, forward_time=0.035, loss=4.355, loss_att=2.265, loss_ctc=6.444, acc=0.914, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.831e-04, train_time=0.099, time=54.62 seconds, total_count=30085, gpu_max_cached_mem_GB=5.824, [valid] loss=6.636, loss_att=5.122, loss_ctc=8.149, acc=0.891, cer=0.120, wer=0.451, cer_ctc=0.188, time=5.91 seconds, total_count=9790, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.45 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:29:31,653 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:29:31,661 (trainer:261) INFO: 56/200epoch started. Estimated time to finish: 5 hours, 36 minutes and 52.41 seconds -[v016] 2022-01-31 05:29:34,456 (trainer:653) INFO: 56epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=3.972, loss_att=2.016, loss_ctc=5.928, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.823e-04, train_time=0.103 -[v016] 2022-01-31 05:29:37,178 (trainer:653) INFO: 56epoch:train:28-54batch: iter_time=1.035e-04, forward_time=0.034, loss=4.425, loss_att=2.315, loss_ctc=6.535, acc=0.913, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.822e-04, train_time=0.100 -[v016] 2022-01-31 05:29:39,772 (trainer:653) INFO: 56epoch:train:55-81batch: iter_time=1.928e-04, forward_time=0.035, loss=3.507, loss_att=1.833, loss_ctc=5.181, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.821e-04, train_time=0.096 -[v016] 2022-01-31 05:29:42,377 (trainer:653) INFO: 56epoch:train:82-108batch: iter_time=1.055e-04, forward_time=0.034, loss=4.425, loss_att=2.300, loss_ctc=6.549, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.820e-04, train_time=0.096 -[v016] 2022-01-31 05:29:45,219 (trainer:653) INFO: 56epoch:train:109-135batch: iter_time=1.956e-04, forward_time=0.038, loss=4.516, loss_att=2.295, loss_ctc=6.736, acc=0.913, backward_time=0.024, optim_step_time=0.021, optim0_lr0=1.819e-04, train_time=0.105 -[v016] 2022-01-31 05:29:47,795 (trainer:653) INFO: 56epoch:train:136-162batch: iter_time=1.219e-04, forward_time=0.034, loss=4.594, loss_att=2.352, loss_ctc=6.836, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.819e-04, train_time=0.095 -[v016] 2022-01-31 05:29:50,511 (trainer:653) INFO: 56epoch:train:163-189batch: iter_time=0.004, forward_time=0.034, loss=4.309, loss_att=2.227, loss_ctc=6.391, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.818e-04, train_time=0.100 -[v016] 2022-01-31 05:29:53,228 (trainer:653) INFO: 56epoch:train:190-216batch: iter_time=3.457e-04, forward_time=0.035, loss=4.662, loss_att=2.339, loss_ctc=6.984, acc=0.912, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.817e-04, train_time=0.100 -[v016] 2022-01-31 05:29:55,891 (trainer:653) INFO: 56epoch:train:217-243batch: iter_time=1.115e-04, forward_time=0.035, loss=4.568, loss_att=2.331, loss_ctc=6.804, acc=0.919, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.816e-04, train_time=0.098 -[v016] 2022-01-31 05:29:58,533 (trainer:653) INFO: 56epoch:train:244-270batch: iter_time=1.027e-04, forward_time=0.035, loss=4.286, loss_att=2.270, loss_ctc=6.303, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.815e-04, train_time=0.098 -[v016] 2022-01-31 05:30:01,145 (trainer:653) INFO: 56epoch:train:271-297batch: iter_time=9.682e-05, forward_time=0.034, loss=4.498, loss_att=2.301, loss_ctc=6.695, acc=0.907, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.815e-04, train_time=0.097 -[v016] 2022-01-31 05:30:03,690 (trainer:653) INFO: 56epoch:train:298-324batch: iter_time=1.074e-04, forward_time=0.034, loss=3.758, loss_att=2.063, loss_ctc=5.452, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.814e-04, train_time=0.094 -[v016] 2022-01-31 05:30:06,272 (trainer:653) INFO: 56epoch:train:325-351batch: iter_time=9.984e-05, forward_time=0.034, loss=4.319, loss_att=2.177, loss_ctc=6.461, acc=0.916, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.813e-04, train_time=0.095 -[v016] 2022-01-31 05:30:08,889 (trainer:653) INFO: 56epoch:train:352-378batch: iter_time=1.012e-04, forward_time=0.034, loss=4.569, loss_att=2.368, loss_ctc=6.770, acc=0.904, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.812e-04, train_time=0.097 -[v016] 2022-01-31 05:30:11,846 (trainer:653) INFO: 56epoch:train:379-405batch: iter_time=4.462e-04, forward_time=0.038, loss=4.714, loss_att=2.413, loss_ctc=7.015, acc=0.917, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.811e-04, train_time=0.109 -[v016] 2022-01-31 05:30:14,781 (trainer:653) INFO: 56epoch:train:406-432batch: iter_time=4.242e-04, forward_time=0.035, loss=3.162, loss_att=1.784, loss_ctc=4.540, acc=0.925, backward_time=0.024, optim_step_time=0.027, optim0_lr0=1.811e-04, train_time=0.108 -[v016] 2022-01-31 05:30:17,496 (trainer:653) INFO: 56epoch:train:433-459batch: iter_time=1.398e-04, forward_time=0.035, loss=4.002, loss_att=2.012, loss_ctc=5.991, acc=0.918, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.810e-04, train_time=0.100 -[v016] 2022-01-31 05:30:20,268 (trainer:653) INFO: 56epoch:train:460-486batch: iter_time=0.007, forward_time=0.033, loss=3.420, loss_att=1.894, loss_ctc=4.946, acc=0.924, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.809e-04, train_time=0.102 -[v016] 2022-01-31 05:30:22,961 (trainer:653) INFO: 56epoch:train:487-513batch: iter_time=1.307e-04, forward_time=0.035, loss=4.103, loss_att=2.109, loss_ctc=6.096, acc=0.925, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.808e-04, train_time=0.100 -[v016] 2022-01-31 05:30:25,743 (trainer:653) INFO: 56epoch:train:514-540batch: iter_time=1.348e-04, forward_time=0.036, loss=4.726, loss_att=2.435, loss_ctc=7.016, acc=0.917, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.807e-04, train_time=0.103 -[v016] 2022-01-31 05:31:08,584 (trainer:328) INFO: 56epoch results: [train] iter_time=8.865e-04, forward_time=0.035, loss=4.217, loss_att=2.189, loss_ctc=6.245, acc=0.916, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.815e-04, train_time=0.100, time=54.84 seconds, total_count=30632, gpu_max_cached_mem_GB=5.824, [valid] loss=6.791, loss_att=5.214, loss_ctc=8.369, acc=0.889, cer=0.117, wer=0.447, cer_ctc=0.187, time=8.65 seconds, total_count=9968, gpu_max_cached_mem_GB=5.824, [att_plot] time=33.43 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:31:11,057 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:31:11,062 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/50epoch.pth, exp/asr_train_asr_raw_en_word/51epoch.pth -[v016] 2022-01-31 05:31:11,066 (trainer:261) INFO: 57/200epoch started. Estimated time to finish: 5 hours, 31 minutes and 53.05 seconds -[v016] 2022-01-31 05:31:22,853 (trainer:653) INFO: 57epoch:train:1-27batch: iter_time=0.296, forward_time=0.062, loss=4.359, loss_att=2.242, loss_ctc=6.476, acc=0.915, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.806e-04, train_time=0.436 -[v016] 2022-01-31 05:31:31,663 (trainer:653) INFO: 57epoch:train:28-54batch: iter_time=0.181, forward_time=0.064, loss=4.176, loss_att=2.110, loss_ctc=6.243, acc=0.921, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.806e-04, train_time=0.326 -[v016] 2022-01-31 05:31:41,413 (trainer:653) INFO: 57epoch:train:55-81batch: iter_time=0.187, forward_time=0.083, loss=4.064, loss_att=2.046, loss_ctc=6.083, acc=0.928, backward_time=0.032, optim_step_time=0.024, optim0_lr0=1.805e-04, train_time=0.354 -[v016] 2022-01-31 05:31:48,325 (trainer:653) INFO: 57epoch:train:82-108batch: iter_time=0.153, forward_time=0.035, loss=4.368, loss_att=2.197, loss_ctc=6.540, acc=0.916, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.804e-04, train_time=0.257 -[v016] 2022-01-31 05:31:55,318 (trainer:653) INFO: 57epoch:train:109-135batch: iter_time=0.161, forward_time=0.035, loss=3.974, loss_att=2.202, loss_ctc=5.746, acc=0.902, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.803e-04, train_time=0.259 -[v016] 2022-01-31 05:32:02,636 (trainer:653) INFO: 57epoch:train:136-162batch: iter_time=0.169, forward_time=0.033, loss=4.974, loss_att=2.476, loss_ctc=7.471, acc=0.905, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.802e-04, train_time=0.271 -[v016] 2022-01-31 05:32:07,991 (trainer:653) INFO: 57epoch:train:163-189batch: iter_time=0.095, forward_time=0.033, loss=3.768, loss_att=2.044, loss_ctc=5.492, acc=0.919, backward_time=0.024, optim_step_time=0.022, optim0_lr0=1.802e-04, train_time=0.198 -[v016] 2022-01-31 05:32:14,766 (trainer:653) INFO: 57epoch:train:190-216batch: iter_time=0.148, forward_time=0.033, loss=4.008, loss_att=2.196, loss_ctc=5.820, acc=0.910, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.801e-04, train_time=0.251 -[v016] 2022-01-31 05:32:21,085 (trainer:653) INFO: 57epoch:train:217-243batch: iter_time=0.134, forward_time=0.037, loss=4.161, loss_att=2.073, loss_ctc=6.249, acc=0.916, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.800e-04, train_time=0.234 -[v016] 2022-01-31 05:32:28,137 (trainer:653) INFO: 57epoch:train:244-270batch: iter_time=0.155, forward_time=0.035, loss=2.917, loss_att=1.628, loss_ctc=4.207, acc=0.927, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.799e-04, train_time=0.261 -[v016] 2022-01-31 05:32:35,136 (trainer:653) INFO: 57epoch:train:271-297batch: iter_time=0.150, forward_time=0.038, loss=4.454, loss_att=2.276, loss_ctc=6.632, acc=0.921, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.798e-04, train_time=0.259 -[v016] 2022-01-31 05:32:40,085 (trainer:653) INFO: 57epoch:train:298-324batch: iter_time=0.082, forward_time=0.037, loss=3.899, loss_att=2.004, loss_ctc=5.795, acc=0.916, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.798e-04, train_time=0.183 -[v016] 2022-01-31 05:32:45,664 (trainer:653) INFO: 57epoch:train:325-351batch: iter_time=0.107, forward_time=0.033, loss=3.366, loss_att=1.809, loss_ctc=4.924, acc=0.917, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.797e-04, train_time=0.206 -[v016] 2022-01-31 05:32:52,585 (trainer:653) INFO: 57epoch:train:352-378batch: iter_time=0.151, forward_time=0.033, loss=4.482, loss_att=2.265, loss_ctc=6.699, acc=0.913, backward_time=0.023, optim_step_time=0.026, optim0_lr0=1.796e-04, train_time=0.256 -[v016] 2022-01-31 05:33:00,179 (trainer:653) INFO: 57epoch:train:379-405batch: iter_time=0.180, forward_time=0.035, loss=4.954, loss_att=2.537, loss_ctc=7.371, acc=0.922, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.795e-04, train_time=0.281 -[v016] 2022-01-31 05:33:07,383 (trainer:653) INFO: 57epoch:train:406-432batch: iter_time=0.104, forward_time=0.049, loss=3.906, loss_att=2.033, loss_ctc=5.779, acc=0.920, backward_time=0.064, optim_step_time=0.024, optim0_lr0=1.795e-04, train_time=0.267 -[v016] 2022-01-31 05:33:14,375 (trainer:653) INFO: 57epoch:train:433-459batch: iter_time=0.156, forward_time=0.034, loss=3.548, loss_att=2.001, loss_ctc=5.096, acc=0.918, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.794e-04, train_time=0.259 -[v016] 2022-01-31 05:33:22,038 (trainer:653) INFO: 57epoch:train:460-486batch: iter_time=0.178, forward_time=0.041, loss=3.856, loss_att=2.072, loss_ctc=5.639, acc=0.915, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.793e-04, train_time=0.284 -[v016] 2022-01-31 05:33:29,197 (trainer:653) INFO: 57epoch:train:487-513batch: iter_time=0.160, forward_time=0.037, loss=4.604, loss_att=2.311, loss_ctc=6.896, acc=0.921, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.792e-04, train_time=0.265 -[v016] 2022-01-31 05:33:35,561 (trainer:653) INFO: 57epoch:train:514-540batch: iter_time=0.132, forward_time=0.033, loss=4.100, loss_att=2.241, loss_ctc=5.958, acc=0.915, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.791e-04, train_time=0.232 -[v016] 2022-01-31 05:34:40,737 (trainer:328) INFO: 57epoch results: [train] iter_time=0.154, forward_time=0.041, loss=4.127, loss_att=2.149, loss_ctc=6.104, acc=0.917, backward_time=0.026, optim_step_time=0.023, optim0_lr0=1.799e-04, train_time=0.267, time=2 minutes and 26.61 seconds, total_count=31179, gpu_max_cached_mem_GB=5.824, [valid] loss=6.588, loss_att=5.169, loss_ctc=8.007, acc=0.891, cer=0.115, wer=0.446, cer_ctc=0.180, time=31.04 seconds, total_count=10146, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.93 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:34:43,468 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:34:43,476 (trainer:261) INFO: 58/200epoch started. Estimated time to finish: 5 hours, 34 minutes and 21.26 seconds -[v016] 2022-01-31 05:34:46,741 (trainer:653) INFO: 58epoch:train:1-27batch: iter_time=0.004, forward_time=0.037, loss=4.531, loss_att=2.206, loss_ctc=6.855, acc=0.918, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.790e-04, train_time=0.109 -[v016] 2022-01-31 05:34:49,552 (trainer:653) INFO: 58epoch:train:28-54batch: iter_time=1.394e-04, forward_time=0.038, loss=3.288, loss_att=1.760, loss_ctc=4.816, acc=0.928, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.790e-04, train_time=0.104 -[v016] 2022-01-31 05:34:52,341 (trainer:653) INFO: 58epoch:train:55-81batch: iter_time=2.183e-04, forward_time=0.035, loss=3.959, loss_att=2.081, loss_ctc=5.836, acc=0.914, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.789e-04, train_time=0.103 -[v016] 2022-01-31 05:34:55,280 (trainer:653) INFO: 58epoch:train:82-108batch: iter_time=1.820e-04, forward_time=0.040, loss=4.046, loss_att=2.078, loss_ctc=6.013, acc=0.924, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.788e-04, train_time=0.109 -[v016] 2022-01-31 05:34:58,090 (trainer:653) INFO: 58epoch:train:109-135batch: iter_time=2.085e-04, forward_time=0.035, loss=4.356, loss_att=2.277, loss_ctc=6.434, acc=0.916, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.787e-04, train_time=0.104 -[v016] 2022-01-31 05:35:00,669 (trainer:653) INFO: 58epoch:train:136-162batch: iter_time=1.315e-04, forward_time=0.034, loss=3.832, loss_att=2.031, loss_ctc=5.633, acc=0.911, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.787e-04, train_time=0.095 -[v016] 2022-01-31 05:35:03,561 (trainer:653) INFO: 58epoch:train:163-189batch: iter_time=0.008, forward_time=0.037, loss=3.989, loss_att=2.060, loss_ctc=5.918, acc=0.917, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.786e-04, train_time=0.107 -[v016] 2022-01-31 05:35:06,291 (trainer:653) INFO: 58epoch:train:190-216batch: iter_time=3.572e-04, forward_time=0.038, loss=3.875, loss_att=1.957, loss_ctc=5.794, acc=0.919, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.785e-04, train_time=0.101 -[v016] 2022-01-31 05:35:09,034 (trainer:653) INFO: 58epoch:train:217-243batch: iter_time=3.661e-04, forward_time=0.034, loss=3.688, loss_att=1.910, loss_ctc=5.466, acc=0.923, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.784e-04, train_time=0.101 -[v016] 2022-01-31 05:35:11,615 (trainer:653) INFO: 58epoch:train:244-270batch: iter_time=1.312e-04, forward_time=0.033, loss=3.651, loss_att=1.930, loss_ctc=5.373, acc=0.921, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.784e-04, train_time=0.095 -[v016] 2022-01-31 05:35:14,393 (trainer:653) INFO: 58epoch:train:271-297batch: iter_time=1.756e-04, forward_time=0.039, loss=3.819, loss_att=1.893, loss_ctc=5.745, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.783e-04, train_time=0.103 -[v016] 2022-01-31 05:35:17,055 (trainer:653) INFO: 58epoch:train:298-324batch: iter_time=2.421e-04, forward_time=0.034, loss=3.786, loss_att=2.067, loss_ctc=5.505, acc=0.911, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.782e-04, train_time=0.098 -[v016] 2022-01-31 05:35:19,866 (trainer:653) INFO: 58epoch:train:325-351batch: iter_time=1.501e-04, forward_time=0.035, loss=4.710, loss_att=2.357, loss_ctc=7.063, acc=0.915, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.781e-04, train_time=0.104 -[v016] 2022-01-31 05:35:22,844 (trainer:653) INFO: 58epoch:train:352-378batch: iter_time=0.009, forward_time=0.034, loss=3.926, loss_att=2.115, loss_ctc=5.738, acc=0.922, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.780e-04, train_time=0.110 -[v016] 2022-01-31 05:35:25,654 (trainer:653) INFO: 58epoch:train:379-405batch: iter_time=2.148e-04, forward_time=0.035, loss=5.021, loss_att=2.478, loss_ctc=7.563, acc=0.918, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.780e-04, train_time=0.104 -[v016] 2022-01-31 05:35:28,407 (trainer:653) INFO: 58epoch:train:406-432batch: iter_time=2.217e-04, forward_time=0.034, loss=4.536, loss_att=2.295, loss_ctc=6.778, acc=0.910, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.779e-04, train_time=0.102 -[v016] 2022-01-31 05:35:31,151 (trainer:653) INFO: 58epoch:train:433-459batch: iter_time=1.963e-04, forward_time=0.034, loss=4.243, loss_att=2.123, loss_ctc=6.363, acc=0.916, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.778e-04, train_time=0.101 -[v016] 2022-01-31 05:35:33,854 (trainer:653) INFO: 58epoch:train:460-486batch: iter_time=2.003e-04, forward_time=0.033, loss=3.696, loss_att=1.915, loss_ctc=5.476, acc=0.931, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.777e-04, train_time=0.100 -[v016] 2022-01-31 05:35:36,615 (trainer:653) INFO: 58epoch:train:487-513batch: iter_time=2.231e-04, forward_time=0.035, loss=3.737, loss_att=2.015, loss_ctc=5.459, acc=0.918, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.777e-04, train_time=0.102 -[v016] 2022-01-31 05:35:39,436 (trainer:653) INFO: 58epoch:train:514-540batch: iter_time=1.709e-04, forward_time=0.035, loss=4.067, loss_att=2.046, loss_ctc=6.088, acc=0.924, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.776e-04, train_time=0.104 -[v016] 2022-01-31 05:36:16,337 (trainer:328) INFO: 58epoch results: [train] iter_time=0.001, forward_time=0.036, loss=4.068, loss_att=2.095, loss_ctc=6.042, acc=0.919, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.783e-04, train_time=0.103, time=56.74 seconds, total_count=31726, gpu_max_cached_mem_GB=5.824, [valid] loss=6.572, loss_att=5.131, loss_ctc=8.014, acc=0.896, cer=0.112, wer=0.431, cer_ctc=0.173, time=6.11 seconds, total_count=10324, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.96 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:36:18,349 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:36:18,354 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/52epoch.pth, exp/asr_train_asr_raw_en_word/53epoch.pth -[v016] 2022-01-31 05:36:18,357 (trainer:261) INFO: 59/200epoch started. Estimated time to finish: 5 hours, 29 minutes and 11.28 seconds -[v016] 2022-01-31 05:36:21,114 (trainer:653) INFO: 59epoch:train:1-27batch: iter_time=0.005, forward_time=0.034, loss=3.614, loss_att=1.898, loss_ctc=5.329, acc=0.918, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.775e-04, train_time=0.102 -[v016] 2022-01-31 05:36:23,748 (trainer:653) INFO: 59epoch:train:28-54batch: iter_time=1.022e-04, forward_time=0.034, loss=4.094, loss_att=2.021, loss_ctc=6.166, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.774e-04, train_time=0.097 -[v016] 2022-01-31 05:36:26,463 (trainer:653) INFO: 59epoch:train:55-81batch: iter_time=3.657e-04, forward_time=0.035, loss=3.500, loss_att=1.805, loss_ctc=5.196, acc=0.930, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.773e-04, train_time=0.100 -[v016] 2022-01-31 05:36:29,097 (trainer:653) INFO: 59epoch:train:82-108batch: iter_time=1.216e-04, forward_time=0.034, loss=4.035, loss_att=2.066, loss_ctc=6.003, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.773e-04, train_time=0.097 -[v016] 2022-01-31 05:36:32,114 (trainer:653) INFO: 59epoch:train:109-135batch: iter_time=4.051e-04, forward_time=0.037, loss=4.550, loss_att=2.174, loss_ctc=6.926, acc=0.927, backward_time=0.023, optim_step_time=0.026, optim0_lr0=1.772e-04, train_time=0.111 -[v016] 2022-01-31 05:36:34,878 (trainer:653) INFO: 59epoch:train:136-162batch: iter_time=0.007, forward_time=0.033, loss=3.859, loss_att=2.075, loss_ctc=5.643, acc=0.909, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.771e-04, train_time=0.102 -[v016] 2022-01-31 05:36:37,692 (trainer:653) INFO: 59epoch:train:163-189batch: iter_time=0.005, forward_time=0.037, loss=4.067, loss_att=2.079, loss_ctc=6.056, acc=0.919, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.770e-04, train_time=0.104 -[v016] 2022-01-31 05:36:40,371 (trainer:653) INFO: 59epoch:train:190-216batch: iter_time=2.151e-04, forward_time=0.034, loss=3.374, loss_att=1.771, loss_ctc=4.976, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.770e-04, train_time=0.099 -[v016] 2022-01-31 05:36:43,172 (trainer:653) INFO: 59epoch:train:217-243batch: iter_time=2.050e-04, forward_time=0.039, loss=4.172, loss_att=2.078, loss_ctc=6.265, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.769e-04, train_time=0.103 -[v016] 2022-01-31 05:36:45,927 (trainer:653) INFO: 59epoch:train:244-270batch: iter_time=1.884e-04, forward_time=0.034, loss=3.747, loss_att=1.976, loss_ctc=5.519, acc=0.927, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.768e-04, train_time=0.102 -[v016] 2022-01-31 05:36:48,535 (trainer:653) INFO: 59epoch:train:271-297batch: iter_time=1.273e-04, forward_time=0.034, loss=4.395, loss_att=2.225, loss_ctc=6.565, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.767e-04, train_time=0.096 -[v016] 2022-01-31 05:36:51,342 (trainer:653) INFO: 59epoch:train:298-324batch: iter_time=1.782e-04, forward_time=0.035, loss=4.367, loss_att=2.218, loss_ctc=6.517, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.767e-04, train_time=0.104 -[v016] 2022-01-31 05:36:54,085 (trainer:653) INFO: 59epoch:train:325-351batch: iter_time=1.229e-04, forward_time=0.039, loss=4.057, loss_att=2.054, loss_ctc=6.060, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.766e-04, train_time=0.101 -[v016] 2022-01-31 05:36:56,851 (trainer:653) INFO: 59epoch:train:352-378batch: iter_time=2.296e-04, forward_time=0.035, loss=3.776, loss_att=1.934, loss_ctc=5.617, acc=0.927, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.765e-04, train_time=0.102 -[v016] 2022-01-31 05:36:59,577 (trainer:653) INFO: 59epoch:train:379-405batch: iter_time=2.982e-04, forward_time=0.038, loss=3.571, loss_att=1.900, loss_ctc=5.243, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.764e-04, train_time=0.101 -[v016] 2022-01-31 05:37:02,119 (trainer:653) INFO: 59epoch:train:406-432batch: iter_time=1.356e-04, forward_time=0.033, loss=3.615, loss_att=2.027, loss_ctc=5.203, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.764e-04, train_time=0.094 -[v016] 2022-01-31 05:37:04,817 (trainer:653) INFO: 59epoch:train:433-459batch: iter_time=9.985e-05, forward_time=0.037, loss=3.824, loss_att=1.945, loss_ctc=5.703, acc=0.921, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.763e-04, train_time=0.100 -[v016] 2022-01-31 05:37:07,809 (trainer:653) INFO: 59epoch:train:460-486batch: iter_time=0.009, forward_time=0.038, loss=3.900, loss_att=2.067, loss_ctc=5.732, acc=0.916, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.762e-04, train_time=0.111 -[v016] 2022-01-31 05:37:10,521 (trainer:653) INFO: 59epoch:train:487-513batch: iter_time=1.225e-04, forward_time=0.038, loss=4.209, loss_att=2.219, loss_ctc=6.199, acc=0.909, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.762e-04, train_time=0.100 -[v016] 2022-01-31 05:37:13,492 (trainer:653) INFO: 59epoch:train:514-540batch: iter_time=1.336e-04, forward_time=0.040, loss=4.601, loss_att=2.351, loss_ctc=6.850, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.761e-04, train_time=0.110 -[v016] 2022-01-31 05:37:49,097 (trainer:328) INFO: 59epoch results: [train] iter_time=0.001, forward_time=0.036, loss=3.966, loss_att=2.045, loss_ctc=5.887, acc=0.921, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.768e-04, train_time=0.102, time=55.88 seconds, total_count=32273, gpu_max_cached_mem_GB=5.824, [valid] loss=6.650, loss_att=5.191, loss_ctc=8.109, acc=0.894, cer=0.114, wer=0.434, cer_ctc=0.180, time=5.88 seconds, total_count=10502, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.97 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:37:51,137 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:37:51,145 (trainer:261) INFO: 60/200epoch started. Estimated time to finish: 5 hours, 24 minutes and 4.78 seconds -[v016] 2022-01-31 05:37:53,964 (trainer:653) INFO: 60epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=3.945, loss_att=1.960, loss_ctc=5.931, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.760e-04, train_time=0.104 -[v016] 2022-01-31 05:37:56,528 (trainer:653) INFO: 60epoch:train:28-54batch: iter_time=1.062e-04, forward_time=0.034, loss=3.443, loss_att=1.828, loss_ctc=5.057, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.759e-04, train_time=0.095 -[v016] 2022-01-31 05:37:59,063 (trainer:653) INFO: 60epoch:train:55-81batch: iter_time=9.576e-05, forward_time=0.034, loss=3.698, loss_att=1.992, loss_ctc=5.405, acc=0.914, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.758e-04, train_time=0.094 -[v016] 2022-01-31 05:38:01,630 (trainer:653) INFO: 60epoch:train:82-108batch: iter_time=9.157e-05, forward_time=0.034, loss=3.667, loss_att=1.876, loss_ctc=5.459, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.758e-04, train_time=0.095 -[v016] 2022-01-31 05:38:04,290 (trainer:653) INFO: 60epoch:train:109-135batch: iter_time=9.449e-05, forward_time=0.035, loss=4.128, loss_att=1.993, loss_ctc=6.264, acc=0.926, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.757e-04, train_time=0.098 -[v016] 2022-01-31 05:38:06,834 (trainer:653) INFO: 60epoch:train:136-162batch: iter_time=9.524e-05, forward_time=0.033, loss=3.005, loss_att=1.715, loss_ctc=4.296, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.756e-04, train_time=0.094 -[v016] 2022-01-31 05:38:09,725 (trainer:653) INFO: 60epoch:train:163-189batch: iter_time=0.010, forward_time=0.034, loss=3.981, loss_att=2.100, loss_ctc=5.863, acc=0.919, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.755e-04, train_time=0.107 -[v016] 2022-01-31 05:38:12,327 (trainer:653) INFO: 60epoch:train:190-216batch: iter_time=9.337e-05, forward_time=0.034, loss=3.357, loss_att=1.790, loss_ctc=4.925, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.755e-04, train_time=0.096 -[v016] 2022-01-31 05:38:15,013 (trainer:653) INFO: 60epoch:train:217-243batch: iter_time=9.308e-05, forward_time=0.035, loss=4.094, loss_att=2.149, loss_ctc=6.039, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.754e-04, train_time=0.099 -[v016] 2022-01-31 05:38:17,587 (trainer:653) INFO: 60epoch:train:244-270batch: iter_time=9.197e-05, forward_time=0.034, loss=3.906, loss_att=1.921, loss_ctc=5.891, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.753e-04, train_time=0.095 -[v016] 2022-01-31 05:38:20,132 (trainer:653) INFO: 60epoch:train:271-297batch: iter_time=9.163e-05, forward_time=0.033, loss=3.939, loss_att=2.010, loss_ctc=5.868, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.753e-04, train_time=0.094 -[v016] 2022-01-31 05:38:22,778 (trainer:653) INFO: 60epoch:train:298-324batch: iter_time=9.534e-05, forward_time=0.034, loss=4.437, loss_att=2.138, loss_ctc=6.736, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.752e-04, train_time=0.098 -[v016] 2022-01-31 05:38:25,357 (trainer:653) INFO: 60epoch:train:325-351batch: iter_time=9.170e-05, forward_time=0.034, loss=4.041, loss_att=2.052, loss_ctc=6.030, acc=0.921, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.751e-04, train_time=0.095 -[v016] 2022-01-31 05:38:27,891 (trainer:653) INFO: 60epoch:train:352-378batch: iter_time=9.096e-05, forward_time=0.033, loss=3.541, loss_att=1.841, loss_ctc=5.241, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.750e-04, train_time=0.094 -[v016] 2022-01-31 05:38:30,388 (trainer:653) INFO: 60epoch:train:379-405batch: iter_time=9.340e-05, forward_time=0.033, loss=3.546, loss_att=1.901, loss_ctc=5.190, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.750e-04, train_time=0.092 -[v016] 2022-01-31 05:38:32,969 (trainer:653) INFO: 60epoch:train:406-432batch: iter_time=9.207e-05, forward_time=0.034, loss=4.323, loss_att=2.218, loss_ctc=6.427, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.749e-04, train_time=0.095 -[v016] 2022-01-31 05:38:35,546 (trainer:653) INFO: 60epoch:train:433-459batch: iter_time=9.424e-05, forward_time=0.034, loss=3.699, loss_att=1.951, loss_ctc=5.446, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.748e-04, train_time=0.095 -[v016] 2022-01-31 05:38:38,163 (trainer:653) INFO: 60epoch:train:460-486batch: iter_time=9.789e-05, forward_time=0.034, loss=4.568, loss_att=2.229, loss_ctc=6.908, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.747e-04, train_time=0.097 -[v016] 2022-01-31 05:38:40,711 (trainer:653) INFO: 60epoch:train:487-513batch: iter_time=4.080e-04, forward_time=0.033, loss=4.120, loss_att=2.014, loss_ctc=6.226, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.747e-04, train_time=0.094 -[v016] 2022-01-31 05:38:43,337 (trainer:653) INFO: 60epoch:train:514-540batch: iter_time=9.374e-05, forward_time=0.034, loss=4.239, loss_att=2.184, loss_ctc=6.294, acc=0.915, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.746e-04, train_time=0.097 -[v016] 2022-01-31 05:39:19,574 (trainer:328) INFO: 60epoch results: [train] iter_time=8.030e-04, forward_time=0.034, loss=3.894, loss_att=1.997, loss_ctc=5.792, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.753e-04, train_time=0.096, time=52.93 seconds, total_count=32820, gpu_max_cached_mem_GB=5.824, [valid] loss=6.641, loss_att=5.214, loss_ctc=8.069, acc=0.893, cer=0.113, wer=0.437, cer_ctc=0.175, time=5.86 seconds, total_count=10680, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.63 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:39:21,958 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:39:21,966 (trainer:261) INFO: 61/200epoch started. Estimated time to finish: 5 hours, 19 minutes and 2.07 seconds -[v016] 2022-01-31 05:39:24,700 (trainer:653) INFO: 61epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=2.939, loss_att=1.545, loss_ctc=4.332, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.745e-04, train_time=0.101 -[v016] 2022-01-31 05:39:27,385 (trainer:653) INFO: 61epoch:train:28-54batch: iter_time=1.132e-04, forward_time=0.037, loss=3.232, loss_att=1.633, loss_ctc=4.830, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.744e-04, train_time=0.099 -[v016] 2022-01-31 05:39:29,978 (trainer:653) INFO: 61epoch:train:55-81batch: iter_time=1.310e-04, forward_time=0.034, loss=3.547, loss_att=1.832, loss_ctc=5.261, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.744e-04, train_time=0.096 -[v016] 2022-01-31 05:39:32,713 (trainer:653) INFO: 61epoch:train:82-108batch: iter_time=1.310e-04, forward_time=0.034, loss=3.699, loss_att=1.892, loss_ctc=5.505, acc=0.918, backward_time=0.022, optim_step_time=0.027, optim0_lr0=1.743e-04, train_time=0.101 -[v016] 2022-01-31 05:39:35,279 (trainer:653) INFO: 61epoch:train:109-135batch: iter_time=1.104e-04, forward_time=0.033, loss=3.407, loss_att=1.753, loss_ctc=5.061, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.742e-04, train_time=0.095 -[v016] 2022-01-31 05:39:37,921 (trainer:653) INFO: 61epoch:train:136-162batch: iter_time=2.704e-04, forward_time=0.034, loss=3.637, loss_att=1.823, loss_ctc=5.451, acc=0.927, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.742e-04, train_time=0.098 -[v016] 2022-01-31 05:39:40,504 (trainer:653) INFO: 61epoch:train:163-189batch: iter_time=1.231e-04, forward_time=0.034, loss=3.542, loss_att=1.933, loss_ctc=5.151, acc=0.918, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.741e-04, train_time=0.095 -[v016] 2022-01-31 05:39:43,529 (trainer:653) INFO: 61epoch:train:190-216batch: iter_time=0.012, forward_time=0.037, loss=3.917, loss_att=1.935, loss_ctc=5.900, acc=0.925, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.740e-04, train_time=0.112 -[v016] 2022-01-31 05:39:46,172 (trainer:653) INFO: 61epoch:train:217-243batch: iter_time=1.216e-04, forward_time=0.034, loss=4.032, loss_att=1.964, loss_ctc=6.099, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.739e-04, train_time=0.098 -[v016] 2022-01-31 05:39:48,968 (trainer:653) INFO: 61epoch:train:244-270batch: iter_time=2.004e-04, forward_time=0.035, loss=4.126, loss_att=2.098, loss_ctc=6.154, acc=0.914, backward_time=0.022, optim_step_time=0.026, optim0_lr0=1.739e-04, train_time=0.103 -[v016] 2022-01-31 05:39:51,636 (trainer:653) INFO: 61epoch:train:271-297batch: iter_time=1.251e-04, forward_time=0.035, loss=4.233, loss_att=2.120, loss_ctc=6.346, acc=0.918, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.738e-04, train_time=0.099 -[v016] 2022-01-31 05:39:54,350 (trainer:653) INFO: 61epoch:train:298-324batch: iter_time=1.845e-04, forward_time=0.034, loss=3.663, loss_att=1.943, loss_ctc=5.383, acc=0.919, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.737e-04, train_time=0.100 -[v016] 2022-01-31 05:39:57,066 (trainer:653) INFO: 61epoch:train:325-351batch: iter_time=5.693e-04, forward_time=0.034, loss=3.793, loss_att=1.886, loss_ctc=5.701, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.737e-04, train_time=0.097 -[v016] 2022-01-31 05:39:59,630 (trainer:653) INFO: 61epoch:train:352-378batch: iter_time=1.230e-04, forward_time=0.033, loss=3.702, loss_att=1.955, loss_ctc=5.449, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.736e-04, train_time=0.095 -[v016] 2022-01-31 05:40:02,232 (trainer:653) INFO: 61epoch:train:379-405batch: iter_time=9.297e-05, forward_time=0.034, loss=3.796, loss_att=1.983, loss_ctc=5.609, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.735e-04, train_time=0.096 -[v016] 2022-01-31 05:40:04,975 (trainer:653) INFO: 61epoch:train:406-432batch: iter_time=2.091e-04, forward_time=0.035, loss=4.044, loss_att=2.181, loss_ctc=5.906, acc=0.914, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.734e-04, train_time=0.101 -[v016] 2022-01-31 05:40:07,604 (trainer:653) INFO: 61epoch:train:433-459batch: iter_time=1.260e-04, forward_time=0.035, loss=4.090, loss_att=1.986, loss_ctc=6.194, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.734e-04, train_time=0.097 -[v016] 2022-01-31 05:40:10,408 (trainer:653) INFO: 61epoch:train:460-486batch: iter_time=1.004e-04, forward_time=0.039, loss=4.303, loss_att=2.103, loss_ctc=6.504, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.733e-04, train_time=0.104 -[v016] 2022-01-31 05:40:13,220 (trainer:653) INFO: 61epoch:train:487-513batch: iter_time=1.938e-04, forward_time=0.039, loss=4.339, loss_att=2.280, loss_ctc=6.397, acc=0.924, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.732e-04, train_time=0.104 -[v016] 2022-01-31 05:40:15,748 (trainer:653) INFO: 61epoch:train:514-540batch: iter_time=1.222e-04, forward_time=0.033, loss=3.280, loss_att=1.708, loss_ctc=4.851, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.732e-04, train_time=0.093 -[v016] 2022-01-31 05:40:52,638 (trainer:328) INFO: 61epoch results: [train] iter_time=9.050e-04, forward_time=0.035, loss=3.784, loss_att=1.934, loss_ctc=5.633, acc=0.925, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.738e-04, train_time=0.099, time=54.57 seconds, total_count=33367, gpu_max_cached_mem_GB=5.824, [valid] loss=6.555, loss_att=5.134, loss_ctc=7.977, acc=0.897, cer=0.113, wer=0.423, cer_ctc=0.172, time=5.94 seconds, total_count=10858, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.15 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:40:54,684 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:40:54,689 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/56epoch.pth -[v016] 2022-01-31 05:40:54,692 (trainer:261) INFO: 62/200epoch started. Estimated time to finish: 5 hours, 14 minutes and 16.16 seconds -[v016] 2022-01-31 05:40:57,748 (trainer:653) INFO: 62epoch:train:1-27batch: iter_time=0.008, forward_time=0.036, loss=4.072, loss_att=2.018, loss_ctc=6.127, acc=0.923, backward_time=0.024, optim_step_time=0.021, optim0_lr0=1.731e-04, train_time=0.113 -[v016] 2022-01-31 05:41:00,405 (trainer:653) INFO: 62epoch:train:28-54batch: iter_time=1.380e-04, forward_time=0.035, loss=3.662, loss_att=1.765, loss_ctc=5.559, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.730e-04, train_time=0.098 -[v016] 2022-01-31 05:41:02,962 (trainer:653) INFO: 62epoch:train:55-81batch: iter_time=1.065e-04, forward_time=0.034, loss=3.147, loss_att=1.605, loss_ctc=4.689, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.729e-04, train_time=0.095 -[v016] 2022-01-31 05:41:05,674 (trainer:653) INFO: 62epoch:train:82-108batch: iter_time=1.345e-04, forward_time=0.035, loss=3.672, loss_att=1.850, loss_ctc=5.494, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.729e-04, train_time=0.100 -[v016] 2022-01-31 05:41:08,301 (trainer:653) INFO: 62epoch:train:109-135batch: iter_time=1.158e-04, forward_time=0.035, loss=3.763, loss_att=1.828, loss_ctc=5.697, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.728e-04, train_time=0.097 -[v016] 2022-01-31 05:41:11,025 (trainer:653) INFO: 62epoch:train:136-162batch: iter_time=1.699e-04, forward_time=0.035, loss=3.795, loss_att=1.858, loss_ctc=5.732, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.727e-04, train_time=0.101 -[v016] 2022-01-31 05:41:13,754 (trainer:653) INFO: 62epoch:train:163-189batch: iter_time=1.478e-04, forward_time=0.035, loss=3.829, loss_att=1.967, loss_ctc=5.691, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.727e-04, train_time=0.101 -[v016] 2022-01-31 05:41:16,297 (trainer:653) INFO: 62epoch:train:190-216batch: iter_time=1.039e-04, forward_time=0.033, loss=3.311, loss_att=1.662, loss_ctc=4.959, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.726e-04, train_time=0.094 -[v016] 2022-01-31 05:41:19,063 (trainer:653) INFO: 62epoch:train:217-243batch: iter_time=1.707e-04, forward_time=0.035, loss=3.817, loss_att=1.880, loss_ctc=5.753, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.725e-04, train_time=0.102 -[v016] 2022-01-31 05:41:21,666 (trainer:653) INFO: 62epoch:train:244-270batch: iter_time=1.228e-04, forward_time=0.034, loss=3.505, loss_att=1.810, loss_ctc=5.199, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.725e-04, train_time=0.096 -[v016] 2022-01-31 05:41:24,395 (trainer:653) INFO: 62epoch:train:271-297batch: iter_time=1.398e-04, forward_time=0.035, loss=3.515, loss_att=1.772, loss_ctc=5.257, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.724e-04, train_time=0.101 -[v016] 2022-01-31 05:41:27,064 (trainer:653) INFO: 62epoch:train:298-324batch: iter_time=1.250e-04, forward_time=0.035, loss=3.978, loss_att=1.927, loss_ctc=6.029, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.723e-04, train_time=0.099 -[v016] 2022-01-31 05:41:29,720 (trainer:653) INFO: 62epoch:train:325-351batch: iter_time=3.055e-04, forward_time=0.034, loss=3.114, loss_att=1.737, loss_ctc=4.490, acc=0.928, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.722e-04, train_time=0.098 -[v016] 2022-01-31 05:41:32,369 (trainer:653) INFO: 62epoch:train:352-378batch: iter_time=1.079e-04, forward_time=0.035, loss=3.902, loss_att=1.940, loss_ctc=5.865, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.722e-04, train_time=0.098 -[v016] 2022-01-31 05:41:35,013 (trainer:653) INFO: 62epoch:train:379-405batch: iter_time=9.228e-05, forward_time=0.035, loss=3.687, loss_att=1.945, loss_ctc=5.428, acc=0.920, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.721e-04, train_time=0.098 -[v016] 2022-01-31 05:41:37,612 (trainer:653) INFO: 62epoch:train:406-432batch: iter_time=1.291e-04, forward_time=0.033, loss=2.965, loss_att=1.610, loss_ctc=4.320, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.720e-04, train_time=0.096 -[v016] 2022-01-31 05:41:40,133 (trainer:653) INFO: 62epoch:train:433-459batch: iter_time=1.159e-04, forward_time=0.033, loss=2.911, loss_att=1.533, loss_ctc=4.289, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.720e-04, train_time=0.093 -[v016] 2022-01-31 05:41:43,066 (trainer:653) INFO: 62epoch:train:460-486batch: iter_time=2.424e-04, forward_time=0.038, loss=3.893, loss_att=1.978, loss_ctc=5.807, acc=0.924, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.719e-04, train_time=0.107 -[v016] 2022-01-31 05:41:45,724 (trainer:653) INFO: 62epoch:train:487-513batch: iter_time=1.246e-04, forward_time=0.035, loss=4.072, loss_att=1.939, loss_ctc=6.205, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.718e-04, train_time=0.099 -[v016] 2022-01-31 05:41:48,610 (trainer:653) INFO: 62epoch:train:514-540batch: iter_time=0.010, forward_time=0.034, loss=3.674, loss_att=1.940, loss_ctc=5.407, acc=0.914, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.718e-04, train_time=0.107 -[v016] 2022-01-31 05:42:25,840 (trainer:328) INFO: 62epoch results: [train] iter_time=0.001, forward_time=0.035, loss=3.630, loss_att=1.833, loss_ctc=5.427, acc=0.928, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.724e-04, train_time=0.100, time=54.72 seconds, total_count=33914, gpu_max_cached_mem_GB=5.824, [valid] loss=6.631, loss_att=5.163, loss_ctc=8.100, acc=0.895, cer=0.111, wer=0.434, cer_ctc=0.173, time=6.51 seconds, total_count=11036, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.9 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:42:28,154 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:42:28,163 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/54epoch.pth -[v016] 2022-01-31 05:42:28,169 (trainer:261) INFO: 63/200epoch started. Estimated time to finish: 5 hours, 9 minutes and 41.91 seconds -[v016] 2022-01-31 05:42:31,051 (trainer:653) INFO: 63epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=3.265, loss_att=1.633, loss_ctc=4.897, acc=0.934, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.717e-04, train_time=0.106 -[v016] 2022-01-31 05:42:33,882 (trainer:653) INFO: 63epoch:train:28-54batch: iter_time=1.603e-04, forward_time=0.039, loss=4.238, loss_att=2.017, loss_ctc=6.458, acc=0.925, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.716e-04, train_time=0.105 -[v016] 2022-01-31 05:42:36,583 (trainer:653) INFO: 63epoch:train:55-81batch: iter_time=1.726e-04, forward_time=0.035, loss=3.474, loss_att=1.674, loss_ctc=5.273, acc=0.933, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.715e-04, train_time=0.100 -[v016] 2022-01-31 05:42:39,217 (trainer:653) INFO: 63epoch:train:82-108batch: iter_time=1.045e-04, forward_time=0.034, loss=3.007, loss_att=1.583, loss_ctc=4.430, acc=0.937, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.715e-04, train_time=0.097 -[v016] 2022-01-31 05:42:41,846 (trainer:653) INFO: 63epoch:train:109-135batch: iter_time=9.923e-05, forward_time=0.036, loss=3.450, loss_att=1.805, loss_ctc=5.096, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.714e-04, train_time=0.097 -[v016] 2022-01-31 05:42:44,579 (trainer:653) INFO: 63epoch:train:136-162batch: iter_time=1.694e-04, forward_time=0.035, loss=3.903, loss_att=1.867, loss_ctc=5.939, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.713e-04, train_time=0.101 -[v016] 2022-01-31 05:42:47,172 (trainer:653) INFO: 63epoch:train:163-189batch: iter_time=1.242e-04, forward_time=0.034, loss=3.179, loss_att=1.615, loss_ctc=4.742, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.713e-04, train_time=0.096 -[v016] 2022-01-31 05:42:49,931 (trainer:653) INFO: 63epoch:train:190-216batch: iter_time=1.044e-04, forward_time=0.038, loss=4.022, loss_att=1.977, loss_ctc=6.066, acc=0.926, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.712e-04, train_time=0.102 -[v016] 2022-01-31 05:42:52,634 (trainer:653) INFO: 63epoch:train:217-243batch: iter_time=2.012e-04, forward_time=0.034, loss=3.778, loss_att=2.053, loss_ctc=5.503, acc=0.912, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.711e-04, train_time=0.100 -[v016] 2022-01-31 05:42:55,244 (trainer:653) INFO: 63epoch:train:244-270batch: iter_time=1.249e-04, forward_time=0.034, loss=3.826, loss_att=1.968, loss_ctc=5.683, acc=0.921, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.711e-04, train_time=0.097 -[v016] 2022-01-31 05:42:58,000 (trainer:653) INFO: 63epoch:train:271-297batch: iter_time=1.276e-04, forward_time=0.035, loss=3.925, loss_att=1.949, loss_ctc=5.900, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.710e-04, train_time=0.102 -[v016] 2022-01-31 05:43:00,651 (trainer:653) INFO: 63epoch:train:298-324batch: iter_time=3.188e-04, forward_time=0.034, loss=3.209, loss_att=1.779, loss_ctc=4.638, acc=0.917, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.709e-04, train_time=0.098 -[v016] 2022-01-31 05:43:03,251 (trainer:653) INFO: 63epoch:train:325-351batch: iter_time=9.646e-05, forward_time=0.034, loss=3.888, loss_att=1.894, loss_ctc=5.881, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.709e-04, train_time=0.096 -[v016] 2022-01-31 05:43:05,950 (trainer:653) INFO: 63epoch:train:352-378batch: iter_time=1.023e-04, forward_time=0.035, loss=4.118, loss_att=1.991, loss_ctc=6.244, acc=0.930, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.708e-04, train_time=0.100 -[v016] 2022-01-31 05:43:08,629 (trainer:653) INFO: 63epoch:train:379-405batch: iter_time=2.424e-04, forward_time=0.035, loss=3.129, loss_att=1.689, loss_ctc=4.569, acc=0.923, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.707e-04, train_time=0.099 -[v016] 2022-01-31 05:43:11,446 (trainer:653) INFO: 63epoch:train:406-432batch: iter_time=2.006e-04, forward_time=0.036, loss=3.923, loss_att=1.946, loss_ctc=5.899, acc=0.927, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.707e-04, train_time=0.104 -[v016] 2022-01-31 05:43:14,114 (trainer:653) INFO: 63epoch:train:433-459batch: iter_time=1.278e-04, forward_time=0.035, loss=3.849, loss_att=1.814, loss_ctc=5.885, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.706e-04, train_time=0.099 -[v016] 2022-01-31 05:43:16,869 (trainer:653) INFO: 63epoch:train:460-486batch: iter_time=1.823e-04, forward_time=0.035, loss=3.324, loss_att=1.774, loss_ctc=4.875, acc=0.932, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.705e-04, train_time=0.102 -[v016] 2022-01-31 05:43:19,477 (trainer:653) INFO: 63epoch:train:487-513batch: iter_time=1.195e-04, forward_time=0.034, loss=3.431, loss_att=1.756, loss_ctc=5.105, acc=0.926, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.705e-04, train_time=0.096 -[v016] 2022-01-31 05:43:22,216 (trainer:653) INFO: 63epoch:train:514-540batch: iter_time=0.002, forward_time=0.037, loss=3.362, loss_att=1.680, loss_ctc=5.043, acc=0.935, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.704e-04, train_time=0.101 -[v016] 2022-01-31 05:43:58,073 (trainer:328) INFO: 63epoch results: [train] iter_time=4.463e-04, forward_time=0.035, loss=3.623, loss_att=1.827, loss_ctc=5.419, acc=0.927, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.710e-04, train_time=0.100, time=54.8 seconds, total_count=34461, gpu_max_cached_mem_GB=5.824, [valid] loss=6.603, loss_att=5.174, loss_ctc=8.031, acc=0.897, cer=0.110, wer=0.423, cer_ctc=0.172, time=5.89 seconds, total_count=11214, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.2 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:44:00,252 (trainer:375) INFO: The best model has been updated: train.loss, valid.acc -[v016] 2022-01-31 05:44:00,256 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/55epoch.pth -[v016] 2022-01-31 05:44:00,260 (trainer:261) INFO: 64/200epoch started. Estimated time to finish: 5 hours, 5 minutes and 11.66 seconds -[v016] 2022-01-31 05:44:03,176 (trainer:653) INFO: 64epoch:train:1-27batch: iter_time=0.004, forward_time=0.036, loss=3.615, loss_att=1.761, loss_ctc=5.469, acc=0.934, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.703e-04, train_time=0.108 -[v016] 2022-01-31 05:44:05,705 (trainer:653) INFO: 64epoch:train:28-54batch: iter_time=1.293e-04, forward_time=0.033, loss=2.861, loss_att=1.430, loss_ctc=4.292, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.702e-04, train_time=0.094 -[v016] 2022-01-31 05:44:08,416 (trainer:653) INFO: 64epoch:train:55-81batch: iter_time=1.296e-04, forward_time=0.035, loss=3.337, loss_att=1.804, loss_ctc=4.869, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.702e-04, train_time=0.100 -[v016] 2022-01-31 05:44:11,066 (trainer:653) INFO: 64epoch:train:82-108batch: iter_time=3.095e-04, forward_time=0.034, loss=2.872, loss_att=1.514, loss_ctc=4.230, acc=0.929, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.701e-04, train_time=0.098 -[v016] 2022-01-31 05:44:13,635 (trainer:653) INFO: 64epoch:train:109-135batch: iter_time=1.081e-04, forward_time=0.034, loss=3.099, loss_att=1.569, loss_ctc=4.628, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.700e-04, train_time=0.095 -[v016] 2022-01-31 05:44:16,187 (trainer:653) INFO: 64epoch:train:136-162batch: iter_time=9.730e-05, forward_time=0.033, loss=3.256, loss_att=1.696, loss_ctc=4.816, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.700e-04, train_time=0.094 -[v016] 2022-01-31 05:44:18,970 (trainer:653) INFO: 64epoch:train:163-189batch: iter_time=1.834e-04, forward_time=0.035, loss=4.408, loss_att=2.114, loss_ctc=6.703, acc=0.927, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.699e-04, train_time=0.103 -[v016] 2022-01-31 05:44:21,768 (trainer:653) INFO: 64epoch:train:190-216batch: iter_time=1.543e-04, forward_time=0.035, loss=4.073, loss_att=1.996, loss_ctc=6.150, acc=0.924, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.698e-04, train_time=0.103 -[v016] 2022-01-31 05:44:24,788 (trainer:653) INFO: 64epoch:train:217-243batch: iter_time=0.019, forward_time=0.033, loss=3.310, loss_att=1.649, loss_ctc=4.970, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.698e-04, train_time=0.112 -[v016] 2022-01-31 05:44:27,481 (trainer:653) INFO: 64epoch:train:244-270batch: iter_time=1.468e-04, forward_time=0.035, loss=3.131, loss_att=1.629, loss_ctc=4.633, acc=0.932, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.697e-04, train_time=0.099 -[v016] 2022-01-31 05:44:30,199 (trainer:653) INFO: 64epoch:train:271-297batch: iter_time=1.950e-04, forward_time=0.035, loss=3.373, loss_att=1.725, loss_ctc=5.021, acc=0.935, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.696e-04, train_time=0.100 -[v016] 2022-01-31 05:44:32,784 (trainer:653) INFO: 64epoch:train:298-324batch: iter_time=1.104e-04, forward_time=0.034, loss=3.712, loss_att=1.873, loss_ctc=5.551, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.696e-04, train_time=0.096 -[v016] 2022-01-31 05:44:35,398 (trainer:653) INFO: 64epoch:train:325-351batch: iter_time=1.096e-04, forward_time=0.034, loss=3.151, loss_att=1.612, loss_ctc=4.691, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.695e-04, train_time=0.097 -[v016] 2022-01-31 05:44:38,055 (trainer:653) INFO: 64epoch:train:352-378batch: iter_time=1.466e-04, forward_time=0.033, loss=2.947, loss_att=1.637, loss_ctc=4.256, acc=0.917, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.695e-04, train_time=0.098 -[v016] 2022-01-31 05:44:40,628 (trainer:653) INFO: 64epoch:train:379-405batch: iter_time=1.147e-04, forward_time=0.034, loss=3.243, loss_att=1.649, loss_ctc=4.838, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.694e-04, train_time=0.095 -[v016] 2022-01-31 05:44:43,312 (trainer:653) INFO: 64epoch:train:406-432batch: iter_time=1.589e-04, forward_time=0.034, loss=3.374, loss_att=1.712, loss_ctc=5.036, acc=0.942, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.693e-04, train_time=0.099 -[v016] 2022-01-31 05:44:46,108 (trainer:653) INFO: 64epoch:train:433-459batch: iter_time=1.656e-04, forward_time=0.039, loss=3.732, loss_att=1.826, loss_ctc=5.639, acc=0.931, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.693e-04, train_time=0.103 -[v016] 2022-01-31 05:44:49,305 (trainer:653) INFO: 64epoch:train:460-486batch: iter_time=5.520e-04, forward_time=0.039, loss=3.752, loss_att=1.985, loss_ctc=5.520, acc=0.929, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.692e-04, train_time=0.115 -[v016] 2022-01-31 05:44:53,185 (trainer:653) INFO: 64epoch:train:487-513batch: iter_time=7.741e-04, forward_time=0.045, loss=3.875, loss_att=1.947, loss_ctc=5.803, acc=0.922, backward_time=0.025, optim_step_time=0.032, optim0_lr0=1.691e-04, train_time=0.144 -[v016] 2022-01-31 05:44:56,988 (trainer:653) INFO: 64epoch:train:514-540batch: iter_time=8.450e-04, forward_time=0.053, loss=3.995, loss_att=1.948, loss_ctc=6.042, acc=0.924, backward_time=0.023, optim_step_time=0.031, optim0_lr0=1.691e-04, train_time=0.141 -[v016] 2022-01-31 05:45:48,294 (trainer:328) INFO: 64epoch results: [train] iter_time=0.001, forward_time=0.036, loss=3.484, loss_att=1.765, loss_ctc=5.202, acc=0.931, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.697e-04, train_time=0.108, time=59.29 seconds, total_count=35008, gpu_max_cached_mem_GB=5.824, [valid] loss=6.545, loss_att=5.179, loss_ctc=7.910, acc=0.895, cer=0.111, wer=0.427, cer_ctc=0.169, time=9.12 seconds, total_count=11392, gpu_max_cached_mem_GB=5.824, [att_plot] time=39.6 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:45:50,863 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc -[v016] 2022-01-31 05:45:50,888 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/59epoch.pth -[v016] 2022-01-31 05:45:50,891 (trainer:261) INFO: 65/200epoch started. Estimated time to finish: 5 hours, 1 minute and 46.82 seconds -[v016] 2022-01-31 05:46:03,964 (trainer:653) INFO: 65epoch:train:1-27batch: iter_time=0.271, forward_time=0.065, loss=3.248, loss_att=1.588, loss_ctc=4.909, acc=0.924, backward_time=0.057, optim_step_time=0.024, optim0_lr0=1.690e-04, train_time=0.479 -[v016] 2022-01-31 05:46:17,312 (trainer:653) INFO: 65epoch:train:28-54batch: iter_time=0.392, forward_time=0.035, loss=3.565, loss_att=1.706, loss_ctc=5.424, acc=0.939, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.689e-04, train_time=0.494 -[v016] 2022-01-31 05:46:25,578 (trainer:653) INFO: 65epoch:train:55-81batch: iter_time=0.204, forward_time=0.035, loss=3.486, loss_att=1.643, loss_ctc=5.329, acc=0.940, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.688e-04, train_time=0.306 -[v016] 2022-01-31 05:46:32,713 (trainer:653) INFO: 65epoch:train:82-108batch: iter_time=0.157, forward_time=0.039, loss=3.438, loss_att=1.699, loss_ctc=5.177, acc=0.932, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.688e-04, train_time=0.264 -[v016] 2022-01-31 05:46:39,960 (trainer:653) INFO: 65epoch:train:109-135batch: iter_time=0.167, forward_time=0.034, loss=2.894, loss_att=1.460, loss_ctc=4.329, acc=0.941, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.687e-04, train_time=0.268 -[v016] 2022-01-31 05:46:45,678 (trainer:653) INFO: 65epoch:train:136-162batch: iter_time=0.109, forward_time=0.033, loss=3.301, loss_att=1.707, loss_ctc=4.895, acc=0.928, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.687e-04, train_time=0.212 -[v016] 2022-01-31 05:46:51,978 (trainer:653) INFO: 65epoch:train:163-189batch: iter_time=0.134, forward_time=0.033, loss=3.515, loss_att=1.834, loss_ctc=5.196, acc=0.923, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.686e-04, train_time=0.233 -[v016] 2022-01-31 05:46:59,381 (trainer:653) INFO: 65epoch:train:190-216batch: iter_time=0.171, forward_time=0.035, loss=3.718, loss_att=1.759, loss_ctc=5.676, acc=0.935, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.685e-04, train_time=0.274 -[v016] 2022-01-31 05:47:06,569 (trainer:653) INFO: 65epoch:train:217-243batch: iter_time=0.158, forward_time=0.034, loss=3.399, loss_att=1.759, loss_ctc=5.038, acc=0.929, backward_time=0.024, optim_step_time=0.026, optim0_lr0=1.685e-04, train_time=0.266 -[v016] 2022-01-31 05:47:14,064 (trainer:653) INFO: 65epoch:train:244-270batch: iter_time=0.172, forward_time=0.035, loss=3.400, loss_att=1.724, loss_ctc=5.075, acc=0.936, backward_time=0.024, optim_step_time=0.026, optim0_lr0=1.684e-04, train_time=0.277 -[v016] 2022-01-31 05:47:21,826 (trainer:653) INFO: 65epoch:train:271-297batch: iter_time=0.182, forward_time=0.036, loss=4.113, loss_att=1.976, loss_ctc=6.250, acc=0.929, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.683e-04, train_time=0.287 -[v016] 2022-01-31 05:47:29,261 (trainer:653) INFO: 65epoch:train:298-324batch: iter_time=0.171, forward_time=0.035, loss=4.207, loss_att=2.063, loss_ctc=6.351, acc=0.921, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.683e-04, train_time=0.275 -[v016] 2022-01-31 05:47:38,940 (trainer:653) INFO: 65epoch:train:325-351batch: iter_time=0.260, forward_time=0.034, loss=3.589, loss_att=1.774, loss_ctc=5.404, acc=0.931, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.682e-04, train_time=0.358 -[v016] 2022-01-31 05:47:48,164 (trainer:653) INFO: 65epoch:train:352-378batch: iter_time=0.241, forward_time=0.034, loss=4.173, loss_att=1.941, loss_ctc=6.405, acc=0.928, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.681e-04, train_time=0.341 -[v016] 2022-01-31 05:47:56,351 (trainer:653) INFO: 65epoch:train:379-405batch: iter_time=0.203, forward_time=0.036, loss=3.216, loss_att=1.656, loss_ctc=4.775, acc=0.933, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.681e-04, train_time=0.303 -[v016] 2022-01-31 05:48:05,061 (trainer:653) INFO: 65epoch:train:406-432batch: iter_time=0.227, forward_time=0.033, loss=3.497, loss_att=1.799, loss_ctc=5.195, acc=0.919, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.680e-04, train_time=0.322 -[v016] 2022-01-31 05:48:11,769 (trainer:653) INFO: 65epoch:train:433-459batch: iter_time=0.147, forward_time=0.037, loss=3.447, loss_att=1.812, loss_ctc=5.082, acc=0.927, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.679e-04, train_time=0.248 -[v016] 2022-01-31 05:48:17,980 (trainer:653) INFO: 65epoch:train:460-486batch: iter_time=0.129, forward_time=0.036, loss=2.914, loss_att=1.529, loss_ctc=4.300, acc=0.935, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.679e-04, train_time=0.230 -[v016] 2022-01-31 05:48:24,134 (trainer:653) INFO: 65epoch:train:487-513batch: iter_time=0.131, forward_time=0.034, loss=3.183, loss_att=1.747, loss_ctc=4.618, acc=0.927, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.678e-04, train_time=0.228 -[v016] 2022-01-31 05:48:30,344 (trainer:653) INFO: 65epoch:train:514-540batch: iter_time=0.134, forward_time=0.033, loss=3.939, loss_att=2.037, loss_ctc=5.841, acc=0.924, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.678e-04, train_time=0.230 -[v016] 2022-01-31 05:49:29,175 (trainer:328) INFO: 65epoch results: [train] iter_time=0.187, forward_time=0.036, loss=3.512, loss_att=1.760, loss_ctc=5.265, acc=0.930, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.684e-04, train_time=0.294, time=2 minutes and 40.86 seconds, total_count=35555, gpu_max_cached_mem_GB=5.824, [valid] loss=6.517, loss_att=5.120, loss_ctc=7.913, acc=0.899, cer=0.104, wer=0.409, cer_ctc=0.166, time=27.56 seconds, total_count=11570, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.79 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:49:31,350 (trainer:375) INFO: The best model has been updated: valid.loss, valid.acc -[v016] 2022-01-31 05:49:31,356 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/60epoch.pth -[v016] 2022-01-31 05:49:31,356 (trainer:261) INFO: 66/200epoch started. Estimated time to finish: 5 hours, 3 minutes and 55.67 seconds -[v016] 2022-01-31 05:49:34,341 (trainer:653) INFO: 66epoch:train:1-27batch: iter_time=0.007, forward_time=0.036, loss=3.270, loss_att=1.662, loss_ctc=4.879, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.677e-04, train_time=0.110 -[v016] 2022-01-31 05:49:36,943 (trainer:653) INFO: 66epoch:train:28-54batch: iter_time=1.269e-04, forward_time=0.034, loss=3.033, loss_att=1.585, loss_ctc=4.480, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.676e-04, train_time=0.096 -[v016] 2022-01-31 05:49:39,648 (trainer:653) INFO: 66epoch:train:55-81batch: iter_time=0.002, forward_time=0.037, loss=2.808, loss_att=1.496, loss_ctc=4.121, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.675e-04, train_time=0.100 -[v016] 2022-01-31 05:49:42,377 (trainer:653) INFO: 66epoch:train:82-108batch: iter_time=1.377e-04, forward_time=0.038, loss=3.402, loss_att=1.721, loss_ctc=5.083, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.675e-04, train_time=0.101 -[v016] 2022-01-31 05:49:45,025 (trainer:653) INFO: 66epoch:train:109-135batch: iter_time=1.094e-04, forward_time=0.034, loss=3.669, loss_att=1.736, loss_ctc=5.602, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.674e-04, train_time=0.098 -[v016] 2022-01-31 05:49:47,846 (trainer:653) INFO: 66epoch:train:136-162batch: iter_time=3.164e-04, forward_time=0.035, loss=3.944, loss_att=1.800, loss_ctc=6.087, acc=0.939, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.674e-04, train_time=0.104 -[v016] 2022-01-31 05:49:50,438 (trainer:653) INFO: 66epoch:train:163-189batch: iter_time=1.230e-04, forward_time=0.034, loss=3.436, loss_att=1.712, loss_ctc=5.161, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.673e-04, train_time=0.096 -[v016] 2022-01-31 05:49:53,156 (trainer:653) INFO: 66epoch:train:190-216batch: iter_time=3.326e-04, forward_time=0.034, loss=3.427, loss_att=1.760, loss_ctc=5.093, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.672e-04, train_time=0.100 -[v016] 2022-01-31 05:49:55,788 (trainer:653) INFO: 66epoch:train:217-243batch: iter_time=1.291e-04, forward_time=0.035, loss=3.763, loss_att=1.859, loss_ctc=5.668, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.672e-04, train_time=0.097 -[v016] 2022-01-31 05:49:58,519 (trainer:653) INFO: 66epoch:train:244-270batch: iter_time=1.599e-04, forward_time=0.038, loss=3.282, loss_att=1.558, loss_ctc=5.005, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.671e-04, train_time=0.101 -[v016] 2022-01-31 05:50:01,230 (trainer:653) INFO: 66epoch:train:271-297batch: iter_time=1.798e-04, forward_time=0.037, loss=3.598, loss_att=1.871, loss_ctc=5.326, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.670e-04, train_time=0.100 -[v016] 2022-01-31 05:50:03,836 (trainer:653) INFO: 66epoch:train:298-324batch: iter_time=1.242e-04, forward_time=0.034, loss=3.239, loss_att=1.589, loss_ctc=4.889, acc=0.937, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.670e-04, train_time=0.096 -[v016] 2022-01-31 05:50:06,523 (trainer:653) INFO: 66epoch:train:325-351batch: iter_time=1.359e-04, forward_time=0.035, loss=3.413, loss_att=1.729, loss_ctc=5.098, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.669e-04, train_time=0.099 -[v016] 2022-01-31 05:50:09,287 (trainer:653) INFO: 66epoch:train:352-378batch: iter_time=0.005, forward_time=0.034, loss=3.951, loss_att=1.892, loss_ctc=6.009, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.668e-04, train_time=0.102 -[v016] 2022-01-31 05:50:12,022 (trainer:653) INFO: 66epoch:train:379-405batch: iter_time=1.886e-04, forward_time=0.035, loss=3.325, loss_att=1.716, loss_ctc=4.934, acc=0.927, backward_time=0.025, optim_step_time=0.021, optim0_lr0=1.668e-04, train_time=0.101 -[v016] 2022-01-31 05:50:14,565 (trainer:653) INFO: 66epoch:train:406-432batch: iter_time=1.240e-04, forward_time=0.033, loss=3.137, loss_att=1.675, loss_ctc=4.599, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.667e-04, train_time=0.094 -[v016] 2022-01-31 05:50:17,324 (trainer:653) INFO: 66epoch:train:433-459batch: iter_time=1.953e-04, forward_time=0.035, loss=3.350, loss_att=1.644, loss_ctc=5.055, acc=0.936, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.667e-04, train_time=0.102 -[v016] 2022-01-31 05:50:20,120 (trainer:653) INFO: 66epoch:train:460-486batch: iter_time=1.250e-04, forward_time=0.038, loss=3.595, loss_att=1.732, loss_ctc=5.458, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.666e-04, train_time=0.103 -[v016] 2022-01-31 05:50:22,678 (trainer:653) INFO: 66epoch:train:487-513batch: iter_time=1.153e-04, forward_time=0.034, loss=3.124, loss_att=1.650, loss_ctc=4.598, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.665e-04, train_time=0.095 -[v016] 2022-01-31 05:50:25,378 (trainer:653) INFO: 66epoch:train:514-540batch: iter_time=1.776e-04, forward_time=0.034, loss=3.409, loss_att=1.777, loss_ctc=5.041, acc=0.922, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.665e-04, train_time=0.100 -[v016] 2022-01-31 05:51:02,559 (trainer:328) INFO: 66epoch results: [train] iter_time=8.042e-04, forward_time=0.035, loss=3.424, loss_att=1.713, loss_ctc=5.134, acc=0.932, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.671e-04, train_time=0.100, time=54.81 seconds, total_count=36102, gpu_max_cached_mem_GB=5.824, [valid] loss=6.335, loss_att=5.123, loss_ctc=7.548, acc=0.900, cer=0.105, wer=0.410, cer_ctc=0.163, time=6 seconds, total_count=11748, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.38 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:51:04,792 (trainer:375) INFO: The best model has been updated: train.loss, valid.loss, train.acc, valid.acc -[v016] 2022-01-31 05:51:04,797 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/57epoch.pth -[v016] 2022-01-31 05:51:04,801 (trainer:261) INFO: 67/200epoch started. Estimated time to finish: 4 hours, 59 minutes and 39.3 seconds -[v016] 2022-01-31 05:51:07,889 (trainer:653) INFO: 67epoch:train:1-27batch: iter_time=0.013, forward_time=0.035, loss=3.104, loss_att=1.585, loss_ctc=4.624, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.664e-04, train_time=0.113 -[v016] 2022-01-31 05:51:10,695 (trainer:653) INFO: 67epoch:train:28-54batch: iter_time=0.005, forward_time=0.034, loss=3.037, loss_att=1.574, loss_ctc=4.501, acc=0.935, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.663e-04, train_time=0.104 -[v016] 2022-01-31 05:51:13,420 (trainer:653) INFO: 67epoch:train:55-81batch: iter_time=0.005, forward_time=0.034, loss=3.082, loss_att=1.432, loss_ctc=4.731, acc=0.942, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.663e-04, train_time=0.101 -[v016] 2022-01-31 05:51:16,145 (trainer:653) INFO: 67epoch:train:82-108batch: iter_time=2.048e-04, forward_time=0.035, loss=2.989, loss_att=1.467, loss_ctc=4.511, acc=0.939, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.662e-04, train_time=0.101 -[v016] 2022-01-31 05:51:18,915 (trainer:653) INFO: 67epoch:train:109-135batch: iter_time=1.980e-04, forward_time=0.035, loss=3.119, loss_att=1.613, loss_ctc=4.626, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.661e-04, train_time=0.102 -[v016] 2022-01-31 05:51:21,495 (trainer:653) INFO: 67epoch:train:136-162batch: iter_time=1.354e-04, forward_time=0.034, loss=2.979, loss_att=1.610, loss_ctc=4.348, acc=0.937, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.661e-04, train_time=0.095 -[v016] 2022-01-31 05:51:24,225 (trainer:653) INFO: 67epoch:train:163-189batch: iter_time=1.489e-04, forward_time=0.035, loss=3.495, loss_att=1.683, loss_ctc=5.308, acc=0.936, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.660e-04, train_time=0.101 -[v016] 2022-01-31 05:51:26,975 (trainer:653) INFO: 67epoch:train:190-216batch: iter_time=1.995e-04, forward_time=0.035, loss=3.500, loss_att=1.826, loss_ctc=5.174, acc=0.928, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.660e-04, train_time=0.102 -[v016] 2022-01-31 05:51:29,652 (trainer:653) INFO: 67epoch:train:217-243batch: iter_time=1.087e-04, forward_time=0.035, loss=3.837, loss_att=1.832, loss_ctc=5.842, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.659e-04, train_time=0.099 -[v016] 2022-01-31 05:51:32,418 (trainer:653) INFO: 67epoch:train:244-270batch: iter_time=1.252e-04, forward_time=0.035, loss=3.573, loss_att=1.719, loss_ctc=5.427, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.658e-04, train_time=0.102 -[v016] 2022-01-31 05:51:35,044 (trainer:653) INFO: 67epoch:train:271-297batch: iter_time=1.112e-04, forward_time=0.035, loss=3.438, loss_att=1.660, loss_ctc=5.217, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.658e-04, train_time=0.097 -[v016] 2022-01-31 05:51:37,833 (trainer:653) INFO: 67epoch:train:298-324batch: iter_time=0.004, forward_time=0.034, loss=3.196, loss_att=1.588, loss_ctc=4.804, acc=0.934, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.657e-04, train_time=0.103 -[v016] 2022-01-31 05:51:40,402 (trainer:653) INFO: 67epoch:train:325-351batch: iter_time=1.136e-04, forward_time=0.034, loss=3.369, loss_att=1.662, loss_ctc=5.076, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.657e-04, train_time=0.095 -[v016] 2022-01-31 05:51:43,175 (trainer:653) INFO: 67epoch:train:352-378batch: iter_time=8.778e-04, forward_time=0.034, loss=2.971, loss_att=1.600, loss_ctc=4.342, acc=0.934, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.656e-04, train_time=0.102 -[v016] 2022-01-31 05:51:45,709 (trainer:653) INFO: 67epoch:train:379-405batch: iter_time=1.184e-04, forward_time=0.033, loss=2.939, loss_att=1.562, loss_ctc=4.316, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.655e-04, train_time=0.094 -[v016] 2022-01-31 05:51:48,423 (trainer:653) INFO: 67epoch:train:406-432batch: iter_time=1.679e-04, forward_time=0.034, loss=3.068, loss_att=1.530, loss_ctc=4.607, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.655e-04, train_time=0.100 -[v016] 2022-01-31 05:51:51,181 (trainer:653) INFO: 67epoch:train:433-459batch: iter_time=1.256e-04, forward_time=0.039, loss=3.732, loss_att=1.816, loss_ctc=5.647, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.654e-04, train_time=0.102 -[v016] 2022-01-31 05:51:53,783 (trainer:653) INFO: 67epoch:train:460-486batch: iter_time=1.149e-04, forward_time=0.034, loss=3.819, loss_att=1.900, loss_ctc=5.739, acc=0.923, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.653e-04, train_time=0.096 -[v016] 2022-01-31 05:51:56,521 (trainer:653) INFO: 67epoch:train:487-513batch: iter_time=1.146e-04, forward_time=0.038, loss=3.515, loss_att=1.771, loss_ctc=5.260, acc=0.928, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.653e-04, train_time=0.101 -[v016] 2022-01-31 05:51:59,229 (trainer:653) INFO: 67epoch:train:514-540batch: iter_time=1.399e-04, forward_time=0.038, loss=3.482, loss_att=1.806, loss_ctc=5.158, acc=0.924, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.652e-04, train_time=0.100 -[v016] 2022-01-31 05:52:35,254 (trainer:328) INFO: 67epoch results: [train] iter_time=0.001, forward_time=0.035, loss=3.310, loss_att=1.660, loss_ctc=4.959, acc=0.933, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.658e-04, train_time=0.101, time=55.22 seconds, total_count=36649, gpu_max_cached_mem_GB=5.824, [valid] loss=6.477, loss_att=5.199, loss_ctc=7.756, acc=0.899, cer=0.105, wer=0.408, cer_ctc=0.163, time=5.92 seconds, total_count=11926, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.3 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:52:37,450 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:52:37,455 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/58epoch.pth -[v016] 2022-01-31 05:52:37,458 (trainer:261) INFO: 68/200epoch started. Estimated time to finish: 4 hours, 55 minutes and 27.64 seconds -[v016] 2022-01-31 05:52:40,307 (trainer:653) INFO: 68epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=3.644, loss_att=1.681, loss_ctc=5.606, acc=0.934, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.652e-04, train_time=0.105 -[v016] 2022-01-31 05:52:43,040 (trainer:653) INFO: 68epoch:train:28-54batch: iter_time=1.591e-04, forward_time=0.037, loss=2.842, loss_att=1.351, loss_ctc=4.333, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.651e-04, train_time=0.101 -[v016] 2022-01-31 05:52:45,956 (trainer:653) INFO: 68epoch:train:55-81batch: iter_time=0.011, forward_time=0.034, loss=3.175, loss_att=1.589, loss_ctc=4.760, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.650e-04, train_time=0.108 -[v016] 2022-01-31 05:52:48,611 (trainer:653) INFO: 68epoch:train:82-108batch: iter_time=1.710e-04, forward_time=0.034, loss=3.213, loss_att=1.643, loss_ctc=4.782, acc=0.921, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.650e-04, train_time=0.098 -[v016] 2022-01-31 05:52:51,171 (trainer:653) INFO: 68epoch:train:109-135batch: iter_time=1.052e-04, forward_time=0.033, loss=2.773, loss_att=1.428, loss_ctc=4.118, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.649e-04, train_time=0.095 -[v016] 2022-01-31 05:52:53,959 (trainer:653) INFO: 68epoch:train:136-162batch: iter_time=1.235e-04, forward_time=0.039, loss=3.678, loss_att=1.737, loss_ctc=5.619, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.648e-04, train_time=0.103 -[v016] 2022-01-31 05:52:56,624 (trainer:653) INFO: 68epoch:train:163-189batch: iter_time=2.191e-04, forward_time=0.035, loss=2.644, loss_att=1.372, loss_ctc=3.916, acc=0.939, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.648e-04, train_time=0.098 -[v016] 2022-01-31 05:52:59,309 (trainer:653) INFO: 68epoch:train:190-216batch: iter_time=9.883e-05, forward_time=0.036, loss=3.271, loss_att=1.622, loss_ctc=4.920, acc=0.941, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.647e-04, train_time=0.099 -[v016] 2022-01-31 05:53:02,042 (trainer:653) INFO: 68epoch:train:217-243batch: iter_time=1.422e-04, forward_time=0.035, loss=2.998, loss_att=1.560, loss_ctc=4.437, acc=0.933, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.647e-04, train_time=0.101 -[v016] 2022-01-31 05:53:04,791 (trainer:653) INFO: 68epoch:train:244-270batch: iter_time=1.881e-04, forward_time=0.035, loss=3.363, loss_att=1.663, loss_ctc=5.064, acc=0.937, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.646e-04, train_time=0.102 -[v016] 2022-01-31 05:53:07,437 (trainer:653) INFO: 68epoch:train:271-297batch: iter_time=1.361e-04, forward_time=0.035, loss=3.019, loss_att=1.514, loss_ctc=4.523, acc=0.938, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.645e-04, train_time=0.098 -[v016] 2022-01-31 05:53:10,241 (trainer:653) INFO: 68epoch:train:298-324batch: iter_time=3.098e-04, forward_time=0.036, loss=3.386, loss_att=1.693, loss_ctc=5.078, acc=0.935, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.645e-04, train_time=0.101 -[v016] 2022-01-31 05:53:12,946 (trainer:653) INFO: 68epoch:train:325-351batch: iter_time=1.127e-04, forward_time=0.036, loss=3.367, loss_att=1.650, loss_ctc=5.084, acc=0.935, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.644e-04, train_time=0.100 -[v016] 2022-01-31 05:53:15,790 (trainer:653) INFO: 68epoch:train:352-378batch: iter_time=0.002, forward_time=0.036, loss=3.869, loss_att=1.752, loss_ctc=5.986, acc=0.941, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.644e-04, train_time=0.105 -[v016] 2022-01-31 05:53:18,558 (trainer:653) INFO: 68epoch:train:379-405batch: iter_time=0.003, forward_time=0.035, loss=3.610, loss_att=1.724, loss_ctc=5.497, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.643e-04, train_time=0.102 -[v016] 2022-01-31 05:53:21,240 (trainer:653) INFO: 68epoch:train:406-432batch: iter_time=1.545e-04, forward_time=0.037, loss=2.867, loss_att=1.527, loss_ctc=4.207, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.642e-04, train_time=0.099 -[v016] 2022-01-31 05:53:23,974 (trainer:653) INFO: 68epoch:train:433-459batch: iter_time=2.223e-04, forward_time=0.035, loss=2.874, loss_att=1.525, loss_ctc=4.223, acc=0.936, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.642e-04, train_time=0.101 -[v016] 2022-01-31 05:53:26,487 (trainer:653) INFO: 68epoch:train:460-486batch: iter_time=1.247e-04, forward_time=0.033, loss=3.128, loss_att=1.697, loss_ctc=4.559, acc=0.927, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.641e-04, train_time=0.093 -[v016] 2022-01-31 05:53:29,268 (trainer:653) INFO: 68epoch:train:487-513batch: iter_time=2.244e-04, forward_time=0.035, loss=3.508, loss_att=1.797, loss_ctc=5.219, acc=0.928, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.641e-04, train_time=0.103 -[v016] 2022-01-31 05:53:31,859 (trainer:653) INFO: 68epoch:train:514-540batch: iter_time=1.293e-04, forward_time=0.034, loss=3.458, loss_att=1.750, loss_ctc=5.165, acc=0.931, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.640e-04, train_time=0.096 -[v016] 2022-01-31 05:54:07,676 (trainer:328) INFO: 68epoch results: [train] iter_time=0.001, forward_time=0.035, loss=3.234, loss_att=1.617, loss_ctc=4.851, acc=0.935, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.646e-04, train_time=0.100, time=55.2 seconds, total_count=37196, gpu_max_cached_mem_GB=5.824, [valid] loss=6.424, loss_att=5.135, loss_ctc=7.713, acc=0.899, cer=0.106, wer=0.414, cer_ctc=0.158, time=5.98 seconds, total_count=12104, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.02 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:54:09,807 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:54:09,812 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/61epoch.pth, exp/asr_train_asr_raw_en_word/62epoch.pth -[v016] 2022-01-31 05:54:09,816 (trainer:261) INFO: 69/200epoch started. Estimated time to finish: 4 hours, 51 minutes and 21.79 seconds -[v016] 2022-01-31 05:54:13,432 (trainer:653) INFO: 69epoch:train:1-27batch: iter_time=0.004, forward_time=0.047, loss=3.556, loss_att=1.638, loss_ctc=5.474, acc=0.942, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.639e-04, train_time=0.129 -[v016] 2022-01-31 05:54:16,012 (trainer:653) INFO: 69epoch:train:28-54batch: iter_time=1.158e-04, forward_time=0.034, loss=2.617, loss_att=1.359, loss_ctc=3.875, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.639e-04, train_time=0.095 -[v016] 2022-01-31 05:54:19,112 (trainer:653) INFO: 69epoch:train:55-81batch: iter_time=0.012, forward_time=0.035, loss=3.661, loss_att=1.755, loss_ctc=5.567, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.638e-04, train_time=0.115 -[v016] 2022-01-31 05:54:21,958 (trainer:653) INFO: 69epoch:train:82-108batch: iter_time=0.004, forward_time=0.038, loss=2.844, loss_att=1.332, loss_ctc=4.357, acc=0.945, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.638e-04, train_time=0.105 -[v016] 2022-01-31 05:54:24,578 (trainer:653) INFO: 69epoch:train:109-135batch: iter_time=1.162e-04, forward_time=0.034, loss=3.089, loss_att=1.460, loss_ctc=4.718, acc=0.942, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.637e-04, train_time=0.097 -[v016] 2022-01-31 05:54:27,355 (trainer:653) INFO: 69epoch:train:136-162batch: iter_time=4.062e-04, forward_time=0.035, loss=3.259, loss_att=1.571, loss_ctc=4.947, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.636e-04, train_time=0.099 -[v016] 2022-01-31 05:54:29,971 (trainer:653) INFO: 69epoch:train:163-189batch: iter_time=1.248e-04, forward_time=0.034, loss=2.843, loss_att=1.452, loss_ctc=4.233, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.636e-04, train_time=0.097 -[v016] 2022-01-31 05:54:32,734 (trainer:653) INFO: 69epoch:train:190-216batch: iter_time=1.823e-04, forward_time=0.035, loss=3.083, loss_att=1.458, loss_ctc=4.707, acc=0.944, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.635e-04, train_time=0.102 -[v016] 2022-01-31 05:54:35,434 (trainer:653) INFO: 69epoch:train:217-243batch: iter_time=0.001, forward_time=0.034, loss=3.473, loss_att=1.707, loss_ctc=5.239, acc=0.935, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.635e-04, train_time=0.100 -[v016] 2022-01-31 05:54:38,091 (trainer:653) INFO: 69epoch:train:244-270batch: iter_time=9.956e-05, forward_time=0.035, loss=3.559, loss_att=1.725, loss_ctc=5.394, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.634e-04, train_time=0.098 -[v016] 2022-01-31 05:54:40,747 (trainer:653) INFO: 69epoch:train:271-297batch: iter_time=1.972e-04, forward_time=0.033, loss=2.525, loss_att=1.340, loss_ctc=3.709, acc=0.940, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.633e-04, train_time=0.098 -[v016] 2022-01-31 05:54:43,442 (trainer:653) INFO: 69epoch:train:298-324batch: iter_time=1.146e-04, forward_time=0.035, loss=3.547, loss_att=1.732, loss_ctc=5.362, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.633e-04, train_time=0.100 -[v016] 2022-01-31 05:54:46,114 (trainer:653) INFO: 69epoch:train:325-351batch: iter_time=2.069e-04, forward_time=0.034, loss=2.789, loss_att=1.541, loss_ctc=4.037, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.632e-04, train_time=0.099 -[v016] 2022-01-31 05:54:48,702 (trainer:653) INFO: 69epoch:train:352-378batch: iter_time=1.145e-04, forward_time=0.034, loss=3.002, loss_att=1.501, loss_ctc=4.503, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.632e-04, train_time=0.096 -[v016] 2022-01-31 05:54:51,475 (trainer:653) INFO: 69epoch:train:379-405batch: iter_time=0.007, forward_time=0.035, loss=2.851, loss_att=1.514, loss_ctc=4.189, acc=0.936, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.631e-04, train_time=0.102 -[v016] 2022-01-31 05:54:54,047 (trainer:653) INFO: 69epoch:train:406-432batch: iter_time=1.250e-04, forward_time=0.034, loss=3.245, loss_att=1.639, loss_ctc=4.850, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.630e-04, train_time=0.095 -[v016] 2022-01-31 05:54:56,715 (trainer:653) INFO: 69epoch:train:433-459batch: iter_time=1.610e-04, forward_time=0.034, loss=3.072, loss_att=1.611, loss_ctc=4.532, acc=0.930, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.630e-04, train_time=0.098 -[v016] 2022-01-31 05:54:59,446 (trainer:653) INFO: 69epoch:train:460-486batch: iter_time=1.816e-04, forward_time=0.038, loss=3.480, loss_att=1.677, loss_ctc=5.282, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.629e-04, train_time=0.101 -[v016] 2022-01-31 05:55:02,027 (trainer:653) INFO: 69epoch:train:487-513batch: iter_time=1.088e-04, forward_time=0.033, loss=2.989, loss_att=1.571, loss_ctc=4.408, acc=0.926, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.629e-04, train_time=0.095 -[v016] 2022-01-31 05:55:04,706 (trainer:653) INFO: 69epoch:train:514-540batch: iter_time=1.295e-04, forward_time=0.037, loss=3.468, loss_att=1.772, loss_ctc=5.165, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.628e-04, train_time=0.099 -[v016] 2022-01-31 05:55:43,681 (trainer:328) INFO: 69epoch results: [train] iter_time=0.002, forward_time=0.035, loss=3.161, loss_att=1.574, loss_ctc=4.749, acc=0.936, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.634e-04, train_time=0.101, time=55.63 seconds, total_count=37743, gpu_max_cached_mem_GB=5.824, [valid] loss=6.511, loss_att=5.234, loss_ctc=7.788, acc=0.899, cer=0.106, wer=0.417, cer_ctc=0.163, time=5.89 seconds, total_count=12282, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.28 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:55:46,225 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:55:46,237 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/63epoch.pth -[v016] 2022-01-31 05:55:46,244 (trainer:261) INFO: 70/200epoch started. Estimated time to finish: 4 hours, 47 minutes and 33.07 seconds -[v016] 2022-01-31 05:55:50,254 (trainer:653) INFO: 70epoch:train:1-27batch: iter_time=0.004, forward_time=0.059, loss=3.075, loss_att=1.453, loss_ctc=4.697, acc=0.943, backward_time=0.038, optim_step_time=0.021, optim0_lr0=1.627e-04, train_time=0.145 -[v016] 2022-01-31 05:55:52,866 (trainer:653) INFO: 70epoch:train:28-54batch: iter_time=4.488e-04, forward_time=0.034, loss=2.807, loss_att=1.428, loss_ctc=4.186, acc=0.930, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.627e-04, train_time=0.097 -[v016] 2022-01-31 05:55:55,645 (trainer:653) INFO: 70epoch:train:55-81batch: iter_time=0.001, forward_time=0.035, loss=3.222, loss_att=1.698, loss_ctc=4.747, acc=0.931, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.626e-04, train_time=0.103 -[v016] 2022-01-31 05:55:58,233 (trainer:653) INFO: 70epoch:train:82-108batch: iter_time=1.296e-04, forward_time=0.033, loss=2.600, loss_att=1.404, loss_ctc=3.796, acc=0.942, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.626e-04, train_time=0.096 -[v016] 2022-01-31 05:56:01,001 (trainer:653) INFO: 70epoch:train:109-135batch: iter_time=3.750e-04, forward_time=0.035, loss=3.384, loss_att=1.590, loss_ctc=5.177, acc=0.931, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.625e-04, train_time=0.102 -[v016] 2022-01-31 05:56:03,671 (trainer:653) INFO: 70epoch:train:136-162batch: iter_time=1.180e-04, forward_time=0.035, loss=3.476, loss_att=1.586, loss_ctc=5.366, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.625e-04, train_time=0.099 -[v016] 2022-01-31 05:56:08,780 (trainer:653) INFO: 70epoch:train:163-189batch: iter_time=1.975e-04, forward_time=0.080, loss=2.681, loss_att=1.423, loss_ctc=3.938, acc=0.935, backward_time=0.026, optim_step_time=0.022, optim0_lr0=1.624e-04, train_time=0.189 -[v016] 2022-01-31 05:56:11,526 (trainer:653) INFO: 70epoch:train:190-216batch: iter_time=1.450e-04, forward_time=0.035, loss=3.346, loss_att=1.652, loss_ctc=5.039, acc=0.938, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.623e-04, train_time=0.101 -[v016] 2022-01-31 05:56:14,163 (trainer:653) INFO: 70epoch:train:217-243batch: iter_time=1.429e-04, forward_time=0.034, loss=2.878, loss_att=1.387, loss_ctc=4.368, acc=0.945, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.623e-04, train_time=0.097 -[v016] 2022-01-31 05:56:16,937 (trainer:653) INFO: 70epoch:train:244-270batch: iter_time=1.877e-04, forward_time=0.035, loss=3.266, loss_att=1.557, loss_ctc=4.976, acc=0.941, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.622e-04, train_time=0.102 -[v016] 2022-01-31 05:56:19,517 (trainer:653) INFO: 70epoch:train:271-297batch: iter_time=1.136e-04, forward_time=0.034, loss=2.999, loss_att=1.483, loss_ctc=4.515, acc=0.944, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.622e-04, train_time=0.095 -[v016] 2022-01-31 05:56:22,231 (trainer:653) INFO: 70epoch:train:298-324batch: iter_time=1.890e-04, forward_time=0.034, loss=2.826, loss_att=1.386, loss_ctc=4.265, acc=0.948, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.621e-04, train_time=0.100 -[v016] 2022-01-31 05:56:25,200 (trainer:653) INFO: 70epoch:train:325-351batch: iter_time=0.013, forward_time=0.034, loss=3.312, loss_att=1.676, loss_ctc=4.948, acc=0.931, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.620e-04, train_time=0.110 -[v016] 2022-01-31 05:56:27,878 (trainer:653) INFO: 70epoch:train:352-378batch: iter_time=1.321e-04, forward_time=0.034, loss=3.211, loss_att=1.706, loss_ctc=4.716, acc=0.921, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.620e-04, train_time=0.099 -[v016] 2022-01-31 05:56:30,641 (trainer:653) INFO: 70epoch:train:379-405batch: iter_time=2.460e-04, forward_time=0.035, loss=3.793, loss_att=1.817, loss_ctc=5.768, acc=0.929, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.619e-04, train_time=0.102 -[v016] 2022-01-31 05:56:33,304 (trainer:653) INFO: 70epoch:train:406-432batch: iter_time=1.087e-04, forward_time=0.037, loss=2.964, loss_att=1.547, loss_ctc=4.381, acc=0.932, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.619e-04, train_time=0.098 -[v016] 2022-01-31 05:56:35,832 (trainer:653) INFO: 70epoch:train:433-459batch: iter_time=1.177e-04, forward_time=0.033, loss=2.894, loss_att=1.610, loss_ctc=4.178, acc=0.925, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.618e-04, train_time=0.094 -[v016] 2022-01-31 05:56:38,540 (trainer:653) INFO: 70epoch:train:460-486batch: iter_time=1.834e-04, forward_time=0.034, loss=3.079, loss_att=1.527, loss_ctc=4.631, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.618e-04, train_time=0.100 -[v016] 2022-01-31 05:56:41,153 (trainer:653) INFO: 70epoch:train:487-513batch: iter_time=1.184e-04, forward_time=0.034, loss=2.966, loss_att=1.493, loss_ctc=4.439, acc=0.944, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.617e-04, train_time=0.097 -[v016] 2022-01-31 05:56:43,939 (trainer:653) INFO: 70epoch:train:514-540batch: iter_time=1.890e-04, forward_time=0.035, loss=3.354, loss_att=1.725, loss_ctc=4.982, acc=0.926, backward_time=0.022, optim_step_time=0.025, optim0_lr0=1.616e-04, train_time=0.103 -[v016] 2022-01-31 05:57:19,928 (trainer:328) INFO: 70epoch results: [train] iter_time=0.001, forward_time=0.038, loss=3.109, loss_att=1.559, loss_ctc=4.659, acc=0.936, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.622e-04, train_time=0.106, time=58.41 seconds, total_count=38290, gpu_max_cached_mem_GB=5.824, [valid] loss=6.426, loss_att=5.182, loss_ctc=7.671, acc=0.899, cer=0.106, wer=0.414, cer_ctc=0.163, time=6.26 seconds, total_count=12460, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.97 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:57:22,317 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:57:22,322 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/64epoch.pth -[v016] 2022-01-31 05:57:22,325 (trainer:261) INFO: 71/200epoch started. Estimated time to finish: 4 hours, 43 minutes and 48.76 seconds -[v016] 2022-01-31 05:57:25,186 (trainer:653) INFO: 71epoch:train:1-27batch: iter_time=0.004, forward_time=0.037, loss=2.990, loss_att=1.438, loss_ctc=4.541, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.616e-04, train_time=0.105 -[v016] 2022-01-31 05:57:28,091 (trainer:653) INFO: 71epoch:train:28-54batch: iter_time=0.001, forward_time=0.036, loss=3.687, loss_att=1.693, loss_ctc=5.681, acc=0.940, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.615e-04, train_time=0.107 -[v016] 2022-01-31 05:57:30,713 (trainer:653) INFO: 71epoch:train:55-81batch: iter_time=1.281e-04, forward_time=0.034, loss=3.175, loss_att=1.513, loss_ctc=4.838, acc=0.941, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.615e-04, train_time=0.097 -[v016] 2022-01-31 05:57:33,473 (trainer:653) INFO: 71epoch:train:82-108batch: iter_time=1.496e-04, forward_time=0.035, loss=2.811, loss_att=1.466, loss_ctc=4.156, acc=0.938, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.614e-04, train_time=0.102 -[v016] 2022-01-31 05:57:36,170 (trainer:653) INFO: 71epoch:train:109-135batch: iter_time=2.680e-04, forward_time=0.037, loss=2.625, loss_att=1.410, loss_ctc=3.840, acc=0.935, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.613e-04, train_time=0.100 -[v016] 2022-01-31 05:57:38,730 (trainer:653) INFO: 71epoch:train:136-162batch: iter_time=1.025e-04, forward_time=0.033, loss=2.695, loss_att=1.391, loss_ctc=3.999, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.613e-04, train_time=0.095 -[v016] 2022-01-31 05:57:41,495 (trainer:653) INFO: 71epoch:train:163-189batch: iter_time=3.141e-04, forward_time=0.035, loss=3.444, loss_att=1.585, loss_ctc=5.303, acc=0.940, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.612e-04, train_time=0.102 -[v016] 2022-01-31 05:57:44,106 (trainer:653) INFO: 71epoch:train:190-216batch: iter_time=1.305e-04, forward_time=0.034, loss=2.812, loss_att=1.417, loss_ctc=4.207, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.612e-04, train_time=0.097 -[v016] 2022-01-31 05:57:46,790 (trainer:653) INFO: 71epoch:train:217-243batch: iter_time=1.174e-04, forward_time=0.037, loss=3.004, loss_att=1.492, loss_ctc=4.516, acc=0.937, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.611e-04, train_time=0.099 -[v016] 2022-01-31 05:57:49,514 (trainer:653) INFO: 71epoch:train:244-270batch: iter_time=2.022e-04, forward_time=0.035, loss=3.028, loss_att=1.493, loss_ctc=4.563, acc=0.937, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.611e-04, train_time=0.101 -[v016] 2022-01-31 05:57:52,161 (trainer:653) INFO: 71epoch:train:271-297batch: iter_time=1.192e-04, forward_time=0.035, loss=3.362, loss_att=1.641, loss_ctc=5.084, acc=0.945, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.610e-04, train_time=0.098 -[v016] 2022-01-31 05:57:54,842 (trainer:653) INFO: 71epoch:train:298-324batch: iter_time=2.401e-04, forward_time=0.034, loss=3.297, loss_att=1.637, loss_ctc=4.958, acc=0.934, backward_time=0.022, optim_step_time=0.024, optim0_lr0=1.610e-04, train_time=0.099 -[v016] 2022-01-31 05:57:57,570 (trainer:653) INFO: 71epoch:train:325-351batch: iter_time=0.004, forward_time=0.034, loss=2.936, loss_att=1.414, loss_ctc=4.459, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.609e-04, train_time=0.101 -[v016] 2022-01-31 05:58:00,548 (trainer:653) INFO: 71epoch:train:352-378batch: iter_time=0.007, forward_time=0.035, loss=2.802, loss_att=1.381, loss_ctc=4.222, acc=0.947, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.608e-04, train_time=0.110 -[v016] 2022-01-31 05:58:03,197 (trainer:653) INFO: 71epoch:train:379-405batch: iter_time=1.231e-04, forward_time=0.035, loss=3.412, loss_att=1.708, loss_ctc=5.115, acc=0.926, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.608e-04, train_time=0.098 -[v016] 2022-01-31 05:58:05,992 (trainer:653) INFO: 71epoch:train:406-432batch: iter_time=1.870e-04, forward_time=0.035, loss=3.355, loss_att=1.588, loss_ctc=5.122, acc=0.941, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.607e-04, train_time=0.103 -[v016] 2022-01-31 05:58:08,805 (trainer:653) INFO: 71epoch:train:433-459batch: iter_time=2.288e-04, forward_time=0.036, loss=3.261, loss_att=1.578, loss_ctc=4.944, acc=0.931, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.607e-04, train_time=0.104 -[v016] 2022-01-31 05:58:11,449 (trainer:653) INFO: 71epoch:train:460-486batch: iter_time=1.218e-04, forward_time=0.035, loss=2.675, loss_att=1.454, loss_ctc=3.895, acc=0.939, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.606e-04, train_time=0.098 -[v016] 2022-01-31 05:58:14,131 (trainer:653) INFO: 71epoch:train:487-513batch: iter_time=1.303e-04, forward_time=0.035, loss=2.947, loss_att=1.472, loss_ctc=4.422, acc=0.938, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.606e-04, train_time=0.099 -[v016] 2022-01-31 05:58:16,763 (trainer:653) INFO: 71epoch:train:514-540batch: iter_time=1.231e-04, forward_time=0.034, loss=3.001, loss_att=1.509, loss_ctc=4.493, acc=0.934, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.605e-04, train_time=0.097 -[v016] 2022-01-31 05:58:52,918 (trainer:328) INFO: 71epoch results: [train] iter_time=9.480e-04, forward_time=0.035, loss=3.070, loss_att=1.515, loss_ctc=4.624, acc=0.938, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.610e-04, train_time=0.101, time=55.19 seconds, total_count=38837, gpu_max_cached_mem_GB=5.824, [valid] loss=6.511, loss_att=5.233, loss_ctc=7.789, acc=0.899, cer=0.106, wer=0.410, cer_ctc=0.161, time=5.74 seconds, total_count=12638, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.66 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 05:58:55,398 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 05:58:55,406 (trainer:261) INFO: 72/200epoch started. Estimated time to finish: 4 hours, 40 minutes and 1.88 seconds -[v016] 2022-01-31 05:58:58,523 (trainer:653) INFO: 72epoch:train:1-27batch: iter_time=0.014, forward_time=0.034, loss=3.198, loss_att=1.490, loss_ctc=4.905, acc=0.945, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.604e-04, train_time=0.115 -[v016] 2022-01-31 05:59:01,625 (trainer:653) INFO: 72epoch:train:28-54batch: iter_time=0.017, forward_time=0.033, loss=2.470, loss_att=1.310, loss_ctc=3.630, acc=0.943, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.604e-04, train_time=0.115 -[v016] 2022-01-31 05:59:04,411 (trainer:653) INFO: 72epoch:train:55-81batch: iter_time=0.004, forward_time=0.034, loss=2.953, loss_att=1.548, loss_ctc=4.358, acc=0.933, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.603e-04, train_time=0.103 -[v016] 2022-01-31 05:59:06,988 (trainer:653) INFO: 72epoch:train:82-108batch: iter_time=9.337e-05, forward_time=0.032, loss=2.835, loss_att=1.479, loss_ctc=4.192, acc=0.940, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.603e-04, train_time=0.095 -[v016] 2022-01-31 05:59:09,566 (trainer:653) INFO: 72epoch:train:109-135batch: iter_time=9.078e-05, forward_time=0.033, loss=2.679, loss_att=1.414, loss_ctc=3.943, acc=0.937, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.602e-04, train_time=0.095 -[v016] 2022-01-31 05:59:12,217 (trainer:653) INFO: 72epoch:train:136-162batch: iter_time=1.309e-04, forward_time=0.034, loss=3.028, loss_att=1.459, loss_ctc=4.598, acc=0.939, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.602e-04, train_time=0.098 -[v016] 2022-01-31 05:59:14,598 (trainer:653) INFO: 72epoch:train:163-189batch: iter_time=7.628e-05, forward_time=0.030, loss=2.712, loss_att=1.467, loss_ctc=3.958, acc=0.935, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.601e-04, train_time=0.088 -[v016] 2022-01-31 05:59:17,193 (trainer:653) INFO: 72epoch:train:190-216batch: iter_time=0.001, forward_time=0.033, loss=3.214, loss_att=1.425, loss_ctc=5.003, acc=0.947, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.600e-04, train_time=0.096 -[v016] 2022-01-31 05:59:19,871 (trainer:653) INFO: 72epoch:train:217-243batch: iter_time=0.003, forward_time=0.033, loss=3.474, loss_att=1.648, loss_ctc=5.301, acc=0.934, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.600e-04, train_time=0.099 -[v016] 2022-01-31 05:59:22,503 (trainer:653) INFO: 72epoch:train:244-270batch: iter_time=0.002, forward_time=0.033, loss=2.895, loss_att=1.405, loss_ctc=4.385, acc=0.942, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.599e-04, train_time=0.097 -[v016] 2022-01-31 05:59:25,186 (trainer:653) INFO: 72epoch:train:271-297batch: iter_time=1.283e-04, forward_time=0.033, loss=3.012, loss_att=1.531, loss_ctc=4.493, acc=0.935, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.599e-04, train_time=0.099 -[v016] 2022-01-31 05:59:27,947 (trainer:653) INFO: 72epoch:train:298-324batch: iter_time=3.129e-04, forward_time=0.034, loss=2.391, loss_att=1.221, loss_ctc=3.560, acc=0.944, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.598e-04, train_time=0.102 -[v016] 2022-01-31 05:59:31,648 (trainer:653) INFO: 72epoch:train:325-351batch: iter_time=0.039, forward_time=0.033, loss=2.916, loss_att=1.526, loss_ctc=4.306, acc=0.936, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.598e-04, train_time=0.137 -[v016] 2022-01-31 05:59:34,299 (trainer:653) INFO: 72epoch:train:352-378batch: iter_time=1.036e-04, forward_time=0.033, loss=2.292, loss_att=1.192, loss_ctc=3.391, acc=0.948, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.597e-04, train_time=0.098 -[v016] 2022-01-31 05:59:36,978 (trainer:653) INFO: 72epoch:train:379-405batch: iter_time=1.008e-04, forward_time=0.034, loss=2.997, loss_att=1.489, loss_ctc=4.506, acc=0.938, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.597e-04, train_time=0.099 -[v016] 2022-01-31 05:59:39,690 (trainer:653) INFO: 72epoch:train:406-432batch: iter_time=1.105e-04, forward_time=0.034, loss=3.328, loss_att=1.572, loss_ctc=5.084, acc=0.938, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.596e-04, train_time=0.100 -[v016] 2022-01-31 05:59:42,532 (trainer:653) INFO: 72epoch:train:433-459batch: iter_time=0.005, forward_time=0.034, loss=3.422, loss_att=1.621, loss_ctc=5.222, acc=0.935, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.595e-04, train_time=0.105 -[v016] 2022-01-31 05:59:45,192 (trainer:653) INFO: 72epoch:train:460-486batch: iter_time=1.272e-04, forward_time=0.033, loss=3.379, loss_att=1.581, loss_ctc=5.178, acc=0.936, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.595e-04, train_time=0.098 -[v016] 2022-01-31 05:59:47,843 (trainer:653) INFO: 72epoch:train:487-513batch: iter_time=1.195e-04, forward_time=0.033, loss=2.859, loss_att=1.464, loss_ctc=4.255, acc=0.938, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.594e-04, train_time=0.098 -[v016] 2022-01-31 05:59:50,532 (trainer:653) INFO: 72epoch:train:514-540batch: iter_time=4.100e-04, forward_time=0.034, loss=3.392, loss_att=1.624, loss_ctc=5.161, acc=0.938, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.594e-04, train_time=0.099 -[v016] 2022-01-31 06:00:27,052 (trainer:328) INFO: 72epoch results: [train] iter_time=0.004, forward_time=0.033, loss=2.989, loss_att=1.481, loss_ctc=4.498, acc=0.939, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.599e-04, train_time=0.102, time=55.98 seconds, total_count=39384, gpu_max_cached_mem_GB=5.824, [valid] loss=6.548, loss_att=5.282, loss_ctc=7.814, acc=0.901, cer=0.104, wer=0.417, cer_ctc=0.161, time=7.01 seconds, total_count=12816, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.65 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:00:29,598 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 06:00:29,604 (trainer:261) INFO: 73/200epoch started. Estimated time to finish: 4 hours, 36 minutes and 22.9 seconds -[v016] 2022-01-31 06:00:32,891 (trainer:653) INFO: 73epoch:train:1-27batch: iter_time=0.021, forward_time=0.033, loss=2.825, loss_att=1.362, loss_ctc=4.287, acc=0.938, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.593e-04, train_time=0.118 -[v016] 2022-01-31 06:00:35,443 (trainer:653) INFO: 73epoch:train:28-54batch: iter_time=0.003, forward_time=0.031, loss=2.897, loss_att=1.470, loss_ctc=4.324, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.593e-04, train_time=0.094 -[v016] 2022-01-31 06:00:37,937 (trainer:653) INFO: 73epoch:train:55-81batch: iter_time=7.764e-05, forward_time=0.031, loss=3.072, loss_att=1.376, loss_ctc=4.769, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.592e-04, train_time=0.092 -[v016] 2022-01-31 06:00:40,441 (trainer:653) INFO: 73epoch:train:82-108batch: iter_time=7.592e-05, forward_time=0.031, loss=2.862, loss_att=1.376, loss_ctc=4.347, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.592e-04, train_time=0.093 -[v016] 2022-01-31 06:00:42,821 (trainer:653) INFO: 73epoch:train:109-135batch: iter_time=7.821e-05, forward_time=0.030, loss=2.534, loss_att=1.278, loss_ctc=3.790, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.591e-04, train_time=0.088 -[v016] 2022-01-31 06:00:45,224 (trainer:653) INFO: 73epoch:train:136-162batch: iter_time=7.981e-05, forward_time=0.030, loss=3.086, loss_att=1.462, loss_ctc=4.710, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.590e-04, train_time=0.089 -[v016] 2022-01-31 06:00:47,812 (trainer:653) INFO: 73epoch:train:163-189batch: iter_time=9.041e-05, forward_time=0.033, loss=3.466, loss_att=1.570, loss_ctc=5.362, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.590e-04, train_time=0.096 -[v016] 2022-01-31 06:00:50,285 (trainer:653) INFO: 73epoch:train:190-216batch: iter_time=8.856e-05, forward_time=0.031, loss=3.026, loss_att=1.434, loss_ctc=4.619, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.589e-04, train_time=0.091 -[v016] 2022-01-31 06:00:52,671 (trainer:653) INFO: 73epoch:train:217-243batch: iter_time=8.441e-05, forward_time=0.030, loss=2.757, loss_att=1.412, loss_ctc=4.103, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.589e-04, train_time=0.088 -[v016] 2022-01-31 06:00:55,179 (trainer:653) INFO: 73epoch:train:244-270batch: iter_time=8.115e-05, forward_time=0.031, loss=3.308, loss_att=1.595, loss_ctc=5.021, acc=0.938, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.588e-04, train_time=0.093 -[v016] 2022-01-31 06:00:57,737 (trainer:653) INFO: 73epoch:train:271-297batch: iter_time=8.180e-05, forward_time=0.030, loss=2.786, loss_att=1.433, loss_ctc=4.139, acc=0.938, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.588e-04, train_time=0.095 -[v016] 2022-01-31 06:01:00,255 (trainer:653) INFO: 73epoch:train:298-324batch: iter_time=8.792e-05, forward_time=0.032, loss=3.165, loss_att=1.507, loss_ctc=4.824, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.587e-04, train_time=0.093 -[v016] 2022-01-31 06:01:02,880 (trainer:653) INFO: 73epoch:train:325-351batch: iter_time=0.003, forward_time=0.033, loss=3.332, loss_att=1.475, loss_ctc=5.188, acc=0.943, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.587e-04, train_time=0.097 -[v016] 2022-01-31 06:01:05,666 (trainer:653) INFO: 73epoch:train:352-378batch: iter_time=0.012, forward_time=0.031, loss=2.684, loss_att=1.301, loss_ctc=4.068, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.586e-04, train_time=0.103 -[v016] 2022-01-31 06:01:08,194 (trainer:653) INFO: 73epoch:train:379-405batch: iter_time=8.858e-05, forward_time=0.032, loss=3.074, loss_att=1.577, loss_ctc=4.571, acc=0.933, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.586e-04, train_time=0.093 -[v016] 2022-01-31 06:01:10,710 (trainer:653) INFO: 73epoch:train:406-432batch: iter_time=8.898e-05, forward_time=0.032, loss=2.835, loss_att=1.407, loss_ctc=4.263, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.585e-04, train_time=0.093 -[v016] 2022-01-31 06:01:13,357 (trainer:653) INFO: 73epoch:train:433-459batch: iter_time=0.008, forward_time=0.031, loss=2.768, loss_att=1.479, loss_ctc=4.057, acc=0.928, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.584e-04, train_time=0.098 -[v016] 2022-01-31 06:01:15,763 (trainer:653) INFO: 73epoch:train:460-486batch: iter_time=8.599e-05, forward_time=0.030, loss=2.356, loss_att=1.157, loss_ctc=3.555, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.584e-04, train_time=0.089 -[v016] 2022-01-31 06:01:20,597 (trainer:653) INFO: 73epoch:train:487-513batch: iter_time=9.743e-05, forward_time=0.061, loss=3.148, loss_att=1.718, loss_ctc=4.578, acc=0.921, backward_time=0.026, optim_step_time=0.029, optim0_lr0=1.583e-04, train_time=0.179 -[v016] 2022-01-31 06:01:23,104 (trainer:653) INFO: 73epoch:train:514-540batch: iter_time=8.695e-05, forward_time=0.032, loss=3.070, loss_att=1.449, loss_ctc=4.691, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.583e-04, train_time=0.093 -[v016] 2022-01-31 06:01:58,620 (trainer:328) INFO: 73epoch results: [train] iter_time=0.002, forward_time=0.033, loss=2.943, loss_att=1.438, loss_ctc=4.448, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.588e-04, train_time=0.098, time=54.17 seconds, total_count=39931, gpu_max_cached_mem_GB=5.824, [valid] loss=6.750, loss_att=5.404, loss_ctc=8.095, acc=0.899, cer=0.107, wer=0.406, cer_ctc=0.169, time=7.31 seconds, total_count=12994, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.54 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:02:01,001 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:02:01,006 (trainer:261) INFO: 74/200epoch started. Estimated time to finish: 4 hours, 32 minutes and 41.93 seconds -[v016] 2022-01-31 06:02:03,738 (trainer:653) INFO: 74epoch:train:1-27batch: iter_time=0.009, forward_time=0.031, loss=2.519, loss_att=1.288, loss_ctc=3.750, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.582e-04, train_time=0.101 -[v016] 2022-01-31 06:02:06,467 (trainer:653) INFO: 74epoch:train:28-54batch: iter_time=0.009, forward_time=0.032, loss=3.284, loss_att=1.471, loss_ctc=5.098, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.582e-04, train_time=0.101 -[v016] 2022-01-31 06:02:08,938 (trainer:653) INFO: 74epoch:train:55-81batch: iter_time=8.800e-05, forward_time=0.032, loss=2.970, loss_att=1.473, loss_ctc=4.468, acc=0.938, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.581e-04, train_time=0.091 -[v016] 2022-01-31 06:02:11,335 (trainer:653) INFO: 74epoch:train:82-108batch: iter_time=7.798e-05, forward_time=0.030, loss=2.701, loss_att=1.401, loss_ctc=4.002, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.581e-04, train_time=0.089 -[v016] 2022-01-31 06:02:13,763 (trainer:653) INFO: 74epoch:train:109-135batch: iter_time=7.685e-05, forward_time=0.031, loss=2.805, loss_att=1.313, loss_ctc=4.296, acc=0.945, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.580e-04, train_time=0.090 -[v016] 2022-01-31 06:02:16,248 (trainer:653) INFO: 74epoch:train:136-162batch: iter_time=7.729e-05, forward_time=0.032, loss=2.841, loss_att=1.393, loss_ctc=4.289, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.580e-04, train_time=0.092 -[v016] 2022-01-31 06:02:18,593 (trainer:653) INFO: 74epoch:train:163-189batch: iter_time=7.467e-05, forward_time=0.030, loss=2.588, loss_att=1.278, loss_ctc=3.898, acc=0.941, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.579e-04, train_time=0.087 -[v016] 2022-01-31 06:02:21,127 (trainer:653) INFO: 74epoch:train:190-216batch: iter_time=7.630e-05, forward_time=0.034, loss=3.122, loss_att=1.457, loss_ctc=4.787, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.578e-04, train_time=0.094 -[v016] 2022-01-31 06:02:23,719 (trainer:653) INFO: 74epoch:train:217-243batch: iter_time=8.179e-05, forward_time=0.033, loss=3.524, loss_att=1.578, loss_ctc=5.470, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.578e-04, train_time=0.096 -[v016] 2022-01-31 06:02:26,215 (trainer:653) INFO: 74epoch:train:244-270batch: iter_time=8.281e-05, forward_time=0.032, loss=3.089, loss_att=1.489, loss_ctc=4.688, acc=0.936, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.577e-04, train_time=0.092 -[v016] 2022-01-31 06:02:28,639 (trainer:653) INFO: 74epoch:train:271-297batch: iter_time=9.269e-05, forward_time=0.031, loss=2.524, loss_att=1.295, loss_ctc=3.753, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.577e-04, train_time=0.090 -[v016] 2022-01-31 06:02:31,230 (trainer:653) INFO: 74epoch:train:298-324batch: iter_time=9.123e-05, forward_time=0.033, loss=3.359, loss_att=1.587, loss_ctc=5.131, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.576e-04, train_time=0.096 -[v016] 2022-01-31 06:02:33,759 (trainer:653) INFO: 74epoch:train:325-351batch: iter_time=8.567e-05, forward_time=0.032, loss=2.930, loss_att=1.401, loss_ctc=4.459, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.576e-04, train_time=0.093 -[v016] 2022-01-31 06:02:36,189 (trainer:653) INFO: 74epoch:train:352-378batch: iter_time=8.014e-05, forward_time=0.031, loss=2.587, loss_att=1.260, loss_ctc=3.914, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.575e-04, train_time=0.090 -[v016] 2022-01-31 06:02:38,689 (trainer:653) INFO: 74epoch:train:379-405batch: iter_time=0.001, forward_time=0.031, loss=2.462, loss_att=1.315, loss_ctc=3.610, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.575e-04, train_time=0.092 -[v016] 2022-01-31 06:02:41,306 (trainer:653) INFO: 74epoch:train:406-432batch: iter_time=8.331e-05, forward_time=0.033, loss=3.391, loss_att=1.564, loss_ctc=5.218, acc=0.941, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.574e-04, train_time=0.097 -[v016] 2022-01-31 06:02:43,699 (trainer:653) INFO: 74epoch:train:433-459batch: iter_time=7.777e-05, forward_time=0.030, loss=2.532, loss_att=1.327, loss_ctc=3.738, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.574e-04, train_time=0.088 -[v016] 2022-01-31 06:02:46,206 (trainer:653) INFO: 74epoch:train:460-486batch: iter_time=7.842e-05, forward_time=0.032, loss=3.141, loss_att=1.575, loss_ctc=4.708, acc=0.930, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.573e-04, train_time=0.093 -[v016] 2022-01-31 06:02:48,839 (trainer:653) INFO: 74epoch:train:487-513batch: iter_time=7.960e-05, forward_time=0.031, loss=2.890, loss_att=1.464, loss_ctc=4.317, acc=0.935, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.573e-04, train_time=0.097 -[v016] 2022-01-31 06:02:51,292 (trainer:653) INFO: 74epoch:train:514-540batch: iter_time=7.907e-05, forward_time=0.031, loss=2.793, loss_att=1.394, loss_ctc=4.192, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.572e-04, train_time=0.091 -[v016] 2022-01-31 06:03:25,444 (trainer:328) INFO: 74epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.895, loss_att=1.412, loss_ctc=4.377, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.577e-04, train_time=0.093, time=50.97 seconds, total_count=40478, gpu_max_cached_mem_GB=5.824, [valid] loss=6.560, loss_att=5.319, loss_ctc=7.801, acc=0.899, cer=0.107, wer=0.415, cer_ctc=0.156, time=5.91 seconds, total_count=13172, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.56 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:03:27,552 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:03:27,557 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/69epoch.pth -[v016] 2022-01-31 06:03:27,557 (trainer:261) INFO: 75/200epoch started. Estimated time to finish: 4 hours, 28 minutes and 54.43 seconds -[v016] 2022-01-31 06:03:30,212 (trainer:653) INFO: 75epoch:train:1-27batch: iter_time=0.005, forward_time=0.032, loss=2.842, loss_att=1.439, loss_ctc=4.246, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.571e-04, train_time=0.098 -[v016] 2022-01-31 06:03:32,678 (trainer:653) INFO: 75epoch:train:28-54batch: iter_time=8.895e-05, forward_time=0.031, loss=2.892, loss_att=1.377, loss_ctc=4.407, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.571e-04, train_time=0.091 -[v016] 2022-01-31 06:03:35,173 (trainer:653) INFO: 75epoch:train:55-81batch: iter_time=8.146e-05, forward_time=0.032, loss=2.699, loss_att=1.235, loss_ctc=4.162, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.570e-04, train_time=0.092 -[v016] 2022-01-31 06:03:37,577 (trainer:653) INFO: 75epoch:train:82-108batch: iter_time=7.742e-05, forward_time=0.031, loss=2.301, loss_att=1.117, loss_ctc=3.484, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.570e-04, train_time=0.089 -[v016] 2022-01-31 06:03:40,352 (trainer:653) INFO: 75epoch:train:109-135batch: iter_time=0.013, forward_time=0.031, loss=3.053, loss_att=1.516, loss_ctc=4.590, acc=0.935, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.569e-04, train_time=0.103 -[v016] 2022-01-31 06:03:42,895 (trainer:653) INFO: 75epoch:train:136-162batch: iter_time=8.396e-05, forward_time=0.033, loss=2.786, loss_att=1.386, loss_ctc=4.185, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.569e-04, train_time=0.094 -[v016] 2022-01-31 06:03:45,408 (trainer:653) INFO: 75epoch:train:163-189batch: iter_time=8.236e-05, forward_time=0.032, loss=2.562, loss_att=1.189, loss_ctc=3.936, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.568e-04, train_time=0.093 -[v016] 2022-01-31 06:03:47,915 (trainer:653) INFO: 75epoch:train:190-216batch: iter_time=7.706e-05, forward_time=0.032, loss=2.952, loss_att=1.443, loss_ctc=4.461, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.568e-04, train_time=0.093 -[v016] 2022-01-31 06:03:50,368 (trainer:653) INFO: 75epoch:train:217-243batch: iter_time=7.618e-05, forward_time=0.032, loss=2.845, loss_att=1.392, loss_ctc=4.297, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.567e-04, train_time=0.091 -[v016] 2022-01-31 06:03:52,791 (trainer:653) INFO: 75epoch:train:244-270batch: iter_time=8.633e-05, forward_time=0.031, loss=3.100, loss_att=1.569, loss_ctc=4.630, acc=0.933, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.567e-04, train_time=0.090 -[v016] 2022-01-31 06:03:55,259 (trainer:653) INFO: 75epoch:train:271-297batch: iter_time=8.161e-05, forward_time=0.032, loss=2.815, loss_att=1.371, loss_ctc=4.259, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.566e-04, train_time=0.091 -[v016] 2022-01-31 06:03:57,699 (trainer:653) INFO: 75epoch:train:298-324batch: iter_time=8.072e-05, forward_time=0.031, loss=2.453, loss_att=1.245, loss_ctc=3.660, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.566e-04, train_time=0.090 -[v016] 2022-01-31 06:04:00,166 (trainer:653) INFO: 75epoch:train:325-351batch: iter_time=8.195e-05, forward_time=0.032, loss=2.672, loss_att=1.356, loss_ctc=3.988, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.565e-04, train_time=0.091 -[v016] 2022-01-31 06:04:02,676 (trainer:653) INFO: 75epoch:train:352-378batch: iter_time=8.143e-05, forward_time=0.032, loss=3.147, loss_att=1.456, loss_ctc=4.838, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.565e-04, train_time=0.093 -[v016] 2022-01-31 06:04:05,127 (trainer:653) INFO: 75epoch:train:379-405batch: iter_time=7.719e-05, forward_time=0.031, loss=2.675, loss_att=1.318, loss_ctc=4.033, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.564e-04, train_time=0.091 -[v016] 2022-01-31 06:04:07,531 (trainer:653) INFO: 75epoch:train:406-432batch: iter_time=7.530e-05, forward_time=0.030, loss=2.509, loss_att=1.285, loss_ctc=3.733, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.564e-04, train_time=0.089 -[v016] 2022-01-31 06:04:10,082 (trainer:653) INFO: 75epoch:train:433-459batch: iter_time=7.764e-05, forward_time=0.033, loss=3.080, loss_att=1.487, loss_ctc=4.672, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.563e-04, train_time=0.094 -[v016] 2022-01-31 06:04:12,835 (trainer:653) INFO: 75epoch:train:460-486batch: iter_time=0.009, forward_time=0.032, loss=2.691, loss_att=1.239, loss_ctc=4.143, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.563e-04, train_time=0.102 -[v016] 2022-01-31 06:04:15,280 (trainer:653) INFO: 75epoch:train:487-513batch: iter_time=7.651e-05, forward_time=0.031, loss=2.924, loss_att=1.383, loss_ctc=4.465, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.562e-04, train_time=0.090 -[v016] 2022-01-31 06:04:17,718 (trainer:653) INFO: 75epoch:train:514-540batch: iter_time=8.140e-05, forward_time=0.032, loss=2.725, loss_att=1.440, loss_ctc=4.011, acc=0.934, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.562e-04, train_time=0.090 -[v016] 2022-01-31 06:04:52,141 (trainer:328) INFO: 75epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.803, loss_att=1.368, loss_ctc=4.237, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.566e-04, train_time=0.093, time=50.93 seconds, total_count=41025, gpu_max_cached_mem_GB=5.824, [valid] loss=6.755, loss_att=5.418, loss_ctc=8.093, acc=0.899, cer=0.103, wer=0.410, cer_ctc=0.159, time=5.92 seconds, total_count=13350, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.74 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:04:54,178 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:04:54,183 (trainer:261) INFO: 76/200epoch started. Estimated time to finish: 4 hours, 25 minutes and 12.24 seconds -[v016] 2022-01-31 06:04:57,446 (trainer:653) INFO: 76epoch:train:1-27batch: iter_time=0.021, forward_time=0.034, loss=3.031, loss_att=1.358, loss_ctc=4.705, acc=0.951, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.561e-04, train_time=0.120 -[v016] 2022-01-31 06:05:00,017 (trainer:653) INFO: 76epoch:train:28-54batch: iter_time=8.246e-05, forward_time=0.033, loss=3.069, loss_att=1.466, loss_ctc=4.671, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.560e-04, train_time=0.095 -[v016] 2022-01-31 06:05:02,495 (trainer:653) INFO: 76epoch:train:55-81batch: iter_time=8.651e-05, forward_time=0.032, loss=2.713, loss_att=1.324, loss_ctc=4.102, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.560e-04, train_time=0.092 -[v016] 2022-01-31 06:05:05,192 (trainer:653) INFO: 76epoch:train:82-108batch: iter_time=8.905e-05, forward_time=0.035, loss=3.531, loss_att=1.517, loss_ctc=5.545, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.559e-04, train_time=0.100 -[v016] 2022-01-31 06:05:07,664 (trainer:653) INFO: 76epoch:train:109-135batch: iter_time=7.558e-05, forward_time=0.031, loss=2.734, loss_att=1.325, loss_ctc=4.143, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.559e-04, train_time=0.091 -[v016] 2022-01-31 06:05:10,209 (trainer:653) INFO: 76epoch:train:136-162batch: iter_time=7.753e-05, forward_time=0.032, loss=2.894, loss_att=1.310, loss_ctc=4.478, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.558e-04, train_time=0.094 -[v016] 2022-01-31 06:05:12,607 (trainer:653) INFO: 76epoch:train:163-189batch: iter_time=7.719e-05, forward_time=0.030, loss=2.528, loss_att=1.261, loss_ctc=3.795, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.558e-04, train_time=0.089 -[v016] 2022-01-31 06:05:15,110 (trainer:653) INFO: 76epoch:train:190-216batch: iter_time=0.003, forward_time=0.031, loss=2.739, loss_att=1.446, loss_ctc=4.031, acc=0.932, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.557e-04, train_time=0.092 -[v016] 2022-01-31 06:05:17,538 (trainer:653) INFO: 76epoch:train:217-243batch: iter_time=7.466e-05, forward_time=0.031, loss=2.475, loss_att=1.279, loss_ctc=3.671, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.557e-04, train_time=0.090 -[v016] 2022-01-31 06:05:19,961 (trainer:653) INFO: 76epoch:train:244-270batch: iter_time=8.399e-05, forward_time=0.031, loss=2.360, loss_att=1.272, loss_ctc=3.448, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.556e-04, train_time=0.090 -[v016] 2022-01-31 06:05:22,527 (trainer:653) INFO: 76epoch:train:271-297batch: iter_time=9.938e-05, forward_time=0.033, loss=2.882, loss_att=1.352, loss_ctc=4.413, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.556e-04, train_time=0.095 -[v016] 2022-01-31 06:05:24,915 (trainer:653) INFO: 76epoch:train:298-324batch: iter_time=8.238e-05, forward_time=0.030, loss=3.118, loss_att=1.623, loss_ctc=4.614, acc=0.933, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.555e-04, train_time=0.088 -[v016] 2022-01-31 06:05:27,290 (trainer:653) INFO: 76epoch:train:325-351batch: iter_time=7.425e-05, forward_time=0.030, loss=2.488, loss_att=1.338, loss_ctc=3.638, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.555e-04, train_time=0.088 -[v016] 2022-01-31 06:05:29,761 (trainer:653) INFO: 76epoch:train:352-378batch: iter_time=7.970e-05, forward_time=0.032, loss=3.136, loss_att=1.529, loss_ctc=4.744, acc=0.936, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.554e-04, train_time=0.091 -[v016] 2022-01-31 06:05:32,281 (trainer:653) INFO: 76epoch:train:379-405batch: iter_time=8.182e-05, forward_time=0.033, loss=3.024, loss_att=1.416, loss_ctc=4.632, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.554e-04, train_time=0.093 -[v016] 2022-01-31 06:05:34,832 (trainer:653) INFO: 76epoch:train:406-432batch: iter_time=8.398e-05, forward_time=0.033, loss=2.924, loss_att=1.334, loss_ctc=4.514, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.553e-04, train_time=0.094 -[v016] 2022-01-31 06:05:37,269 (trainer:653) INFO: 76epoch:train:433-459batch: iter_time=8.558e-05, forward_time=0.032, loss=2.505, loss_att=1.274, loss_ctc=3.736, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.553e-04, train_time=0.090 -[v016] 2022-01-31 06:05:39,655 (trainer:653) INFO: 76epoch:train:460-486batch: iter_time=7.379e-05, forward_time=0.030, loss=2.496, loss_att=1.301, loss_ctc=3.692, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.552e-04, train_time=0.088 -[v016] 2022-01-31 06:05:42,142 (trainer:653) INFO: 76epoch:train:487-513batch: iter_time=8.224e-05, forward_time=0.032, loss=2.838, loss_att=1.423, loss_ctc=4.253, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.552e-04, train_time=0.092 -[v016] 2022-01-31 06:05:44,627 (trainer:653) INFO: 76epoch:train:514-540batch: iter_time=8.310e-05, forward_time=0.032, loss=2.827, loss_att=1.314, loss_ctc=4.339, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.551e-04, train_time=0.092 -[v016] 2022-01-31 06:06:19,373 (trainer:328) INFO: 76epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.810, loss_att=1.372, loss_ctc=4.247, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.556e-04, train_time=0.093, time=51.15 seconds, total_count=41572, gpu_max_cached_mem_GB=5.824, [valid] loss=6.627, loss_att=5.366, loss_ctc=7.887, acc=0.899, cer=0.107, wer=0.420, cer_ctc=0.162, time=5.62 seconds, total_count=13528, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.33 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:06:21,444 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 06:06:21,449 (trainer:261) INFO: 77/200epoch started. Estimated time to finish: 4 hours, 21 minutes and 36.3 seconds -[v016] 2022-01-31 06:06:24,361 (trainer:653) INFO: 77epoch:train:1-27batch: iter_time=0.010, forward_time=0.030, loss=2.239, loss_att=1.127, loss_ctc=3.351, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.551e-04, train_time=0.102 -[v016] 2022-01-31 06:06:26,973 (trainer:653) INFO: 77epoch:train:28-54batch: iter_time=6.429e-04, forward_time=0.033, loss=2.942, loss_att=1.316, loss_ctc=4.568, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.550e-04, train_time=0.097 -[v016] 2022-01-31 06:06:29,563 (trainer:653) INFO: 77epoch:train:55-81batch: iter_time=8.507e-05, forward_time=0.033, loss=2.975, loss_att=1.400, loss_ctc=4.550, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.550e-04, train_time=0.096 -[v016] 2022-01-31 06:06:32,135 (trainer:653) INFO: 77epoch:train:82-108batch: iter_time=7.676e-04, forward_time=0.032, loss=2.923, loss_att=1.363, loss_ctc=4.482, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.549e-04, train_time=0.095 -[v016] 2022-01-31 06:06:34,656 (trainer:653) INFO: 77epoch:train:109-135batch: iter_time=0.001, forward_time=0.032, loss=2.706, loss_att=1.308, loss_ctc=4.104, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.549e-04, train_time=0.093 -[v016] 2022-01-31 06:06:37,128 (trainer:653) INFO: 77epoch:train:136-162batch: iter_time=7.578e-05, forward_time=0.032, loss=2.533, loss_att=1.337, loss_ctc=3.729, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.548e-04, train_time=0.091 -[v016] 2022-01-31 06:06:39,903 (trainer:653) INFO: 77epoch:train:163-189batch: iter_time=0.009, forward_time=0.032, loss=3.290, loss_att=1.569, loss_ctc=5.010, acc=0.937, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.548e-04, train_time=0.103 -[v016] 2022-01-31 06:06:42,406 (trainer:653) INFO: 77epoch:train:190-216batch: iter_time=8.083e-05, forward_time=0.032, loss=2.579, loss_att=1.288, loss_ctc=3.870, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.547e-04, train_time=0.092 -[v016] 2022-01-31 06:06:44,874 (trainer:653) INFO: 77epoch:train:217-243batch: iter_time=0.001, forward_time=0.031, loss=2.664, loss_att=1.334, loss_ctc=3.995, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.547e-04, train_time=0.091 -[v016] 2022-01-31 06:06:47,395 (trainer:653) INFO: 77epoch:train:244-270batch: iter_time=7.704e-05, forward_time=0.032, loss=2.797, loss_att=1.280, loss_ctc=4.315, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.546e-04, train_time=0.093 -[v016] 2022-01-31 06:06:49,868 (trainer:653) INFO: 77epoch:train:271-297batch: iter_time=8.168e-05, forward_time=0.032, loss=2.502, loss_att=1.250, loss_ctc=3.754, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.546e-04, train_time=0.091 -[v016] 2022-01-31 06:06:52,367 (trainer:653) INFO: 77epoch:train:298-324batch: iter_time=7.716e-05, forward_time=0.032, loss=2.479, loss_att=1.217, loss_ctc=3.741, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.545e-04, train_time=0.092 -[v016] 2022-01-31 06:06:54,825 (trainer:653) INFO: 77epoch:train:325-351batch: iter_time=7.797e-05, forward_time=0.031, loss=2.428, loss_att=1.234, loss_ctc=3.622, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.545e-04, train_time=0.091 -[v016] 2022-01-31 06:06:57,336 (trainer:653) INFO: 77epoch:train:352-378batch: iter_time=8.003e-05, forward_time=0.032, loss=2.879, loss_att=1.524, loss_ctc=4.235, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.544e-04, train_time=0.093 -[v016] 2022-01-31 06:06:59,810 (trainer:653) INFO: 77epoch:train:379-405batch: iter_time=7.869e-05, forward_time=0.032, loss=2.803, loss_att=1.328, loss_ctc=4.278, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.544e-04, train_time=0.091 -[v016] 2022-01-31 06:07:02,244 (trainer:653) INFO: 77epoch:train:406-432batch: iter_time=7.729e-05, forward_time=0.031, loss=2.888, loss_att=1.378, loss_ctc=4.398, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.543e-04, train_time=0.090 -[v016] 2022-01-31 06:07:04,746 (trainer:653) INFO: 77epoch:train:433-459batch: iter_time=0.001, forward_time=0.031, loss=2.675, loss_att=1.348, loss_ctc=4.003, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.543e-04, train_time=0.092 -[v016] 2022-01-31 06:07:07,234 (trainer:653) INFO: 77epoch:train:460-486batch: iter_time=7.357e-05, forward_time=0.032, loss=2.467, loss_att=1.235, loss_ctc=3.698, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.542e-04, train_time=0.092 -[v016] 2022-01-31 06:07:09,860 (trainer:653) INFO: 77epoch:train:487-513batch: iter_time=5.343e-04, forward_time=0.036, loss=2.920, loss_att=1.354, loss_ctc=4.485, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.542e-04, train_time=0.097 -[v016] 2022-01-31 06:07:12,343 (trainer:653) INFO: 77epoch:train:514-540batch: iter_time=0.001, forward_time=0.031, loss=2.576, loss_att=1.342, loss_ctc=3.809, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.541e-04, train_time=0.092 -[v016] 2022-01-31 06:07:47,231 (trainer:328) INFO: 77epoch results: [train] iter_time=0.002, forward_time=0.032, loss=2.704, loss_att=1.323, loss_ctc=4.086, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.546e-04, train_time=0.094, time=51.64 seconds, total_count=42119, gpu_max_cached_mem_GB=5.824, [valid] loss=6.715, loss_att=5.499, loss_ctc=7.931, acc=0.899, cer=0.106, wer=0.415, cer_ctc=0.165, time=5.93 seconds, total_count=13706, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.16 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:07:49,304 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:07:49,313 (trainer:261) INFO: 78/200epoch started. Estimated time to finish: 4 hours, 18 minutes and 6.15 seconds -[v016] 2022-01-31 06:07:53,463 (trainer:653) INFO: 78epoch:train:1-27batch: iter_time=0.061, forward_time=0.031, loss=2.445, loss_att=1.225, loss_ctc=3.664, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.541e-04, train_time=0.153 -[v016] 2022-01-31 06:07:56,652 (trainer:653) INFO: 78epoch:train:28-54batch: iter_time=0.026, forward_time=0.031, loss=2.675, loss_att=1.258, loss_ctc=4.091, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.540e-04, train_time=0.118 -[v016] 2022-01-31 06:07:59,761 (trainer:653) INFO: 78epoch:train:55-81batch: iter_time=0.025, forward_time=0.030, loss=2.779, loss_att=1.404, loss_ctc=4.153, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.540e-04, train_time=0.115 -[v016] 2022-01-31 06:08:02,817 (trainer:653) INFO: 78epoch:train:82-108batch: iter_time=0.020, forward_time=0.031, loss=2.745, loss_att=1.347, loss_ctc=4.143, acc=0.948, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.539e-04, train_time=0.113 -[v016] 2022-01-31 06:08:06,031 (trainer:653) INFO: 78epoch:train:109-135batch: iter_time=0.023, forward_time=0.032, loss=2.810, loss_att=1.325, loss_ctc=4.296, acc=0.949, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.539e-04, train_time=0.119 -[v016] 2022-01-31 06:08:08,805 (trainer:653) INFO: 78epoch:train:136-162batch: iter_time=0.006, forward_time=0.033, loss=2.403, loss_att=1.176, loss_ctc=3.631, acc=0.950, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.538e-04, train_time=0.102 -[v016] 2022-01-31 06:08:11,498 (trainer:653) INFO: 78epoch:train:163-189batch: iter_time=0.005, forward_time=0.032, loss=2.926, loss_att=1.403, loss_ctc=4.449, acc=0.944, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.538e-04, train_time=0.100 -[v016] 2022-01-31 06:08:14,296 (trainer:653) INFO: 78epoch:train:190-216batch: iter_time=0.009, forward_time=0.032, loss=2.536, loss_att=1.232, loss_ctc=3.839, acc=0.951, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.537e-04, train_time=0.103 -[v016] 2022-01-31 06:08:16,835 (trainer:653) INFO: 78epoch:train:217-243batch: iter_time=0.004, forward_time=0.030, loss=2.134, loss_att=1.139, loss_ctc=3.130, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.537e-04, train_time=0.094 -[v016] 2022-01-31 06:08:19,494 (trainer:653) INFO: 78epoch:train:244-270batch: iter_time=0.004, forward_time=0.032, loss=2.657, loss_att=1.243, loss_ctc=4.070, acc=0.946, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.536e-04, train_time=0.098 -[v016] 2022-01-31 06:08:22,058 (trainer:653) INFO: 78epoch:train:271-297batch: iter_time=0.001, forward_time=0.032, loss=2.956, loss_att=1.466, loss_ctc=4.446, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.536e-04, train_time=0.095 -[v016] 2022-01-31 06:08:25,368 (trainer:653) INFO: 78epoch:train:298-324batch: iter_time=0.027, forward_time=0.032, loss=2.757, loss_att=1.397, loss_ctc=4.117, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.535e-04, train_time=0.122 -[v016] 2022-01-31 06:08:28,196 (trainer:653) INFO: 78epoch:train:325-351batch: iter_time=0.005, forward_time=0.032, loss=2.922, loss_att=1.404, loss_ctc=4.439, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.535e-04, train_time=0.104 -[v016] 2022-01-31 06:08:30,631 (trainer:653) INFO: 78epoch:train:352-378batch: iter_time=3.219e-04, forward_time=0.030, loss=2.320, loss_att=1.175, loss_ctc=3.466, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.534e-04, train_time=0.090 -[v016] 2022-01-31 06:08:33,297 (trainer:653) INFO: 78epoch:train:379-405batch: iter_time=0.008, forward_time=0.030, loss=2.496, loss_att=1.211, loss_ctc=3.781, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.534e-04, train_time=0.099 -[v016] 2022-01-31 06:08:35,903 (trainer:653) INFO: 78epoch:train:406-432batch: iter_time=0.005, forward_time=0.031, loss=2.294, loss_att=1.166, loss_ctc=3.421, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.533e-04, train_time=0.096 -[v016] 2022-01-31 06:08:38,800 (trainer:653) INFO: 78epoch:train:433-459batch: iter_time=0.014, forward_time=0.032, loss=2.859, loss_att=1.422, loss_ctc=4.296, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.533e-04, train_time=0.107 -[v016] 2022-01-31 06:08:41,727 (trainer:653) INFO: 78epoch:train:460-486batch: iter_time=0.016, forward_time=0.031, loss=3.013, loss_att=1.417, loss_ctc=4.609, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.532e-04, train_time=0.108 -[v016] 2022-01-31 06:08:44,413 (trainer:653) INFO: 78epoch:train:487-513batch: iter_time=0.008, forward_time=0.031, loss=2.682, loss_att=1.294, loss_ctc=4.069, acc=0.948, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.532e-04, train_time=0.099 -[v016] 2022-01-31 06:08:47,180 (trainer:653) INFO: 78epoch:train:514-540batch: iter_time=0.008, forward_time=0.032, loss=3.155, loss_att=1.452, loss_ctc=4.858, acc=0.941, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.531e-04, train_time=0.102 -[v016] 2022-01-31 06:09:30,717 (trainer:328) INFO: 78epoch results: [train] iter_time=0.014, forward_time=0.031, loss=2.675, loss_att=1.306, loss_ctc=4.043, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.536e-04, train_time=0.107, time=58.63 seconds, total_count=42666, gpu_max_cached_mem_GB=5.824, [valid] loss=6.545, loss_att=5.383, loss_ctc=7.707, acc=0.903, cer=0.099, wer=0.400, cer_ctc=0.148, time=14.31 seconds, total_count=13884, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.45 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:09:32,896 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 06:09:32,919 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/65epoch.pth, exp/asr_train_asr_raw_en_word/73epoch.pth -[v016] 2022-01-31 06:09:32,922 (trainer:261) INFO: 79/200epoch started. Estimated time to finish: 4 hours, 15 minutes and 13.35 seconds -[v016] 2022-01-31 06:09:35,823 (trainer:653) INFO: 79epoch:train:1-27batch: iter_time=0.008, forward_time=0.034, loss=2.124, loss_att=1.036, loss_ctc=3.212, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.531e-04, train_time=0.105 -[v016] 2022-01-31 06:09:38,284 (trainer:653) INFO: 79epoch:train:28-54batch: iter_time=8.528e-05, forward_time=0.031, loss=2.379, loss_att=1.176, loss_ctc=3.582, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.530e-04, train_time=0.091 -[v016] 2022-01-31 06:09:40,757 (trainer:653) INFO: 79epoch:train:55-81batch: iter_time=9.377e-05, forward_time=0.031, loss=2.586, loss_att=1.278, loss_ctc=3.895, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.530e-04, train_time=0.091 -[v016] 2022-01-31 06:09:43,309 (trainer:653) INFO: 79epoch:train:82-108batch: iter_time=8.170e-05, forward_time=0.033, loss=2.982, loss_att=1.364, loss_ctc=4.599, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.529e-04, train_time=0.094 -[v016] 2022-01-31 06:09:45,933 (trainer:653) INFO: 79epoch:train:109-135batch: iter_time=0.004, forward_time=0.032, loss=3.150, loss_att=1.468, loss_ctc=4.832, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.529e-04, train_time=0.097 -[v016] 2022-01-31 06:09:48,343 (trainer:653) INFO: 79epoch:train:136-162batch: iter_time=8.258e-05, forward_time=0.030, loss=2.572, loss_att=1.244, loss_ctc=3.901, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.528e-04, train_time=0.089 -[v016] 2022-01-31 06:09:51,021 (trainer:653) INFO: 79epoch:train:163-189batch: iter_time=0.005, forward_time=0.033, loss=2.793, loss_att=1.323, loss_ctc=4.263, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.528e-04, train_time=0.099 -[v016] 2022-01-31 06:09:53,427 (trainer:653) INFO: 79epoch:train:190-216batch: iter_time=7.674e-05, forward_time=0.030, loss=2.824, loss_att=1.411, loss_ctc=4.238, acc=0.941, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.527e-04, train_time=0.089 -[v016] 2022-01-31 06:09:55,881 (trainer:653) INFO: 79epoch:train:217-243batch: iter_time=8.103e-05, forward_time=0.031, loss=2.621, loss_att=1.281, loss_ctc=3.961, acc=0.938, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.527e-04, train_time=0.091 -[v016] 2022-01-31 06:09:58,692 (trainer:653) INFO: 79epoch:train:244-270batch: iter_time=0.013, forward_time=0.031, loss=2.418, loss_att=1.275, loss_ctc=3.561, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.526e-04, train_time=0.104 -[v016] 2022-01-31 06:10:01,245 (trainer:653) INFO: 79epoch:train:271-297batch: iter_time=7.781e-05, forward_time=0.032, loss=2.995, loss_att=1.345, loss_ctc=4.645, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.526e-04, train_time=0.094 -[v016] 2022-01-31 06:10:03,701 (trainer:653) INFO: 79epoch:train:298-324batch: iter_time=7.616e-05, forward_time=0.031, loss=2.258, loss_att=1.097, loss_ctc=3.419, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.525e-04, train_time=0.091 -[v016] 2022-01-31 06:10:06,180 (trainer:653) INFO: 79epoch:train:325-351batch: iter_time=8.108e-05, forward_time=0.032, loss=2.820, loss_att=1.396, loss_ctc=4.243, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.525e-04, train_time=0.092 -[v016] 2022-01-31 06:10:08,634 (trainer:653) INFO: 79epoch:train:352-378batch: iter_time=8.412e-05, forward_time=0.031, loss=2.284, loss_att=1.188, loss_ctc=3.380, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.524e-04, train_time=0.091 -[v016] 2022-01-31 06:10:11,180 (trainer:653) INFO: 79epoch:train:379-405batch: iter_time=8.370e-05, forward_time=0.032, loss=2.637, loss_att=1.189, loss_ctc=4.084, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.524e-04, train_time=0.094 -[v016] 2022-01-31 06:10:13,636 (trainer:653) INFO: 79epoch:train:406-432batch: iter_time=8.264e-05, forward_time=0.031, loss=2.484, loss_att=1.233, loss_ctc=3.734, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.523e-04, train_time=0.091 -[v016] 2022-01-31 06:10:16,125 (trainer:653) INFO: 79epoch:train:433-459batch: iter_time=7.770e-05, forward_time=0.031, loss=2.740, loss_att=1.311, loss_ctc=4.169, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.523e-04, train_time=0.092 -[v016] 2022-01-31 06:10:18,598 (trainer:653) INFO: 79epoch:train:460-486batch: iter_time=9.368e-05, forward_time=0.031, loss=2.699, loss_att=1.340, loss_ctc=4.059, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.523e-04, train_time=0.091 -[v016] 2022-01-31 06:10:21,465 (trainer:653) INFO: 79epoch:train:487-513batch: iter_time=0.012, forward_time=0.032, loss=2.911, loss_att=1.437, loss_ctc=4.384, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.522e-04, train_time=0.106 -[v016] 2022-01-31 06:10:27,055 (trainer:653) INFO: 79epoch:train:514-540batch: iter_time=1.491e-04, forward_time=0.123, loss=2.539, loss_att=1.303, loss_ctc=3.775, acc=0.949, backward_time=0.037, optim_step_time=0.022, optim0_lr0=1.522e-04, train_time=0.207 -[v016] 2022-01-31 06:11:04,981 (trainer:328) INFO: 79epoch results: [train] iter_time=0.002, forward_time=0.036, loss=2.644, loss_att=1.285, loss_ctc=4.003, acc=0.946, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.526e-04, train_time=0.100, time=54.88 seconds, total_count=43213, gpu_max_cached_mem_GB=5.824, [valid] loss=6.644, loss_att=5.420, loss_ctc=7.868, acc=0.902, cer=0.103, wer=0.398, cer_ctc=0.154, time=6.13 seconds, total_count=14062, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.01 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:11:09,048 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:11:09,054 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/74epoch.pth -[v016] 2022-01-31 06:11:09,057 (trainer:261) INFO: 80/200epoch started. Estimated time to finish: 4 hours, 12 minutes and 7.57 seconds -[v016] 2022-01-31 06:11:15,149 (trainer:653) INFO: 80epoch:train:1-27batch: iter_time=0.043, forward_time=0.075, loss=2.762, loss_att=1.160, loss_ctc=4.364, acc=0.957, backward_time=0.031, optim_step_time=0.029, optim0_lr0=1.521e-04, train_time=0.213 -[v016] 2022-01-31 06:11:17,859 (trainer:653) INFO: 80epoch:train:28-54batch: iter_time=0.007, forward_time=0.031, loss=2.419, loss_att=1.120, loss_ctc=3.718, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.520e-04, train_time=0.101 -[v016] 2022-01-31 06:11:20,536 (trainer:653) INFO: 80epoch:train:55-81batch: iter_time=0.002, forward_time=0.033, loss=2.666, loss_att=1.247, loss_ctc=4.085, acc=0.948, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.520e-04, train_time=0.099 -[v016] 2022-01-31 06:11:23,430 (trainer:653) INFO: 80epoch:train:82-108batch: iter_time=0.008, forward_time=0.034, loss=2.646, loss_att=1.186, loss_ctc=4.105, acc=0.953, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.520e-04, train_time=0.107 -[v016] 2022-01-31 06:11:26,728 (trainer:653) INFO: 80epoch:train:109-135batch: iter_time=0.029, forward_time=0.032, loss=2.605, loss_att=1.301, loss_ctc=3.910, acc=0.941, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.519e-04, train_time=0.122 -[v016] 2022-01-31 06:11:29,409 (trainer:653) INFO: 80epoch:train:136-162batch: iter_time=1.224e-04, forward_time=0.033, loss=2.435, loss_att=1.146, loss_ctc=3.724, acc=0.953, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.519e-04, train_time=0.099 -[v016] 2022-01-31 06:11:32,149 (trainer:653) INFO: 80epoch:train:163-189batch: iter_time=1.102e-04, forward_time=0.034, loss=2.773, loss_att=1.253, loss_ctc=4.293, acc=0.952, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.518e-04, train_time=0.101 -[v016] 2022-01-31 06:11:35,830 (trainer:653) INFO: 80epoch:train:190-216batch: iter_time=0.038, forward_time=0.034, loss=2.699, loss_att=1.348, loss_ctc=4.049, acc=0.945, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.518e-04, train_time=0.136 -[v016] 2022-01-31 06:11:38,441 (trainer:653) INFO: 80epoch:train:217-243batch: iter_time=1.020e-04, forward_time=0.033, loss=2.321, loss_att=1.203, loss_ctc=3.440, acc=0.946, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.517e-04, train_time=0.096 -[v016] 2022-01-31 06:11:41,122 (trainer:653) INFO: 80epoch:train:244-270batch: iter_time=0.001, forward_time=0.033, loss=2.480, loss_att=1.181, loss_ctc=3.780, acc=0.949, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.517e-04, train_time=0.099 -[v016] 2022-01-31 06:11:43,693 (trainer:653) INFO: 80epoch:train:271-297batch: iter_time=2.700e-04, forward_time=0.032, loss=2.325, loss_att=1.190, loss_ctc=3.461, acc=0.944, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.516e-04, train_time=0.095 -[v016] 2022-01-31 06:11:46,300 (trainer:653) INFO: 80epoch:train:298-324batch: iter_time=1.104e-04, forward_time=0.033, loss=2.494, loss_att=1.133, loss_ctc=3.855, acc=0.955, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.516e-04, train_time=0.096 -[v016] 2022-01-31 06:11:48,909 (trainer:653) INFO: 80epoch:train:325-351batch: iter_time=9.827e-05, forward_time=0.033, loss=2.685, loss_att=1.329, loss_ctc=4.040, acc=0.944, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.515e-04, train_time=0.096 -[v016] 2022-01-31 06:11:51,518 (trainer:653) INFO: 80epoch:train:352-378batch: iter_time=9.194e-05, forward_time=0.032, loss=2.395, loss_att=1.210, loss_ctc=3.580, acc=0.945, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.515e-04, train_time=0.096 -[v016] 2022-01-31 06:11:54,184 (trainer:653) INFO: 80epoch:train:379-405batch: iter_time=9.176e-04, forward_time=0.033, loss=2.993, loss_att=1.415, loss_ctc=4.571, acc=0.950, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.514e-04, train_time=0.098 -[v016] 2022-01-31 06:11:56,856 (trainer:653) INFO: 80epoch:train:406-432batch: iter_time=0.005, forward_time=0.032, loss=2.383, loss_att=1.157, loss_ctc=3.609, acc=0.953, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.514e-04, train_time=0.099 -[v016] 2022-01-31 06:11:59,283 (trainer:653) INFO: 80epoch:train:433-459batch: iter_time=2.421e-04, forward_time=0.030, loss=2.566, loss_att=1.222, loss_ctc=3.911, acc=0.951, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.513e-04, train_time=0.090 -[v016] 2022-01-31 06:12:01,717 (trainer:653) INFO: 80epoch:train:460-486batch: iter_time=8.166e-05, forward_time=0.031, loss=2.400, loss_att=1.268, loss_ctc=3.531, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.513e-04, train_time=0.090 -[v016] 2022-01-31 06:12:04,600 (trainer:653) INFO: 80epoch:train:487-513batch: iter_time=0.013, forward_time=0.032, loss=2.894, loss_att=1.390, loss_ctc=4.397, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.512e-04, train_time=0.107 -[v016] 2022-01-31 06:12:06,999 (trainer:653) INFO: 80epoch:train:514-540batch: iter_time=8.115e-05, forward_time=0.030, loss=2.671, loss_att=1.343, loss_ctc=4.000, acc=0.936, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.512e-04, train_time=0.089 -[v016] 2022-01-31 06:12:44,678 (trainer:328) INFO: 80epoch results: [train] iter_time=0.007, forward_time=0.035, loss=2.577, loss_att=1.239, loss_ctc=3.914, acc=0.948, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.516e-04, train_time=0.106, time=58.62 seconds, total_count=43760, gpu_max_cached_mem_GB=5.824, [valid] loss=6.777, loss_att=5.484, loss_ctc=8.071, acc=0.900, cer=0.104, wer=0.409, cer_ctc=0.158, time=9.17 seconds, total_count=14240, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.8 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:12:47,318 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:12:47,324 (trainer:261) INFO: 81/200epoch started. Estimated time to finish: 4 hours, 9 minutes and 9.05 seconds -[v016] 2022-01-31 06:12:50,368 (trainer:653) INFO: 81epoch:train:1-27batch: iter_time=0.016, forward_time=0.033, loss=2.496, loss_att=1.130, loss_ctc=3.861, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.511e-04, train_time=0.112 -[v016] 2022-01-31 06:12:53,093 (trainer:653) INFO: 81epoch:train:28-54batch: iter_time=0.002, forward_time=0.033, loss=3.228, loss_att=1.421, loss_ctc=5.036, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.511e-04, train_time=0.101 -[v016] 2022-01-31 06:12:55,522 (trainer:653) INFO: 81epoch:train:55-81batch: iter_time=8.338e-05, forward_time=0.031, loss=2.270, loss_att=1.125, loss_ctc=3.415, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.510e-04, train_time=0.090 -[v016] 2022-01-31 06:12:58,084 (trainer:653) INFO: 81epoch:train:82-108batch: iter_time=0.005, forward_time=0.031, loss=2.518, loss_att=1.194, loss_ctc=3.841, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.510e-04, train_time=0.095 -[v016] 2022-01-31 06:13:00,512 (trainer:653) INFO: 81epoch:train:109-135batch: iter_time=0.001, forward_time=0.030, loss=2.530, loss_att=1.258, loss_ctc=3.802, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.510e-04, train_time=0.090 -[v016] 2022-01-31 06:13:02,939 (trainer:653) INFO: 81epoch:train:136-162batch: iter_time=8.072e-05, forward_time=0.030, loss=2.283, loss_att=1.148, loss_ctc=3.418, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.509e-04, train_time=0.090 -[v016] 2022-01-31 06:13:05,459 (trainer:653) INFO: 81epoch:train:163-189batch: iter_time=9.313e-05, forward_time=0.032, loss=2.411, loss_att=1.222, loss_ctc=3.599, acc=0.950, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.509e-04, train_time=0.093 -[v016] 2022-01-31 06:13:08,039 (trainer:653) INFO: 81epoch:train:190-216batch: iter_time=1.003e-04, forward_time=0.033, loss=2.396, loss_att=1.144, loss_ctc=3.648, acc=0.952, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.508e-04, train_time=0.095 -[v016] 2022-01-31 06:13:10,555 (trainer:653) INFO: 81epoch:train:217-243batch: iter_time=4.527e-04, forward_time=0.032, loss=2.761, loss_att=1.346, loss_ctc=4.176, acc=0.940, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.508e-04, train_time=0.093 -[v016] 2022-01-31 06:13:13,080 (trainer:653) INFO: 81epoch:train:244-270batch: iter_time=8.580e-05, forward_time=0.032, loss=2.381, loss_att=1.079, loss_ctc=3.683, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.507e-04, train_time=0.093 -[v016] 2022-01-31 06:13:15,649 (trainer:653) INFO: 81epoch:train:271-297batch: iter_time=8.718e-05, forward_time=0.032, loss=2.856, loss_att=1.297, loss_ctc=4.415, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.507e-04, train_time=0.095 -[v016] 2022-01-31 06:13:18,250 (trainer:653) INFO: 81epoch:train:298-324batch: iter_time=0.005, forward_time=0.031, loss=2.236, loss_att=1.049, loss_ctc=3.423, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.506e-04, train_time=0.096 -[v016] 2022-01-31 06:13:20,686 (trainer:653) INFO: 81epoch:train:325-351batch: iter_time=8.271e-05, forward_time=0.031, loss=2.616, loss_att=1.193, loss_ctc=4.040, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.506e-04, train_time=0.090 -[v016] 2022-01-31 06:13:23,197 (trainer:653) INFO: 81epoch:train:352-378batch: iter_time=9.971e-05, forward_time=0.031, loss=2.448, loss_att=1.150, loss_ctc=3.746, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.505e-04, train_time=0.093 -[v016] 2022-01-31 06:13:25,666 (trainer:653) INFO: 81epoch:train:379-405batch: iter_time=9.059e-05, forward_time=0.031, loss=2.550, loss_att=1.253, loss_ctc=3.847, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.505e-04, train_time=0.091 -[v016] 2022-01-31 06:13:28,189 (trainer:653) INFO: 81epoch:train:406-432batch: iter_time=9.302e-05, forward_time=0.031, loss=2.707, loss_att=1.350, loss_ctc=4.064, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.504e-04, train_time=0.093 -[v016] 2022-01-31 06:13:30,769 (trainer:653) INFO: 81epoch:train:433-459batch: iter_time=0.006, forward_time=0.030, loss=2.457, loss_att=1.255, loss_ctc=3.659, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.504e-04, train_time=0.095 -[v016] 2022-01-31 06:13:33,233 (trainer:653) INFO: 81epoch:train:460-486batch: iter_time=7.661e-05, forward_time=0.031, loss=2.519, loss_att=1.212, loss_ctc=3.827, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.504e-04, train_time=0.091 -[v016] 2022-01-31 06:13:35,706 (trainer:653) INFO: 81epoch:train:487-513batch: iter_time=7.875e-05, forward_time=0.031, loss=2.447, loss_att=1.211, loss_ctc=3.684, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.503e-04, train_time=0.091 -[v016] 2022-01-31 06:13:38,218 (trainer:653) INFO: 81epoch:train:514-540batch: iter_time=8.371e-05, forward_time=0.032, loss=2.763, loss_att=1.326, loss_ctc=4.201, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.503e-04, train_time=0.093 -[v016] 2022-01-31 06:14:12,413 (trainer:328) INFO: 81epoch results: [train] iter_time=0.002, forward_time=0.031, loss=2.549, loss_att=1.218, loss_ctc=3.881, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.507e-04, train_time=0.094, time=51.65 seconds, total_count=44307, gpu_max_cached_mem_GB=5.824, [valid] loss=6.573, loss_att=5.370, loss_ctc=7.776, acc=0.904, cer=0.097, wer=0.402, cer_ctc=0.152, time=6.04 seconds, total_count=14418, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.4 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:14:14,593 (trainer:375) INFO: The best model has been updated: train.loss, valid.acc -[v016] 2022-01-31 06:14:14,651 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/75epoch.pth, exp/asr_train_asr_raw_en_word/76epoch.pth -[v016] 2022-01-31 06:14:14,652 (trainer:261) INFO: 82/200epoch started. Estimated time to finish: 4 hours, 5 minutes and 51.81 seconds -[v016] 2022-01-31 06:14:17,239 (trainer:653) INFO: 82epoch:train:1-27batch: iter_time=0.005, forward_time=0.031, loss=2.392, loss_att=1.210, loss_ctc=3.574, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.502e-04, train_time=0.096 -[v016] 2022-01-31 06:14:19,690 (trainer:653) INFO: 82epoch:train:28-54batch: iter_time=7.932e-05, forward_time=0.031, loss=2.389, loss_att=1.117, loss_ctc=3.661, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.502e-04, train_time=0.091 -[v016] 2022-01-31 06:14:22,077 (trainer:653) INFO: 82epoch:train:55-81batch: iter_time=8.085e-05, forward_time=0.030, loss=2.344, loss_att=1.205, loss_ctc=3.484, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.501e-04, train_time=0.088 -[v016] 2022-01-31 06:14:24,486 (trainer:653) INFO: 82epoch:train:82-108batch: iter_time=7.867e-05, forward_time=0.031, loss=2.390, loss_att=1.129, loss_ctc=3.651, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.501e-04, train_time=0.089 -[v016] 2022-01-31 06:14:26,942 (trainer:653) INFO: 82epoch:train:109-135batch: iter_time=8.867e-05, forward_time=0.031, loss=2.188, loss_att=1.131, loss_ctc=3.245, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.500e-04, train_time=0.091 -[v016] 2022-01-31 06:14:29,491 (trainer:653) INFO: 82epoch:train:136-162batch: iter_time=0.003, forward_time=0.032, loss=2.760, loss_att=1.304, loss_ctc=4.217, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.500e-04, train_time=0.094 -[v016] 2022-01-31 06:14:32,032 (trainer:653) INFO: 82epoch:train:163-189batch: iter_time=7.674e-05, forward_time=0.032, loss=2.966, loss_att=1.251, loss_ctc=4.680, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.499e-04, train_time=0.094 -[v016] 2022-01-31 06:14:34,604 (trainer:653) INFO: 82epoch:train:190-216batch: iter_time=0.005, forward_time=0.031, loss=2.471, loss_att=1.188, loss_ctc=3.753, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.499e-04, train_time=0.095 -[v016] 2022-01-31 06:14:37,240 (trainer:653) INFO: 82epoch:train:217-243batch: iter_time=7.743e-05, forward_time=0.033, loss=2.555, loss_att=1.098, loss_ctc=4.012, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.498e-04, train_time=0.097 -[v016] 2022-01-31 06:14:39,694 (trainer:653) INFO: 82epoch:train:244-270batch: iter_time=7.845e-05, forward_time=0.031, loss=2.290, loss_att=1.106, loss_ctc=3.475, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.498e-04, train_time=0.091 -[v016] 2022-01-31 06:14:42,231 (trainer:653) INFO: 82epoch:train:271-297batch: iter_time=8.798e-05, forward_time=0.032, loss=2.435, loss_att=1.228, loss_ctc=3.642, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.498e-04, train_time=0.094 -[v016] 2022-01-31 06:14:44,651 (trainer:653) INFO: 82epoch:train:298-324batch: iter_time=7.806e-05, forward_time=0.030, loss=2.364, loss_att=1.129, loss_ctc=3.600, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.497e-04, train_time=0.089 -[v016] 2022-01-31 06:14:47,071 (trainer:653) INFO: 82epoch:train:325-351batch: iter_time=7.657e-05, forward_time=0.030, loss=2.440, loss_att=1.183, loss_ctc=3.697, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.497e-04, train_time=0.089 -[v016] 2022-01-31 06:14:49,492 (trainer:653) INFO: 82epoch:train:352-378batch: iter_time=7.469e-05, forward_time=0.030, loss=2.421, loss_att=1.132, loss_ctc=3.710, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.496e-04, train_time=0.089 -[v016] 2022-01-31 06:14:51,974 (trainer:653) INFO: 82epoch:train:379-405batch: iter_time=7.677e-05, forward_time=0.031, loss=2.752, loss_att=1.327, loss_ctc=4.177, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.496e-04, train_time=0.092 -[v016] 2022-01-31 06:14:54,462 (trainer:653) INFO: 82epoch:train:406-432batch: iter_time=0.006, forward_time=0.030, loss=2.189, loss_att=1.158, loss_ctc=3.219, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.495e-04, train_time=0.092 -[v016] 2022-01-31 06:14:56,991 (trainer:653) INFO: 82epoch:train:433-459batch: iter_time=8.508e-05, forward_time=0.032, loss=3.008, loss_att=1.370, loss_ctc=4.646, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.495e-04, train_time=0.093 -[v016] 2022-01-31 06:14:59,500 (trainer:653) INFO: 82epoch:train:460-486batch: iter_time=8.257e-05, forward_time=0.032, loss=3.370, loss_att=1.541, loss_ctc=5.199, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.494e-04, train_time=0.093 -[v016] 2022-01-31 06:15:01,984 (trainer:653) INFO: 82epoch:train:487-513batch: iter_time=7.923e-05, forward_time=0.031, loss=2.666, loss_att=1.266, loss_ctc=4.066, acc=0.945, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.494e-04, train_time=0.092 -[v016] 2022-01-31 06:15:05,109 (trainer:653) INFO: 82epoch:train:514-540batch: iter_time=0.023, forward_time=0.032, loss=2.879, loss_att=1.406, loss_ctc=4.353, acc=0.945, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.493e-04, train_time=0.116 -[v016] 2022-01-31 06:15:38,656 (trainer:328) INFO: 82epoch results: [train] iter_time=0.002, forward_time=0.031, loss=2.564, loss_att=1.226, loss_ctc=3.901, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.498e-04, train_time=0.094, time=51.63 seconds, total_count=44854, gpu_max_cached_mem_GB=5.824, [valid] loss=6.665, loss_att=5.516, loss_ctc=7.814, acc=0.901, cer=0.104, wer=0.409, cer_ctc=0.156, time=5.45 seconds, total_count=14596, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.91 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:15:40,762 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 06:15:40,767 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/77epoch.pth -[v016] 2022-01-31 06:15:40,767 (trainer:261) INFO: 83/200epoch started. Estimated time to finish: 4 hours, 2 minutes and 35.81 seconds -[v016] 2022-01-31 06:15:43,395 (trainer:653) INFO: 83epoch:train:1-27batch: iter_time=0.006, forward_time=0.031, loss=2.119, loss_att=1.072, loss_ctc=3.166, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.493e-04, train_time=0.097 -[v016] 2022-01-31 06:15:45,862 (trainer:653) INFO: 83epoch:train:28-54batch: iter_time=8.507e-05, forward_time=0.031, loss=2.374, loss_att=1.108, loss_ctc=3.640, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.492e-04, train_time=0.091 -[v016] 2022-01-31 06:15:48,339 (trainer:653) INFO: 83epoch:train:55-81batch: iter_time=7.510e-05, forward_time=0.031, loss=2.332, loss_att=1.115, loss_ctc=3.548, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.492e-04, train_time=0.092 -[v016] 2022-01-31 06:15:50,811 (trainer:653) INFO: 83epoch:train:82-108batch: iter_time=7.656e-05, forward_time=0.031, loss=2.617, loss_att=1.236, loss_ctc=3.997, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.492e-04, train_time=0.091 -[v016] 2022-01-31 06:15:53,298 (trainer:653) INFO: 83epoch:train:109-135batch: iter_time=7.487e-05, forward_time=0.031, loss=2.600, loss_att=1.150, loss_ctc=4.050, acc=0.954, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.491e-04, train_time=0.092 -[v016] 2022-01-31 06:15:55,731 (trainer:653) INFO: 83epoch:train:136-162batch: iter_time=7.542e-05, forward_time=0.031, loss=2.307, loss_att=1.137, loss_ctc=3.477, acc=0.950, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.491e-04, train_time=0.090 -[v016] 2022-01-31 06:15:58,227 (trainer:653) INFO: 83epoch:train:163-189batch: iter_time=8.048e-05, forward_time=0.032, loss=2.770, loss_att=1.272, loss_ctc=4.267, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.490e-04, train_time=0.092 -[v016] 2022-01-31 06:16:00,697 (trainer:653) INFO: 83epoch:train:190-216batch: iter_time=8.222e-05, forward_time=0.031, loss=2.477, loss_att=1.131, loss_ctc=3.824, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.490e-04, train_time=0.091 -[v016] 2022-01-31 06:16:03,174 (trainer:653) INFO: 83epoch:train:217-243batch: iter_time=7.967e-05, forward_time=0.031, loss=2.355, loss_att=1.092, loss_ctc=3.618, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.489e-04, train_time=0.091 -[v016] 2022-01-31 06:16:05,586 (trainer:653) INFO: 83epoch:train:244-270batch: iter_time=8.147e-05, forward_time=0.031, loss=2.214, loss_att=1.067, loss_ctc=3.362, acc=0.952, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.489e-04, train_time=0.089 -[v016] 2022-01-31 06:16:08,001 (trainer:653) INFO: 83epoch:train:271-297batch: iter_time=8.124e-05, forward_time=0.031, loss=2.278, loss_att=1.105, loss_ctc=3.451, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.488e-04, train_time=0.089 -[v016] 2022-01-31 06:16:10,458 (trainer:653) INFO: 83epoch:train:298-324batch: iter_time=7.899e-05, forward_time=0.031, loss=2.470, loss_att=1.224, loss_ctc=3.716, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.488e-04, train_time=0.091 -[v016] 2022-01-31 06:16:12,973 (trainer:653) INFO: 83epoch:train:325-351batch: iter_time=7.911e-05, forward_time=0.032, loss=2.641, loss_att=1.327, loss_ctc=3.954, acc=0.948, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.488e-04, train_time=0.093 -[v016] 2022-01-31 06:16:15,430 (trainer:653) INFO: 83epoch:train:352-378batch: iter_time=7.687e-05, forward_time=0.031, loss=2.659, loss_att=1.343, loss_ctc=3.975, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.487e-04, train_time=0.091 -[v016] 2022-01-31 06:16:17,823 (trainer:653) INFO: 83epoch:train:379-405batch: iter_time=8.203e-05, forward_time=0.030, loss=2.062, loss_att=1.085, loss_ctc=3.038, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.487e-04, train_time=0.088 -[v016] 2022-01-31 06:16:20,248 (trainer:653) INFO: 83epoch:train:406-432batch: iter_time=7.970e-05, forward_time=0.031, loss=2.625, loss_att=1.249, loss_ctc=4.001, acc=0.949, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.486e-04, train_time=0.090 -[v016] 2022-01-31 06:16:22,731 (trainer:653) INFO: 83epoch:train:433-459batch: iter_time=7.683e-05, forward_time=0.032, loss=2.478, loss_att=1.187, loss_ctc=3.769, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.486e-04, train_time=0.092 -[v016] 2022-01-31 06:16:25,250 (trainer:653) INFO: 83epoch:train:460-486batch: iter_time=7.745e-05, forward_time=0.032, loss=2.827, loss_att=1.335, loss_ctc=4.320, acc=0.946, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.485e-04, train_time=0.093 -[v016] 2022-01-31 06:16:27,846 (trainer:653) INFO: 83epoch:train:487-513batch: iter_time=8.406e-05, forward_time=0.031, loss=2.365, loss_att=1.138, loss_ctc=3.591, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.485e-04, train_time=0.096 -[v016] 2022-01-31 06:16:30,272 (trainer:653) INFO: 83epoch:train:514-540batch: iter_time=8.077e-05, forward_time=0.031, loss=2.172, loss_att=1.159, loss_ctc=3.185, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.484e-04, train_time=0.090 -[v016] 2022-01-31 06:17:03,780 (trainer:328) INFO: 83epoch results: [train] iter_time=3.676e-04, forward_time=0.031, loss=2.438, loss_att=1.179, loss_ctc=3.697, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.489e-04, train_time=0.091, time=50.2 seconds, total_count=45401, gpu_max_cached_mem_GB=5.824, [valid] loss=6.662, loss_att=5.496, loss_ctc=7.829, acc=0.902, cer=0.101, wer=0.407, cer_ctc=0.154, time=5.7 seconds, total_count=14774, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.1 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:17:05,873 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:17:05,919 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/72epoch.pth -[v016] 2022-01-31 06:17:05,919 (trainer:261) INFO: 84/200epoch started. Estimated time to finish: 3 hours, 59 minutes and 21.51 seconds -[v016] 2022-01-31 06:17:08,661 (trainer:653) INFO: 84epoch:train:1-27batch: iter_time=0.007, forward_time=0.032, loss=2.298, loss_att=1.109, loss_ctc=3.487, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.484e-04, train_time=0.101 -[v016] 2022-01-31 06:17:11,077 (trainer:653) INFO: 84epoch:train:28-54batch: iter_time=8.011e-05, forward_time=0.031, loss=2.482, loss_att=1.145, loss_ctc=3.818, acc=0.951, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.483e-04, train_time=0.089 -[v016] 2022-01-31 06:17:13,503 (trainer:653) INFO: 84epoch:train:55-81batch: iter_time=7.911e-05, forward_time=0.031, loss=2.438, loss_att=1.204, loss_ctc=3.671, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.483e-04, train_time=0.090 -[v016] 2022-01-31 06:17:15,941 (trainer:653) INFO: 84epoch:train:82-108batch: iter_time=7.954e-05, forward_time=0.031, loss=2.485, loss_att=1.197, loss_ctc=3.772, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.483e-04, train_time=0.090 -[v016] 2022-01-31 06:17:18,379 (trainer:653) INFO: 84epoch:train:109-135batch: iter_time=7.634e-05, forward_time=0.031, loss=2.447, loss_att=1.178, loss_ctc=3.717, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.482e-04, train_time=0.090 -[v016] 2022-01-31 06:17:20,885 (trainer:653) INFO: 84epoch:train:136-162batch: iter_time=8.679e-05, forward_time=0.032, loss=2.622, loss_att=1.137, loss_ctc=4.108, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.482e-04, train_time=0.093 -[v016] 2022-01-31 06:17:23,416 (trainer:653) INFO: 84epoch:train:163-189batch: iter_time=8.665e-05, forward_time=0.032, loss=2.385, loss_att=1.183, loss_ctc=3.587, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.481e-04, train_time=0.094 -[v016] 2022-01-31 06:17:25,888 (trainer:653) INFO: 84epoch:train:190-216batch: iter_time=9.222e-05, forward_time=0.032, loss=2.252, loss_att=1.121, loss_ctc=3.382, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.481e-04, train_time=0.091 -[v016] 2022-01-31 06:17:28,351 (trainer:653) INFO: 84epoch:train:217-243batch: iter_time=8.920e-05, forward_time=0.031, loss=2.031, loss_att=0.979, loss_ctc=3.083, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.480e-04, train_time=0.091 -[v016] 2022-01-31 06:17:30,820 (trainer:653) INFO: 84epoch:train:244-270batch: iter_time=9.229e-05, forward_time=0.032, loss=2.251, loss_att=1.105, loss_ctc=3.398, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.480e-04, train_time=0.091 -[v016] 2022-01-31 06:17:33,310 (trainer:653) INFO: 84epoch:train:271-297batch: iter_time=9.955e-05, forward_time=0.032, loss=2.339, loss_att=1.161, loss_ctc=3.517, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.479e-04, train_time=0.092 -[v016] 2022-01-31 06:17:35,913 (trainer:653) INFO: 84epoch:train:298-324batch: iter_time=8.822e-05, forward_time=0.033, loss=2.506, loss_att=1.196, loss_ctc=3.815, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.479e-04, train_time=0.096 -[v016] 2022-01-31 06:17:38,486 (trainer:653) INFO: 84epoch:train:325-351batch: iter_time=1.024e-04, forward_time=0.033, loss=2.858, loss_att=1.323, loss_ctc=4.392, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.479e-04, train_time=0.095 -[v016] 2022-01-31 06:17:41,398 (trainer:653) INFO: 84epoch:train:352-378batch: iter_time=0.018, forward_time=0.030, loss=2.726, loss_att=1.297, loss_ctc=4.156, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.478e-04, train_time=0.108 -[v016] 2022-01-31 06:17:43,861 (trainer:653) INFO: 84epoch:train:379-405batch: iter_time=8.391e-05, forward_time=0.032, loss=2.582, loss_att=1.250, loss_ctc=3.914, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.478e-04, train_time=0.091 -[v016] 2022-01-31 06:17:46,302 (trainer:653) INFO: 84epoch:train:406-432batch: iter_time=8.298e-05, forward_time=0.031, loss=2.356, loss_att=1.309, loss_ctc=3.403, acc=0.940, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.477e-04, train_time=0.090 -[v016] 2022-01-31 06:17:48,888 (trainer:653) INFO: 84epoch:train:433-459batch: iter_time=0.003, forward_time=0.032, loss=2.438, loss_att=1.233, loss_ctc=3.643, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.477e-04, train_time=0.096 -[v016] 2022-01-31 06:17:51,338 (trainer:653) INFO: 84epoch:train:460-486batch: iter_time=8.178e-05, forward_time=0.031, loss=2.282, loss_att=1.072, loss_ctc=3.492, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.476e-04, train_time=0.090 -[v016] 2022-01-31 06:17:53,856 (trainer:653) INFO: 84epoch:train:487-513batch: iter_time=8.244e-05, forward_time=0.032, loss=2.652, loss_att=1.168, loss_ctc=4.136, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.476e-04, train_time=0.093 -[v016] 2022-01-31 06:17:56,302 (trainer:653) INFO: 84epoch:train:514-540batch: iter_time=7.666e-05, forward_time=0.032, loss=2.214, loss_att=1.135, loss_ctc=3.294, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.476e-04, train_time=0.090 -[v016] 2022-01-31 06:18:30,148 (trainer:328) INFO: 84epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.434, loss_att=1.176, loss_ctc=3.691, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.480e-04, train_time=0.093, time=51.07 seconds, total_count=45948, gpu_max_cached_mem_GB=5.824, [valid] loss=6.833, loss_att=5.516, loss_ctc=8.149, acc=0.900, cer=0.106, wer=0.410, cer_ctc=0.159, time=5.66 seconds, total_count=14952, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.5 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:18:32,166 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 06:18:32,171 (trainer:261) INFO: 85/200epoch started. Estimated time to finish: 3 hours, 56 minutes and 12.61 seconds -[v016] 2022-01-31 06:18:34,776 (trainer:653) INFO: 85epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=2.328, loss_att=1.002, loss_ctc=3.653, acc=0.958, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.475e-04, train_time=0.096 -[v016] 2022-01-31 06:18:37,230 (trainer:653) INFO: 85epoch:train:28-54batch: iter_time=8.151e-05, forward_time=0.032, loss=2.152, loss_att=1.012, loss_ctc=3.292, acc=0.958, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.475e-04, train_time=0.091 -[v016] 2022-01-31 06:18:39,631 (trainer:653) INFO: 85epoch:train:55-81batch: iter_time=8.088e-05, forward_time=0.031, loss=2.103, loss_att=1.094, loss_ctc=3.112, acc=0.953, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.474e-04, train_time=0.089 -[v016] 2022-01-31 06:18:42,148 (trainer:653) INFO: 85epoch:train:82-108batch: iter_time=6.790e-04, forward_time=0.032, loss=2.582, loss_att=1.200, loss_ctc=3.964, acc=0.946, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.474e-04, train_time=0.093 -[v016] 2022-01-31 06:18:44,683 (trainer:653) INFO: 85epoch:train:109-135batch: iter_time=8.378e-05, forward_time=0.032, loss=2.521, loss_att=1.199, loss_ctc=3.843, acc=0.954, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.473e-04, train_time=0.094 -[v016] 2022-01-31 06:18:47,098 (trainer:653) INFO: 85epoch:train:136-162batch: iter_time=8.039e-05, forward_time=0.031, loss=2.377, loss_att=1.189, loss_ctc=3.566, acc=0.951, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.473e-04, train_time=0.089 -[v016] 2022-01-31 06:18:49,473 (trainer:653) INFO: 85epoch:train:163-189batch: iter_time=8.070e-05, forward_time=0.031, loss=2.174, loss_att=1.191, loss_ctc=3.156, acc=0.945, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.472e-04, train_time=0.088 -[v016] 2022-01-31 06:18:52,049 (trainer:653) INFO: 85epoch:train:190-216batch: iter_time=7.971e-05, forward_time=0.033, loss=2.786, loss_att=1.270, loss_ctc=4.303, acc=0.948, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.472e-04, train_time=0.095 -[v016] 2022-01-31 06:18:54,550 (trainer:653) INFO: 85epoch:train:217-243batch: iter_time=7.699e-05, forward_time=0.032, loss=2.275, loss_att=1.061, loss_ctc=3.489, acc=0.949, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.472e-04, train_time=0.092 -[v016] 2022-01-31 06:18:56,974 (trainer:653) INFO: 85epoch:train:244-270batch: iter_time=7.998e-05, forward_time=0.031, loss=2.161, loss_att=1.067, loss_ctc=3.255, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.471e-04, train_time=0.090 -[v016] 2022-01-31 06:18:59,393 (trainer:653) INFO: 85epoch:train:271-297batch: iter_time=8.407e-05, forward_time=0.031, loss=2.133, loss_att=1.026, loss_ctc=3.240, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.471e-04, train_time=0.089 -[v016] 2022-01-31 06:19:01,894 (trainer:653) INFO: 85epoch:train:298-324batch: iter_time=7.733e-05, forward_time=0.032, loss=2.496, loss_att=1.114, loss_ctc=3.879, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.470e-04, train_time=0.092 -[v016] 2022-01-31 06:19:04,323 (trainer:653) INFO: 85epoch:train:325-351batch: iter_time=8.014e-05, forward_time=0.031, loss=2.499, loss_att=1.200, loss_ctc=3.797, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.470e-04, train_time=0.090 -[v016] 2022-01-31 06:19:06,823 (trainer:653) INFO: 85epoch:train:352-378batch: iter_time=8.325e-05, forward_time=0.032, loss=2.678, loss_att=1.207, loss_ctc=4.150, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.469e-04, train_time=0.092 -[v016] 2022-01-31 06:19:09,346 (trainer:653) INFO: 85epoch:train:379-405batch: iter_time=8.042e-05, forward_time=0.032, loss=2.654, loss_att=1.210, loss_ctc=4.098, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.469e-04, train_time=0.093 -[v016] 2022-01-31 06:19:11,834 (trainer:653) INFO: 85epoch:train:406-432batch: iter_time=8.067e-05, forward_time=0.032, loss=2.305, loss_att=1.117, loss_ctc=3.494, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.469e-04, train_time=0.092 -[v016] 2022-01-31 06:19:14,357 (trainer:653) INFO: 85epoch:train:433-459batch: iter_time=0.001, forward_time=0.032, loss=2.288, loss_att=1.097, loss_ctc=3.478, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.468e-04, train_time=0.093 -[v016] 2022-01-31 06:19:16,849 (trainer:653) INFO: 85epoch:train:460-486batch: iter_time=7.990e-05, forward_time=0.032, loss=2.359, loss_att=1.119, loss_ctc=3.599, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.468e-04, train_time=0.092 -[v016] 2022-01-31 06:19:19,353 (trainer:653) INFO: 85epoch:train:487-513batch: iter_time=7.824e-05, forward_time=0.032, loss=2.254, loss_att=1.102, loss_ctc=3.405, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.467e-04, train_time=0.093 -[v016] 2022-01-31 06:19:21,833 (trainer:653) INFO: 85epoch:train:514-540batch: iter_time=7.836e-05, forward_time=0.032, loss=2.826, loss_att=1.363, loss_ctc=4.289, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.467e-04, train_time=0.092 -[v016] 2022-01-31 06:19:55,642 (trainer:328) INFO: 85epoch results: [train] iter_time=3.256e-04, forward_time=0.032, loss=2.388, loss_att=1.140, loss_ctc=3.636, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.471e-04, train_time=0.092, time=50.35 seconds, total_count=46495, gpu_max_cached_mem_GB=5.824, [valid] loss=6.739, loss_att=5.508, loss_ctc=7.969, acc=0.902, cer=0.102, wer=0.405, cer_ctc=0.152, time=5.48 seconds, total_count=15130, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.64 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:19:57,665 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:19:57,671 (trainer:261) INFO: 86/200epoch started. Estimated time to finish: 3 hours, 53 minutes and 5.54 seconds -[v016] 2022-01-31 06:20:00,431 (trainer:653) INFO: 86epoch:train:1-27batch: iter_time=0.008, forward_time=0.032, loss=2.240, loss_att=1.044, loss_ctc=3.437, acc=0.957, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.466e-04, train_time=0.102 -[v016] 2022-01-31 06:20:02,834 (trainer:653) INFO: 86epoch:train:28-54batch: iter_time=9.272e-05, forward_time=0.031, loss=1.967, loss_att=1.018, loss_ctc=2.917, acc=0.945, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.466e-04, train_time=0.089 -[v016] 2022-01-31 06:20:05,261 (trainer:653) INFO: 86epoch:train:55-81batch: iter_time=7.633e-05, forward_time=0.031, loss=1.982, loss_att=0.968, loss_ctc=2.997, acc=0.959, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.465e-04, train_time=0.090 -[v016] 2022-01-31 06:20:07,704 (trainer:653) INFO: 86epoch:train:82-108batch: iter_time=7.523e-05, forward_time=0.031, loss=2.129, loss_att=0.980, loss_ctc=3.277, acc=0.959, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.465e-04, train_time=0.090 -[v016] 2022-01-31 06:20:10,096 (trainer:653) INFO: 86epoch:train:109-135batch: iter_time=7.474e-05, forward_time=0.031, loss=2.291, loss_att=1.096, loss_ctc=3.486, acc=0.950, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.465e-04, train_time=0.088 -[v016] 2022-01-31 06:20:12,619 (trainer:653) INFO: 86epoch:train:136-162batch: iter_time=7.664e-05, forward_time=0.033, loss=2.314, loss_att=1.078, loss_ctc=3.550, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.464e-04, train_time=0.093 -[v016] 2022-01-31 06:20:15,141 (trainer:653) INFO: 86epoch:train:163-189batch: iter_time=7.913e-05, forward_time=0.032, loss=2.562, loss_att=1.136, loss_ctc=3.989, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.464e-04, train_time=0.093 -[v016] 2022-01-31 06:20:17,780 (trainer:653) INFO: 86epoch:train:190-216batch: iter_time=0.006, forward_time=0.032, loss=2.059, loss_att=0.941, loss_ctc=3.178, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.463e-04, train_time=0.098 -[v016] 2022-01-31 06:20:20,239 (trainer:653) INFO: 86epoch:train:217-243batch: iter_time=8.104e-05, forward_time=0.032, loss=2.418, loss_att=1.196, loss_ctc=3.640, acc=0.948, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.463e-04, train_time=0.091 -[v016] 2022-01-31 06:20:22,642 (trainer:653) INFO: 86epoch:train:244-270batch: iter_time=7.525e-05, forward_time=0.031, loss=2.056, loss_att=0.977, loss_ctc=3.135, acc=0.953, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.462e-04, train_time=0.089 -[v016] 2022-01-31 06:20:25,086 (trainer:653) INFO: 86epoch:train:271-297batch: iter_time=8.030e-05, forward_time=0.031, loss=2.537, loss_att=1.196, loss_ctc=3.879, acc=0.945, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.462e-04, train_time=0.090 -[v016] 2022-01-31 06:20:27,646 (trainer:653) INFO: 86epoch:train:298-324batch: iter_time=7.737e-05, forward_time=0.033, loss=2.642, loss_att=1.130, loss_ctc=4.155, acc=0.958, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.462e-04, train_time=0.095 -[v016] 2022-01-31 06:20:30,037 (trainer:653) INFO: 86epoch:train:325-351batch: iter_time=7.486e-05, forward_time=0.031, loss=2.324, loss_att=1.191, loss_ctc=3.457, acc=0.947, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.461e-04, train_time=0.088 -[v016] 2022-01-31 06:20:32,512 (trainer:653) INFO: 86epoch:train:352-378batch: iter_time=8.144e-05, forward_time=0.032, loss=2.407, loss_att=1.213, loss_ctc=3.601, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.461e-04, train_time=0.091 -[v016] 2022-01-31 06:20:34,961 (trainer:653) INFO: 86epoch:train:379-405batch: iter_time=8.971e-05, forward_time=0.032, loss=2.438, loss_att=1.224, loss_ctc=3.653, acc=0.947, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.460e-04, train_time=0.091 -[v016] 2022-01-31 06:20:37,490 (trainer:653) INFO: 86epoch:train:406-432batch: iter_time=8.009e-05, forward_time=0.032, loss=2.498, loss_att=1.159, loss_ctc=3.836, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.460e-04, train_time=0.093 -[v016] 2022-01-31 06:20:40,007 (trainer:653) INFO: 86epoch:train:433-459batch: iter_time=7.784e-05, forward_time=0.033, loss=2.531, loss_att=1.169, loss_ctc=3.893, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.460e-04, train_time=0.093 -[v016] 2022-01-31 06:20:42,562 (trainer:653) INFO: 86epoch:train:460-486batch: iter_time=8.052e-05, forward_time=0.033, loss=2.571, loss_att=1.365, loss_ctc=3.777, acc=0.939, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.459e-04, train_time=0.094 -[v016] 2022-01-31 06:20:45,085 (trainer:653) INFO: 86epoch:train:487-513batch: iter_time=7.645e-05, forward_time=0.032, loss=2.453, loss_att=1.087, loss_ctc=3.819, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.459e-04, train_time=0.093 -[v016] 2022-01-31 06:20:47,501 (trainer:653) INFO: 86epoch:train:514-540batch: iter_time=7.984e-05, forward_time=0.031, loss=2.206, loss_att=1.061, loss_ctc=3.352, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.458e-04, train_time=0.089 -[v016] 2022-01-31 06:21:21,518 (trainer:328) INFO: 86epoch results: [train] iter_time=7.478e-04, forward_time=0.032, loss=2.336, loss_att=1.111, loss_ctc=3.561, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.462e-04, train_time=0.092, time=50.58 seconds, total_count=47042, gpu_max_cached_mem_GB=5.824, [valid] loss=6.727, loss_att=5.544, loss_ctc=7.910, acc=0.903, cer=0.102, wer=0.399, cer_ctc=0.151, time=5.47 seconds, total_count=15308, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.8 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:21:24,258 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:21:24,298 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/79epoch.pth, exp/asr_train_asr_raw_en_word/82epoch.pth -[v016] 2022-01-31 06:21:24,298 (trainer:261) INFO: 87/200epoch started. Estimated time to finish: 3 hours, 50 minutes and 3.5 seconds -[v016] 2022-01-31 06:21:27,492 (trainer:653) INFO: 87epoch:train:1-27batch: iter_time=0.015, forward_time=0.033, loss=2.016, loss_att=1.003, loss_ctc=3.029, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.458e-04, train_time=0.113 -[v016] 2022-01-31 06:21:29,911 (trainer:653) INFO: 87epoch:train:28-54batch: iter_time=8.301e-05, forward_time=0.031, loss=2.423, loss_att=1.126, loss_ctc=3.720, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.457e-04, train_time=0.089 -[v016] 2022-01-31 06:21:32,422 (trainer:653) INFO: 87epoch:train:55-81batch: iter_time=0.002, forward_time=0.031, loss=2.226, loss_att=1.081, loss_ctc=3.371, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.457e-04, train_time=0.093 -[v016] 2022-01-31 06:21:34,876 (trainer:653) INFO: 87epoch:train:82-108batch: iter_time=8.060e-05, forward_time=0.031, loss=2.729, loss_att=1.228, loss_ctc=4.231, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.457e-04, train_time=0.091 -[v016] 2022-01-31 06:21:37,389 (trainer:653) INFO: 87epoch:train:109-135batch: iter_time=8.130e-05, forward_time=0.032, loss=2.243, loss_att=1.016, loss_ctc=3.470, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.456e-04, train_time=0.093 -[v016] 2022-01-31 06:21:39,888 (trainer:653) INFO: 87epoch:train:136-162batch: iter_time=9.964e-05, forward_time=0.032, loss=2.414, loss_att=1.083, loss_ctc=3.745, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.456e-04, train_time=0.092 -[v016] 2022-01-31 06:21:42,403 (trainer:653) INFO: 87epoch:train:163-189batch: iter_time=7.866e-05, forward_time=0.032, loss=2.461, loss_att=1.212, loss_ctc=3.711, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.455e-04, train_time=0.093 -[v016] 2022-01-31 06:21:44,877 (trainer:653) INFO: 87epoch:train:190-216batch: iter_time=8.411e-05, forward_time=0.031, loss=2.339, loss_att=1.121, loss_ctc=3.556, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.455e-04, train_time=0.091 -[v016] 2022-01-31 06:21:47,394 (trainer:653) INFO: 87epoch:train:217-243batch: iter_time=7.985e-05, forward_time=0.032, loss=2.231, loss_att=1.026, loss_ctc=3.437, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.454e-04, train_time=0.093 -[v016] 2022-01-31 06:21:49,834 (trainer:653) INFO: 87epoch:train:244-270batch: iter_time=8.254e-05, forward_time=0.031, loss=2.304, loss_att=1.103, loss_ctc=3.505, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.454e-04, train_time=0.090 -[v016] 2022-01-31 06:21:52,508 (trainer:653) INFO: 87epoch:train:271-297batch: iter_time=0.011, forward_time=0.030, loss=2.035, loss_att=1.036, loss_ctc=3.035, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.454e-04, train_time=0.099 -[v016] 2022-01-31 06:21:54,905 (trainer:653) INFO: 87epoch:train:298-324batch: iter_time=8.404e-05, forward_time=0.031, loss=2.061, loss_att=1.023, loss_ctc=3.100, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.453e-04, train_time=0.089 -[v016] 2022-01-31 06:21:57,410 (trainer:653) INFO: 87epoch:train:325-351batch: iter_time=7.481e-05, forward_time=0.032, loss=2.437, loss_att=1.126, loss_ctc=3.749, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.453e-04, train_time=0.093 -[v016] 2022-01-31 06:21:59,879 (trainer:653) INFO: 87epoch:train:352-378batch: iter_time=7.724e-05, forward_time=0.031, loss=2.378, loss_att=1.122, loss_ctc=3.635, acc=0.948, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.452e-04, train_time=0.091 -[v016] 2022-01-31 06:22:02,300 (trainer:653) INFO: 87epoch:train:379-405batch: iter_time=7.621e-05, forward_time=0.031, loss=2.231, loss_att=1.118, loss_ctc=3.343, acc=0.950, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.452e-04, train_time=0.089 -[v016] 2022-01-31 06:22:04,777 (trainer:653) INFO: 87epoch:train:406-432batch: iter_time=7.562e-05, forward_time=0.032, loss=2.630, loss_att=1.225, loss_ctc=4.034, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.452e-04, train_time=0.092 -[v016] 2022-01-31 06:22:07,264 (trainer:653) INFO: 87epoch:train:433-459batch: iter_time=7.540e-05, forward_time=0.031, loss=2.150, loss_att=1.070, loss_ctc=3.229, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.451e-04, train_time=0.092 -[v016] 2022-01-31 06:22:09,702 (trainer:653) INFO: 87epoch:train:460-486batch: iter_time=7.734e-05, forward_time=0.032, loss=2.080, loss_att=1.052, loss_ctc=3.107, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.451e-04, train_time=0.090 -[v016] 2022-01-31 06:22:12,273 (trainer:653) INFO: 87epoch:train:487-513batch: iter_time=8.406e-05, forward_time=0.033, loss=2.942, loss_att=1.361, loss_ctc=4.523, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.450e-04, train_time=0.095 -[v016] 2022-01-31 06:22:14,710 (trainer:653) INFO: 87epoch:train:514-540batch: iter_time=7.938e-05, forward_time=0.031, loss=2.297, loss_att=1.095, loss_ctc=3.498, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.450e-04, train_time=0.090 -[v016] 2022-01-31 06:22:49,905 (trainer:328) INFO: 87epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.326, loss_att=1.109, loss_ctc=3.543, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.454e-04, train_time=0.093, time=51.12 seconds, total_count=47589, gpu_max_cached_mem_GB=5.824, [valid] loss=6.520, loss_att=5.414, loss_ctc=7.626, acc=0.903, cer=0.097, wer=0.401, cer_ctc=0.148, time=5.72 seconds, total_count=15486, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.75 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:22:52,442 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 06:22:52,448 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/80epoch.pth -[v016] 2022-01-31 06:22:52,448 (trainer:261) INFO: 88/200epoch started. Estimated time to finish: 3 hours, 47 minutes and 6.87 seconds -[v016] 2022-01-31 06:22:57,402 (trainer:653) INFO: 88epoch:train:1-27batch: iter_time=0.077, forward_time=0.035, loss=2.304, loss_att=1.109, loss_ctc=3.500, acc=0.950, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.449e-04, train_time=0.181 -[v016] 2022-01-31 06:23:00,569 (trainer:653) INFO: 88epoch:train:28-54batch: iter_time=0.015, forward_time=0.034, loss=2.036, loss_att=0.925, loss_ctc=3.148, acc=0.960, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.449e-04, train_time=0.118 -[v016] 2022-01-31 06:23:05,801 (trainer:653) INFO: 88epoch:train:55-81batch: iter_time=0.016, forward_time=0.072, loss=2.342, loss_att=1.133, loss_ctc=3.550, acc=0.949, backward_time=0.028, optim_step_time=0.047, optim0_lr0=1.449e-04, train_time=0.194 -[v016] 2022-01-31 06:23:09,838 (trainer:653) INFO: 88epoch:train:82-108batch: iter_time=0.043, forward_time=0.036, loss=2.258, loss_att=0.973, loss_ctc=3.544, acc=0.964, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.448e-04, train_time=0.149 -[v016] 2022-01-31 06:23:12,885 (trainer:653) INFO: 88epoch:train:109-135batch: iter_time=0.012, forward_time=0.034, loss=2.153, loss_att=0.995, loss_ctc=3.311, acc=0.957, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.448e-04, train_time=0.113 -[v016] 2022-01-31 06:23:16,154 (trainer:653) INFO: 88epoch:train:136-162batch: iter_time=0.028, forward_time=0.032, loss=2.160, loss_att=1.021, loss_ctc=3.300, acc=0.956, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.447e-04, train_time=0.121 -[v016] 2022-01-31 06:23:18,721 (trainer:653) INFO: 88epoch:train:163-189batch: iter_time=0.002, forward_time=0.032, loss=2.124, loss_att=1.114, loss_ctc=3.135, acc=0.947, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.447e-04, train_time=0.095 -[v016] 2022-01-31 06:23:21,366 (trainer:653) INFO: 88epoch:train:190-216batch: iter_time=0.003, forward_time=0.033, loss=2.201, loss_att=1.121, loss_ctc=3.281, acc=0.951, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.446e-04, train_time=0.098 -[v016] 2022-01-31 06:23:24,076 (trainer:653) INFO: 88epoch:train:217-243batch: iter_time=0.008, forward_time=0.031, loss=2.192, loss_att=1.096, loss_ctc=3.289, acc=0.948, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.446e-04, train_time=0.100 -[v016] 2022-01-31 06:23:27,479 (trainer:653) INFO: 88epoch:train:244-270batch: iter_time=0.024, forward_time=0.035, loss=2.358, loss_att=1.085, loss_ctc=3.630, acc=0.953, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.446e-04, train_time=0.126 -[v016] 2022-01-31 06:23:30,391 (trainer:653) INFO: 88epoch:train:271-297batch: iter_time=0.006, forward_time=0.035, loss=2.395, loss_att=1.023, loss_ctc=3.767, acc=0.957, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.445e-04, train_time=0.108 -[v016] 2022-01-31 06:23:33,220 (trainer:653) INFO: 88epoch:train:298-324batch: iter_time=0.006, forward_time=0.034, loss=2.445, loss_att=1.182, loss_ctc=3.707, acc=0.948, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.445e-04, train_time=0.105 -[v016] 2022-01-31 06:23:36,625 (trainer:653) INFO: 88epoch:train:325-351batch: iter_time=0.028, forward_time=0.033, loss=2.177, loss_att=1.062, loss_ctc=3.292, acc=0.954, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.444e-04, train_time=0.126 -[v016] 2022-01-31 06:23:39,336 (trainer:653) INFO: 88epoch:train:352-378batch: iter_time=0.002, forward_time=0.033, loss=2.220, loss_att=1.003, loss_ctc=3.437, acc=0.954, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.444e-04, train_time=0.100 -[v016] 2022-01-31 06:23:41,987 (trainer:653) INFO: 88epoch:train:379-405batch: iter_time=0.002, forward_time=0.033, loss=2.299, loss_att=1.190, loss_ctc=3.407, acc=0.945, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.444e-04, train_time=0.098 -[v016] 2022-01-31 06:23:44,910 (trainer:653) INFO: 88epoch:train:406-432batch: iter_time=0.009, forward_time=0.033, loss=2.582, loss_att=1.206, loss_ctc=3.958, acc=0.947, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.443e-04, train_time=0.108 -[v016] 2022-01-31 06:23:47,482 (trainer:653) INFO: 88epoch:train:433-459batch: iter_time=1.098e-04, forward_time=0.032, loss=2.337, loss_att=1.165, loss_ctc=3.509, acc=0.943, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.443e-04, train_time=0.095 -[v016] 2022-01-31 06:23:50,129 (trainer:653) INFO: 88epoch:train:460-486batch: iter_time=1.086e-04, forward_time=0.033, loss=2.364, loss_att=1.038, loss_ctc=3.690, acc=0.955, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.442e-04, train_time=0.098 -[v016] 2022-01-31 06:23:52,903 (trainer:653) INFO: 88epoch:train:487-513batch: iter_time=0.005, forward_time=0.033, loss=2.069, loss_att=1.040, loss_ctc=3.098, acc=0.952, backward_time=0.022, optim_step_time=0.023, optim0_lr0=1.442e-04, train_time=0.103 -[v016] 2022-01-31 06:23:55,835 (trainer:653) INFO: 88epoch:train:514-540batch: iter_time=0.013, forward_time=0.033, loss=2.407, loss_att=1.217, loss_ctc=3.597, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.442e-04, train_time=0.108 -[v016] 2022-01-31 06:24:35,509 (trainer:328) INFO: 88epoch results: [train] iter_time=0.015, forward_time=0.035, loss=2.274, loss_att=1.088, loss_ctc=3.460, acc=0.952, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.445e-04, train_time=0.117, time=1 minute and 4.13 seconds, total_count=48136, gpu_max_cached_mem_GB=5.824, [valid] loss=6.638, loss_att=5.491, loss_ctc=7.785, acc=0.904, cer=0.100, wer=0.397, cer_ctc=0.151, time=11.58 seconds, total_count=15664, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.35 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:24:38,184 (trainer:375) INFO: The best model has been updated: train.loss, valid.acc -[v016] 2022-01-31 06:24:38,190 (trainer:261) INFO: 89/200epoch started. Estimated time to finish: 3 hours, 44 minutes and 41.82 seconds -[v016] 2022-01-31 06:24:41,102 (trainer:653) INFO: 89epoch:train:1-27batch: iter_time=0.015, forward_time=0.031, loss=2.018, loss_att=0.918, loss_ctc=3.118, acc=0.957, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.441e-04, train_time=0.107 -[v016] 2022-01-31 06:24:43,547 (trainer:653) INFO: 89epoch:train:28-54batch: iter_time=8.028e-05, forward_time=0.031, loss=2.159, loss_att=1.060, loss_ctc=3.258, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.441e-04, train_time=0.090 -[v016] 2022-01-31 06:24:46,035 (trainer:653) INFO: 89epoch:train:55-81batch: iter_time=7.918e-05, forward_time=0.032, loss=2.300, loss_att=1.122, loss_ctc=3.479, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.440e-04, train_time=0.092 -[v016] 2022-01-31 06:24:48,504 (trainer:653) INFO: 89epoch:train:82-108batch: iter_time=8.571e-05, forward_time=0.031, loss=2.254, loss_att=1.066, loss_ctc=3.441, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.440e-04, train_time=0.091 -[v016] 2022-01-31 06:24:51,007 (trainer:653) INFO: 89epoch:train:109-135batch: iter_time=7.690e-05, forward_time=0.032, loss=2.503, loss_att=1.124, loss_ctc=3.882, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.439e-04, train_time=0.093 -[v016] 2022-01-31 06:24:53,496 (trainer:653) INFO: 89epoch:train:136-162batch: iter_time=7.441e-05, forward_time=0.032, loss=2.400, loss_att=1.166, loss_ctc=3.633, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.439e-04, train_time=0.092 -[v016] 2022-01-31 06:24:56,221 (trainer:653) INFO: 89epoch:train:163-189batch: iter_time=0.006, forward_time=0.032, loss=2.402, loss_att=0.974, loss_ctc=3.830, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.439e-04, train_time=0.101 -[v016] 2022-01-31 06:24:58,627 (trainer:653) INFO: 89epoch:train:190-216batch: iter_time=0.001, forward_time=0.030, loss=1.840, loss_att=1.006, loss_ctc=2.674, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.438e-04, train_time=0.089 -[v016] 2022-01-31 06:25:01,745 (trainer:653) INFO: 89epoch:train:217-243batch: iter_time=0.022, forward_time=0.032, loss=2.281, loss_att=1.084, loss_ctc=3.478, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.438e-04, train_time=0.115 -[v016] 2022-01-31 06:25:04,577 (trainer:653) INFO: 89epoch:train:244-270batch: iter_time=9.555e-05, forward_time=0.033, loss=2.303, loss_att=1.032, loss_ctc=3.573, acc=0.957, backward_time=0.021, optim_step_time=0.031, optim0_lr0=1.437e-04, train_time=0.105 -[v016] 2022-01-31 06:25:07,098 (trainer:653) INFO: 89epoch:train:271-297batch: iter_time=7.943e-05, forward_time=0.032, loss=2.350, loss_att=1.091, loss_ctc=3.609, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.437e-04, train_time=0.093 -[v016] 2022-01-31 06:25:09,581 (trainer:653) INFO: 89epoch:train:298-324batch: iter_time=7.605e-05, forward_time=0.031, loss=2.356, loss_att=1.150, loss_ctc=3.561, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.437e-04, train_time=0.092 -[v016] 2022-01-31 06:25:12,052 (trainer:653) INFO: 89epoch:train:325-351batch: iter_time=7.741e-05, forward_time=0.032, loss=2.118, loss_att=1.059, loss_ctc=3.177, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.436e-04, train_time=0.091 -[v016] 2022-01-31 06:25:14,596 (trainer:653) INFO: 89epoch:train:352-378batch: iter_time=8.406e-05, forward_time=0.032, loss=2.288, loss_att=0.981, loss_ctc=3.595, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.436e-04, train_time=0.094 -[v016] 2022-01-31 06:25:17,001 (trainer:653) INFO: 89epoch:train:379-405batch: iter_time=7.481e-05, forward_time=0.030, loss=2.133, loss_att=1.135, loss_ctc=3.132, acc=0.942, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.435e-04, train_time=0.089 -[v016] 2022-01-31 06:25:19,475 (trainer:653) INFO: 89epoch:train:406-432batch: iter_time=8.480e-05, forward_time=0.031, loss=2.274, loss_att=1.041, loss_ctc=3.506, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.435e-04, train_time=0.091 -[v016] 2022-01-31 06:25:21,997 (trainer:653) INFO: 89epoch:train:433-459batch: iter_time=2.017e-04, forward_time=0.032, loss=2.359, loss_att=1.083, loss_ctc=3.635, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.435e-04, train_time=0.093 -[v016] 2022-01-31 06:25:24,499 (trainer:653) INFO: 89epoch:train:460-486batch: iter_time=7.899e-05, forward_time=0.032, loss=2.279, loss_att=1.096, loss_ctc=3.461, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.434e-04, train_time=0.092 -[v016] 2022-01-31 06:25:27,075 (trainer:653) INFO: 89epoch:train:487-513batch: iter_time=3.158e-04, forward_time=0.033, loss=2.339, loss_att=1.086, loss_ctc=3.592, acc=0.951, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.434e-04, train_time=0.095 -[v016] 2022-01-31 06:25:29,558 (trainer:653) INFO: 89epoch:train:514-540batch: iter_time=8.386e-05, forward_time=0.031, loss=2.145, loss_att=1.066, loss_ctc=3.224, acc=0.951, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.433e-04, train_time=0.092 -[v016] 2022-01-31 06:26:05,580 (trainer:328) INFO: 89epoch results: [train] iter_time=0.002, forward_time=0.032, loss=2.257, loss_att=1.067, loss_ctc=3.447, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.437e-04, train_time=0.095, time=52.09 seconds, total_count=48683, gpu_max_cached_mem_GB=5.824, [valid] loss=6.835, loss_att=5.620, loss_ctc=8.051, acc=0.901, cer=0.103, wer=0.414, cer_ctc=0.152, time=7.2 seconds, total_count=15842, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.1 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:26:08,164 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:26:08,203 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/83epoch.pth, exp/asr_train_asr_raw_en_word/84epoch.pth -[v016] 2022-01-31 06:26:08,203 (trainer:261) INFO: 90/200epoch started. Estimated time to finish: 3 hours, 41 minutes and 52.61 seconds -[v016] 2022-01-31 06:26:11,498 (trainer:653) INFO: 90epoch:train:1-27batch: iter_time=0.019, forward_time=0.033, loss=2.010, loss_att=1.018, loss_ctc=3.002, acc=0.948, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.433e-04, train_time=0.115 -[v016] 2022-01-31 06:26:13,902 (trainer:653) INFO: 90epoch:train:28-54batch: iter_time=8.091e-05, forward_time=0.030, loss=1.891, loss_att=0.886, loss_ctc=2.897, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.433e-04, train_time=0.089 -[v016] 2022-01-31 06:26:16,311 (trainer:653) INFO: 90epoch:train:55-81batch: iter_time=1.069e-04, forward_time=0.030, loss=1.937, loss_att=0.945, loss_ctc=2.930, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.432e-04, train_time=0.089 -[v016] 2022-01-31 06:26:18,789 (trainer:653) INFO: 90epoch:train:82-108batch: iter_time=8.382e-05, forward_time=0.032, loss=2.012, loss_att=0.946, loss_ctc=3.078, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.432e-04, train_time=0.092 -[v016] 2022-01-31 06:26:21,316 (trainer:653) INFO: 90epoch:train:109-135batch: iter_time=9.245e-05, forward_time=0.033, loss=2.095, loss_att=0.947, loss_ctc=3.242, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.431e-04, train_time=0.093 -[v016] 2022-01-31 06:26:23,775 (trainer:653) INFO: 90epoch:train:136-162batch: iter_time=9.289e-05, forward_time=0.031, loss=2.225, loss_att=1.046, loss_ctc=3.403, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.431e-04, train_time=0.091 -[v016] 2022-01-31 06:26:26,419 (trainer:653) INFO: 90epoch:train:163-189batch: iter_time=8.473e-05, forward_time=0.034, loss=2.463, loss_att=1.087, loss_ctc=3.839, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.431e-04, train_time=0.098 -[v016] 2022-01-31 06:26:28,948 (trainer:653) INFO: 90epoch:train:190-216batch: iter_time=7.766e-05, forward_time=0.032, loss=2.281, loss_att=1.064, loss_ctc=3.498, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.430e-04, train_time=0.093 -[v016] 2022-01-31 06:26:31,611 (trainer:653) INFO: 90epoch:train:217-243batch: iter_time=8.048e-05, forward_time=0.034, loss=2.626, loss_att=1.091, loss_ctc=4.160, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.430e-04, train_time=0.098 -[v016] 2022-01-31 06:26:34,753 (trainer:653) INFO: 90epoch:train:244-270batch: iter_time=0.015, forward_time=0.032, loss=1.977, loss_att=0.996, loss_ctc=2.959, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.429e-04, train_time=0.116 -[v016] 2022-01-31 06:26:37,336 (trainer:653) INFO: 90epoch:train:271-297batch: iter_time=8.429e-05, forward_time=0.033, loss=2.500, loss_att=1.142, loss_ctc=3.859, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.429e-04, train_time=0.095 -[v016] 2022-01-31 06:26:39,867 (trainer:653) INFO: 90epoch:train:298-324batch: iter_time=8.122e-05, forward_time=0.033, loss=1.974, loss_att=0.871, loss_ctc=3.078, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.429e-04, train_time=0.094 -[v016] 2022-01-31 06:26:42,379 (trainer:653) INFO: 90epoch:train:325-351batch: iter_time=8.474e-05, forward_time=0.032, loss=2.297, loss_att=1.092, loss_ctc=3.503, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.428e-04, train_time=0.093 -[v016] 2022-01-31 06:26:44,817 (trainer:653) INFO: 90epoch:train:352-378batch: iter_time=7.789e-05, forward_time=0.031, loss=1.829, loss_att=0.888, loss_ctc=2.769, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.428e-04, train_time=0.090 -[v016] 2022-01-31 06:26:47,229 (trainer:653) INFO: 90epoch:train:379-405batch: iter_time=7.880e-05, forward_time=0.031, loss=2.164, loss_att=1.100, loss_ctc=3.228, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.427e-04, train_time=0.089 -[v016] 2022-01-31 06:26:49,770 (trainer:653) INFO: 90epoch:train:406-432batch: iter_time=7.703e-05, forward_time=0.033, loss=2.264, loss_att=1.004, loss_ctc=3.524, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.427e-04, train_time=0.094 -[v016] 2022-01-31 06:26:52,270 (trainer:653) INFO: 90epoch:train:433-459batch: iter_time=8.357e-05, forward_time=0.032, loss=2.502, loss_att=1.176, loss_ctc=3.829, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.427e-04, train_time=0.092 -[v016] 2022-01-31 06:26:54,748 (trainer:653) INFO: 90epoch:train:460-486batch: iter_time=8.194e-05, forward_time=0.032, loss=2.026, loss_att=0.969, loss_ctc=3.082, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.426e-04, train_time=0.092 -[v016] 2022-01-31 06:26:57,207 (trainer:653) INFO: 90epoch:train:487-513batch: iter_time=8.101e-05, forward_time=0.032, loss=2.194, loss_att=1.102, loss_ctc=3.286, acc=0.949, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.426e-04, train_time=0.091 -[v016] 2022-01-31 06:26:59,723 (trainer:653) INFO: 90epoch:train:514-540batch: iter_time=8.241e-05, forward_time=0.032, loss=2.376, loss_att=1.132, loss_ctc=3.620, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.426e-04, train_time=0.093 -[v016] 2022-01-31 06:27:33,564 (trainer:328) INFO: 90epoch results: [train] iter_time=0.002, forward_time=0.032, loss=2.183, loss_att=1.027, loss_ctc=3.338, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.429e-04, train_time=0.095, time=52.17 seconds, total_count=49230, gpu_max_cached_mem_GB=5.824, [valid] loss=6.887, loss_att=5.631, loss_ctc=8.143, acc=0.903, cer=0.102, wer=0.408, cer_ctc=0.152, time=6.24 seconds, total_count=16020, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.9 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:27:35,651 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:27:35,657 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/85epoch.pth -[v016] 2022-01-31 06:27:35,658 (trainer:261) INFO: 91/200epoch started. Estimated time to finish: 3 hours, 39 minutes and 1.63 seconds -[v016] 2022-01-31 06:27:38,708 (trainer:653) INFO: 91epoch:train:1-27batch: iter_time=0.014, forward_time=0.034, loss=2.509, loss_att=0.984, loss_ctc=4.035, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.425e-04, train_time=0.111 -[v016] 2022-01-31 06:27:41,230 (trainer:653) INFO: 91epoch:train:28-54batch: iter_time=9.573e-05, forward_time=0.032, loss=2.029, loss_att=0.892, loss_ctc=3.166, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.425e-04, train_time=0.093 -[v016] 2022-01-31 06:27:43,693 (trainer:653) INFO: 91epoch:train:55-81batch: iter_time=9.441e-05, forward_time=0.031, loss=1.995, loss_att=0.924, loss_ctc=3.067, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.424e-04, train_time=0.091 -[v016] 2022-01-31 06:27:46,104 (trainer:653) INFO: 91epoch:train:82-108batch: iter_time=7.837e-05, forward_time=0.031, loss=1.878, loss_att=0.936, loss_ctc=2.820, acc=0.956, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.424e-04, train_time=0.089 -[v016] 2022-01-31 06:27:48,511 (trainer:653) INFO: 91epoch:train:109-135batch: iter_time=8.440e-05, forward_time=0.031, loss=1.998, loss_att=0.916, loss_ctc=3.080, acc=0.961, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.423e-04, train_time=0.089 -[v016] 2022-01-31 06:27:50,958 (trainer:653) INFO: 91epoch:train:136-162batch: iter_time=8.821e-05, forward_time=0.031, loss=1.889, loss_att=0.941, loss_ctc=2.838, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.423e-04, train_time=0.090 -[v016] 2022-01-31 06:27:53,412 (trainer:653) INFO: 91epoch:train:163-189batch: iter_time=8.364e-05, forward_time=0.031, loss=2.234, loss_att=1.012, loss_ctc=3.456, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.423e-04, train_time=0.091 -[v016] 2022-01-31 06:27:55,889 (trainer:653) INFO: 91epoch:train:190-216batch: iter_time=8.592e-05, forward_time=0.032, loss=2.378, loss_att=1.133, loss_ctc=3.622, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.422e-04, train_time=0.092 -[v016] 2022-01-31 06:27:58,303 (trainer:653) INFO: 91epoch:train:217-243batch: iter_time=8.263e-05, forward_time=0.031, loss=2.062, loss_att=0.900, loss_ctc=3.224, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.422e-04, train_time=0.089 -[v016] 2022-01-31 06:28:00,862 (trainer:653) INFO: 91epoch:train:244-270batch: iter_time=8.720e-05, forward_time=0.033, loss=2.182, loss_att=0.931, loss_ctc=3.434, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.422e-04, train_time=0.095 -[v016] 2022-01-31 06:28:03,253 (trainer:653) INFO: 91epoch:train:271-297batch: iter_time=8.226e-05, forward_time=0.030, loss=2.350, loss_att=1.154, loss_ctc=3.546, acc=0.947, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.421e-04, train_time=0.088 -[v016] 2022-01-31 06:28:05,664 (trainer:653) INFO: 91epoch:train:298-324batch: iter_time=8.996e-05, forward_time=0.031, loss=2.344, loss_att=1.099, loss_ctc=3.588, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.421e-04, train_time=0.089 -[v016] 2022-01-31 06:28:08,079 (trainer:653) INFO: 91epoch:train:325-351batch: iter_time=9.947e-05, forward_time=0.031, loss=1.850, loss_att=0.935, loss_ctc=2.765, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.420e-04, train_time=0.089 -[v016] 2022-01-31 06:28:10,533 (trainer:653) INFO: 91epoch:train:352-378batch: iter_time=9.249e-05, forward_time=0.032, loss=2.249, loss_att=1.088, loss_ctc=3.411, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.420e-04, train_time=0.091 -[v016] 2022-01-31 06:28:13,062 (trainer:653) INFO: 91epoch:train:379-405batch: iter_time=8.830e-05, forward_time=0.033, loss=2.283, loss_att=1.046, loss_ctc=3.520, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.420e-04, train_time=0.093 -[v016] 2022-01-31 06:28:15,644 (trainer:653) INFO: 91epoch:train:406-432batch: iter_time=9.242e-05, forward_time=0.033, loss=2.298, loss_att=1.040, loss_ctc=3.555, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.419e-04, train_time=0.095 -[v016] 2022-01-31 06:28:18,123 (trainer:653) INFO: 91epoch:train:433-459batch: iter_time=9.032e-05, forward_time=0.032, loss=2.409, loss_att=1.093, loss_ctc=3.725, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.419e-04, train_time=0.092 -[v016] 2022-01-31 06:28:20,612 (trainer:653) INFO: 91epoch:train:460-486batch: iter_time=8.040e-05, forward_time=0.032, loss=2.314, loss_att=1.041, loss_ctc=3.588, acc=0.951, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.418e-04, train_time=0.092 -[v016] 2022-01-31 06:28:23,045 (trainer:653) INFO: 91epoch:train:487-513batch: iter_time=7.632e-05, forward_time=0.031, loss=2.126, loss_att=1.061, loss_ctc=3.191, acc=0.950, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.418e-04, train_time=0.090 -[v016] 2022-01-31 06:28:25,496 (trainer:653) INFO: 91epoch:train:514-540batch: iter_time=7.835e-05, forward_time=0.031, loss=2.218, loss_att=1.053, loss_ctc=3.382, acc=0.957, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.418e-04, train_time=0.091 -[v016] 2022-01-31 06:28:59,149 (trainer:328) INFO: 91epoch results: [train] iter_time=7.705e-04, forward_time=0.032, loss=2.178, loss_att=1.008, loss_ctc=3.347, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.421e-04, train_time=0.092, time=50.52 seconds, total_count=49777, gpu_max_cached_mem_GB=5.824, [valid] loss=6.791, loss_att=5.566, loss_ctc=8.016, acc=0.904, cer=0.100, wer=0.400, cer_ctc=0.144, time=5.57 seconds, total_count=16198, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.37 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:29:01,191 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 06:29:01,197 (trainer:261) INFO: 92/200epoch started. Estimated time to finish: 3 hours, 36 minutes and 10.07 seconds -[v016] 2022-01-31 06:29:04,051 (trainer:653) INFO: 92epoch:train:1-27batch: iter_time=0.009, forward_time=0.033, loss=1.972, loss_att=0.960, loss_ctc=2.983, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.417e-04, train_time=0.104 -[v016] 2022-01-31 06:29:06,563 (trainer:653) INFO: 92epoch:train:28-54batch: iter_time=8.774e-05, forward_time=0.032, loss=2.044, loss_att=0.939, loss_ctc=3.149, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.417e-04, train_time=0.093 -[v016] 2022-01-31 06:29:08,985 (trainer:653) INFO: 92epoch:train:55-81batch: iter_time=8.150e-05, forward_time=0.031, loss=2.121, loss_att=1.051, loss_ctc=3.191, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.416e-04, train_time=0.090 -[v016] 2022-01-31 06:29:11,810 (trainer:653) INFO: 92epoch:train:82-108batch: iter_time=0.013, forward_time=0.032, loss=2.287, loss_att=0.998, loss_ctc=3.577, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.416e-04, train_time=0.104 -[v016] 2022-01-31 06:29:14,315 (trainer:653) INFO: 92epoch:train:109-135batch: iter_time=7.610e-05, forward_time=0.032, loss=2.275, loss_att=1.042, loss_ctc=3.508, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.416e-04, train_time=0.093 -[v016] 2022-01-31 06:29:16,737 (trainer:653) INFO: 92epoch:train:136-162batch: iter_time=7.603e-05, forward_time=0.031, loss=2.072, loss_att=0.978, loss_ctc=3.166, acc=0.957, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.415e-04, train_time=0.089 -[v016] 2022-01-31 06:29:19,318 (trainer:653) INFO: 92epoch:train:163-189batch: iter_time=7.853e-05, forward_time=0.033, loss=2.540, loss_att=1.047, loss_ctc=4.032, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.415e-04, train_time=0.095 -[v016] 2022-01-31 06:29:21,856 (trainer:653) INFO: 92epoch:train:190-216batch: iter_time=9.075e-04, forward_time=0.033, loss=2.377, loss_att=1.098, loss_ctc=3.656, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.414e-04, train_time=0.094 -[v016] 2022-01-31 06:29:24,281 (trainer:653) INFO: 92epoch:train:217-243batch: iter_time=7.426e-05, forward_time=0.032, loss=1.850, loss_att=0.941, loss_ctc=2.758, acc=0.955, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.414e-04, train_time=0.090 -[v016] 2022-01-31 06:29:26,844 (trainer:653) INFO: 92epoch:train:244-270batch: iter_time=7.574e-05, forward_time=0.033, loss=2.544, loss_att=1.123, loss_ctc=3.965, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.414e-04, train_time=0.095 -[v016] 2022-01-31 06:29:29,274 (trainer:653) INFO: 92epoch:train:271-297batch: iter_time=7.510e-05, forward_time=0.031, loss=2.032, loss_att=1.006, loss_ctc=3.058, acc=0.952, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.413e-04, train_time=0.090 -[v016] 2022-01-31 06:29:31,708 (trainer:653) INFO: 92epoch:train:298-324batch: iter_time=7.710e-05, forward_time=0.032, loss=2.064, loss_att=1.047, loss_ctc=3.080, acc=0.951, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.413e-04, train_time=0.090 -[v016] 2022-01-31 06:29:34,241 (trainer:653) INFO: 92epoch:train:325-351batch: iter_time=7.775e-05, forward_time=0.033, loss=2.302, loss_att=1.089, loss_ctc=3.514, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.413e-04, train_time=0.094 -[v016] 2022-01-31 06:29:36,712 (trainer:653) INFO: 92epoch:train:352-378batch: iter_time=8.310e-05, forward_time=0.032, loss=2.133, loss_att=1.007, loss_ctc=3.259, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.412e-04, train_time=0.091 -[v016] 2022-01-31 06:29:39,305 (trainer:653) INFO: 92epoch:train:379-405batch: iter_time=8.070e-05, forward_time=0.034, loss=2.362, loss_att=1.091, loss_ctc=3.633, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.412e-04, train_time=0.096 -[v016] 2022-01-31 06:29:41,747 (trainer:653) INFO: 92epoch:train:406-432batch: iter_time=8.410e-05, forward_time=0.032, loss=1.933, loss_att=0.974, loss_ctc=2.892, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.411e-04, train_time=0.090 -[v016] 2022-01-31 06:29:44,484 (trainer:653) INFO: 92epoch:train:433-459batch: iter_time=0.009, forward_time=0.032, loss=2.208, loss_att=1.059, loss_ctc=3.357, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.411e-04, train_time=0.101 -[v016] 2022-01-31 06:29:47,026 (trainer:653) INFO: 92epoch:train:460-486batch: iter_time=7.824e-05, forward_time=0.031, loss=1.826, loss_att=0.885, loss_ctc=2.768, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.411e-04, train_time=0.094 -[v016] 2022-01-31 06:29:49,465 (trainer:653) INFO: 92epoch:train:487-513batch: iter_time=7.784e-05, forward_time=0.031, loss=2.029, loss_att=0.944, loss_ctc=3.114, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.410e-04, train_time=0.090 -[v016] 2022-01-31 06:29:51,891 (trainer:653) INFO: 92epoch:train:514-540batch: iter_time=7.839e-05, forward_time=0.032, loss=1.821, loss_att=0.828, loss_ctc=2.815, acc=0.961, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.410e-04, train_time=0.090 -[v016] 2022-01-31 06:30:25,147 (trainer:328) INFO: 92epoch results: [train] iter_time=0.002, forward_time=0.032, loss=2.154, loss_att=1.008, loss_ctc=3.299, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.413e-04, train_time=0.094, time=51.47 seconds, total_count=50324, gpu_max_cached_mem_GB=5.824, [valid] loss=6.777, loss_att=5.584, loss_ctc=7.969, acc=0.905, cer=0.099, wer=0.394, cer_ctc=0.151, time=5.46 seconds, total_count=16376, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.02 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:30:27,126 (trainer:375) INFO: The best model has been updated: train.loss, valid.acc -[v016] 2022-01-31 06:30:27,173 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/87epoch.pth -[v016] 2022-01-31 06:30:27,173 (trainer:261) INFO: 93/200epoch started. Estimated time to finish: 3 hours, 33 minutes and 21.56 seconds -[v016] 2022-01-31 06:30:29,918 (trainer:653) INFO: 93epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=2.086, loss_att=0.953, loss_ctc=3.219, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.409e-04, train_time=0.099 -[v016] 2022-01-31 06:30:32,393 (trainer:653) INFO: 93epoch:train:28-54batch: iter_time=8.115e-05, forward_time=0.031, loss=1.913, loss_att=0.929, loss_ctc=2.896, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.409e-04, train_time=0.094 -[v016] 2022-01-31 06:30:34,845 (trainer:653) INFO: 93epoch:train:55-81batch: iter_time=7.564e-05, forward_time=0.031, loss=2.233, loss_att=1.033, loss_ctc=3.432, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.409e-04, train_time=0.091 -[v016] 2022-01-31 06:30:37,339 (trainer:653) INFO: 93epoch:train:82-108batch: iter_time=7.545e-05, forward_time=0.032, loss=2.097, loss_att=0.920, loss_ctc=3.274, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.408e-04, train_time=0.092 -[v016] 2022-01-31 06:30:39,838 (trainer:653) INFO: 93epoch:train:109-135batch: iter_time=7.456e-05, forward_time=0.031, loss=2.101, loss_att=0.904, loss_ctc=3.297, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.408e-04, train_time=0.092 -[v016] 2022-01-31 06:30:42,445 (trainer:653) INFO: 93epoch:train:136-162batch: iter_time=0.004, forward_time=0.032, loss=2.290, loss_att=0.997, loss_ctc=3.584, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.408e-04, train_time=0.096 -[v016] 2022-01-31 06:30:45,590 (trainer:653) INFO: 93epoch:train:163-189batch: iter_time=0.026, forward_time=0.031, loss=2.001, loss_att=1.036, loss_ctc=2.965, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.407e-04, train_time=0.116 -[v016] 2022-01-31 06:30:47,973 (trainer:653) INFO: 93epoch:train:190-216batch: iter_time=5.946e-04, forward_time=0.030, loss=1.779, loss_att=0.898, loss_ctc=2.659, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.407e-04, train_time=0.088 -[v016] 2022-01-31 06:30:50,409 (trainer:653) INFO: 93epoch:train:217-243batch: iter_time=7.743e-05, forward_time=0.032, loss=2.227, loss_att=1.101, loss_ctc=3.353, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.406e-04, train_time=0.090 -[v016] 2022-01-31 06:30:52,961 (trainer:653) INFO: 93epoch:train:244-270batch: iter_time=7.701e-05, forward_time=0.033, loss=2.375, loss_att=1.062, loss_ctc=3.689, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.406e-04, train_time=0.094 -[v016] 2022-01-31 06:30:55,422 (trainer:653) INFO: 93epoch:train:271-297batch: iter_time=7.069e-04, forward_time=0.031, loss=2.025, loss_att=0.937, loss_ctc=3.114, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.406e-04, train_time=0.091 -[v016] 2022-01-31 06:30:57,923 (trainer:653) INFO: 93epoch:train:298-324batch: iter_time=7.392e-04, forward_time=0.032, loss=1.975, loss_att=1.026, loss_ctc=2.923, acc=0.944, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.405e-04, train_time=0.092 -[v016] 2022-01-31 06:31:00,453 (trainer:653) INFO: 93epoch:train:325-351batch: iter_time=8.520e-05, forward_time=0.032, loss=2.035, loss_att=0.898, loss_ctc=3.172, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.405e-04, train_time=0.093 -[v016] 2022-01-31 06:31:02,928 (trainer:653) INFO: 93epoch:train:352-378batch: iter_time=8.328e-05, forward_time=0.032, loss=2.084, loss_att=1.002, loss_ctc=3.167, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.405e-04, train_time=0.091 -[v016] 2022-01-31 06:31:05,562 (trainer:653) INFO: 93epoch:train:379-405batch: iter_time=9.166e-05, forward_time=0.034, loss=2.291, loss_att=1.040, loss_ctc=3.542, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.404e-04, train_time=0.097 -[v016] 2022-01-31 06:31:08,670 (trainer:653) INFO: 93epoch:train:406-432batch: iter_time=0.024, forward_time=0.032, loss=2.032, loss_att=0.966, loss_ctc=3.099, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.404e-04, train_time=0.115 -[v016] 2022-01-31 06:31:11,136 (trainer:653) INFO: 93epoch:train:433-459batch: iter_time=8.973e-05, forward_time=0.032, loss=1.973, loss_att=1.051, loss_ctc=2.895, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.403e-04, train_time=0.091 -[v016] 2022-01-31 06:31:13,633 (trainer:653) INFO: 93epoch:train:460-486batch: iter_time=9.382e-05, forward_time=0.032, loss=1.934, loss_att=0.965, loss_ctc=2.903, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.403e-04, train_time=0.092 -[v016] 2022-01-31 06:31:16,235 (trainer:653) INFO: 93epoch:train:487-513batch: iter_time=0.001, forward_time=0.033, loss=2.609, loss_att=1.175, loss_ctc=4.044, acc=0.953, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.403e-04, train_time=0.096 -[v016] 2022-01-31 06:31:18,770 (trainer:653) INFO: 93epoch:train:514-540batch: iter_time=8.886e-05, forward_time=0.032, loss=2.100, loss_att=0.966, loss_ctc=3.234, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.402e-04, train_time=0.094 -[v016] 2022-01-31 06:31:52,943 (trainer:328) INFO: 93epoch results: [train] iter_time=0.003, forward_time=0.032, loss=2.106, loss_att=0.992, loss_ctc=3.220, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.406e-04, train_time=0.095, time=52.3 seconds, total_count=50871, gpu_max_cached_mem_GB=5.824, [valid] loss=6.848, loss_att=5.653, loss_ctc=8.042, acc=0.904, cer=0.099, wer=0.404, cer_ctc=0.148, time=5.53 seconds, total_count=16554, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.94 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:31:54,990 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:31:54,996 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/78epoch.pth, exp/asr_train_asr_raw_en_word/86epoch.pth -[v016] 2022-01-31 06:31:55,000 (trainer:261) INFO: 94/200epoch started. Estimated time to finish: 3 hours, 30 minutes and 38.01 seconds -[v016] 2022-01-31 06:31:57,925 (trainer:653) INFO: 94epoch:train:1-27batch: iter_time=0.014, forward_time=0.031, loss=1.937, loss_att=0.893, loss_ctc=2.981, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.402e-04, train_time=0.108 -[v016] 2022-01-31 06:32:00,385 (trainer:653) INFO: 94epoch:train:28-54batch: iter_time=9.676e-05, forward_time=0.031, loss=2.232, loss_att=1.064, loss_ctc=3.401, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.401e-04, train_time=0.091 -[v016] 2022-01-31 06:32:02,959 (trainer:653) INFO: 94epoch:train:55-81batch: iter_time=8.681e-05, forward_time=0.034, loss=2.014, loss_att=0.813, loss_ctc=3.216, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.401e-04, train_time=0.095 -[v016] 2022-01-31 06:32:05,516 (trainer:653) INFO: 94epoch:train:82-108batch: iter_time=8.189e-05, forward_time=0.033, loss=2.339, loss_att=1.107, loss_ctc=3.570, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.401e-04, train_time=0.095 -[v016] 2022-01-31 06:32:08,071 (trainer:653) INFO: 94epoch:train:109-135batch: iter_time=5.155e-04, forward_time=0.033, loss=1.919, loss_att=0.929, loss_ctc=2.910, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.400e-04, train_time=0.094 -[v016] 2022-01-31 06:32:10,505 (trainer:653) INFO: 94epoch:train:136-162batch: iter_time=7.658e-05, forward_time=0.031, loss=1.913, loss_att=0.949, loss_ctc=2.877, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.400e-04, train_time=0.090 -[v016] 2022-01-31 06:32:12,980 (trainer:653) INFO: 94epoch:train:163-189batch: iter_time=7.937e-05, forward_time=0.032, loss=1.978, loss_att=0.981, loss_ctc=2.975, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.400e-04, train_time=0.091 -[v016] 2022-01-31 06:32:15,476 (trainer:653) INFO: 94epoch:train:190-216batch: iter_time=7.592e-05, forward_time=0.032, loss=2.148, loss_att=0.972, loss_ctc=3.325, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.399e-04, train_time=0.092 -[v016] 2022-01-31 06:32:18,092 (trainer:653) INFO: 94epoch:train:217-243batch: iter_time=0.002, forward_time=0.033, loss=2.296, loss_att=0.970, loss_ctc=3.621, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.399e-04, train_time=0.097 -[v016] 2022-01-31 06:32:21,121 (trainer:653) INFO: 94epoch:train:244-270batch: iter_time=0.018, forward_time=0.032, loss=2.211, loss_att=0.950, loss_ctc=3.472, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.399e-04, train_time=0.112 -[v016] 2022-01-31 06:32:23,575 (trainer:653) INFO: 94epoch:train:271-297batch: iter_time=4.073e-04, forward_time=0.031, loss=2.042, loss_att=0.997, loss_ctc=3.088, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.398e-04, train_time=0.091 -[v016] 2022-01-31 06:32:26,108 (trainer:653) INFO: 94epoch:train:298-324batch: iter_time=8.670e-05, forward_time=0.032, loss=1.914, loss_att=0.878, loss_ctc=2.951, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.398e-04, train_time=0.094 -[v016] 2022-01-31 06:32:28,733 (trainer:653) INFO: 94epoch:train:325-351batch: iter_time=0.006, forward_time=0.032, loss=2.160, loss_att=1.075, loss_ctc=3.246, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.397e-04, train_time=0.097 -[v016] 2022-01-31 06:32:31,255 (trainer:653) INFO: 94epoch:train:352-378batch: iter_time=9.518e-04, forward_time=0.032, loss=2.070, loss_att=0.977, loss_ctc=3.163, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.397e-04, train_time=0.093 -[v016] 2022-01-31 06:32:33,855 (trainer:653) INFO: 94epoch:train:379-405batch: iter_time=0.001, forward_time=0.033, loss=2.514, loss_att=1.138, loss_ctc=3.890, acc=0.956, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.397e-04, train_time=0.096 -[v016] 2022-01-31 06:32:36,689 (trainer:653) INFO: 94epoch:train:406-432batch: iter_time=0.012, forward_time=0.032, loss=2.076, loss_att=1.014, loss_ctc=3.139, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.396e-04, train_time=0.105 -[v016] 2022-01-31 06:32:39,125 (trainer:653) INFO: 94epoch:train:433-459batch: iter_time=8.189e-05, forward_time=0.031, loss=1.827, loss_att=0.964, loss_ctc=2.690, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.396e-04, train_time=0.090 -[v016] 2022-01-31 06:32:41,534 (trainer:653) INFO: 94epoch:train:460-486batch: iter_time=8.116e-05, forward_time=0.030, loss=1.921, loss_att=1.001, loss_ctc=2.841, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.396e-04, train_time=0.089 -[v016] 2022-01-31 06:32:43,977 (trainer:653) INFO: 94epoch:train:487-513batch: iter_time=8.524e-05, forward_time=0.031, loss=1.966, loss_att=0.932, loss_ctc=3.001, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.395e-04, train_time=0.090 -[v016] 2022-01-31 06:32:46,425 (trainer:653) INFO: 94epoch:train:514-540batch: iter_time=0.001, forward_time=0.030, loss=2.160, loss_att=1.066, loss_ctc=3.254, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.395e-04, train_time=0.090 -[v016] 2022-01-31 06:33:22,911 (trainer:328) INFO: 94epoch results: [train] iter_time=0.003, forward_time=0.032, loss=2.076, loss_att=0.980, loss_ctc=3.171, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.398e-04, train_time=0.095, time=52.11 seconds, total_count=51418, gpu_max_cached_mem_GB=5.824, [valid] loss=6.862, loss_att=5.651, loss_ctc=8.072, acc=0.904, cer=0.099, wer=0.400, cer_ctc=0.151, time=6.41 seconds, total_count=16732, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.39 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:33:25,006 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:33:25,050 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/89epoch.pth -[v016] 2022-01-31 06:33:25,050 (trainer:261) INFO: 95/200epoch started. Estimated time to finish: 3 hours, 27 minutes and 59.71 seconds -[v016] 2022-01-31 06:33:29,054 (trainer:653) INFO: 95epoch:train:1-27batch: iter_time=0.010, forward_time=0.054, loss=1.776, loss_att=0.826, loss_ctc=2.726, acc=0.961, backward_time=0.037, optim_step_time=0.021, optim0_lr0=1.394e-04, train_time=0.147 -[v016] 2022-01-31 06:33:31,504 (trainer:653) INFO: 95epoch:train:28-54batch: iter_time=4.092e-04, forward_time=0.031, loss=1.902, loss_att=0.933, loss_ctc=2.871, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.394e-04, train_time=0.091 -[v016] 2022-01-31 06:33:33,932 (trainer:653) INFO: 95epoch:train:55-81batch: iter_time=0.002, forward_time=0.030, loss=1.735, loss_att=0.900, loss_ctc=2.569, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.394e-04, train_time=0.090 -[v016] 2022-01-31 06:33:36,629 (trainer:653) INFO: 95epoch:train:82-108batch: iter_time=0.009, forward_time=0.031, loss=1.804, loss_att=0.966, loss_ctc=2.643, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.393e-04, train_time=0.100 -[v016] 2022-01-31 06:33:39,065 (trainer:653) INFO: 95epoch:train:109-135batch: iter_time=7.947e-05, forward_time=0.031, loss=1.730, loss_att=0.839, loss_ctc=2.621, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.393e-04, train_time=0.090 -[v016] 2022-01-31 06:33:41,677 (trainer:653) INFO: 95epoch:train:136-162batch: iter_time=7.735e-05, forward_time=0.033, loss=2.309, loss_att=0.991, loss_ctc=3.626, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.393e-04, train_time=0.097 -[v016] 2022-01-31 06:33:44,165 (trainer:653) INFO: 95epoch:train:163-189batch: iter_time=7.923e-05, forward_time=0.031, loss=2.162, loss_att=1.005, loss_ctc=3.319, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.392e-04, train_time=0.092 -[v016] 2022-01-31 06:33:46,604 (trainer:653) INFO: 95epoch:train:190-216batch: iter_time=8.036e-05, forward_time=0.031, loss=2.113, loss_att=1.025, loss_ctc=3.201, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.392e-04, train_time=0.090 -[v016] 2022-01-31 06:33:49,184 (trainer:653) INFO: 95epoch:train:217-243batch: iter_time=0.002, forward_time=0.032, loss=2.195, loss_att=0.999, loss_ctc=3.391, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.391e-04, train_time=0.095 -[v016] 2022-01-31 06:33:51,590 (trainer:653) INFO: 95epoch:train:244-270batch: iter_time=8.610e-04, forward_time=0.031, loss=1.710, loss_att=0.935, loss_ctc=2.486, acc=0.956, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.391e-04, train_time=0.089 -[v016] 2022-01-31 06:33:54,828 (trainer:653) INFO: 95epoch:train:271-297batch: iter_time=0.026, forward_time=0.032, loss=2.092, loss_att=0.944, loss_ctc=3.241, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.391e-04, train_time=0.120 -[v016] 2022-01-31 06:33:58,119 (trainer:653) INFO: 95epoch:train:298-324batch: iter_time=0.028, forward_time=0.032, loss=2.247, loss_att=0.958, loss_ctc=3.537, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.390e-04, train_time=0.122 -[v016] 2022-01-31 06:34:00,607 (trainer:653) INFO: 95epoch:train:325-351batch: iter_time=8.570e-05, forward_time=0.031, loss=2.222, loss_att=1.053, loss_ctc=3.391, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.390e-04, train_time=0.092 -[v016] 2022-01-31 06:34:03,112 (trainer:653) INFO: 95epoch:train:352-378batch: iter_time=8.203e-04, forward_time=0.032, loss=2.132, loss_att=0.960, loss_ctc=3.305, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.390e-04, train_time=0.093 -[v016] 2022-01-31 06:34:05,547 (trainer:653) INFO: 95epoch:train:379-405batch: iter_time=7.805e-05, forward_time=0.030, loss=2.134, loss_att=1.097, loss_ctc=3.170, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.389e-04, train_time=0.090 -[v016] 2022-01-31 06:34:07,967 (trainer:653) INFO: 95epoch:train:406-432batch: iter_time=2.068e-04, forward_time=0.030, loss=1.822, loss_att=0.893, loss_ctc=2.751, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.389e-04, train_time=0.089 -[v016] 2022-01-31 06:34:10,467 (trainer:653) INFO: 95epoch:train:433-459batch: iter_time=7.882e-05, forward_time=0.032, loss=2.087, loss_att=0.984, loss_ctc=3.190, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.389e-04, train_time=0.092 -[v016] 2022-01-31 06:34:12,935 (trainer:653) INFO: 95epoch:train:460-486batch: iter_time=8.755e-05, forward_time=0.031, loss=2.229, loss_att=1.095, loss_ctc=3.362, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.388e-04, train_time=0.091 -[v016] 2022-01-31 06:34:15,398 (trainer:653) INFO: 95epoch:train:487-513batch: iter_time=7.801e-05, forward_time=0.031, loss=2.030, loss_att=0.866, loss_ctc=3.194, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.388e-04, train_time=0.091 -[v016] 2022-01-31 06:34:17,948 (trainer:653) INFO: 95epoch:train:514-540batch: iter_time=7.864e-05, forward_time=0.032, loss=2.260, loss_att=0.992, loss_ctc=3.528, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.387e-04, train_time=0.094 -[v016] 2022-01-31 06:34:54,320 (trainer:328) INFO: 95epoch results: [train] iter_time=0.004, forward_time=0.032, loss=2.027, loss_att=0.961, loss_ctc=3.094, acc=0.958, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.391e-04, train_time=0.098, time=53.56 seconds, total_count=51965, gpu_max_cached_mem_GB=5.824, [valid] loss=6.773, loss_att=5.552, loss_ctc=7.994, acc=0.902, cer=0.100, wer=0.403, cer_ctc=0.147, time=6.83 seconds, total_count=16910, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.86 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:34:58,377 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:34:58,427 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/90epoch.pth -[v016] 2022-01-31 06:34:58,428 (trainer:261) INFO: 96/200epoch started. Estimated time to finish: 3 hours, 25 minutes and 27.88 seconds -[v016] 2022-01-31 06:35:04,040 (trainer:653) INFO: 96epoch:train:1-27batch: iter_time=0.088, forward_time=0.036, loss=1.809, loss_att=0.909, loss_ctc=2.709, acc=0.957, backward_time=0.030, optim_step_time=0.023, optim0_lr0=1.387e-04, train_time=0.202 -[v016] 2022-01-31 06:35:08,108 (trainer:653) INFO: 96epoch:train:28-54batch: iter_time=0.048, forward_time=0.035, loss=1.764, loss_att=0.861, loss_ctc=2.666, acc=0.959, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.387e-04, train_time=0.150 -[v016] 2022-01-31 06:35:11,224 (trainer:653) INFO: 96epoch:train:55-81batch: iter_time=0.013, forward_time=0.034, loss=1.761, loss_att=0.835, loss_ctc=2.686, acc=0.959, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.386e-04, train_time=0.115 -[v016] 2022-01-31 06:35:14,299 (trainer:653) INFO: 96epoch:train:82-108batch: iter_time=0.016, forward_time=0.034, loss=2.052, loss_att=0.844, loss_ctc=3.261, acc=0.963, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.386e-04, train_time=0.114 -[v016] 2022-01-31 06:35:17,122 (trainer:653) INFO: 96epoch:train:109-135batch: iter_time=0.011, forward_time=0.032, loss=2.293, loss_att=1.008, loss_ctc=3.578, acc=0.959, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.386e-04, train_time=0.104 -[v016] 2022-01-31 06:35:21,190 (trainer:653) INFO: 96epoch:train:136-162batch: iter_time=0.060, forward_time=0.031, loss=1.867, loss_att=0.915, loss_ctc=2.819, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.385e-04, train_time=0.150 -[v016] 2022-01-31 06:35:24,273 (trainer:653) INFO: 96epoch:train:163-189batch: iter_time=0.016, forward_time=0.034, loss=1.976, loss_att=0.922, loss_ctc=3.030, acc=0.956, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.385e-04, train_time=0.114 -[v016] 2022-01-31 06:35:26,985 (trainer:653) INFO: 96epoch:train:190-216batch: iter_time=0.002, forward_time=0.033, loss=1.587, loss_att=0.752, loss_ctc=2.423, acc=0.965, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.385e-04, train_time=0.100 -[v016] 2022-01-31 06:35:29,891 (trainer:653) INFO: 96epoch:train:217-243batch: iter_time=0.013, forward_time=0.032, loss=1.908, loss_att=0.915, loss_ctc=2.901, acc=0.960, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.384e-04, train_time=0.107 -[v016] 2022-01-31 06:35:32,792 (trainer:653) INFO: 96epoch:train:244-270batch: iter_time=0.008, forward_time=0.034, loss=2.391, loss_att=1.105, loss_ctc=3.677, acc=0.956, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.384e-04, train_time=0.107 -[v016] 2022-01-31 06:35:35,714 (trainer:653) INFO: 96epoch:train:271-297batch: iter_time=0.011, forward_time=0.033, loss=1.893, loss_att=0.915, loss_ctc=2.872, acc=0.961, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.383e-04, train_time=0.108 -[v016] 2022-01-31 06:35:38,449 (trainer:653) INFO: 96epoch:train:298-324batch: iter_time=0.002, forward_time=0.033, loss=2.128, loss_att=0.954, loss_ctc=3.302, acc=0.958, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.383e-04, train_time=0.101 -[v016] 2022-01-31 06:35:41,651 (trainer:653) INFO: 96epoch:train:325-351batch: iter_time=0.021, forward_time=0.033, loss=2.047, loss_att=1.038, loss_ctc=3.056, acc=0.953, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.383e-04, train_time=0.118 -[v016] 2022-01-31 06:35:44,304 (trainer:653) INFO: 96epoch:train:352-378batch: iter_time=0.001, forward_time=0.034, loss=2.096, loss_att=0.997, loss_ctc=3.196, acc=0.955, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.382e-04, train_time=0.098 -[v016] 2022-01-31 06:35:47,064 (trainer:653) INFO: 96epoch:train:379-405batch: iter_time=0.002, forward_time=0.034, loss=2.520, loss_att=1.124, loss_ctc=3.917, acc=0.960, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.382e-04, train_time=0.102 -[v016] 2022-01-31 06:35:49,842 (trainer:653) INFO: 96epoch:train:406-432batch: iter_time=0.005, forward_time=0.033, loss=2.005, loss_att=0.959, loss_ctc=3.051, acc=0.960, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.382e-04, train_time=0.103 -[v016] 2022-01-31 06:35:52,593 (trainer:653) INFO: 96epoch:train:433-459batch: iter_time=0.002, forward_time=0.034, loss=2.282, loss_att=1.014, loss_ctc=3.550, acc=0.954, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.381e-04, train_time=0.102 -[v016] 2022-01-31 06:35:55,502 (trainer:653) INFO: 96epoch:train:460-486batch: iter_time=0.010, forward_time=0.033, loss=2.126, loss_att=0.995, loss_ctc=3.257, acc=0.956, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.381e-04, train_time=0.108 -[v016] 2022-01-31 06:35:58,033 (trainer:653) INFO: 96epoch:train:487-513batch: iter_time=9.741e-04, forward_time=0.031, loss=1.827, loss_att=0.905, loss_ctc=2.749, acc=0.960, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.381e-04, train_time=0.094 -[v016] 2022-01-31 06:36:01,622 (trainer:653) INFO: 96epoch:train:514-540batch: iter_time=0.043, forward_time=0.031, loss=1.773, loss_att=0.878, loss_ctc=2.669, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.380e-04, train_time=0.133 -[v016] 2022-01-31 06:36:44,168 (trainer:328) INFO: 96epoch results: [train] iter_time=0.019, forward_time=0.033, loss=1.998, loss_att=0.939, loss_ctc=3.057, acc=0.958, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.384e-04, train_time=0.117, time=1 minute and 4.08 seconds, total_count=52512, gpu_max_cached_mem_GB=5.824, [valid] loss=6.818, loss_att=5.684, loss_ctc=7.952, acc=0.905, cer=0.100, wer=0.395, cer_ctc=0.147, time=13.98 seconds, total_count=17088, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.64 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:36:46,611 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:36:46,617 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/81epoch.pth -[v016] 2022-01-31 06:36:46,617 (trainer:261) INFO: 97/200epoch started. Estimated time to finish: 3 hours, 23 minutes and 17.86 seconds -[v016] 2022-01-31 06:36:49,922 (trainer:653) INFO: 97epoch:train:1-27batch: iter_time=0.027, forward_time=0.031, loss=1.830, loss_att=0.875, loss_ctc=2.785, acc=0.955, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.380e-04, train_time=0.120 -[v016] 2022-01-31 06:36:52,392 (trainer:653) INFO: 97epoch:train:28-54batch: iter_time=0.001, forward_time=0.031, loss=1.989, loss_att=0.943, loss_ctc=3.035, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.379e-04, train_time=0.092 -[v016] 2022-01-31 06:36:55,913 (trainer:653) INFO: 97epoch:train:55-81batch: iter_time=0.033, forward_time=0.034, loss=2.153, loss_att=0.945, loss_ctc=3.361, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.379e-04, train_time=0.130 -[v016] 2022-01-31 06:36:58,498 (trainer:653) INFO: 97epoch:train:82-108batch: iter_time=0.002, forward_time=0.032, loss=1.841, loss_att=0.847, loss_ctc=2.834, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.379e-04, train_time=0.096 -[v016] 2022-01-31 06:37:02,975 (trainer:653) INFO: 97epoch:train:109-135batch: iter_time=0.006, forward_time=0.044, loss=2.386, loss_att=1.074, loss_ctc=3.699, acc=0.953, backward_time=0.068, optim_step_time=0.022, optim0_lr0=1.378e-04, train_time=0.166 -[v016] 2022-01-31 06:37:05,499 (trainer:653) INFO: 97epoch:train:136-162batch: iter_time=0.001, forward_time=0.032, loss=1.705, loss_att=0.844, loss_ctc=2.566, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.378e-04, train_time=0.093 -[v016] 2022-01-31 06:37:08,064 (trainer:653) INFO: 97epoch:train:163-189batch: iter_time=8.931e-05, forward_time=0.033, loss=2.099, loss_att=0.863, loss_ctc=3.335, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.378e-04, train_time=0.095 -[v016] 2022-01-31 06:37:10,564 (trainer:653) INFO: 97epoch:train:190-216batch: iter_time=8.028e-05, forward_time=0.032, loss=2.015, loss_att=0.964, loss_ctc=3.067, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.377e-04, train_time=0.092 -[v016] 2022-01-31 06:37:13,047 (trainer:653) INFO: 97epoch:train:217-243batch: iter_time=3.484e-04, forward_time=0.031, loss=2.037, loss_att=0.878, loss_ctc=3.197, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.377e-04, train_time=0.092 -[v016] 2022-01-31 06:37:15,626 (trainer:653) INFO: 97epoch:train:244-270batch: iter_time=0.005, forward_time=0.032, loss=2.183, loss_att=0.948, loss_ctc=3.418, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.377e-04, train_time=0.095 -[v016] 2022-01-31 06:37:18,032 (trainer:653) INFO: 97epoch:train:271-297batch: iter_time=7.758e-05, forward_time=0.031, loss=1.909, loss_att=0.994, loss_ctc=2.825, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.376e-04, train_time=0.089 -[v016] 2022-01-31 06:37:20,568 (trainer:653) INFO: 97epoch:train:298-324batch: iter_time=8.938e-05, forward_time=0.032, loss=2.077, loss_att=1.060, loss_ctc=3.095, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.376e-04, train_time=0.094 -[v016] 2022-01-31 06:37:23,059 (trainer:653) INFO: 97epoch:train:325-351batch: iter_time=0.001, forward_time=0.031, loss=2.007, loss_att=0.992, loss_ctc=3.022, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.376e-04, train_time=0.092 -[v016] 2022-01-31 06:37:25,480 (trainer:653) INFO: 97epoch:train:352-378batch: iter_time=0.001, forward_time=0.030, loss=1.693, loss_att=0.830, loss_ctc=2.556, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.375e-04, train_time=0.089 -[v016] 2022-01-31 06:37:27,981 (trainer:653) INFO: 97epoch:train:379-405batch: iter_time=3.623e-04, forward_time=0.032, loss=1.915, loss_att=0.890, loss_ctc=2.940, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.375e-04, train_time=0.092 -[v016] 2022-01-31 06:37:30,412 (trainer:653) INFO: 97epoch:train:406-432batch: iter_time=8.711e-05, forward_time=0.031, loss=1.876, loss_att=0.959, loss_ctc=2.792, acc=0.950, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.374e-04, train_time=0.090 -[v016] 2022-01-31 06:37:33,818 (trainer:653) INFO: 97epoch:train:433-459batch: iter_time=0.036, forward_time=0.031, loss=1.987, loss_att=0.988, loss_ctc=2.987, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.374e-04, train_time=0.126 -[v016] 2022-01-31 06:37:36,342 (trainer:653) INFO: 97epoch:train:460-486batch: iter_time=8.347e-05, forward_time=0.032, loss=1.975, loss_att=0.869, loss_ctc=3.081, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.374e-04, train_time=0.093 -[v016] 2022-01-31 06:37:39,015 (trainer:653) INFO: 97epoch:train:487-513batch: iter_time=8.787e-05, forward_time=0.034, loss=2.317, loss_att=0.958, loss_ctc=3.677, acc=0.961, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.373e-04, train_time=0.099 -[v016] 2022-01-31 06:37:41,490 (trainer:653) INFO: 97epoch:train:514-540batch: iter_time=2.374e-04, forward_time=0.032, loss=1.982, loss_att=1.034, loss_ctc=2.930, acc=0.948, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.373e-04, train_time=0.091 -[v016] 2022-01-31 06:38:15,965 (trainer:328) INFO: 97epoch results: [train] iter_time=0.006, forward_time=0.032, loss=2.005, loss_att=0.941, loss_ctc=3.069, acc=0.958, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.376e-04, train_time=0.101, time=55.59 seconds, total_count=53059, gpu_max_cached_mem_GB=5.824, [valid] loss=6.961, loss_att=5.720, loss_ctc=8.202, acc=0.904, cer=0.099, wer=0.399, cer_ctc=0.146, time=5.72 seconds, total_count=17266, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.04 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:38:18,150 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 06:38:18,156 (trainer:261) INFO: 98/200epoch started. Estimated time to finish: 3 hours, 20 minutes and 46.13 seconds -[v016] 2022-01-31 06:38:20,911 (trainer:653) INFO: 98epoch:train:1-27batch: iter_time=0.005, forward_time=0.033, loss=2.228, loss_att=0.933, loss_ctc=3.524, acc=0.963, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.373e-04, train_time=0.102 -[v016] 2022-01-31 06:38:23,446 (trainer:653) INFO: 98epoch:train:28-54batch: iter_time=8.881e-05, forward_time=0.032, loss=2.020, loss_att=0.993, loss_ctc=3.047, acc=0.949, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.372e-04, train_time=0.094 -[v016] 2022-01-31 06:38:25,951 (trainer:653) INFO: 98epoch:train:55-81batch: iter_time=5.840e-04, forward_time=0.031, loss=1.888, loss_att=0.939, loss_ctc=2.838, acc=0.956, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.372e-04, train_time=0.093 -[v016] 2022-01-31 06:38:28,523 (trainer:653) INFO: 98epoch:train:82-108batch: iter_time=9.092e-05, forward_time=0.033, loss=1.979, loss_att=0.862, loss_ctc=3.096, acc=0.959, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.372e-04, train_time=0.095 -[v016] 2022-01-31 06:38:30,965 (trainer:653) INFO: 98epoch:train:109-135batch: iter_time=7.824e-05, forward_time=0.031, loss=1.724, loss_att=0.967, loss_ctc=2.481, acc=0.950, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.371e-04, train_time=0.090 -[v016] 2022-01-31 06:38:33,545 (trainer:653) INFO: 98epoch:train:136-162batch: iter_time=8.894e-05, forward_time=0.033, loss=1.855, loss_att=0.765, loss_ctc=2.944, acc=0.969, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.371e-04, train_time=0.095 -[v016] 2022-01-31 06:38:36,334 (trainer:653) INFO: 98epoch:train:163-189batch: iter_time=0.012, forward_time=0.031, loss=1.866, loss_att=0.999, loss_ctc=2.733, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.371e-04, train_time=0.103 -[v016] 2022-01-31 06:38:38,801 (trainer:653) INFO: 98epoch:train:190-216batch: iter_time=8.252e-05, forward_time=0.031, loss=1.905, loss_att=0.978, loss_ctc=2.833, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.370e-04, train_time=0.091 -[v016] 2022-01-31 06:38:41,314 (trainer:653) INFO: 98epoch:train:217-243batch: iter_time=8.043e-05, forward_time=0.032, loss=1.931, loss_att=0.920, loss_ctc=2.943, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.370e-04, train_time=0.093 -[v016] 2022-01-31 06:38:43,980 (trainer:653) INFO: 98epoch:train:244-270batch: iter_time=1.078e-04, forward_time=0.034, loss=2.351, loss_att=0.931, loss_ctc=3.772, acc=0.960, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.370e-04, train_time=0.099 -[v016] 2022-01-31 06:38:46,496 (trainer:653) INFO: 98epoch:train:271-297batch: iter_time=8.237e-05, forward_time=0.032, loss=1.907, loss_att=0.905, loss_ctc=2.908, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.369e-04, train_time=0.093 -[v016] 2022-01-31 06:38:48,983 (trainer:653) INFO: 98epoch:train:298-324batch: iter_time=7.950e-05, forward_time=0.031, loss=2.126, loss_att=1.015, loss_ctc=3.238, acc=0.953, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.369e-04, train_time=0.092 -[v016] 2022-01-31 06:38:51,520 (trainer:653) INFO: 98epoch:train:325-351batch: iter_time=8.409e-04, forward_time=0.032, loss=2.302, loss_att=1.016, loss_ctc=3.588, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.368e-04, train_time=0.094 -[v016] 2022-01-31 06:38:53,895 (trainer:653) INFO: 98epoch:train:352-378batch: iter_time=7.619e-05, forward_time=0.030, loss=1.866, loss_att=0.929, loss_ctc=2.804, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.368e-04, train_time=0.088 -[v016] 2022-01-31 06:38:56,362 (trainer:653) INFO: 98epoch:train:379-405batch: iter_time=7.668e-05, forward_time=0.031, loss=2.153, loss_att=0.974, loss_ctc=3.332, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.368e-04, train_time=0.091 -[v016] 2022-01-31 06:38:58,892 (trainer:653) INFO: 98epoch:train:406-432batch: iter_time=8.808e-05, forward_time=0.032, loss=1.897, loss_att=0.878, loss_ctc=2.916, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.367e-04, train_time=0.093 -[v016] 2022-01-31 06:39:01,435 (trainer:653) INFO: 98epoch:train:433-459batch: iter_time=8.608e-05, forward_time=0.032, loss=2.123, loss_att=0.980, loss_ctc=3.267, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.367e-04, train_time=0.094 -[v016] 2022-01-31 06:39:03,944 (trainer:653) INFO: 98epoch:train:460-486batch: iter_time=7.948e-05, forward_time=0.032, loss=1.954, loss_att=1.019, loss_ctc=2.888, acc=0.950, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.367e-04, train_time=0.093 -[v016] 2022-01-31 06:39:06,529 (trainer:653) INFO: 98epoch:train:487-513batch: iter_time=7.911e-05, forward_time=0.032, loss=2.052, loss_att=0.892, loss_ctc=3.213, acc=0.961, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.366e-04, train_time=0.096 -[v016] 2022-01-31 06:39:09,218 (trainer:653) INFO: 98epoch:train:514-540batch: iter_time=0.006, forward_time=0.032, loss=1.905, loss_att=0.988, loss_ctc=2.822, acc=0.955, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.366e-04, train_time=0.099 -[v016] 2022-01-31 06:39:42,983 (trainer:328) INFO: 98epoch results: [train] iter_time=0.001, forward_time=0.032, loss=2.000, loss_att=0.944, loss_ctc=3.055, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.369e-04, train_time=0.094, time=51.79 seconds, total_count=53606, gpu_max_cached_mem_GB=5.824, [valid] loss=6.958, loss_att=5.728, loss_ctc=8.188, acc=0.903, cer=0.102, wer=0.407, cer_ctc=0.147, time=5.63 seconds, total_count=17444, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.4 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:39:45,146 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 06:39:45,153 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/93epoch.pth -[v016] 2022-01-31 06:39:45,153 (trainer:261) INFO: 99/200epoch started. Estimated time to finish: 3 hours, 18 minutes and 10 seconds -[v016] 2022-01-31 06:39:47,857 (trainer:653) INFO: 99epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.809, loss_att=0.787, loss_ctc=2.832, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.366e-04, train_time=0.100 -[v016] 2022-01-31 06:39:50,268 (trainer:653) INFO: 99epoch:train:28-54batch: iter_time=8.093e-05, forward_time=0.030, loss=1.620, loss_att=0.769, loss_ctc=2.471, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.365e-04, train_time=0.089 -[v016] 2022-01-31 06:39:52,766 (trainer:653) INFO: 99epoch:train:55-81batch: iter_time=7.649e-05, forward_time=0.031, loss=1.792, loss_att=0.783, loss_ctc=2.802, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.365e-04, train_time=0.092 -[v016] 2022-01-31 06:39:55,246 (trainer:653) INFO: 99epoch:train:82-108batch: iter_time=7.821e-05, forward_time=0.032, loss=2.082, loss_att=0.983, loss_ctc=3.181, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.365e-04, train_time=0.092 -[v016] 2022-01-31 06:39:57,647 (trainer:653) INFO: 99epoch:train:109-135batch: iter_time=7.634e-05, forward_time=0.030, loss=1.763, loss_att=0.874, loss_ctc=2.651, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.364e-04, train_time=0.089 -[v016] 2022-01-31 06:40:00,077 (trainer:653) INFO: 99epoch:train:136-162batch: iter_time=7.354e-05, forward_time=0.031, loss=1.640, loss_att=0.847, loss_ctc=2.433, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.364e-04, train_time=0.090 -[v016] 2022-01-31 06:40:02,580 (trainer:653) INFO: 99epoch:train:163-189batch: iter_time=8.107e-05, forward_time=0.032, loss=2.218, loss_att=0.980, loss_ctc=3.457, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.364e-04, train_time=0.093 -[v016] 2022-01-31 06:40:05,043 (trainer:653) INFO: 99epoch:train:190-216batch: iter_time=8.398e-05, forward_time=0.031, loss=2.012, loss_att=0.941, loss_ctc=3.084, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.363e-04, train_time=0.091 -[v016] 2022-01-31 06:40:07,438 (trainer:653) INFO: 99epoch:train:217-243batch: iter_time=8.128e-05, forward_time=0.031, loss=1.973, loss_att=1.008, loss_ctc=2.939, acc=0.943, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.363e-04, train_time=0.088 -[v016] 2022-01-31 06:40:10,176 (trainer:653) INFO: 99epoch:train:244-270batch: iter_time=0.011, forward_time=0.031, loss=2.159, loss_att=0.945, loss_ctc=3.373, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.363e-04, train_time=0.101 -[v016] 2022-01-31 06:40:12,588 (trainer:653) INFO: 99epoch:train:271-297batch: iter_time=7.582e-05, forward_time=0.031, loss=2.211, loss_att=1.007, loss_ctc=3.415, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.362e-04, train_time=0.089 -[v016] 2022-01-31 06:40:15,046 (trainer:653) INFO: 99epoch:train:298-324batch: iter_time=7.461e-05, forward_time=0.031, loss=1.866, loss_att=0.889, loss_ctc=2.843, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.362e-04, train_time=0.091 -[v016] 2022-01-31 06:40:17,545 (trainer:653) INFO: 99epoch:train:325-351batch: iter_time=7.614e-05, forward_time=0.032, loss=2.171, loss_att=1.021, loss_ctc=3.320, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.362e-04, train_time=0.092 -[v016] 2022-01-31 06:40:20,606 (trainer:653) INFO: 99epoch:train:352-378batch: iter_time=0.020, forward_time=0.032, loss=1.909, loss_att=0.906, loss_ctc=2.912, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.361e-04, train_time=0.113 -[v016] 2022-01-31 06:40:23,026 (trainer:653) INFO: 99epoch:train:379-405batch: iter_time=7.893e-05, forward_time=0.031, loss=2.062, loss_att=0.991, loss_ctc=3.132, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.361e-04, train_time=0.089 -[v016] 2022-01-31 06:40:25,590 (trainer:653) INFO: 99epoch:train:406-432batch: iter_time=2.157e-04, forward_time=0.033, loss=2.026, loss_att=1.022, loss_ctc=3.030, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.361e-04, train_time=0.094 -[v016] 2022-01-31 06:40:28,759 (trainer:653) INFO: 99epoch:train:433-459batch: iter_time=1.033e-04, forward_time=0.049, loss=1.984, loss_att=0.954, loss_ctc=3.014, acc=0.957, backward_time=0.029, optim_step_time=0.021, optim0_lr0=1.360e-04, train_time=0.117 -[v016] 2022-01-31 06:40:31,251 (trainer:653) INFO: 99epoch:train:460-486batch: iter_time=7.789e-05, forward_time=0.032, loss=2.150, loss_att=0.944, loss_ctc=3.356, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.360e-04, train_time=0.092 -[v016] 2022-01-31 06:40:33,681 (trainer:653) INFO: 99epoch:train:487-513batch: iter_time=7.523e-05, forward_time=0.031, loss=1.782, loss_att=0.882, loss_ctc=2.682, acc=0.956, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.359e-04, train_time=0.090 -[v016] 2022-01-31 06:40:36,210 (trainer:653) INFO: 99epoch:train:514-540batch: iter_time=8.537e-05, forward_time=0.032, loss=2.125, loss_att=0.941, loss_ctc=3.309, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.359e-04, train_time=0.093 -[v016] 2022-01-31 06:41:10,316 (trainer:328) INFO: 99epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.971, loss_att=0.923, loss_ctc=3.018, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.362e-04, train_time=0.094, time=51.78 seconds, total_count=54153, gpu_max_cached_mem_GB=5.824, [valid] loss=7.002, loss_att=5.777, loss_ctc=8.226, acc=0.902, cer=0.101, wer=0.407, cer_ctc=0.151, time=6.06 seconds, total_count=17622, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.29 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:41:13,674 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:41:13,683 (trainer:261) INFO: 100/200epoch started. Estimated time to finish: 3 hours, 15 minutes and 37.58 seconds -[v016] 2022-01-31 06:41:17,381 (trainer:653) INFO: 100epoch:train:1-27batch: iter_time=0.036, forward_time=0.032, loss=1.763, loss_att=0.798, loss_ctc=2.728, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.359e-04, train_time=0.131 -[v016] 2022-01-31 06:41:19,841 (trainer:653) INFO: 100epoch:train:28-54batch: iter_time=8.614e-05, forward_time=0.031, loss=1.953, loss_att=0.775, loss_ctc=3.132, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.358e-04, train_time=0.091 -[v016] 2022-01-31 06:41:22,326 (trainer:653) INFO: 100epoch:train:55-81batch: iter_time=7.465e-05, forward_time=0.032, loss=2.141, loss_att=0.916, loss_ctc=3.367, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.358e-04, train_time=0.092 -[v016] 2022-01-31 06:41:25,266 (trainer:653) INFO: 100epoch:train:82-108batch: iter_time=0.016, forward_time=0.032, loss=1.940, loss_att=0.879, loss_ctc=3.002, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.358e-04, train_time=0.109 -[v016] 2022-01-31 06:41:27,855 (trainer:653) INFO: 100epoch:train:109-135batch: iter_time=1.147e-04, forward_time=0.032, loss=2.174, loss_att=0.968, loss_ctc=3.381, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.357e-04, train_time=0.096 -[v016] 2022-01-31 06:41:30,620 (trainer:653) INFO: 100epoch:train:136-162batch: iter_time=0.011, forward_time=0.031, loss=1.857, loss_att=0.923, loss_ctc=2.792, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.357e-04, train_time=0.102 -[v016] 2022-01-31 06:41:33,181 (trainer:653) INFO: 100epoch:train:163-189batch: iter_time=8.241e-05, forward_time=0.032, loss=1.852, loss_att=0.876, loss_ctc=2.828, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.357e-04, train_time=0.095 -[v016] 2022-01-31 06:41:35,640 (trainer:653) INFO: 100epoch:train:190-216batch: iter_time=8.433e-05, forward_time=0.031, loss=1.903, loss_att=0.899, loss_ctc=2.908, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.356e-04, train_time=0.091 -[v016] 2022-01-31 06:41:38,105 (trainer:653) INFO: 100epoch:train:217-243batch: iter_time=8.714e-05, forward_time=0.031, loss=2.115, loss_att=1.020, loss_ctc=3.209, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.356e-04, train_time=0.091 -[v016] 2022-01-31 06:41:40,653 (trainer:653) INFO: 100epoch:train:244-270batch: iter_time=9.737e-05, forward_time=0.032, loss=2.004, loss_att=0.958, loss_ctc=3.050, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.356e-04, train_time=0.094 -[v016] 2022-01-31 06:41:43,175 (trainer:653) INFO: 100epoch:train:271-297batch: iter_time=0.004, forward_time=0.031, loss=1.673, loss_att=0.831, loss_ctc=2.514, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.355e-04, train_time=0.093 -[v016] 2022-01-31 06:41:45,913 (trainer:653) INFO: 100epoch:train:298-324batch: iter_time=0.011, forward_time=0.031, loss=1.715, loss_att=0.760, loss_ctc=2.670, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.355e-04, train_time=0.101 -[v016] 2022-01-31 06:41:48,334 (trainer:653) INFO: 100epoch:train:325-351batch: iter_time=8.025e-05, forward_time=0.031, loss=1.607, loss_att=0.778, loss_ctc=2.437, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.355e-04, train_time=0.089 -[v016] 2022-01-31 06:41:50,851 (trainer:653) INFO: 100epoch:train:352-378batch: iter_time=0.002, forward_time=0.031, loss=1.916, loss_att=0.843, loss_ctc=2.990, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.354e-04, train_time=0.093 -[v016] 2022-01-31 06:41:53,330 (trainer:653) INFO: 100epoch:train:379-405batch: iter_time=7.668e-05, forward_time=0.032, loss=1.957, loss_att=1.001, loss_ctc=2.914, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.354e-04, train_time=0.092 -[v016] 2022-01-31 06:41:55,882 (trainer:653) INFO: 100epoch:train:406-432batch: iter_time=8.486e-05, forward_time=0.032, loss=2.444, loss_att=1.040, loss_ctc=3.847, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.354e-04, train_time=0.094 -[v016] 2022-01-31 06:41:58,344 (trainer:653) INFO: 100epoch:train:433-459batch: iter_time=8.203e-05, forward_time=0.031, loss=2.024, loss_att=1.049, loss_ctc=2.999, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.353e-04, train_time=0.091 -[v016] 2022-01-31 06:42:01,361 (trainer:653) INFO: 100epoch:train:460-486batch: iter_time=0.021, forward_time=0.031, loss=2.063, loss_att=0.946, loss_ctc=3.181, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.353e-04, train_time=0.112 -[v016] 2022-01-31 06:42:04,088 (trainer:653) INFO: 100epoch:train:487-513batch: iter_time=0.008, forward_time=0.032, loss=2.004, loss_att=0.932, loss_ctc=3.077, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.353e-04, train_time=0.101 -[v016] 2022-01-31 06:42:06,549 (trainer:653) INFO: 100epoch:train:514-540batch: iter_time=7.525e-05, forward_time=0.031, loss=1.922, loss_att=0.873, loss_ctc=2.971, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.352e-04, train_time=0.091 -[v016] 2022-01-31 06:42:43,869 (trainer:328) INFO: 100epoch results: [train] iter_time=0.005, forward_time=0.031, loss=1.952, loss_att=0.903, loss_ctc=3.001, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.355e-04, train_time=0.097, time=53.55 seconds, total_count=54700, gpu_max_cached_mem_GB=5.824, [valid] loss=6.879, loss_att=5.703, loss_ctc=8.056, acc=0.904, cer=0.099, wer=0.394, cer_ctc=0.145, time=6.41 seconds, total_count=17800, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.18 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:42:46,370 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:42:46,408 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/94epoch.pth, exp/asr_train_asr_raw_en_word/95epoch.pth -[v016] 2022-01-31 06:42:46,411 (trainer:261) INFO: 101/200epoch started. Estimated time to finish: 3 hours, 13 minutes and 12.01 seconds -[v016] 2022-01-31 06:42:50,937 (trainer:653) INFO: 101epoch:train:1-27batch: iter_time=0.029, forward_time=0.047, loss=1.976, loss_att=0.894, loss_ctc=3.058, acc=0.960, backward_time=0.042, optim_step_time=0.023, optim0_lr0=1.352e-04, train_time=0.164 -[v016] 2022-01-31 06:42:54,384 (trainer:653) INFO: 101epoch:train:28-54batch: iter_time=0.034, forward_time=0.032, loss=1.762, loss_att=0.912, loss_ctc=2.611, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.352e-04, train_time=0.127 -[v016] 2022-01-31 06:42:57,118 (trainer:653) INFO: 101epoch:train:55-81batch: iter_time=0.004, forward_time=0.036, loss=1.919, loss_att=0.794, loss_ctc=3.045, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.351e-04, train_time=0.101 -[v016] 2022-01-31 06:42:59,987 (trainer:653) INFO: 101epoch:train:82-108batch: iter_time=0.015, forward_time=0.031, loss=2.170, loss_att=0.918, loss_ctc=3.423, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.351e-04, train_time=0.106 -[v016] 2022-01-31 06:43:03,332 (trainer:653) INFO: 101epoch:train:109-135batch: iter_time=0.034, forward_time=0.030, loss=1.676, loss_att=0.803, loss_ctc=2.549, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.351e-04, train_time=0.124 -[v016] 2022-01-31 06:43:06,118 (trainer:653) INFO: 101epoch:train:136-162batch: iter_time=0.011, forward_time=0.031, loss=1.601, loss_att=0.761, loss_ctc=2.441, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.350e-04, train_time=0.103 -[v016] 2022-01-31 06:43:09,337 (trainer:653) INFO: 101epoch:train:163-189batch: iter_time=0.024, forward_time=0.033, loss=1.680, loss_att=0.825, loss_ctc=2.534, acc=0.963, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.350e-04, train_time=0.119 -[v016] 2022-01-31 06:43:11,954 (trainer:653) INFO: 101epoch:train:190-216batch: iter_time=0.002, forward_time=0.033, loss=2.170, loss_att=0.944, loss_ctc=3.396, acc=0.962, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.350e-04, train_time=0.097 -[v016] 2022-01-31 06:43:14,632 (trainer:653) INFO: 101epoch:train:217-243batch: iter_time=0.006, forward_time=0.032, loss=1.654, loss_att=0.750, loss_ctc=2.558, acc=0.964, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.349e-04, train_time=0.099 -[v016] 2022-01-31 06:43:17,499 (trainer:653) INFO: 101epoch:train:244-270batch: iter_time=0.014, forward_time=0.031, loss=1.880, loss_att=0.998, loss_ctc=2.763, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.349e-04, train_time=0.106 -[v016] 2022-01-31 06:43:20,662 (trainer:653) INFO: 101epoch:train:271-297batch: iter_time=0.027, forward_time=0.031, loss=1.820, loss_att=0.853, loss_ctc=2.787, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.349e-04, train_time=0.117 -[v016] 2022-01-31 06:43:23,939 (trainer:653) INFO: 101epoch:train:298-324batch: iter_time=0.028, forward_time=0.032, loss=1.855, loss_att=0.766, loss_ctc=2.943, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.348e-04, train_time=0.121 -[v016] 2022-01-31 06:43:26,957 (trainer:653) INFO: 101epoch:train:325-351batch: iter_time=0.018, forward_time=0.032, loss=2.107, loss_att=0.977, loss_ctc=3.236, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.348e-04, train_time=0.112 -[v016] 2022-01-31 06:43:29,813 (trainer:653) INFO: 101epoch:train:352-378batch: iter_time=0.013, forward_time=0.032, loss=2.048, loss_att=0.887, loss_ctc=3.209, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.348e-04, train_time=0.106 -[v016] 2022-01-31 06:43:32,784 (trainer:653) INFO: 101epoch:train:379-405batch: iter_time=0.019, forward_time=0.031, loss=1.963, loss_att=0.918, loss_ctc=3.007, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.347e-04, train_time=0.110 -[v016] 2022-01-31 06:43:35,542 (trainer:653) INFO: 101epoch:train:406-432batch: iter_time=0.010, forward_time=0.031, loss=1.844, loss_att=0.854, loss_ctc=2.834, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.347e-04, train_time=0.102 -[v016] 2022-01-31 06:43:38,066 (trainer:653) INFO: 101epoch:train:433-459batch: iter_time=0.003, forward_time=0.031, loss=2.255, loss_att=1.087, loss_ctc=3.422, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.347e-04, train_time=0.093 -[v016] 2022-01-31 06:43:40,572 (trainer:653) INFO: 101epoch:train:460-486batch: iter_time=8.280e-05, forward_time=0.031, loss=2.189, loss_att=1.009, loss_ctc=3.369, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.346e-04, train_time=0.093 -[v016] 2022-01-31 06:43:43,347 (trainer:653) INFO: 101epoch:train:487-513batch: iter_time=0.011, forward_time=0.031, loss=1.974, loss_att=0.897, loss_ctc=3.052, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.346e-04, train_time=0.103 -[v016] 2022-01-31 06:43:46,148 (trainer:653) INFO: 101epoch:train:514-540batch: iter_time=0.011, forward_time=0.032, loss=2.003, loss_att=0.953, loss_ctc=3.054, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.346e-04, train_time=0.103 -[v016] 2022-01-31 06:44:25,822 (trainer:328) INFO: 101epoch results: [train] iter_time=0.016, forward_time=0.032, loss=1.939, loss_att=0.892, loss_ctc=2.986, acc=0.961, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.349e-04, train_time=0.111, time=1 minute and 0.82 seconds, total_count=55247, gpu_max_cached_mem_GB=5.824, [valid] loss=7.030, loss_att=5.700, loss_ctc=8.360, acc=0.904, cer=0.102, wer=0.403, cer_ctc=0.149, time=10.82 seconds, total_count=17978, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.69 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:44:28,010 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:44:28,017 (trainer:261) INFO: 102/200epoch started. Estimated time to finish: 3 hours, 10 minutes and 58.6 seconds -[v016] 2022-01-31 06:44:31,411 (trainer:653) INFO: 102epoch:train:1-27batch: iter_time=0.029, forward_time=0.032, loss=1.677, loss_att=0.813, loss_ctc=2.541, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.345e-04, train_time=0.123 -[v016] 2022-01-31 06:44:34,768 (trainer:653) INFO: 102epoch:train:28-54batch: iter_time=0.034, forward_time=0.031, loss=1.916, loss_att=0.904, loss_ctc=2.928, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.345e-04, train_time=0.125 -[v016] 2022-01-31 06:44:37,583 (trainer:653) INFO: 102epoch:train:55-81batch: iter_time=0.013, forward_time=0.031, loss=1.922, loss_att=0.874, loss_ctc=2.971, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.345e-04, train_time=0.104 -[v016] 2022-01-31 06:44:40,180 (trainer:653) INFO: 102epoch:train:82-108batch: iter_time=0.004, forward_time=0.032, loss=1.584, loss_att=0.754, loss_ctc=2.413, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.344e-04, train_time=0.096 -[v016] 2022-01-31 06:44:42,738 (trainer:653) INFO: 102epoch:train:109-135batch: iter_time=5.752e-04, forward_time=0.032, loss=1.808, loss_att=0.792, loss_ctc=2.823, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.344e-04, train_time=0.095 -[v016] 2022-01-31 06:44:45,409 (trainer:653) INFO: 102epoch:train:136-162batch: iter_time=0.005, forward_time=0.032, loss=1.762, loss_att=0.854, loss_ctc=2.669, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.344e-04, train_time=0.099 -[v016] 2022-01-31 06:44:49,054 (trainer:653) INFO: 102epoch:train:163-189batch: iter_time=0.042, forward_time=0.031, loss=1.870, loss_att=0.910, loss_ctc=2.829, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.343e-04, train_time=0.135 -[v016] 2022-01-31 06:44:54,643 (trainer:653) INFO: 102epoch:train:190-216batch: iter_time=0.060, forward_time=0.044, loss=1.920, loss_att=0.849, loss_ctc=2.991, acc=0.959, backward_time=0.055, optim_step_time=0.023, optim0_lr0=1.343e-04, train_time=0.207 -[v016] 2022-01-31 06:44:58,838 (trainer:653) INFO: 102epoch:train:217-243batch: iter_time=0.063, forward_time=0.032, loss=1.850, loss_att=0.887, loss_ctc=2.814, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.343e-04, train_time=0.155 -[v016] 2022-01-31 06:45:01,842 (trainer:653) INFO: 102epoch:train:244-270batch: iter_time=0.022, forward_time=0.030, loss=1.883, loss_att=0.892, loss_ctc=2.873, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.342e-04, train_time=0.111 -[v016] 2022-01-31 06:45:04,596 (trainer:653) INFO: 102epoch:train:271-297batch: iter_time=0.008, forward_time=0.032, loss=1.982, loss_att=0.874, loss_ctc=3.090, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.342e-04, train_time=0.102 -[v016] 2022-01-31 06:45:07,171 (trainer:653) INFO: 102epoch:train:298-324batch: iter_time=2.329e-04, forward_time=0.034, loss=1.762, loss_att=0.857, loss_ctc=2.667, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.342e-04, train_time=0.095 -[v016] 2022-01-31 06:45:09,706 (trainer:653) INFO: 102epoch:train:325-351batch: iter_time=8.202e-05, forward_time=0.032, loss=1.855, loss_att=0.806, loss_ctc=2.904, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.341e-04, train_time=0.094 -[v016] 2022-01-31 06:45:12,286 (trainer:653) INFO: 102epoch:train:352-378batch: iter_time=0.002, forward_time=0.032, loss=1.944, loss_att=0.880, loss_ctc=3.007, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.341e-04, train_time=0.095 -[v016] 2022-01-31 06:45:15,032 (trainer:653) INFO: 102epoch:train:379-405batch: iter_time=0.011, forward_time=0.031, loss=1.669, loss_att=0.764, loss_ctc=2.574, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.341e-04, train_time=0.101 -[v016] 2022-01-31 06:45:17,771 (trainer:653) INFO: 102epoch:train:406-432batch: iter_time=0.005, forward_time=0.032, loss=1.766, loss_att=0.872, loss_ctc=2.661, acc=0.960, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.340e-04, train_time=0.100 -[v016] 2022-01-31 06:45:20,343 (trainer:653) INFO: 102epoch:train:433-459batch: iter_time=0.004, forward_time=0.031, loss=1.956, loss_att=0.977, loss_ctc=2.935, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.340e-04, train_time=0.095 -[v016] 2022-01-31 06:45:23,904 (trainer:653) INFO: 102epoch:train:460-486batch: iter_time=0.040, forward_time=0.031, loss=2.298, loss_att=1.044, loss_ctc=3.553, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.340e-04, train_time=0.132 -[v016] 2022-01-31 06:45:26,378 (trainer:653) INFO: 102epoch:train:487-513batch: iter_time=2.289e-04, forward_time=0.031, loss=1.830, loss_att=0.853, loss_ctc=2.808, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.339e-04, train_time=0.091 -[v016] 2022-01-31 06:45:29,325 (trainer:653) INFO: 102epoch:train:514-540batch: iter_time=0.015, forward_time=0.032, loss=1.826, loss_att=0.768, loss_ctc=2.883, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.339e-04, train_time=0.109 -[v016] 2022-01-31 06:46:15,254 (trainer:328) INFO: 102epoch results: [train] iter_time=0.018, forward_time=0.032, loss=1.856, loss_att=0.861, loss_ctc=2.850, acc=0.962, backward_time=0.023, optim_step_time=0.021, optim0_lr0=1.342e-04, train_time=0.114, time=1 minute and 2.48 seconds, total_count=55794, gpu_max_cached_mem_GB=5.824, [valid] loss=6.952, loss_att=5.735, loss_ctc=8.170, acc=0.905, cer=0.101, wer=0.404, cer_ctc=0.150, time=12.56 seconds, total_count=18156, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.2 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:46:17,284 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:46:17,318 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/88epoch.pth, exp/asr_train_asr_raw_en_word/97epoch.pth, exp/asr_train_asr_raw_en_word/98epoch.pth -[v016] 2022-01-31 06:46:17,319 (trainer:261) INFO: 103/200epoch started. Estimated time to finish: 3 hours, 8 minutes and 55.16 seconds -[v016] 2022-01-31 06:46:19,942 (trainer:653) INFO: 103epoch:train:1-27batch: iter_time=0.005, forward_time=0.031, loss=1.640, loss_att=0.739, loss_ctc=2.542, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.339e-04, train_time=0.097 -[v016] 2022-01-31 06:46:22,348 (trainer:653) INFO: 103epoch:train:28-54batch: iter_time=8.042e-05, forward_time=0.031, loss=1.971, loss_att=0.909, loss_ctc=3.033, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.338e-04, train_time=0.089 -[v016] 2022-01-31 06:46:25,071 (trainer:653) INFO: 103epoch:train:55-81batch: iter_time=0.010, forward_time=0.031, loss=1.830, loss_att=0.834, loss_ctc=2.826, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.338e-04, train_time=0.101 -[v016] 2022-01-31 06:46:27,536 (trainer:653) INFO: 103epoch:train:82-108batch: iter_time=0.002, forward_time=0.031, loss=1.759, loss_att=0.828, loss_ctc=2.691, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.338e-04, train_time=0.091 -[v016] 2022-01-31 06:46:29,959 (trainer:653) INFO: 103epoch:train:109-135batch: iter_time=7.741e-05, forward_time=0.031, loss=1.873, loss_att=0.852, loss_ctc=2.894, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.337e-04, train_time=0.090 -[v016] 2022-01-31 06:46:32,381 (trainer:653) INFO: 103epoch:train:136-162batch: iter_time=8.342e-05, forward_time=0.031, loss=1.576, loss_att=0.759, loss_ctc=2.392, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.337e-04, train_time=0.089 -[v016] 2022-01-31 06:46:34,845 (trainer:653) INFO: 103epoch:train:163-189batch: iter_time=7.622e-05, forward_time=0.031, loss=1.813, loss_att=0.875, loss_ctc=2.751, acc=0.959, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.337e-04, train_time=0.091 -[v016] 2022-01-31 06:46:37,381 (trainer:653) INFO: 103epoch:train:190-216batch: iter_time=7.769e-05, forward_time=0.033, loss=1.835, loss_att=0.803, loss_ctc=2.867, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.336e-04, train_time=0.094 -[v016] 2022-01-31 06:46:39,766 (trainer:653) INFO: 103epoch:train:217-243batch: iter_time=7.491e-05, forward_time=0.031, loss=1.703, loss_att=0.868, loss_ctc=2.539, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.336e-04, train_time=0.088 -[v016] 2022-01-31 06:46:42,304 (trainer:653) INFO: 103epoch:train:244-270batch: iter_time=7.679e-05, forward_time=0.032, loss=2.056, loss_att=0.957, loss_ctc=3.155, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.336e-04, train_time=0.094 -[v016] 2022-01-31 06:46:44,777 (trainer:653) INFO: 103epoch:train:271-297batch: iter_time=7.733e-05, forward_time=0.032, loss=1.813, loss_att=0.872, loss_ctc=2.755, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.335e-04, train_time=0.091 -[v016] 2022-01-31 06:46:47,319 (trainer:653) INFO: 103epoch:train:298-324batch: iter_time=8.940e-05, forward_time=0.032, loss=1.985, loss_att=0.886, loss_ctc=3.084, acc=0.957, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.335e-04, train_time=0.094 -[v016] 2022-01-31 06:46:50,230 (trainer:653) INFO: 103epoch:train:325-351batch: iter_time=1.339e-04, forward_time=0.037, loss=2.081, loss_att=0.955, loss_ctc=3.207, acc=0.960, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.335e-04, train_time=0.108 -[v016] 2022-01-31 06:46:52,997 (trainer:653) INFO: 103epoch:train:352-378batch: iter_time=1.271e-04, forward_time=0.035, loss=2.074, loss_att=0.977, loss_ctc=3.171, acc=0.955, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.334e-04, train_time=0.102 -[v016] 2022-01-31 06:46:55,805 (trainer:653) INFO: 103epoch:train:379-405batch: iter_time=1.666e-04, forward_time=0.036, loss=2.045, loss_att=0.857, loss_ctc=3.234, acc=0.963, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.334e-04, train_time=0.104 -[v016] 2022-01-31 06:46:58,756 (trainer:653) INFO: 103epoch:train:406-432batch: iter_time=0.003, forward_time=0.040, loss=2.019, loss_att=0.908, loss_ctc=3.129, acc=0.960, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.334e-04, train_time=0.109 -[v016] 2022-01-31 06:47:01,581 (trainer:653) INFO: 103epoch:train:433-459batch: iter_time=1.178e-04, forward_time=0.036, loss=2.071, loss_att=0.907, loss_ctc=3.235, acc=0.963, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.333e-04, train_time=0.104 -[v016] 2022-01-31 06:47:04,359 (trainer:653) INFO: 103epoch:train:460-486batch: iter_time=1.123e-04, forward_time=0.035, loss=1.833, loss_att=0.926, loss_ctc=2.741, acc=0.959, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.333e-04, train_time=0.103 -[v016] 2022-01-31 06:47:07,180 (trainer:653) INFO: 103epoch:train:487-513batch: iter_time=1.250e-04, forward_time=0.036, loss=1.877, loss_att=0.866, loss_ctc=2.889, acc=0.959, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.333e-04, train_time=0.104 -[v016] 2022-01-31 06:47:10,001 (trainer:653) INFO: 103epoch:train:514-540batch: iter_time=1.118e-04, forward_time=0.036, loss=1.993, loss_att=0.927, loss_ctc=3.059, acc=0.961, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.332e-04, train_time=0.104 -[v016] 2022-01-31 06:47:46,364 (trainer:328) INFO: 103epoch results: [train] iter_time=0.001, forward_time=0.033, loss=1.889, loss_att=0.874, loss_ctc=2.904, acc=0.961, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.335e-04, train_time=0.097, time=53.46 seconds, total_count=56341, gpu_max_cached_mem_GB=5.824, [valid] loss=6.997, loss_att=5.761, loss_ctc=8.233, acc=0.904, cer=0.100, wer=0.402, cer_ctc=0.149, time=6.36 seconds, total_count=18334, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.22 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:47:49,422 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 06:47:49,429 (trainer:261) INFO: 104/200epoch started. Estimated time to finish: 3 hours, 6 minutes and 31.96 seconds -[v016] 2022-01-31 06:47:53,180 (trainer:653) INFO: 104epoch:train:1-27batch: iter_time=0.032, forward_time=0.034, loss=1.852, loss_att=0.776, loss_ctc=2.927, acc=0.965, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.332e-04, train_time=0.133 -[v016] 2022-01-31 06:47:56,567 (trainer:653) INFO: 104epoch:train:28-54batch: iter_time=0.027, forward_time=0.034, loss=2.014, loss_att=0.904, loss_ctc=3.123, acc=0.962, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.332e-04, train_time=0.125 -[v016] 2022-01-31 06:47:59,222 (trainer:653) INFO: 104epoch:train:55-81batch: iter_time=0.002, forward_time=0.033, loss=2.006, loss_att=0.871, loss_ctc=3.141, acc=0.963, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.331e-04, train_time=0.098 -[v016] 2022-01-31 06:48:02,603 (trainer:653) INFO: 104epoch:train:82-108batch: iter_time=0.031, forward_time=0.032, loss=1.884, loss_att=0.861, loss_ctc=2.907, acc=0.963, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.331e-04, train_time=0.125 -[v016] 2022-01-31 06:48:05,083 (trainer:653) INFO: 104epoch:train:109-135batch: iter_time=8.047e-05, forward_time=0.031, loss=1.911, loss_att=0.920, loss_ctc=2.901, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.331e-04, train_time=0.092 -[v016] 2022-01-31 06:48:07,936 (trainer:653) INFO: 104epoch:train:136-162batch: iter_time=0.014, forward_time=0.031, loss=1.841, loss_att=0.796, loss_ctc=2.886, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.330e-04, train_time=0.105 -[v016] 2022-01-31 06:48:10,600 (trainer:653) INFO: 104epoch:train:163-189batch: iter_time=0.004, forward_time=0.032, loss=1.774, loss_att=0.796, loss_ctc=2.752, acc=0.966, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.330e-04, train_time=0.098 -[v016] 2022-01-31 06:48:13,044 (trainer:653) INFO: 104epoch:train:190-216batch: iter_time=9.111e-05, forward_time=0.031, loss=1.765, loss_att=0.909, loss_ctc=2.621, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.330e-04, train_time=0.090 -[v016] 2022-01-31 06:48:15,545 (trainer:653) INFO: 104epoch:train:217-243batch: iter_time=8.503e-05, forward_time=0.032, loss=1.689, loss_att=0.739, loss_ctc=2.638, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.330e-04, train_time=0.092 -[v016] 2022-01-31 06:48:18,161 (trainer:653) INFO: 104epoch:train:244-270batch: iter_time=0.005, forward_time=0.032, loss=1.518, loss_att=0.788, loss_ctc=2.248, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.329e-04, train_time=0.097 -[v016] 2022-01-31 06:48:20,690 (trainer:653) INFO: 104epoch:train:271-297batch: iter_time=8.827e-05, forward_time=0.032, loss=1.674, loss_att=0.761, loss_ctc=2.586, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.329e-04, train_time=0.093 -[v016] 2022-01-31 06:48:23,680 (trainer:653) INFO: 104epoch:train:298-324batch: iter_time=0.018, forward_time=0.032, loss=1.857, loss_att=0.881, loss_ctc=2.833, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.329e-04, train_time=0.111 -[v016] 2022-01-31 06:48:26,120 (trainer:653) INFO: 104epoch:train:325-351batch: iter_time=7.720e-05, forward_time=0.031, loss=1.615, loss_att=0.777, loss_ctc=2.453, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.328e-04, train_time=0.090 -[v016] 2022-01-31 06:48:28,571 (trainer:653) INFO: 104epoch:train:352-378batch: iter_time=0.002, forward_time=0.030, loss=1.575, loss_att=0.763, loss_ctc=2.386, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.328e-04, train_time=0.091 -[v016] 2022-01-31 06:48:32,564 (trainer:653) INFO: 104epoch:train:379-405batch: iter_time=0.057, forward_time=0.031, loss=1.687, loss_att=0.741, loss_ctc=2.633, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.328e-04, train_time=0.148 -[v016] 2022-01-31 06:48:35,123 (trainer:653) INFO: 104epoch:train:406-432batch: iter_time=9.397e-04, forward_time=0.032, loss=1.976, loss_att=0.922, loss_ctc=3.029, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.327e-04, train_time=0.095 -[v016] 2022-01-31 06:48:37,668 (trainer:653) INFO: 104epoch:train:433-459batch: iter_time=0.001, forward_time=0.032, loss=1.991, loss_att=0.903, loss_ctc=3.078, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.327e-04, train_time=0.094 -[v016] 2022-01-31 06:48:40,234 (trainer:653) INFO: 104epoch:train:460-486batch: iter_time=0.002, forward_time=0.032, loss=1.945, loss_att=0.896, loss_ctc=2.993, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.327e-04, train_time=0.095 -[v016] 2022-01-31 06:48:42,913 (trainer:653) INFO: 104epoch:train:487-513batch: iter_time=0.006, forward_time=0.032, loss=2.361, loss_att=1.002, loss_ctc=3.719, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.326e-04, train_time=0.099 -[v016] 2022-01-31 06:48:45,804 (trainer:653) INFO: 104epoch:train:514-540batch: iter_time=0.015, forward_time=0.031, loss=2.046, loss_att=0.970, loss_ctc=3.123, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.326e-04, train_time=0.107 -[v016] 2022-01-31 06:49:20,004 (trainer:328) INFO: 104epoch results: [train] iter_time=0.012, forward_time=0.032, loss=1.846, loss_att=0.848, loss_ctc=2.845, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.329e-04, train_time=0.105, time=57.52 seconds, total_count=56888, gpu_max_cached_mem_GB=5.824, [valid] loss=7.028, loss_att=5.757, loss_ctc=8.298, acc=0.903, cer=0.098, wer=0.401, cer_ctc=0.147, time=5.78 seconds, total_count=18512, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.27 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:49:22,571 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 06:49:22,578 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/99epoch.pth -[v016] 2022-01-31 06:49:22,579 (trainer:261) INFO: 105/200epoch started. Estimated time to finish: 3 hours, 4 minutes and 11.18 seconds -[v016] 2022-01-31 06:49:26,056 (trainer:653) INFO: 105epoch:train:1-27batch: iter_time=0.033, forward_time=0.031, loss=1.861, loss_att=0.931, loss_ctc=2.790, acc=0.954, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.326e-04, train_time=0.125 -[v016] 2022-01-31 06:49:28,574 (trainer:653) INFO: 105epoch:train:28-54batch: iter_time=8.392e-05, forward_time=0.032, loss=1.768, loss_att=0.753, loss_ctc=2.783, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.325e-04, train_time=0.094 -[v016] 2022-01-31 06:49:31,027 (trainer:653) INFO: 105epoch:train:55-81batch: iter_time=0.001, forward_time=0.030, loss=1.675, loss_att=0.799, loss_ctc=2.551, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.325e-04, train_time=0.091 -[v016] 2022-01-31 06:49:33,465 (trainer:653) INFO: 105epoch:train:82-108batch: iter_time=7.377e-05, forward_time=0.031, loss=1.668, loss_att=0.777, loss_ctc=2.558, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.325e-04, train_time=0.090 -[v016] 2022-01-31 06:49:36,006 (trainer:653) INFO: 105epoch:train:109-135batch: iter_time=0.003, forward_time=0.031, loss=1.700, loss_att=0.795, loss_ctc=2.604, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.324e-04, train_time=0.094 -[v016] 2022-01-31 06:49:38,491 (trainer:653) INFO: 105epoch:train:136-162batch: iter_time=8.108e-05, forward_time=0.031, loss=1.766, loss_att=0.863, loss_ctc=2.668, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.324e-04, train_time=0.092 -[v016] 2022-01-31 06:49:41,113 (trainer:653) INFO: 105epoch:train:163-189batch: iter_time=0.005, forward_time=0.031, loss=1.723, loss_att=0.785, loss_ctc=2.662, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.324e-04, train_time=0.097 -[v016] 2022-01-31 06:49:43,972 (trainer:653) INFO: 105epoch:train:190-216batch: iter_time=0.015, forward_time=0.031, loss=1.918, loss_att=0.907, loss_ctc=2.929, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.323e-04, train_time=0.106 -[v016] 2022-01-31 06:49:46,435 (trainer:653) INFO: 105epoch:train:217-243batch: iter_time=7.644e-05, forward_time=0.032, loss=2.001, loss_att=0.886, loss_ctc=3.117, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.323e-04, train_time=0.091 -[v016] 2022-01-31 06:49:48,931 (trainer:653) INFO: 105epoch:train:244-270batch: iter_time=7.998e-05, forward_time=0.032, loss=1.934, loss_att=0.883, loss_ctc=2.985, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.323e-04, train_time=0.092 -[v016] 2022-01-31 06:49:51,386 (trainer:653) INFO: 105epoch:train:271-297batch: iter_time=8.719e-05, forward_time=0.032, loss=1.703, loss_att=0.698, loss_ctc=2.709, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.323e-04, train_time=0.091 -[v016] 2022-01-31 06:49:53,916 (trainer:653) INFO: 105epoch:train:298-324batch: iter_time=0.001, forward_time=0.032, loss=1.501, loss_att=0.673, loss_ctc=2.328, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.322e-04, train_time=0.094 -[v016] 2022-01-31 06:49:56,471 (trainer:653) INFO: 105epoch:train:325-351batch: iter_time=8.770e-05, forward_time=0.033, loss=2.066, loss_att=0.872, loss_ctc=3.261, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.322e-04, train_time=0.094 -[v016] 2022-01-31 06:49:58,853 (trainer:653) INFO: 105epoch:train:352-378batch: iter_time=7.420e-05, forward_time=0.030, loss=1.452, loss_att=0.750, loss_ctc=2.154, acc=0.966, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.322e-04, train_time=0.088 -[v016] 2022-01-31 06:50:01,490 (trainer:653) INFO: 105epoch:train:379-405batch: iter_time=0.004, forward_time=0.032, loss=1.936, loss_att=0.874, loss_ctc=2.999, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.321e-04, train_time=0.097 -[v016] 2022-01-31 06:50:03,952 (trainer:653) INFO: 105epoch:train:406-432batch: iter_time=7.782e-05, forward_time=0.032, loss=1.691, loss_att=0.812, loss_ctc=2.569, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.321e-04, train_time=0.091 -[v016] 2022-01-31 06:50:07,130 (trainer:653) INFO: 105epoch:train:433-459batch: iter_time=0.026, forward_time=0.032, loss=1.979, loss_att=0.879, loss_ctc=3.079, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.321e-04, train_time=0.117 -[v016] 2022-01-31 06:50:09,676 (trainer:653) INFO: 105epoch:train:460-486batch: iter_time=0.002, forward_time=0.032, loss=2.017, loss_att=0.945, loss_ctc=3.089, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.320e-04, train_time=0.094 -[v016] 2022-01-31 06:50:12,274 (trainer:653) INFO: 105epoch:train:487-513batch: iter_time=0.004, forward_time=0.032, loss=1.577, loss_att=0.740, loss_ctc=2.414, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.320e-04, train_time=0.096 -[v016] 2022-01-31 06:50:14,849 (trainer:653) INFO: 105epoch:train:514-540batch: iter_time=0.002, forward_time=0.032, loss=2.056, loss_att=0.946, loss_ctc=3.167, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.320e-04, train_time=0.095 -[v016] 2022-01-31 06:50:49,254 (trainer:328) INFO: 105epoch results: [train] iter_time=0.005, forward_time=0.032, loss=1.801, loss_att=0.829, loss_ctc=2.772, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.323e-04, train_time=0.097, time=53.11 seconds, total_count=57435, gpu_max_cached_mem_GB=5.824, [valid] loss=6.949, loss_att=5.759, loss_ctc=8.140, acc=0.904, cer=0.102, wer=0.398, cer_ctc=0.146, time=5.66 seconds, total_count=18690, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.9 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:50:51,791 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:50:51,798 (trainer:261) INFO: 106/200epoch started. Estimated time to finish: 3 hours, 1 minute and 47.12 seconds -[v016] 2022-01-31 06:50:56,546 (trainer:653) INFO: 106epoch:train:1-27batch: iter_time=0.033, forward_time=0.056, loss=1.508, loss_att=0.746, loss_ctc=2.270, acc=0.961, backward_time=0.024, optim_step_time=0.028, optim0_lr0=1.319e-04, train_time=0.169 -[v016] 2022-01-31 06:50:59,154 (trainer:653) INFO: 106epoch:train:28-54batch: iter_time=0.003, forward_time=0.032, loss=1.724, loss_att=0.816, loss_ctc=2.632, acc=0.968, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.319e-04, train_time=0.096 -[v016] 2022-01-31 06:51:01,755 (trainer:653) INFO: 106epoch:train:55-81batch: iter_time=0.003, forward_time=0.031, loss=1.908, loss_att=0.859, loss_ctc=2.958, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.319e-04, train_time=0.096 -[v016] 2022-01-31 06:51:04,314 (trainer:653) INFO: 106epoch:train:82-108batch: iter_time=8.378e-05, forward_time=0.032, loss=1.898, loss_att=0.776, loss_ctc=3.021, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.318e-04, train_time=0.095 -[v016] 2022-01-31 06:51:06,922 (trainer:653) INFO: 106epoch:train:109-135batch: iter_time=0.003, forward_time=0.032, loss=1.791, loss_att=0.766, loss_ctc=2.816, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.318e-04, train_time=0.096 -[v016] 2022-01-31 06:51:09,664 (trainer:653) INFO: 106epoch:train:136-162batch: iter_time=0.009, forward_time=0.031, loss=2.140, loss_att=0.959, loss_ctc=3.320, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.318e-04, train_time=0.101 -[v016] 2022-01-31 06:51:12,092 (trainer:653) INFO: 106epoch:train:163-189batch: iter_time=7.804e-05, forward_time=0.031, loss=1.658, loss_att=0.749, loss_ctc=2.567, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.317e-04, train_time=0.090 -[v016] 2022-01-31 06:51:14,680 (trainer:653) INFO: 106epoch:train:190-216batch: iter_time=0.001, forward_time=0.032, loss=2.121, loss_att=0.960, loss_ctc=3.282, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.317e-04, train_time=0.096 -[v016] 2022-01-31 06:51:17,414 (trainer:653) INFO: 106epoch:train:217-243batch: iter_time=0.004, forward_time=0.033, loss=1.851, loss_att=0.829, loss_ctc=2.873, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.317e-04, train_time=0.101 -[v016] 2022-01-31 06:51:20,102 (trainer:653) INFO: 106epoch:train:244-270batch: iter_time=0.004, forward_time=0.032, loss=1.932, loss_att=0.821, loss_ctc=3.044, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.317e-04, train_time=0.099 -[v016] 2022-01-31 06:51:22,550 (trainer:653) INFO: 106epoch:train:271-297batch: iter_time=7.924e-05, forward_time=0.031, loss=1.655, loss_att=0.758, loss_ctc=2.552, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.316e-04, train_time=0.090 -[v016] 2022-01-31 06:51:25,131 (trainer:653) INFO: 106epoch:train:298-324batch: iter_time=0.003, forward_time=0.032, loss=1.818, loss_att=0.773, loss_ctc=2.864, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.316e-04, train_time=0.095 -[v016] 2022-01-31 06:51:27,559 (trainer:653) INFO: 106epoch:train:325-351batch: iter_time=8.266e-05, forward_time=0.030, loss=1.926, loss_att=0.903, loss_ctc=2.948, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.316e-04, train_time=0.090 -[v016] 2022-01-31 06:51:30,013 (trainer:653) INFO: 106epoch:train:352-378batch: iter_time=3.086e-04, forward_time=0.031, loss=1.499, loss_att=0.724, loss_ctc=2.274, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.315e-04, train_time=0.091 -[v016] 2022-01-31 06:51:32,542 (trainer:653) INFO: 106epoch:train:379-405batch: iter_time=0.003, forward_time=0.031, loss=1.726, loss_att=0.776, loss_ctc=2.676, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.315e-04, train_time=0.093 -[v016] 2022-01-31 06:51:35,123 (trainer:653) INFO: 106epoch:train:406-432batch: iter_time=0.003, forward_time=0.032, loss=1.936, loss_att=0.900, loss_ctc=2.972, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.315e-04, train_time=0.095 -[v016] 2022-01-31 06:51:37,628 (trainer:653) INFO: 106epoch:train:433-459batch: iter_time=0.003, forward_time=0.030, loss=1.687, loss_att=0.825, loss_ctc=2.548, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.314e-04, train_time=0.093 -[v016] 2022-01-31 06:51:40,618 (trainer:653) INFO: 106epoch:train:460-486batch: iter_time=0.018, forward_time=0.032, loss=1.829, loss_att=0.882, loss_ctc=2.777, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.314e-04, train_time=0.111 -[v016] 2022-01-31 06:51:43,015 (trainer:653) INFO: 106epoch:train:487-513batch: iter_time=7.644e-05, forward_time=0.030, loss=1.713, loss_att=0.838, loss_ctc=2.588, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.314e-04, train_time=0.089 -[v016] 2022-01-31 06:51:45,465 (trainer:653) INFO: 106epoch:train:514-540batch: iter_time=7.872e-05, forward_time=0.031, loss=1.743, loss_att=0.842, loss_ctc=2.644, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.313e-04, train_time=0.091 -[v016] 2022-01-31 06:52:26,356 (trainer:328) INFO: 106epoch results: [train] iter_time=0.005, forward_time=0.033, loss=1.795, loss_att=0.822, loss_ctc=2.768, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.316e-04, train_time=0.099, time=54.38 seconds, total_count=57982, gpu_max_cached_mem_GB=5.824, [valid] loss=7.009, loss_att=5.800, loss_ctc=8.219, acc=0.903, cer=0.102, wer=0.404, cer_ctc=0.149, time=11.42 seconds, total_count=18868, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.76 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:52:28,410 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:52:28,417 (trainer:261) INFO: 107/200epoch started. Estimated time to finish: 2 hours, 59 minutes and 32.42 seconds -[v016] 2022-01-31 06:52:31,272 (trainer:653) INFO: 107epoch:train:1-27batch: iter_time=0.009, forward_time=0.033, loss=1.383, loss_att=0.610, loss_ctc=2.157, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.313e-04, train_time=0.105 -[v016] 2022-01-31 06:52:33,867 (trainer:653) INFO: 107epoch:train:28-54batch: iter_time=0.005, forward_time=0.031, loss=1.704, loss_att=0.775, loss_ctc=2.634, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.313e-04, train_time=0.096 -[v016] 2022-01-31 06:52:36,367 (trainer:653) INFO: 107epoch:train:55-81batch: iter_time=8.197e-05, forward_time=0.032, loss=1.595, loss_att=0.721, loss_ctc=2.468, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.312e-04, train_time=0.092 -[v016] 2022-01-31 06:52:38,943 (trainer:653) INFO: 107epoch:train:82-108batch: iter_time=8.599e-05, forward_time=0.033, loss=1.847, loss_att=0.790, loss_ctc=2.905, acc=0.967, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.312e-04, train_time=0.095 -[v016] 2022-01-31 06:52:41,521 (trainer:653) INFO: 107epoch:train:109-135batch: iter_time=9.058e-05, forward_time=0.033, loss=1.984, loss_att=0.855, loss_ctc=3.114, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.312e-04, train_time=0.095 -[v016] 2022-01-31 06:52:44,104 (trainer:653) INFO: 107epoch:train:136-162batch: iter_time=0.006, forward_time=0.030, loss=1.843, loss_att=0.960, loss_ctc=2.726, acc=0.952, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.312e-04, train_time=0.095 -[v016] 2022-01-31 06:52:46,607 (trainer:653) INFO: 107epoch:train:163-189batch: iter_time=7.990e-05, forward_time=0.032, loss=1.853, loss_att=0.824, loss_ctc=2.883, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.311e-04, train_time=0.092 -[v016] 2022-01-31 06:52:49,400 (trainer:653) INFO: 107epoch:train:190-216batch: iter_time=0.008, forward_time=0.033, loss=1.879, loss_att=0.827, loss_ctc=2.931, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.311e-04, train_time=0.103 -[v016] 2022-01-31 06:52:51,919 (trainer:653) INFO: 107epoch:train:217-243batch: iter_time=1.175e-04, forward_time=0.032, loss=1.612, loss_att=0.856, loss_ctc=2.369, acc=0.956, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.311e-04, train_time=0.093 -[v016] 2022-01-31 06:52:54,594 (trainer:653) INFO: 107epoch:train:244-270batch: iter_time=3.726e-04, forward_time=0.032, loss=1.973, loss_att=0.905, loss_ctc=3.040, acc=0.955, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.310e-04, train_time=0.099 -[v016] 2022-01-31 06:52:57,057 (trainer:653) INFO: 107epoch:train:271-297batch: iter_time=1.159e-04, forward_time=0.031, loss=1.609, loss_att=0.760, loss_ctc=2.459, acc=0.967, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.310e-04, train_time=0.091 -[v016] 2022-01-31 06:52:59,546 (trainer:653) INFO: 107epoch:train:298-324batch: iter_time=7.942e-05, forward_time=0.032, loss=1.689, loss_att=0.752, loss_ctc=2.625, acc=0.966, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.310e-04, train_time=0.092 -[v016] 2022-01-31 06:53:02,152 (trainer:653) INFO: 107epoch:train:325-351batch: iter_time=8.296e-05, forward_time=0.034, loss=2.014, loss_att=0.923, loss_ctc=3.105, acc=0.964, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.309e-04, train_time=0.096 -[v016] 2022-01-31 06:53:04,615 (trainer:653) INFO: 107epoch:train:352-378batch: iter_time=7.897e-05, forward_time=0.031, loss=1.714, loss_att=0.836, loss_ctc=2.593, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.309e-04, train_time=0.091 -[v016] 2022-01-31 06:53:07,219 (trainer:653) INFO: 107epoch:train:379-405batch: iter_time=8.341e-05, forward_time=0.033, loss=1.781, loss_att=0.819, loss_ctc=2.744, acc=0.964, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.309e-04, train_time=0.096 -[v016] 2022-01-31 06:53:09,706 (trainer:653) INFO: 107epoch:train:406-432batch: iter_time=8.876e-05, forward_time=0.032, loss=1.514, loss_att=0.764, loss_ctc=2.263, acc=0.963, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.309e-04, train_time=0.092 -[v016] 2022-01-31 06:53:12,272 (trainer:653) INFO: 107epoch:train:433-459batch: iter_time=8.711e-05, forward_time=0.033, loss=2.114, loss_att=0.980, loss_ctc=3.248, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.308e-04, train_time=0.095 -[v016] 2022-01-31 06:53:15,094 (trainer:653) INFO: 107epoch:train:460-486batch: iter_time=0.012, forward_time=0.032, loss=1.736, loss_att=0.881, loss_ctc=2.591, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.308e-04, train_time=0.104 -[v016] 2022-01-31 06:53:17,605 (trainer:653) INFO: 107epoch:train:487-513batch: iter_time=8.238e-05, forward_time=0.032, loss=1.822, loss_att=0.789, loss_ctc=2.855, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.308e-04, train_time=0.093 -[v016] 2022-01-31 06:53:20,050 (trainer:653) INFO: 107epoch:train:514-540batch: iter_time=7.937e-05, forward_time=0.031, loss=1.848, loss_att=0.853, loss_ctc=2.843, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.307e-04, train_time=0.090 -[v016] 2022-01-31 06:53:53,975 (trainer:328) INFO: 107epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.772, loss_att=0.823, loss_ctc=2.720, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.310e-04, train_time=0.095, time=52.32 seconds, total_count=58529, gpu_max_cached_mem_GB=5.824, [valid] loss=7.013, loss_att=5.760, loss_ctc=8.265, acc=0.905, cer=0.100, wer=0.393, cer_ctc=0.145, time=5.9 seconds, total_count=19046, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.34 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:53:56,159 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:53:56,283 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/91epoch.pth, exp/asr_train_asr_raw_en_word/101epoch.pth, exp/asr_train_asr_raw_en_word/103epoch.pth -[v016] 2022-01-31 06:53:56,287 (trainer:261) INFO: 108/200epoch started. Estimated time to finish: 2 hours, 57 minutes and 9.24 seconds -[v016] 2022-01-31 06:53:59,028 (trainer:653) INFO: 108epoch:train:1-27batch: iter_time=0.008, forward_time=0.031, loss=1.407, loss_att=0.687, loss_ctc=2.128, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.307e-04, train_time=0.101 -[v016] 2022-01-31 06:54:01,521 (trainer:653) INFO: 108epoch:train:28-54batch: iter_time=8.065e-05, forward_time=0.031, loss=1.893, loss_att=0.789, loss_ctc=2.997, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.307e-04, train_time=0.092 -[v016] 2022-01-31 06:54:03,861 (trainer:653) INFO: 108epoch:train:55-81batch: iter_time=7.594e-05, forward_time=0.030, loss=1.465, loss_att=0.784, loss_ctc=2.145, acc=0.953, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.306e-04, train_time=0.086 -[v016] 2022-01-31 06:54:06,351 (trainer:653) INFO: 108epoch:train:82-108batch: iter_time=7.668e-05, forward_time=0.032, loss=1.996, loss_att=0.973, loss_ctc=3.018, acc=0.962, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.306e-04, train_time=0.092 -[v016] 2022-01-31 06:54:08,851 (trainer:653) INFO: 108epoch:train:109-135batch: iter_time=7.789e-05, forward_time=0.032, loss=1.945, loss_att=0.870, loss_ctc=3.019, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.306e-04, train_time=0.092 -[v016] 2022-01-31 06:54:11,423 (trainer:653) INFO: 108epoch:train:136-162batch: iter_time=8.054e-05, forward_time=0.033, loss=2.268, loss_att=0.887, loss_ctc=3.649, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.305e-04, train_time=0.095 -[v016] 2022-01-31 06:54:13,978 (trainer:653) INFO: 108epoch:train:163-189batch: iter_time=7.982e-05, forward_time=0.033, loss=1.755, loss_att=0.778, loss_ctc=2.731, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.305e-04, train_time=0.094 -[v016] 2022-01-31 06:54:16,389 (trainer:653) INFO: 108epoch:train:190-216batch: iter_time=7.647e-05, forward_time=0.031, loss=1.764, loss_att=0.850, loss_ctc=2.679, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.305e-04, train_time=0.089 -[v016] 2022-01-31 06:54:19,745 (trainer:653) INFO: 108epoch:train:217-243batch: iter_time=0.034, forward_time=0.031, loss=1.587, loss_att=0.748, loss_ctc=2.427, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.305e-04, train_time=0.124 -[v016] 2022-01-31 06:54:22,245 (trainer:653) INFO: 108epoch:train:244-270batch: iter_time=7.890e-05, forward_time=0.032, loss=1.857, loss_att=0.860, loss_ctc=2.854, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.304e-04, train_time=0.092 -[v016] 2022-01-31 06:54:24,694 (trainer:653) INFO: 108epoch:train:271-297batch: iter_time=7.689e-05, forward_time=0.032, loss=1.598, loss_att=0.804, loss_ctc=2.393, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.304e-04, train_time=0.091 -[v016] 2022-01-31 06:54:27,105 (trainer:653) INFO: 108epoch:train:298-324batch: iter_time=8.231e-05, forward_time=0.031, loss=1.696, loss_att=0.783, loss_ctc=2.609, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.304e-04, train_time=0.089 -[v016] 2022-01-31 06:54:29,555 (trainer:653) INFO: 108epoch:train:325-351batch: iter_time=8.434e-05, forward_time=0.032, loss=1.596, loss_att=0.753, loss_ctc=2.439, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.303e-04, train_time=0.091 -[v016] 2022-01-31 06:54:31,996 (trainer:653) INFO: 108epoch:train:352-378batch: iter_time=7.886e-05, forward_time=0.031, loss=1.700, loss_att=0.813, loss_ctc=2.587, acc=0.963, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.303e-04, train_time=0.090 -[v016] 2022-01-31 06:54:34,571 (trainer:653) INFO: 108epoch:train:379-405batch: iter_time=7.844e-05, forward_time=0.033, loss=1.907, loss_att=0.835, loss_ctc=2.979, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.303e-04, train_time=0.095 -[v016] 2022-01-31 06:54:37,006 (trainer:653) INFO: 108epoch:train:406-432batch: iter_time=7.711e-05, forward_time=0.032, loss=1.864, loss_att=0.853, loss_ctc=2.874, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.302e-04, train_time=0.090 -[v016] 2022-01-31 06:54:39,465 (trainer:653) INFO: 108epoch:train:433-459batch: iter_time=7.807e-05, forward_time=0.032, loss=1.837, loss_att=0.854, loss_ctc=2.819, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.302e-04, train_time=0.091 -[v016] 2022-01-31 06:54:41,947 (trainer:653) INFO: 108epoch:train:460-486batch: iter_time=7.695e-05, forward_time=0.032, loss=1.740, loss_att=0.746, loss_ctc=2.733, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.302e-04, train_time=0.092 -[v016] 2022-01-31 06:54:44,451 (trainer:653) INFO: 108epoch:train:487-513batch: iter_time=8.401e-05, forward_time=0.032, loss=1.735, loss_att=0.775, loss_ctc=2.694, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.302e-04, train_time=0.093 -[v016] 2022-01-31 06:54:46,939 (trainer:653) INFO: 108epoch:train:514-540batch: iter_time=7.846e-05, forward_time=0.032, loss=1.649, loss_att=0.806, loss_ctc=2.493, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.301e-04, train_time=0.092 -[v016] 2022-01-31 06:55:21,580 (trainer:328) INFO: 108epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.759, loss_att=0.811, loss_ctc=2.707, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.304e-04, train_time=0.094, time=51.4 seconds, total_count=59076, gpu_max_cached_mem_GB=5.824, [valid] loss=7.145, loss_att=5.920, loss_ctc=8.369, acc=0.903, cer=0.104, wer=0.409, cer_ctc=0.149, time=6.37 seconds, total_count=19224, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.53 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:55:23,605 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:55:23,613 (trainer:261) INFO: 109/200epoch started. Estimated time to finish: 2 hours, 54 minutes and 46.76 seconds -[v016] 2022-01-31 06:55:26,608 (trainer:653) INFO: 109epoch:train:1-27batch: iter_time=0.012, forward_time=0.033, loss=1.732, loss_att=0.763, loss_ctc=2.701, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.301e-04, train_time=0.108 -[v016] 2022-01-31 06:55:29,105 (trainer:653) INFO: 109epoch:train:28-54batch: iter_time=8.131e-05, forward_time=0.032, loss=1.429, loss_att=0.626, loss_ctc=2.232, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.301e-04, train_time=0.092 -[v016] 2022-01-31 06:55:31,546 (trainer:653) INFO: 109epoch:train:55-81batch: iter_time=8.140e-05, forward_time=0.031, loss=1.666, loss_att=0.778, loss_ctc=2.554, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.300e-04, train_time=0.090 -[v016] 2022-01-31 06:55:33,959 (trainer:653) INFO: 109epoch:train:82-108batch: iter_time=7.760e-05, forward_time=0.031, loss=1.390, loss_att=0.667, loss_ctc=2.114, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.300e-04, train_time=0.089 -[v016] 2022-01-31 06:55:36,609 (trainer:653) INFO: 109epoch:train:109-135batch: iter_time=0.005, forward_time=0.032, loss=1.861, loss_att=0.775, loss_ctc=2.948, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.300e-04, train_time=0.098 -[v016] 2022-01-31 06:55:39,115 (trainer:653) INFO: 109epoch:train:136-162batch: iter_time=7.875e-05, forward_time=0.032, loss=1.580, loss_att=0.748, loss_ctc=2.413, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.299e-04, train_time=0.093 -[v016] 2022-01-31 06:55:41,712 (trainer:653) INFO: 109epoch:train:163-189batch: iter_time=7.523e-05, forward_time=0.033, loss=1.905, loss_att=0.714, loss_ctc=3.095, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.299e-04, train_time=0.096 -[v016] 2022-01-31 06:55:44,116 (trainer:653) INFO: 109epoch:train:190-216batch: iter_time=8.156e-05, forward_time=0.030, loss=1.644, loss_att=0.821, loss_ctc=2.468, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.299e-04, train_time=0.089 -[v016] 2022-01-31 06:55:46,565 (trainer:653) INFO: 109epoch:train:217-243batch: iter_time=7.882e-05, forward_time=0.031, loss=1.722, loss_att=0.769, loss_ctc=2.676, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.299e-04, train_time=0.090 -[v016] 2022-01-31 06:55:49,107 (trainer:653) INFO: 109epoch:train:244-270batch: iter_time=8.370e-05, forward_time=0.033, loss=1.796, loss_att=0.784, loss_ctc=2.807, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.298e-04, train_time=0.094 -[v016] 2022-01-31 06:55:51,864 (trainer:653) INFO: 109epoch:train:271-297batch: iter_time=0.014, forward_time=0.030, loss=1.653, loss_att=0.776, loss_ctc=2.530, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.298e-04, train_time=0.102 -[v016] 2022-01-31 06:55:54,287 (trainer:653) INFO: 109epoch:train:298-324batch: iter_time=8.124e-05, forward_time=0.031, loss=1.485, loss_att=0.703, loss_ctc=2.266, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.298e-04, train_time=0.090 -[v016] 2022-01-31 06:55:56,754 (trainer:653) INFO: 109epoch:train:325-351batch: iter_time=8.392e-05, forward_time=0.031, loss=1.749, loss_att=0.868, loss_ctc=2.631, acc=0.955, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.297e-04, train_time=0.091 -[v016] 2022-01-31 06:55:59,222 (trainer:653) INFO: 109epoch:train:352-378batch: iter_time=7.758e-05, forward_time=0.032, loss=1.665, loss_att=0.799, loss_ctc=2.531, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.297e-04, train_time=0.091 -[v016] 2022-01-31 06:56:01,757 (trainer:653) INFO: 109epoch:train:379-405batch: iter_time=7.648e-05, forward_time=0.033, loss=1.952, loss_att=0.815, loss_ctc=3.089, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.297e-04, train_time=0.094 -[v016] 2022-01-31 06:56:04,164 (trainer:653) INFO: 109epoch:train:406-432batch: iter_time=7.751e-05, forward_time=0.031, loss=1.854, loss_att=0.933, loss_ctc=2.776, acc=0.951, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.296e-04, train_time=0.089 -[v016] 2022-01-31 06:56:06,705 (trainer:653) INFO: 109epoch:train:433-459batch: iter_time=8.103e-05, forward_time=0.032, loss=1.793, loss_att=0.779, loss_ctc=2.808, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.296e-04, train_time=0.094 -[v016] 2022-01-31 06:56:09,196 (trainer:653) INFO: 109epoch:train:460-486batch: iter_time=7.873e-05, forward_time=0.032, loss=1.859, loss_att=0.825, loss_ctc=2.892, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.296e-04, train_time=0.092 -[v016] 2022-01-31 06:56:11,679 (trainer:653) INFO: 109epoch:train:487-513batch: iter_time=7.803e-05, forward_time=0.032, loss=1.806, loss_att=0.893, loss_ctc=2.719, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.296e-04, train_time=0.092 -[v016] 2022-01-31 06:56:14,108 (trainer:653) INFO: 109epoch:train:514-540batch: iter_time=7.649e-05, forward_time=0.031, loss=1.695, loss_att=0.833, loss_ctc=2.556, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.295e-04, train_time=0.090 -[v016] 2022-01-31 06:56:47,416 (trainer:328) INFO: 109epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.708, loss_att=0.783, loss_ctc=2.633, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.298e-04, train_time=0.093, time=51.16 seconds, total_count=59623, gpu_max_cached_mem_GB=5.824, [valid] loss=7.162, loss_att=5.816, loss_ctc=8.508, acc=0.902, cer=0.103, wer=0.411, cer_ctc=0.152, time=5.48 seconds, total_count=19402, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.14 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:56:49,938 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:56:49,984 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/104epoch.pth -[v016] 2022-01-31 06:56:49,984 (trainer:261) INFO: 110/200epoch started. Estimated time to finish: 2 hours, 52 minutes and 24.54 seconds -[v016] 2022-01-31 06:56:53,169 (trainer:653) INFO: 110epoch:train:1-27batch: iter_time=0.020, forward_time=0.032, loss=1.685, loss_att=0.785, loss_ctc=2.586, acc=0.967, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.295e-04, train_time=0.115 -[v016] 2022-01-31 06:56:55,899 (trainer:653) INFO: 110epoch:train:28-54batch: iter_time=0.007, forward_time=0.032, loss=1.821, loss_att=0.743, loss_ctc=2.899, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.295e-04, train_time=0.101 -[v016] 2022-01-31 06:56:58,712 (trainer:653) INFO: 110epoch:train:55-81batch: iter_time=0.011, forward_time=0.032, loss=1.853, loss_att=0.758, loss_ctc=2.947, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.294e-04, train_time=0.104 -[v016] 2022-01-31 06:57:01,232 (trainer:653) INFO: 110epoch:train:82-108batch: iter_time=0.001, forward_time=0.032, loss=1.629, loss_att=0.728, loss_ctc=2.529, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.294e-04, train_time=0.093 -[v016] 2022-01-31 06:57:03,806 (trainer:653) INFO: 110epoch:train:109-135batch: iter_time=0.002, forward_time=0.032, loss=1.823, loss_att=0.801, loss_ctc=2.845, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.294e-04, train_time=0.095 -[v016] 2022-01-31 06:57:06,303 (trainer:653) INFO: 110epoch:train:136-162batch: iter_time=4.525e-04, forward_time=0.032, loss=1.604, loss_att=0.672, loss_ctc=2.537, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.293e-04, train_time=0.092 -[v016] 2022-01-31 06:57:08,839 (trainer:653) INFO: 110epoch:train:163-189batch: iter_time=0.003, forward_time=0.031, loss=1.745, loss_att=0.816, loss_ctc=2.673, acc=0.957, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.293e-04, train_time=0.094 -[v016] 2022-01-31 06:57:11,263 (trainer:653) INFO: 110epoch:train:190-216batch: iter_time=8.223e-05, forward_time=0.030, loss=1.634, loss_att=0.820, loss_ctc=2.448, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.293e-04, train_time=0.090 -[v016] 2022-01-31 06:57:13,674 (trainer:653) INFO: 110epoch:train:217-243batch: iter_time=4.835e-04, forward_time=0.030, loss=1.716, loss_att=0.785, loss_ctc=2.647, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.293e-04, train_time=0.089 -[v016] 2022-01-31 06:57:16,109 (trainer:653) INFO: 110epoch:train:244-270batch: iter_time=7.534e-05, forward_time=0.030, loss=1.518, loss_att=0.761, loss_ctc=2.275, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.292e-04, train_time=0.090 -[v016] 2022-01-31 06:57:18,702 (trainer:653) INFO: 110epoch:train:271-297batch: iter_time=0.004, forward_time=0.031, loss=1.954, loss_att=0.911, loss_ctc=2.997, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.292e-04, train_time=0.096 -[v016] 2022-01-31 06:57:21,406 (trainer:653) INFO: 110epoch:train:298-324batch: iter_time=0.008, forward_time=0.032, loss=1.825, loss_att=0.838, loss_ctc=2.813, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.292e-04, train_time=0.100 -[v016] 2022-01-31 06:57:23,917 (trainer:653) INFO: 110epoch:train:325-351batch: iter_time=9.676e-04, forward_time=0.031, loss=1.729, loss_att=0.807, loss_ctc=2.652, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.291e-04, train_time=0.093 -[v016] 2022-01-31 06:57:26,867 (trainer:653) INFO: 110epoch:train:352-378batch: iter_time=0.014, forward_time=0.033, loss=1.681, loss_att=0.768, loss_ctc=2.594, acc=0.966, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.291e-04, train_time=0.109 -[v016] 2022-01-31 06:57:29,450 (trainer:653) INFO: 110epoch:train:379-405batch: iter_time=0.003, forward_time=0.032, loss=1.781, loss_att=0.864, loss_ctc=2.699, acc=0.956, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.291e-04, train_time=0.095 -[v016] 2022-01-31 06:57:31,982 (trainer:653) INFO: 110epoch:train:406-432batch: iter_time=7.354e-04, forward_time=0.031, loss=1.570, loss_att=0.786, loss_ctc=2.354, acc=0.968, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.291e-04, train_time=0.094 -[v016] 2022-01-31 06:57:34,821 (trainer:653) INFO: 110epoch:train:433-459batch: iter_time=0.011, forward_time=0.032, loss=1.894, loss_att=0.768, loss_ctc=3.020, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.290e-04, train_time=0.105 -[v016] 2022-01-31 06:57:37,378 (trainer:653) INFO: 110epoch:train:460-486batch: iter_time=0.004, forward_time=0.030, loss=1.862, loss_att=0.911, loss_ctc=2.813, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.290e-04, train_time=0.095 -[v016] 2022-01-31 06:57:39,912 (trainer:653) INFO: 110epoch:train:487-513batch: iter_time=3.815e-04, forward_time=0.032, loss=1.712, loss_att=0.721, loss_ctc=2.702, acc=0.970, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.290e-04, train_time=0.094 -[v016] 2022-01-31 06:57:42,482 (trainer:653) INFO: 110epoch:train:514-540batch: iter_time=0.002, forward_time=0.032, loss=1.869, loss_att=0.906, loss_ctc=2.832, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.289e-04, train_time=0.095 -[v016] 2022-01-31 06:58:17,530 (trainer:328) INFO: 110epoch results: [train] iter_time=0.005, forward_time=0.031, loss=1.740, loss_att=0.795, loss_ctc=2.686, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.292e-04, train_time=0.097, time=53.21 seconds, total_count=60170, gpu_max_cached_mem_GB=5.824, [valid] loss=7.067, loss_att=5.829, loss_ctc=8.304, acc=0.903, cer=0.101, wer=0.405, cer_ctc=0.151, time=6.58 seconds, total_count=19580, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.76 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:58:19,644 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 06:58:19,652 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/105epoch.pth -[v016] 2022-01-31 06:58:19,652 (trainer:261) INFO: 111/200epoch started. Estimated time to finish: 2 hours, 50 minutes and 6.85 seconds -[v016] 2022-01-31 06:58:22,806 (trainer:653) INFO: 111epoch:train:1-27batch: iter_time=0.021, forward_time=0.033, loss=1.642, loss_att=0.756, loss_ctc=2.528, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.289e-04, train_time=0.115 -[v016] 2022-01-31 06:58:25,938 (trainer:653) INFO: 111epoch:train:28-54batch: iter_time=0.024, forward_time=0.031, loss=1.707, loss_att=0.742, loss_ctc=2.673, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.289e-04, train_time=0.116 -[v016] 2022-01-31 06:58:29,158 (trainer:653) INFO: 111epoch:train:55-81batch: iter_time=0.029, forward_time=0.031, loss=1.404, loss_att=0.671, loss_ctc=2.137, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.288e-04, train_time=0.119 -[v016] 2022-01-31 06:58:31,961 (trainer:653) INFO: 111epoch:train:82-108batch: iter_time=0.009, forward_time=0.032, loss=1.806, loss_att=0.835, loss_ctc=2.777, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.288e-04, train_time=0.104 -[v016] 2022-01-31 06:58:34,907 (trainer:653) INFO: 111epoch:train:109-135batch: iter_time=0.017, forward_time=0.032, loss=1.836, loss_att=0.840, loss_ctc=2.833, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.288e-04, train_time=0.109 -[v016] 2022-01-31 06:58:37,314 (trainer:653) INFO: 111epoch:train:136-162batch: iter_time=7.581e-05, forward_time=0.030, loss=1.573, loss_att=0.770, loss_ctc=2.377, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.288e-04, train_time=0.089 -[v016] 2022-01-31 06:58:39,803 (trainer:653) INFO: 111epoch:train:163-189batch: iter_time=7.619e-05, forward_time=0.032, loss=1.818, loss_att=0.766, loss_ctc=2.869, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.287e-04, train_time=0.092 -[v016] 2022-01-31 06:58:42,311 (trainer:653) INFO: 111epoch:train:190-216batch: iter_time=7.754e-04, forward_time=0.031, loss=1.647, loss_att=0.750, loss_ctc=2.543, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.287e-04, train_time=0.093 -[v016] 2022-01-31 06:58:45,091 (trainer:653) INFO: 111epoch:train:217-243batch: iter_time=0.012, forward_time=0.031, loss=1.899, loss_att=0.883, loss_ctc=2.915, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.287e-04, train_time=0.103 -[v016] 2022-01-31 06:58:47,831 (trainer:653) INFO: 111epoch:train:244-270batch: iter_time=0.002, forward_time=0.034, loss=1.770, loss_att=0.829, loss_ctc=2.710, acc=0.960, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.286e-04, train_time=0.101 -[v016] 2022-01-31 06:58:50,535 (trainer:653) INFO: 111epoch:train:271-297batch: iter_time=1.024e-04, forward_time=0.035, loss=1.866, loss_att=0.785, loss_ctc=2.947, acc=0.969, backward_time=0.024, optim_step_time=0.022, optim0_lr0=1.286e-04, train_time=0.100 -[v016] 2022-01-31 06:58:53,246 (trainer:653) INFO: 111epoch:train:298-324batch: iter_time=1.053e-04, forward_time=0.035, loss=1.429, loss_att=0.658, loss_ctc=2.201, acc=0.969, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.286e-04, train_time=0.100 -[v016] 2022-01-31 06:58:55,965 (trainer:653) INFO: 111epoch:train:325-351batch: iter_time=0.002, forward_time=0.034, loss=1.760, loss_att=0.792, loss_ctc=2.729, acc=0.962, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.286e-04, train_time=0.100 -[v016] 2022-01-31 06:58:59,111 (trainer:653) INFO: 111epoch:train:352-378batch: iter_time=0.015, forward_time=0.035, loss=1.663, loss_att=0.668, loss_ctc=2.659, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.285e-04, train_time=0.116 -[v016] 2022-01-31 06:59:02,134 (trainer:653) INFO: 111epoch:train:379-405batch: iter_time=0.009, forward_time=0.035, loss=1.646, loss_att=0.699, loss_ctc=2.594, acc=0.965, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.285e-04, train_time=0.112 -[v016] 2022-01-31 06:59:05,046 (trainer:653) INFO: 111epoch:train:406-432batch: iter_time=0.005, forward_time=0.035, loss=1.732, loss_att=0.754, loss_ctc=2.710, acc=0.965, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.285e-04, train_time=0.108 -[v016] 2022-01-31 06:59:07,779 (trainer:653) INFO: 111epoch:train:433-459batch: iter_time=1.189e-04, forward_time=0.034, loss=1.642, loss_att=0.718, loss_ctc=2.565, acc=0.964, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.284e-04, train_time=0.101 -[v016] 2022-01-31 06:59:10,520 (trainer:653) INFO: 111epoch:train:460-486batch: iter_time=1.264e-04, forward_time=0.035, loss=1.746, loss_att=0.733, loss_ctc=2.760, acc=0.967, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.284e-04, train_time=0.101 -[v016] 2022-01-31 06:59:13,438 (trainer:653) INFO: 111epoch:train:487-513batch: iter_time=1.219e-04, forward_time=0.040, loss=1.812, loss_att=0.767, loss_ctc=2.857, acc=0.966, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.284e-04, train_time=0.108 -[v016] 2022-01-31 06:59:16,044 (trainer:653) INFO: 111epoch:train:514-540batch: iter_time=2.861e-04, forward_time=0.033, loss=1.701, loss_att=0.876, loss_ctc=2.526, acc=0.962, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.284e-04, train_time=0.096 -[v016] 2022-01-31 06:59:53,773 (trainer:328) INFO: 111epoch results: [train] iter_time=0.008, forward_time=0.033, loss=1.702, loss_att=0.763, loss_ctc=2.642, acc=0.965, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.286e-04, train_time=0.105, time=57.44 seconds, total_count=60717, gpu_max_cached_mem_GB=5.824, [valid] loss=7.185, loss_att=5.919, loss_ctc=8.451, acc=0.904, cer=0.098, wer=0.400, cer_ctc=0.149, time=6.65 seconds, total_count=19758, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.03 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 06:59:56,175 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 06:59:56,220 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/106epoch.pth -[v016] 2022-01-31 06:59:56,220 (trainer:261) INFO: 112/200epoch started. Estimated time to finish: 2 hours, 47 minutes and 56.97 seconds -[v016] 2022-01-31 06:59:59,911 (trainer:653) INFO: 112epoch:train:1-27batch: iter_time=0.039, forward_time=0.033, loss=1.785, loss_att=0.848, loss_ctc=2.722, acc=0.961, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.283e-04, train_time=0.136 -[v016] 2022-01-31 07:00:03,905 (trainer:653) INFO: 112epoch:train:28-54batch: iter_time=0.053, forward_time=0.032, loss=1.546, loss_att=0.634, loss_ctc=2.458, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.283e-04, train_time=0.148 -[v016] 2022-01-31 07:00:06,760 (trainer:653) INFO: 112epoch:train:55-81batch: iter_time=0.016, forward_time=0.030, loss=1.514, loss_att=0.773, loss_ctc=2.254, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.283e-04, train_time=0.106 -[v016] 2022-01-31 07:00:09,481 (trainer:653) INFO: 112epoch:train:82-108batch: iter_time=0.010, forward_time=0.031, loss=1.647, loss_att=0.770, loss_ctc=2.525, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.282e-04, train_time=0.101 -[v016] 2022-01-31 07:00:12,380 (trainer:653) INFO: 112epoch:train:109-135batch: iter_time=0.016, forward_time=0.031, loss=1.814, loss_att=0.789, loss_ctc=2.839, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.282e-04, train_time=0.107 -[v016] 2022-01-31 07:00:14,973 (trainer:653) INFO: 112epoch:train:136-162batch: iter_time=0.006, forward_time=0.030, loss=1.843, loss_att=0.937, loss_ctc=2.750, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.282e-04, train_time=0.096 -[v016] 2022-01-31 07:00:18,227 (trainer:653) INFO: 112epoch:train:163-189batch: iter_time=0.026, forward_time=0.032, loss=1.681, loss_att=0.709, loss_ctc=2.652, acc=0.966, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.281e-04, train_time=0.120 -[v016] 2022-01-31 07:00:20,826 (trainer:653) INFO: 112epoch:train:190-216batch: iter_time=0.001, forward_time=0.032, loss=1.790, loss_att=0.739, loss_ctc=2.842, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.281e-04, train_time=0.096 -[v016] 2022-01-31 07:00:24,114 (trainer:653) INFO: 112epoch:train:217-243batch: iter_time=0.031, forward_time=0.031, loss=1.611, loss_att=0.748, loss_ctc=2.474, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.281e-04, train_time=0.122 -[v016] 2022-01-31 07:00:28,584 (trainer:653) INFO: 112epoch:train:244-270batch: iter_time=0.072, forward_time=0.032, loss=1.967, loss_att=0.769, loss_ctc=3.166, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.281e-04, train_time=0.165 -[v016] 2022-01-31 07:00:31,111 (trainer:653) INFO: 112epoch:train:271-297batch: iter_time=0.001, forward_time=0.031, loss=2.017, loss_att=0.928, loss_ctc=3.106, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.280e-04, train_time=0.093 -[v016] 2022-01-31 07:00:35,242 (trainer:653) INFO: 112epoch:train:298-324batch: iter_time=0.060, forward_time=0.032, loss=1.855, loss_att=0.761, loss_ctc=2.948, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.280e-04, train_time=0.153 -[v016] 2022-01-31 07:00:38,464 (trainer:653) INFO: 112epoch:train:325-351batch: iter_time=0.027, forward_time=0.031, loss=1.742, loss_att=0.781, loss_ctc=2.702, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.280e-04, train_time=0.119 -[v016] 2022-01-31 07:00:41,139 (trainer:653) INFO: 112epoch:train:352-378batch: iter_time=0.006, forward_time=0.031, loss=1.630, loss_att=0.793, loss_ctc=2.467, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.279e-04, train_time=0.099 -[v016] 2022-01-31 07:00:44,209 (trainer:653) INFO: 112epoch:train:379-405batch: iter_time=0.023, forward_time=0.030, loss=1.596, loss_att=0.736, loss_ctc=2.457, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.279e-04, train_time=0.114 -[v016] 2022-01-31 07:00:49,453 (trainer:653) INFO: 112epoch:train:406-432batch: iter_time=0.023, forward_time=0.101, loss=1.897, loss_att=0.785, loss_ctc=3.009, acc=0.965, backward_time=0.026, optim_step_time=0.025, optim0_lr0=1.279e-04, train_time=0.194 -[v016] 2022-01-31 07:00:52,214 (trainer:653) INFO: 112epoch:train:433-459batch: iter_time=0.010, forward_time=0.032, loss=1.827, loss_att=0.817, loss_ctc=2.838, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.279e-04, train_time=0.102 -[v016] 2022-01-31 07:00:55,384 (trainer:653) INFO: 112epoch:train:460-486batch: iter_time=0.030, forward_time=0.030, loss=1.568, loss_att=0.811, loss_ctc=2.325, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.278e-04, train_time=0.117 -[v016] 2022-01-31 07:00:58,465 (trainer:653) INFO: 112epoch:train:487-513batch: iter_time=0.023, forward_time=0.031, loss=1.648, loss_att=0.824, loss_ctc=2.472, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.278e-04, train_time=0.114 -[v016] 2022-01-31 07:01:01,440 (trainer:653) INFO: 112epoch:train:514-540batch: iter_time=0.018, forward_time=0.031, loss=1.639, loss_att=0.680, loss_ctc=2.599, acc=0.972, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.278e-04, train_time=0.110 -[v016] 2022-01-31 07:01:46,117 (trainer:328) INFO: 112epoch results: [train] iter_time=0.024, forward_time=0.035, loss=1.725, loss_att=0.780, loss_ctc=2.671, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.280e-04, train_time=0.120, time=1 minute and 5.97 seconds, total_count=61264, gpu_max_cached_mem_GB=5.824, [valid] loss=7.016, loss_att=5.861, loss_ctc=8.171, acc=0.904, cer=0.101, wer=0.398, cer_ctc=0.149, time=16.34 seconds, total_count=19936, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.58 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:01:48,452 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:01:48,460 (trainer:261) INFO: 113/200epoch started. Estimated time to finish: 2 hours, 46 minutes and 2.81 seconds -[v016] 2022-01-31 07:01:51,352 (trainer:653) INFO: 113epoch:train:1-27batch: iter_time=0.009, forward_time=0.033, loss=1.757, loss_att=0.697, loss_ctc=2.816, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.277e-04, train_time=0.107 -[v016] 2022-01-31 07:01:53,845 (trainer:653) INFO: 113epoch:train:28-54batch: iter_time=8.397e-05, forward_time=0.032, loss=1.998, loss_att=0.849, loss_ctc=3.147, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.277e-04, train_time=0.092 -[v016] 2022-01-31 07:01:56,245 (trainer:653) INFO: 113epoch:train:55-81batch: iter_time=7.539e-05, forward_time=0.030, loss=1.321, loss_att=0.680, loss_ctc=1.961, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.277e-04, train_time=0.089 -[v016] 2022-01-31 07:01:58,766 (trainer:653) INFO: 113epoch:train:82-108batch: iter_time=7.381e-05, forward_time=0.032, loss=1.743, loss_att=0.790, loss_ctc=2.695, acc=0.962, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.277e-04, train_time=0.093 -[v016] 2022-01-31 07:02:01,268 (trainer:653) INFO: 113epoch:train:109-135batch: iter_time=7.409e-05, forward_time=0.032, loss=1.993, loss_att=0.846, loss_ctc=3.140, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.276e-04, train_time=0.092 -[v016] 2022-01-31 07:02:03,665 (trainer:653) INFO: 113epoch:train:136-162batch: iter_time=7.275e-05, forward_time=0.030, loss=1.685, loss_att=0.781, loss_ctc=2.589, acc=0.959, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.276e-04, train_time=0.089 -[v016] 2022-01-31 07:02:06,083 (trainer:653) INFO: 113epoch:train:163-189batch: iter_time=7.216e-05, forward_time=0.031, loss=1.591, loss_att=0.713, loss_ctc=2.469, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.276e-04, train_time=0.089 -[v016] 2022-01-31 07:02:08,567 (trainer:653) INFO: 113epoch:train:190-216batch: iter_time=7.900e-05, forward_time=0.032, loss=1.857, loss_att=0.820, loss_ctc=2.895, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.275e-04, train_time=0.092 -[v016] 2022-01-31 07:02:11,121 (trainer:653) INFO: 113epoch:train:217-243batch: iter_time=0.004, forward_time=0.031, loss=1.655, loss_att=0.724, loss_ctc=2.586, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.275e-04, train_time=0.094 -[v016] 2022-01-31 07:02:13,597 (trainer:653) INFO: 113epoch:train:244-270batch: iter_time=7.238e-05, forward_time=0.032, loss=1.640, loss_att=0.801, loss_ctc=2.479, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.275e-04, train_time=0.091 -[v016] 2022-01-31 07:02:15,953 (trainer:653) INFO: 113epoch:train:271-297batch: iter_time=7.615e-05, forward_time=0.030, loss=1.431, loss_att=0.719, loss_ctc=2.143, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.275e-04, train_time=0.087 -[v016] 2022-01-31 07:02:18,381 (trainer:653) INFO: 113epoch:train:298-324batch: iter_time=7.442e-05, forward_time=0.031, loss=1.838, loss_att=0.773, loss_ctc=2.902, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.274e-04, train_time=0.090 -[v016] 2022-01-31 07:02:20,786 (trainer:653) INFO: 113epoch:train:325-351batch: iter_time=7.394e-05, forward_time=0.031, loss=1.618, loss_att=0.736, loss_ctc=2.500, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.274e-04, train_time=0.089 -[v016] 2022-01-31 07:02:23,247 (trainer:653) INFO: 113epoch:train:352-378batch: iter_time=7.537e-05, forward_time=0.031, loss=1.590, loss_att=0.701, loss_ctc=2.478, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.274e-04, train_time=0.091 -[v016] 2022-01-31 07:02:25,656 (trainer:653) INFO: 113epoch:train:379-405batch: iter_time=8.117e-05, forward_time=0.031, loss=1.697, loss_att=0.771, loss_ctc=2.624, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.274e-04, train_time=0.089 -[v016] 2022-01-31 07:02:28,108 (trainer:653) INFO: 113epoch:train:406-432batch: iter_time=7.919e-05, forward_time=0.031, loss=1.700, loss_att=0.783, loss_ctc=2.618, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.273e-04, train_time=0.091 -[v016] 2022-01-31 07:02:30,620 (trainer:653) INFO: 113epoch:train:433-459batch: iter_time=8.643e-05, forward_time=0.032, loss=2.045, loss_att=0.930, loss_ctc=3.160, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.273e-04, train_time=0.093 -[v016] 2022-01-31 07:02:33,126 (trainer:653) INFO: 113epoch:train:460-486batch: iter_time=8.210e-05, forward_time=0.032, loss=1.696, loss_att=0.743, loss_ctc=2.649, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.273e-04, train_time=0.093 -[v016] 2022-01-31 07:02:35,558 (trainer:653) INFO: 113epoch:train:487-513batch: iter_time=7.756e-05, forward_time=0.031, loss=1.812, loss_att=0.917, loss_ctc=2.706, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.272e-04, train_time=0.090 -[v016] 2022-01-31 07:02:38,510 (trainer:653) INFO: 113epoch:train:514-540batch: iter_time=0.017, forward_time=0.032, loss=1.666, loss_att=0.840, loss_ctc=2.492, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.272e-04, train_time=0.109 -[v016] 2022-01-31 07:03:11,679 (trainer:328) INFO: 113epoch results: [train] iter_time=0.002, forward_time=0.031, loss=1.721, loss_att=0.781, loss_ctc=2.660, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.275e-04, train_time=0.092, time=50.79 seconds, total_count=61811, gpu_max_cached_mem_GB=5.824, [valid] loss=7.104, loss_att=5.793, loss_ctc=8.415, acc=0.904, cer=0.098, wer=0.394, cer_ctc=0.146, time=5.45 seconds, total_count=20114, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.98 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:03:13,666 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:03:13,710 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/108epoch.pth -[v016] 2022-01-31 07:03:13,710 (trainer:261) INFO: 114/200epoch started. Estimated time to finish: 2 hours, 43 minutes and 43.43 seconds -[v016] 2022-01-31 07:03:16,412 (trainer:653) INFO: 114epoch:train:1-27batch: iter_time=0.004, forward_time=0.033, loss=1.560, loss_att=0.664, loss_ctc=2.457, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.272e-04, train_time=0.100 -[v016] 2022-01-31 07:03:18,939 (trainer:653) INFO: 114epoch:train:28-54batch: iter_time=8.323e-05, forward_time=0.033, loss=1.734, loss_att=0.755, loss_ctc=2.713, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.272e-04, train_time=0.093 -[v016] 2022-01-31 07:03:21,385 (trainer:653) INFO: 114epoch:train:55-81batch: iter_time=7.653e-05, forward_time=0.032, loss=1.737, loss_att=0.748, loss_ctc=2.726, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.271e-04, train_time=0.090 -[v016] 2022-01-31 07:03:23,838 (trainer:653) INFO: 114epoch:train:82-108batch: iter_time=7.480e-05, forward_time=0.031, loss=1.673, loss_att=0.740, loss_ctc=2.605, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.271e-04, train_time=0.091 -[v016] 2022-01-31 07:03:26,400 (trainer:653) INFO: 114epoch:train:109-135batch: iter_time=7.593e-05, forward_time=0.033, loss=1.612, loss_att=0.731, loss_ctc=2.493, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.271e-04, train_time=0.095 -[v016] 2022-01-31 07:03:28,841 (trainer:653) INFO: 114epoch:train:136-162batch: iter_time=8.006e-05, forward_time=0.032, loss=1.894, loss_att=0.920, loss_ctc=2.868, acc=0.956, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.270e-04, train_time=0.090 -[v016] 2022-01-31 07:03:31,340 (trainer:653) INFO: 114epoch:train:163-189batch: iter_time=7.855e-05, forward_time=0.032, loss=1.565, loss_att=0.647, loss_ctc=2.483, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.270e-04, train_time=0.092 -[v016] 2022-01-31 07:03:33,740 (trainer:653) INFO: 114epoch:train:190-216batch: iter_time=7.494e-05, forward_time=0.031, loss=1.460, loss_att=0.704, loss_ctc=2.217, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.270e-04, train_time=0.089 -[v016] 2022-01-31 07:03:36,155 (trainer:653) INFO: 114epoch:train:217-243batch: iter_time=7.483e-05, forward_time=0.031, loss=1.840, loss_att=0.846, loss_ctc=2.834, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.270e-04, train_time=0.089 -[v016] 2022-01-31 07:03:38,599 (trainer:653) INFO: 114epoch:train:244-270batch: iter_time=7.474e-05, forward_time=0.031, loss=1.466, loss_att=0.651, loss_ctc=2.280, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.269e-04, train_time=0.090 -[v016] 2022-01-31 07:03:41,027 (trainer:653) INFO: 114epoch:train:271-297batch: iter_time=7.502e-05, forward_time=0.031, loss=1.532, loss_att=0.681, loss_ctc=2.384, acc=0.969, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.269e-04, train_time=0.090 -[v016] 2022-01-31 07:03:43,404 (trainer:653) INFO: 114epoch:train:298-324batch: iter_time=7.681e-05, forward_time=0.030, loss=1.687, loss_att=0.817, loss_ctc=2.557, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.269e-04, train_time=0.088 -[v016] 2022-01-31 07:03:45,906 (trainer:653) INFO: 114epoch:train:325-351batch: iter_time=8.458e-05, forward_time=0.032, loss=1.539, loss_att=0.772, loss_ctc=2.306, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.268e-04, train_time=0.092 -[v016] 2022-01-31 07:03:48,407 (trainer:653) INFO: 114epoch:train:352-378batch: iter_time=8.090e-05, forward_time=0.033, loss=1.917, loss_att=0.778, loss_ctc=3.057, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.268e-04, train_time=0.092 -[v016] 2022-01-31 07:03:50,881 (trainer:653) INFO: 114epoch:train:379-405batch: iter_time=7.852e-05, forward_time=0.032, loss=1.392, loss_att=0.664, loss_ctc=2.121, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.268e-04, train_time=0.091 -[v016] 2022-01-31 07:03:53,331 (trainer:653) INFO: 114epoch:train:406-432batch: iter_time=7.468e-05, forward_time=0.032, loss=1.864, loss_att=0.805, loss_ctc=2.924, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.268e-04, train_time=0.091 -[v016] 2022-01-31 07:03:55,734 (trainer:653) INFO: 114epoch:train:433-459batch: iter_time=7.436e-05, forward_time=0.031, loss=1.726, loss_att=0.832, loss_ctc=2.619, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.267e-04, train_time=0.089 -[v016] 2022-01-31 07:03:58,119 (trainer:653) INFO: 114epoch:train:460-486batch: iter_time=7.420e-05, forward_time=0.031, loss=1.471, loss_att=0.697, loss_ctc=2.245, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.267e-04, train_time=0.088 -[v016] 2022-01-31 07:04:00,528 (trainer:653) INFO: 114epoch:train:487-513batch: iter_time=7.606e-05, forward_time=0.031, loss=1.583, loss_att=0.824, loss_ctc=2.342, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.267e-04, train_time=0.089 -[v016] 2022-01-31 07:04:03,101 (trainer:653) INFO: 114epoch:train:514-540batch: iter_time=9.025e-05, forward_time=0.031, loss=1.743, loss_att=0.819, loss_ctc=2.667, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.267e-04, train_time=0.095 -[v016] 2022-01-31 07:04:36,220 (trainer:328) INFO: 114epoch results: [train] iter_time=2.814e-04, forward_time=0.032, loss=1.658, loss_att=0.758, loss_ctc=2.559, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.269e-04, train_time=0.091, time=50.11 seconds, total_count=62358, gpu_max_cached_mem_GB=5.824, [valid] loss=7.210, loss_att=5.965, loss_ctc=8.454, acc=0.903, cer=0.104, wer=0.405, cer_ctc=0.150, time=5.46 seconds, total_count=20292, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.93 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:04:38,309 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:04:38,337 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/110epoch.pth -[v016] 2022-01-31 07:04:38,337 (trainer:261) INFO: 115/200epoch started. Estimated time to finish: 2 hours, 41 minutes and 24.64 seconds -[v016] 2022-01-31 07:04:40,954 (trainer:653) INFO: 115epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.424, loss_att=0.647, loss_ctc=2.200, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.266e-04, train_time=0.097 -[v016] 2022-01-31 07:04:43,554 (trainer:653) INFO: 115epoch:train:28-54batch: iter_time=0.006, forward_time=0.032, loss=1.658, loss_att=0.706, loss_ctc=2.611, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.266e-04, train_time=0.096 -[v016] 2022-01-31 07:04:46,031 (trainer:653) INFO: 115epoch:train:55-81batch: iter_time=7.618e-05, forward_time=0.033, loss=1.476, loss_att=0.747, loss_ctc=2.205, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.266e-04, train_time=0.092 -[v016] 2022-01-31 07:04:48,424 (trainer:653) INFO: 115epoch:train:82-108batch: iter_time=8.204e-05, forward_time=0.031, loss=1.429, loss_att=0.682, loss_ctc=2.176, acc=0.962, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.265e-04, train_time=0.088 -[v016] 2022-01-31 07:04:50,853 (trainer:653) INFO: 115epoch:train:109-135batch: iter_time=7.980e-05, forward_time=0.031, loss=1.533, loss_att=0.665, loss_ctc=2.400, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.265e-04, train_time=0.090 -[v016] 2022-01-31 07:04:53,299 (trainer:653) INFO: 115epoch:train:136-162batch: iter_time=7.573e-05, forward_time=0.032, loss=1.843, loss_att=0.876, loss_ctc=2.809, acc=0.958, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.265e-04, train_time=0.090 -[v016] 2022-01-31 07:04:55,824 (trainer:653) INFO: 115epoch:train:163-189batch: iter_time=7.701e-05, forward_time=0.033, loss=1.857, loss_att=0.740, loss_ctc=2.975, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.265e-04, train_time=0.093 -[v016] 2022-01-31 07:04:58,301 (trainer:653) INFO: 115epoch:train:190-216batch: iter_time=8.134e-05, forward_time=0.032, loss=1.890, loss_att=0.823, loss_ctc=2.957, acc=0.959, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.264e-04, train_time=0.092 -[v016] 2022-01-31 07:05:00,695 (trainer:653) INFO: 115epoch:train:217-243batch: iter_time=7.916e-05, forward_time=0.031, loss=1.598, loss_att=0.761, loss_ctc=2.434, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.264e-04, train_time=0.088 -[v016] 2022-01-31 07:05:03,128 (trainer:653) INFO: 115epoch:train:244-270batch: iter_time=7.737e-05, forward_time=0.031, loss=1.726, loss_att=0.707, loss_ctc=2.745, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.264e-04, train_time=0.090 -[v016] 2022-01-31 07:05:05,582 (trainer:653) INFO: 115epoch:train:271-297batch: iter_time=9.010e-05, forward_time=0.032, loss=1.787, loss_att=0.834, loss_ctc=2.739, acc=0.962, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.263e-04, train_time=0.091 -[v016] 2022-01-31 07:05:07,995 (trainer:653) INFO: 115epoch:train:298-324batch: iter_time=7.960e-05, forward_time=0.031, loss=1.890, loss_att=0.935, loss_ctc=2.846, acc=0.956, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.263e-04, train_time=0.089 -[v016] 2022-01-31 07:05:10,507 (trainer:653) INFO: 115epoch:train:325-351batch: iter_time=7.763e-05, forward_time=0.032, loss=1.702, loss_att=0.709, loss_ctc=2.694, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.263e-04, train_time=0.093 -[v016] 2022-01-31 07:05:13,135 (trainer:653) INFO: 115epoch:train:352-378batch: iter_time=0.005, forward_time=0.032, loss=1.560, loss_att=0.698, loss_ctc=2.422, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.263e-04, train_time=0.097 -[v016] 2022-01-31 07:05:15,776 (trainer:653) INFO: 115epoch:train:379-405batch: iter_time=0.005, forward_time=0.032, loss=1.658, loss_att=0.786, loss_ctc=2.530, acc=0.960, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.262e-04, train_time=0.098 -[v016] 2022-01-31 07:05:18,291 (trainer:653) INFO: 115epoch:train:406-432batch: iter_time=7.932e-05, forward_time=0.033, loss=1.738, loss_att=0.779, loss_ctc=2.697, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.262e-04, train_time=0.093 -[v016] 2022-01-31 07:05:20,749 (trainer:653) INFO: 115epoch:train:433-459batch: iter_time=8.329e-05, forward_time=0.031, loss=1.457, loss_att=0.688, loss_ctc=2.227, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.262e-04, train_time=0.091 -[v016] 2022-01-31 07:05:23,310 (trainer:653) INFO: 115epoch:train:460-486batch: iter_time=8.264e-05, forward_time=0.033, loss=1.996, loss_att=0.892, loss_ctc=3.100, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.262e-04, train_time=0.095 -[v016] 2022-01-31 07:05:25,841 (trainer:653) INFO: 115epoch:train:487-513batch: iter_time=8.213e-05, forward_time=0.032, loss=1.736, loss_att=0.757, loss_ctc=2.716, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.261e-04, train_time=0.094 -[v016] 2022-01-31 07:05:28,378 (trainer:653) INFO: 115epoch:train:514-540batch: iter_time=7.817e-05, forward_time=0.033, loss=1.764, loss_att=0.716, loss_ctc=2.812, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.261e-04, train_time=0.094 -[v016] 2022-01-31 07:06:02,283 (trainer:328) INFO: 115epoch results: [train] iter_time=9.803e-04, forward_time=0.032, loss=1.686, loss_att=0.758, loss_ctc=2.614, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.264e-04, train_time=0.092, time=50.74 seconds, total_count=62905, gpu_max_cached_mem_GB=5.824, [valid] loss=7.226, loss_att=5.918, loss_ctc=8.533, acc=0.905, cer=0.099, wer=0.396, cer_ctc=0.146, time=5.46 seconds, total_count=20470, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.74 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:06:04,849 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:06:04,858 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/100epoch.pth -[v016] 2022-01-31 07:06:04,858 (trainer:261) INFO: 116/200epoch started. Estimated time to finish: 2 hours, 39 minutes and 8.68 seconds -[v016] 2022-01-31 07:06:08,592 (trainer:653) INFO: 116epoch:train:1-27batch: iter_time=0.035, forward_time=0.032, loss=1.837, loss_att=0.817, loss_ctc=2.857, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.261e-04, train_time=0.132 -[v016] 2022-01-31 07:06:11,101 (trainer:653) INFO: 116epoch:train:28-54batch: iter_time=8.823e-05, forward_time=0.032, loss=1.582, loss_att=0.706, loss_ctc=2.458, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.260e-04, train_time=0.093 -[v016] 2022-01-31 07:06:13,510 (trainer:653) INFO: 116epoch:train:55-81batch: iter_time=7.877e-05, forward_time=0.030, loss=1.497, loss_att=0.748, loss_ctc=2.245, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.260e-04, train_time=0.089 -[v016] 2022-01-31 07:06:16,423 (trainer:653) INFO: 116epoch:train:82-108batch: iter_time=0.015, forward_time=0.031, loss=1.615, loss_att=0.657, loss_ctc=2.574, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.260e-04, train_time=0.108 -[v016] 2022-01-31 07:06:19,635 (trainer:653) INFO: 116epoch:train:109-135batch: iter_time=0.028, forward_time=0.031, loss=1.544, loss_att=0.615, loss_ctc=2.473, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.260e-04, train_time=0.119 -[v016] 2022-01-31 07:06:22,004 (trainer:653) INFO: 116epoch:train:136-162batch: iter_time=7.520e-05, forward_time=0.030, loss=1.696, loss_att=0.812, loss_ctc=2.580, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.259e-04, train_time=0.088 -[v016] 2022-01-31 07:06:24,491 (trainer:653) INFO: 116epoch:train:163-189batch: iter_time=7.782e-05, forward_time=0.031, loss=1.421, loss_att=0.669, loss_ctc=2.174, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.259e-04, train_time=0.092 -[v016] 2022-01-31 07:06:27,355 (trainer:653) INFO: 116epoch:train:190-216batch: iter_time=0.016, forward_time=0.031, loss=1.831, loss_att=0.825, loss_ctc=2.837, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.259e-04, train_time=0.106 -[v016] 2022-01-31 07:06:29,787 (trainer:653) INFO: 116epoch:train:217-243batch: iter_time=7.739e-05, forward_time=0.030, loss=1.519, loss_att=0.708, loss_ctc=2.330, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.259e-04, train_time=0.090 -[v016] 2022-01-31 07:06:32,410 (trainer:653) INFO: 116epoch:train:244-270batch: iter_time=0.005, forward_time=0.031, loss=1.778, loss_att=0.769, loss_ctc=2.786, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.258e-04, train_time=0.097 -[v016] 2022-01-31 07:06:34,909 (trainer:653) INFO: 116epoch:train:271-297batch: iter_time=0.003, forward_time=0.030, loss=1.658, loss_att=0.821, loss_ctc=2.495, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.258e-04, train_time=0.092 -[v016] 2022-01-31 07:06:37,348 (trainer:653) INFO: 116epoch:train:298-324batch: iter_time=7.959e-05, forward_time=0.030, loss=1.726, loss_att=0.773, loss_ctc=2.679, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.258e-04, train_time=0.090 -[v016] 2022-01-31 07:06:39,925 (trainer:653) INFO: 116epoch:train:325-351batch: iter_time=0.005, forward_time=0.031, loss=1.689, loss_att=0.783, loss_ctc=2.594, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.257e-04, train_time=0.095 -[v016] 2022-01-31 07:06:42,359 (trainer:653) INFO: 116epoch:train:352-378batch: iter_time=8.429e-05, forward_time=0.031, loss=1.594, loss_att=0.743, loss_ctc=2.445, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.257e-04, train_time=0.090 -[v016] 2022-01-31 07:06:44,758 (trainer:653) INFO: 116epoch:train:379-405batch: iter_time=7.600e-05, forward_time=0.030, loss=1.710, loss_att=0.762, loss_ctc=2.657, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.257e-04, train_time=0.089 -[v016] 2022-01-31 07:06:47,706 (trainer:653) INFO: 116epoch:train:406-432batch: iter_time=0.014, forward_time=0.032, loss=1.724, loss_att=0.732, loss_ctc=2.716, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.257e-04, train_time=0.109 -[v016] 2022-01-31 07:06:50,099 (trainer:653) INFO: 116epoch:train:433-459batch: iter_time=7.657e-05, forward_time=0.030, loss=1.777, loss_att=0.863, loss_ctc=2.691, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.256e-04, train_time=0.088 -[v016] 2022-01-31 07:06:53,519 (trainer:653) INFO: 116epoch:train:460-486batch: iter_time=0.033, forward_time=0.032, loss=1.714, loss_att=0.741, loss_ctc=2.688, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.256e-04, train_time=0.126 -[v016] 2022-01-31 07:06:55,952 (trainer:653) INFO: 116epoch:train:487-513batch: iter_time=7.037e-04, forward_time=0.030, loss=1.658, loss_att=0.828, loss_ctc=2.489, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.256e-04, train_time=0.090 -[v016] 2022-01-31 07:06:58,495 (trainer:653) INFO: 116epoch:train:514-540batch: iter_time=0.003, forward_time=0.031, loss=1.787, loss_att=0.815, loss_ctc=2.759, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.256e-04, train_time=0.094 -[v016] 2022-01-31 07:07:31,945 (trainer:328) INFO: 116epoch results: [train] iter_time=0.008, forward_time=0.031, loss=1.669, loss_att=0.759, loss_ctc=2.578, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.258e-04, train_time=0.099, time=54.32 seconds, total_count=63452, gpu_max_cached_mem_GB=5.824, [valid] loss=7.095, loss_att=5.936, loss_ctc=8.254, acc=0.905, cer=0.098, wer=0.392, cer_ctc=0.143, time=5.29 seconds, total_count=20648, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.44 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:07:33,994 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:07:34,058 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/102epoch.pth, exp/asr_train_asr_raw_en_word/113epoch.pth -[v016] 2022-01-31 07:07:34,058 (trainer:261) INFO: 117/200epoch started. Estimated time to finish: 2 hours, 36 minutes and 56.1 seconds -[v016] 2022-01-31 07:07:36,674 (trainer:653) INFO: 117epoch:train:1-27batch: iter_time=0.003, forward_time=0.031, loss=1.501, loss_att=0.667, loss_ctc=2.335, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.255e-04, train_time=0.097 -[v016] 2022-01-31 07:07:39,222 (trainer:653) INFO: 117epoch:train:28-54batch: iter_time=8.770e-05, forward_time=0.033, loss=1.618, loss_att=0.681, loss_ctc=2.555, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.255e-04, train_time=0.094 -[v016] 2022-01-31 07:07:41,697 (trainer:653) INFO: 117epoch:train:55-81batch: iter_time=8.061e-05, forward_time=0.032, loss=1.588, loss_att=0.698, loss_ctc=2.478, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.255e-04, train_time=0.091 -[v016] 2022-01-31 07:07:44,207 (trainer:653) INFO: 117epoch:train:82-108batch: iter_time=8.290e-05, forward_time=0.032, loss=1.610, loss_att=0.701, loss_ctc=2.519, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.254e-04, train_time=0.093 -[v016] 2022-01-31 07:07:46,714 (trainer:653) INFO: 117epoch:train:109-135batch: iter_time=8.460e-05, forward_time=0.032, loss=1.652, loss_att=0.780, loss_ctc=2.525, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.254e-04, train_time=0.093 -[v016] 2022-01-31 07:07:49,431 (trainer:653) INFO: 117epoch:train:136-162batch: iter_time=0.008, forward_time=0.032, loss=1.454, loss_att=0.618, loss_ctc=2.290, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.254e-04, train_time=0.100 -[v016] 2022-01-31 07:07:51,896 (trainer:653) INFO: 117epoch:train:163-189batch: iter_time=0.001, forward_time=0.031, loss=1.530, loss_att=0.689, loss_ctc=2.371, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.254e-04, train_time=0.091 -[v016] 2022-01-31 07:07:54,348 (trainer:653) INFO: 117epoch:train:190-216batch: iter_time=7.743e-05, forward_time=0.031, loss=1.543, loss_att=0.637, loss_ctc=2.450, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.253e-04, train_time=0.091 -[v016] 2022-01-31 07:07:56,831 (trainer:653) INFO: 117epoch:train:217-243batch: iter_time=7.885e-05, forward_time=0.032, loss=1.630, loss_att=0.734, loss_ctc=2.527, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.253e-04, train_time=0.092 -[v016] 2022-01-31 07:07:59,270 (trainer:653) INFO: 117epoch:train:244-270batch: iter_time=8.018e-05, forward_time=0.032, loss=1.724, loss_att=0.835, loss_ctc=2.613, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.253e-04, train_time=0.090 -[v016] 2022-01-31 07:08:01,784 (trainer:653) INFO: 117epoch:train:271-297batch: iter_time=8.955e-05, forward_time=0.032, loss=1.638, loss_att=0.724, loss_ctc=2.552, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.253e-04, train_time=0.093 -[v016] 2022-01-31 07:08:04,161 (trainer:653) INFO: 117epoch:train:298-324batch: iter_time=7.768e-05, forward_time=0.030, loss=1.657, loss_att=0.756, loss_ctc=2.558, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.252e-04, train_time=0.088 -[v016] 2022-01-31 07:08:06,604 (trainer:653) INFO: 117epoch:train:325-351batch: iter_time=8.428e-05, forward_time=0.031, loss=1.534, loss_att=0.720, loss_ctc=2.348, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.252e-04, train_time=0.090 -[v016] 2022-01-31 07:08:09,113 (trainer:653) INFO: 117epoch:train:352-378batch: iter_time=8.762e-05, forward_time=0.032, loss=1.697, loss_att=0.718, loss_ctc=2.676, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.252e-04, train_time=0.093 -[v016] 2022-01-31 07:08:11,597 (trainer:653) INFO: 117epoch:train:379-405batch: iter_time=8.863e-05, forward_time=0.032, loss=1.623, loss_att=0.751, loss_ctc=2.496, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.252e-04, train_time=0.092 -[v016] 2022-01-31 07:08:14,104 (trainer:653) INFO: 117epoch:train:406-432batch: iter_time=8.463e-05, forward_time=0.033, loss=1.854, loss_att=0.825, loss_ctc=2.883, acc=0.963, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.251e-04, train_time=0.093 -[v016] 2022-01-31 07:08:16,624 (trainer:653) INFO: 117epoch:train:433-459batch: iter_time=8.196e-05, forward_time=0.033, loss=1.679, loss_att=0.777, loss_ctc=2.582, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.251e-04, train_time=0.093 -[v016] 2022-01-31 07:08:19,073 (trainer:653) INFO: 117epoch:train:460-486batch: iter_time=8.482e-05, forward_time=0.032, loss=1.555, loss_att=0.754, loss_ctc=2.355, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.251e-04, train_time=0.091 -[v016] 2022-01-31 07:08:22,175 (trainer:653) INFO: 117epoch:train:487-513batch: iter_time=0.026, forward_time=0.031, loss=1.608, loss_att=0.817, loss_ctc=2.400, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.250e-04, train_time=0.115 -[v016] 2022-01-31 07:08:24,595 (trainer:653) INFO: 117epoch:train:514-540batch: iter_time=7.735e-05, forward_time=0.031, loss=1.562, loss_att=0.663, loss_ctc=2.461, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.250e-04, train_time=0.089 -[v016] 2022-01-31 07:08:57,989 (trainer:328) INFO: 117epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.614, loss_att=0.726, loss_ctc=2.502, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.253e-04, train_time=0.093, time=51.23 seconds, total_count=63999, gpu_max_cached_mem_GB=5.824, [valid] loss=7.283, loss_att=5.968, loss_ctc=8.598, acc=0.901, cer=0.100, wer=0.405, cer_ctc=0.147, time=5.35 seconds, total_count=20826, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.34 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:08:59,945 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:08:59,974 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/109epoch.pth -[v016] 2022-01-31 07:08:59,974 (trainer:261) INFO: 118/200epoch started. Estimated time to finish: 2 hours, 34 minutes and 41.6 seconds -[v016] 2022-01-31 07:09:02,493 (trainer:653) INFO: 118epoch:train:1-27batch: iter_time=0.003, forward_time=0.031, loss=1.249, loss_att=0.681, loss_ctc=1.816, acc=0.962, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.250e-04, train_time=0.093 -[v016] 2022-01-31 07:09:05,020 (trainer:653) INFO: 118epoch:train:28-54batch: iter_time=9.095e-05, forward_time=0.032, loss=1.691, loss_att=0.722, loss_ctc=2.661, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.250e-04, train_time=0.093 -[v016] 2022-01-31 07:09:07,496 (trainer:653) INFO: 118epoch:train:55-81batch: iter_time=8.364e-05, forward_time=0.032, loss=1.622, loss_att=0.745, loss_ctc=2.499, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.249e-04, train_time=0.091 -[v016] 2022-01-31 07:09:09,984 (trainer:653) INFO: 118epoch:train:82-108batch: iter_time=7.681e-05, forward_time=0.032, loss=1.516, loss_att=0.629, loss_ctc=2.403, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.249e-04, train_time=0.092 -[v016] 2022-01-31 07:09:12,394 (trainer:653) INFO: 118epoch:train:109-135batch: iter_time=7.513e-05, forward_time=0.031, loss=1.491, loss_att=0.691, loss_ctc=2.291, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.249e-04, train_time=0.089 -[v016] 2022-01-31 07:09:14,833 (trainer:653) INFO: 118epoch:train:136-162batch: iter_time=7.893e-05, forward_time=0.031, loss=1.810, loss_att=0.778, loss_ctc=2.841, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.249e-04, train_time=0.090 -[v016] 2022-01-31 07:09:17,275 (trainer:653) INFO: 118epoch:train:163-189batch: iter_time=7.640e-05, forward_time=0.031, loss=1.482, loss_att=0.635, loss_ctc=2.330, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.248e-04, train_time=0.090 -[v016] 2022-01-31 07:09:19,774 (trainer:653) INFO: 118epoch:train:190-216batch: iter_time=7.644e-05, forward_time=0.032, loss=1.724, loss_att=0.719, loss_ctc=2.730, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.248e-04, train_time=0.092 -[v016] 2022-01-31 07:09:22,249 (trainer:653) INFO: 118epoch:train:217-243batch: iter_time=8.139e-05, forward_time=0.032, loss=1.674, loss_att=0.718, loss_ctc=2.631, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.248e-04, train_time=0.091 -[v016] 2022-01-31 07:09:25,012 (trainer:653) INFO: 118epoch:train:244-270batch: iter_time=0.010, forward_time=0.032, loss=1.725, loss_att=0.733, loss_ctc=2.716, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.247e-04, train_time=0.102 -[v016] 2022-01-31 07:09:27,460 (trainer:653) INFO: 118epoch:train:271-297batch: iter_time=7.638e-05, forward_time=0.031, loss=1.683, loss_att=0.750, loss_ctc=2.615, acc=0.961, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.247e-04, train_time=0.090 -[v016] 2022-01-31 07:09:29,923 (trainer:653) INFO: 118epoch:train:298-324batch: iter_time=7.598e-05, forward_time=0.031, loss=1.625, loss_att=0.729, loss_ctc=2.521, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.247e-04, train_time=0.091 -[v016] 2022-01-31 07:09:32,292 (trainer:653) INFO: 118epoch:train:325-351batch: iter_time=7.452e-05, forward_time=0.030, loss=1.722, loss_att=0.849, loss_ctc=2.595, acc=0.959, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.247e-04, train_time=0.088 -[v016] 2022-01-31 07:09:34,669 (trainer:653) INFO: 118epoch:train:352-378batch: iter_time=7.404e-05, forward_time=0.030, loss=1.388, loss_att=0.656, loss_ctc=2.120, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.246e-04, train_time=0.088 -[v016] 2022-01-31 07:09:37,067 (trainer:653) INFO: 118epoch:train:379-405batch: iter_time=8.740e-05, forward_time=0.031, loss=1.618, loss_att=0.803, loss_ctc=2.432, acc=0.959, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.246e-04, train_time=0.089 -[v016] 2022-01-31 07:09:39,616 (trainer:653) INFO: 118epoch:train:406-432batch: iter_time=8.176e-05, forward_time=0.033, loss=1.726, loss_att=0.755, loss_ctc=2.698, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.246e-04, train_time=0.094 -[v016] 2022-01-31 07:09:42,063 (trainer:653) INFO: 118epoch:train:433-459batch: iter_time=7.528e-05, forward_time=0.031, loss=1.561, loss_att=0.707, loss_ctc=2.416, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.246e-04, train_time=0.090 -[v016] 2022-01-31 07:09:44,441 (trainer:653) INFO: 118epoch:train:460-486batch: iter_time=7.610e-05, forward_time=0.030, loss=1.451, loss_att=0.714, loss_ctc=2.189, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.245e-04, train_time=0.088 -[v016] 2022-01-31 07:09:46,797 (trainer:653) INFO: 118epoch:train:487-513batch: iter_time=7.372e-05, forward_time=0.030, loss=1.505, loss_att=0.788, loss_ctc=2.221, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.245e-04, train_time=0.087 -[v016] 2022-01-31 07:09:49,148 (trainer:653) INFO: 118epoch:train:514-540batch: iter_time=7.401e-05, forward_time=0.030, loss=1.336, loss_att=0.729, loss_ctc=1.943, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.245e-04, train_time=0.087 -[v016] 2022-01-31 07:10:22,773 (trainer:328) INFO: 118epoch results: [train] iter_time=7.359e-04, forward_time=0.031, loss=1.585, loss_att=0.729, loss_ctc=2.441, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.247e-04, train_time=0.091, time=49.92 seconds, total_count=64546, gpu_max_cached_mem_GB=5.824, [valid] loss=7.108, loss_att=5.834, loss_ctc=8.382, acc=0.903, cer=0.102, wer=0.407, cer_ctc=0.148, time=6.25 seconds, total_count=21004, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.63 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:10:24,857 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:10:24,885 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/112epoch.pth -[v016] 2022-01-31 07:10:24,885 (trainer:261) INFO: 119/200epoch started. Estimated time to finish: 2 hours, 32 minutes and 27.26 seconds -[v016] 2022-01-31 07:10:27,728 (trainer:653) INFO: 119epoch:train:1-27batch: iter_time=0.011, forward_time=0.033, loss=1.636, loss_att=0.761, loss_ctc=2.510, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.245e-04, train_time=0.105 -[v016] 2022-01-31 07:10:30,145 (trainer:653) INFO: 119epoch:train:28-54batch: iter_time=7.837e-05, forward_time=0.031, loss=1.453, loss_att=0.646, loss_ctc=2.261, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.244e-04, train_time=0.089 -[v016] 2022-01-31 07:10:32,528 (trainer:653) INFO: 119epoch:train:55-81batch: iter_time=7.497e-05, forward_time=0.031, loss=1.494, loss_att=0.699, loss_ctc=2.288, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.244e-04, train_time=0.088 -[v016] 2022-01-31 07:10:34,901 (trainer:653) INFO: 119epoch:train:82-108batch: iter_time=7.583e-05, forward_time=0.030, loss=1.313, loss_att=0.600, loss_ctc=2.025, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.244e-04, train_time=0.088 -[v016] 2022-01-31 07:10:37,302 (trainer:653) INFO: 119epoch:train:109-135batch: iter_time=7.562e-05, forward_time=0.031, loss=1.422, loss_att=0.693, loss_ctc=2.151, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.244e-04, train_time=0.089 -[v016] 2022-01-31 07:10:39,739 (trainer:653) INFO: 119epoch:train:136-162batch: iter_time=7.791e-05, forward_time=0.032, loss=1.594, loss_att=0.704, loss_ctc=2.485, acc=0.972, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.243e-04, train_time=0.090 -[v016] 2022-01-31 07:10:42,409 (trainer:653) INFO: 119epoch:train:163-189batch: iter_time=1.041e-04, forward_time=0.034, loss=1.828, loss_att=0.758, loss_ctc=2.898, acc=0.967, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.243e-04, train_time=0.099 -[v016] 2022-01-31 07:10:45,256 (trainer:653) INFO: 119epoch:train:190-216batch: iter_time=0.005, forward_time=0.034, loss=1.648, loss_att=0.757, loss_ctc=2.539, acc=0.966, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.243e-04, train_time=0.105 -[v016] 2022-01-31 07:10:47,934 (trainer:653) INFO: 119epoch:train:217-243batch: iter_time=9.588e-05, forward_time=0.034, loss=1.752, loss_att=0.733, loss_ctc=2.772, acc=0.968, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.242e-04, train_time=0.099 -[v016] 2022-01-31 07:10:50,492 (trainer:653) INFO: 119epoch:train:244-270batch: iter_time=1.010e-04, forward_time=0.033, loss=1.598, loss_att=0.782, loss_ctc=2.415, acc=0.962, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.242e-04, train_time=0.095 -[v016] 2022-01-31 07:10:53,088 (trainer:653) INFO: 119epoch:train:271-297batch: iter_time=1.022e-04, forward_time=0.034, loss=1.677, loss_att=0.692, loss_ctc=2.662, acc=0.972, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.242e-04, train_time=0.096 -[v016] 2022-01-31 07:10:55,636 (trainer:653) INFO: 119epoch:train:298-324batch: iter_time=1.267e-04, forward_time=0.033, loss=1.473, loss_att=0.722, loss_ctc=2.223, acc=0.964, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.242e-04, train_time=0.094 -[v016] 2022-01-31 07:10:58,241 (trainer:653) INFO: 119epoch:train:325-351batch: iter_time=0.002, forward_time=0.033, loss=1.433, loss_att=0.653, loss_ctc=2.214, acc=0.968, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.241e-04, train_time=0.096 -[v016] 2022-01-31 07:11:00,807 (trainer:653) INFO: 119epoch:train:352-378batch: iter_time=1.206e-04, forward_time=0.033, loss=1.565, loss_att=0.728, loss_ctc=2.401, acc=0.964, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.241e-04, train_time=0.095 -[v016] 2022-01-31 07:11:03,348 (trainer:653) INFO: 119epoch:train:379-405batch: iter_time=1.275e-04, forward_time=0.033, loss=1.502, loss_att=0.736, loss_ctc=2.268, acc=0.966, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.241e-04, train_time=0.094 -[v016] 2022-01-31 07:11:05,964 (trainer:653) INFO: 119epoch:train:406-432batch: iter_time=1.338e-04, forward_time=0.034, loss=1.420, loss_att=0.683, loss_ctc=2.157, acc=0.968, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.241e-04, train_time=0.097 -[v016] 2022-01-31 07:11:08,605 (trainer:653) INFO: 119epoch:train:433-459batch: iter_time=1.232e-04, forward_time=0.034, loss=1.521, loss_att=0.661, loss_ctc=2.381, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.240e-04, train_time=0.098 -[v016] 2022-01-31 07:11:11,073 (trainer:653) INFO: 119epoch:train:460-486batch: iter_time=9.761e-05, forward_time=0.032, loss=1.508, loss_att=0.664, loss_ctc=2.352, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.240e-04, train_time=0.091 -[v016] 2022-01-31 07:11:13,556 (trainer:653) INFO: 119epoch:train:487-513batch: iter_time=8.583e-05, forward_time=0.032, loss=1.467, loss_att=0.697, loss_ctc=2.237, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.240e-04, train_time=0.092 -[v016] 2022-01-31 07:11:16,060 (trainer:653) INFO: 119epoch:train:514-540batch: iter_time=9.220e-05, forward_time=0.032, loss=1.772, loss_att=0.839, loss_ctc=2.706, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.240e-04, train_time=0.093 -[v016] 2022-01-31 07:11:51,450 (trainer:328) INFO: 119epoch results: [train] iter_time=9.675e-04, forward_time=0.033, loss=1.555, loss_att=0.712, loss_ctc=2.398, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.242e-04, train_time=0.095, time=51.91 seconds, total_count=65093, gpu_max_cached_mem_GB=5.824, [valid] loss=7.248, loss_att=5.902, loss_ctc=8.593, acc=0.905, cer=0.100, wer=0.395, cer_ctc=0.146, time=5.74 seconds, total_count=21182, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.91 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:11:53,567 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:11:53,598 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/96epoch.pth, exp/asr_train_asr_raw_en_word/111epoch.pth -[v016] 2022-01-31 07:11:53,598 (trainer:261) INFO: 120/200epoch started. Estimated time to finish: 2 hours, 30 minutes and 17.02 seconds -[v016] 2022-01-31 07:11:56,192 (trainer:653) INFO: 120epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.695, loss_att=0.722, loss_ctc=2.668, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.239e-04, train_time=0.096 -[v016] 2022-01-31 07:11:58,573 (trainer:653) INFO: 120epoch:train:28-54batch: iter_time=7.851e-05, forward_time=0.031, loss=1.535, loss_att=0.711, loss_ctc=2.360, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.239e-04, train_time=0.088 -[v016] 2022-01-31 07:12:01,351 (trainer:653) INFO: 120epoch:train:55-81batch: iter_time=0.013, forward_time=0.031, loss=1.494, loss_att=0.655, loss_ctc=2.333, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.239e-04, train_time=0.103 -[v016] 2022-01-31 07:12:03,777 (trainer:653) INFO: 120epoch:train:82-108batch: iter_time=7.500e-05, forward_time=0.032, loss=1.279, loss_att=0.624, loss_ctc=1.934, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.239e-04, train_time=0.090 -[v016] 2022-01-31 07:12:06,196 (trainer:653) INFO: 120epoch:train:109-135batch: iter_time=7.455e-05, forward_time=0.031, loss=1.636, loss_att=0.787, loss_ctc=2.486, acc=0.958, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.238e-04, train_time=0.089 -[v016] 2022-01-31 07:12:08,633 (trainer:653) INFO: 120epoch:train:136-162batch: iter_time=8.194e-05, forward_time=0.032, loss=1.269, loss_att=0.614, loss_ctc=1.924, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.238e-04, train_time=0.090 -[v016] 2022-01-31 07:12:11,141 (trainer:653) INFO: 120epoch:train:163-189batch: iter_time=7.779e-05, forward_time=0.032, loss=1.432, loss_att=0.630, loss_ctc=2.233, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.238e-04, train_time=0.093 -[v016] 2022-01-31 07:12:13,633 (trainer:653) INFO: 120epoch:train:190-216batch: iter_time=7.508e-05, forward_time=0.032, loss=1.645, loss_att=0.656, loss_ctc=2.634, acc=0.973, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.238e-04, train_time=0.092 -[v016] 2022-01-31 07:12:16,196 (trainer:653) INFO: 120epoch:train:217-243batch: iter_time=7.861e-05, forward_time=0.033, loss=1.469, loss_att=0.585, loss_ctc=2.354, acc=0.974, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.237e-04, train_time=0.095 -[v016] 2022-01-31 07:12:18,628 (trainer:653) INFO: 120epoch:train:244-270batch: iter_time=7.534e-05, forward_time=0.031, loss=1.422, loss_att=0.572, loss_ctc=2.271, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.237e-04, train_time=0.090 -[v016] 2022-01-31 07:12:21,172 (trainer:653) INFO: 120epoch:train:271-297batch: iter_time=7.759e-05, forward_time=0.033, loss=1.610, loss_att=0.667, loss_ctc=2.553, acc=0.972, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.237e-04, train_time=0.094 -[v016] 2022-01-31 07:12:23,644 (trainer:653) INFO: 120epoch:train:298-324batch: iter_time=8.659e-05, forward_time=0.033, loss=1.834, loss_att=0.846, loss_ctc=2.821, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.237e-04, train_time=0.091 -[v016] 2022-01-31 07:12:26,190 (trainer:653) INFO: 120epoch:train:325-351batch: iter_time=8.194e-05, forward_time=0.033, loss=1.733, loss_att=0.727, loss_ctc=2.738, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.236e-04, train_time=0.094 -[v016] 2022-01-31 07:12:28,655 (trainer:653) INFO: 120epoch:train:352-378batch: iter_time=8.578e-05, forward_time=0.032, loss=1.415, loss_att=0.641, loss_ctc=2.188, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.236e-04, train_time=0.091 -[v016] 2022-01-31 07:12:31,394 (trainer:653) INFO: 120epoch:train:379-405batch: iter_time=0.011, forward_time=0.032, loss=1.580, loss_att=0.823, loss_ctc=2.337, acc=0.953, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.236e-04, train_time=0.101 -[v016] 2022-01-31 07:12:33,840 (trainer:653) INFO: 120epoch:train:406-432batch: iter_time=8.195e-05, forward_time=0.032, loss=1.494, loss_att=0.724, loss_ctc=2.265, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.235e-04, train_time=0.090 -[v016] 2022-01-31 07:12:36,266 (trainer:653) INFO: 120epoch:train:433-459batch: iter_time=7.666e-05, forward_time=0.032, loss=1.486, loss_att=0.658, loss_ctc=2.313, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.235e-04, train_time=0.090 -[v016] 2022-01-31 07:12:38,742 (trainer:653) INFO: 120epoch:train:460-486batch: iter_time=8.493e-05, forward_time=0.032, loss=1.643, loss_att=0.761, loss_ctc=2.524, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.235e-04, train_time=0.091 -[v016] 2022-01-31 07:12:41,255 (trainer:653) INFO: 120epoch:train:487-513batch: iter_time=8.401e-05, forward_time=0.033, loss=1.767, loss_att=0.771, loss_ctc=2.762, acc=0.958, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.235e-04, train_time=0.093 -[v016] 2022-01-31 07:12:43,678 (trainer:653) INFO: 120epoch:train:514-540batch: iter_time=7.819e-05, forward_time=0.032, loss=1.691, loss_att=0.720, loss_ctc=2.662, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.234e-04, train_time=0.090 -[v016] 2022-01-31 07:13:16,968 (trainer:328) INFO: 120epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.559, loss_att=0.696, loss_ctc=2.423, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.237e-04, train_time=0.093, time=50.82 seconds, total_count=65640, gpu_max_cached_mem_GB=5.824, [valid] loss=7.289, loss_att=5.934, loss_ctc=8.645, acc=0.903, cer=0.102, wer=0.396, cer_ctc=0.152, time=5.44 seconds, total_count=21360, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.12 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:13:18,908 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:13:18,916 (trainer:261) INFO: 121/200epoch started. Estimated time to finish: 2 hours, 28 minutes and 4.89 seconds -[v016] 2022-01-31 07:13:21,463 (trainer:653) INFO: 121epoch:train:1-27batch: iter_time=0.004, forward_time=0.031, loss=1.812, loss_att=0.816, loss_ctc=2.808, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.234e-04, train_time=0.094 -[v016] 2022-01-31 07:13:23,899 (trainer:653) INFO: 121epoch:train:28-54batch: iter_time=8.139e-05, forward_time=0.031, loss=1.640, loss_att=0.697, loss_ctc=2.583, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.234e-04, train_time=0.090 -[v016] 2022-01-31 07:13:26,293 (trainer:653) INFO: 121epoch:train:55-81batch: iter_time=7.591e-05, forward_time=0.031, loss=1.436, loss_att=0.663, loss_ctc=2.208, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.234e-04, train_time=0.088 -[v016] 2022-01-31 07:13:28,749 (trainer:653) INFO: 121epoch:train:82-108batch: iter_time=8.082e-05, forward_time=0.032, loss=1.469, loss_att=0.630, loss_ctc=2.308, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.233e-04, train_time=0.091 -[v016] 2022-01-31 07:13:31,116 (trainer:653) INFO: 121epoch:train:109-135batch: iter_time=7.307e-05, forward_time=0.030, loss=1.409, loss_att=0.688, loss_ctc=2.130, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.233e-04, train_time=0.087 -[v016] 2022-01-31 07:13:33,679 (trainer:653) INFO: 121epoch:train:136-162batch: iter_time=0.006, forward_time=0.030, loss=1.613, loss_att=0.703, loss_ctc=2.523, acc=0.967, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.233e-04, train_time=0.095 -[v016] 2022-01-31 07:13:36,049 (trainer:653) INFO: 121epoch:train:163-189batch: iter_time=8.001e-05, forward_time=0.031, loss=1.407, loss_att=0.653, loss_ctc=2.160, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.233e-04, train_time=0.088 -[v016] 2022-01-31 07:13:38,431 (trainer:653) INFO: 121epoch:train:190-216batch: iter_time=7.555e-05, forward_time=0.031, loss=1.484, loss_att=0.678, loss_ctc=2.291, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.232e-04, train_time=0.088 -[v016] 2022-01-31 07:13:40,911 (trainer:653) INFO: 121epoch:train:217-243batch: iter_time=7.647e-05, forward_time=0.032, loss=1.531, loss_att=0.693, loss_ctc=2.370, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.232e-04, train_time=0.092 -[v016] 2022-01-31 07:13:43,434 (trainer:653) INFO: 121epoch:train:244-270batch: iter_time=8.440e-05, forward_time=0.033, loss=1.637, loss_att=0.624, loss_ctc=2.650, acc=0.976, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.232e-04, train_time=0.093 -[v016] 2022-01-31 07:13:45,833 (trainer:653) INFO: 121epoch:train:271-297batch: iter_time=7.786e-05, forward_time=0.031, loss=1.444, loss_att=0.706, loss_ctc=2.183, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.232e-04, train_time=0.089 -[v016] 2022-01-31 07:13:48,236 (trainer:653) INFO: 121epoch:train:298-324batch: iter_time=7.578e-05, forward_time=0.031, loss=1.413, loss_att=0.672, loss_ctc=2.154, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.231e-04, train_time=0.089 -[v016] 2022-01-31 07:13:50,712 (trainer:653) INFO: 121epoch:train:325-351batch: iter_time=7.576e-05, forward_time=0.032, loss=1.602, loss_att=0.741, loss_ctc=2.464, acc=0.962, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.231e-04, train_time=0.092 -[v016] 2022-01-31 07:13:53,154 (trainer:653) INFO: 121epoch:train:352-378batch: iter_time=7.593e-05, forward_time=0.032, loss=1.679, loss_att=0.735, loss_ctc=2.624, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.231e-04, train_time=0.090 -[v016] 2022-01-31 07:13:55,505 (trainer:653) INFO: 121epoch:train:379-405batch: iter_time=7.420e-05, forward_time=0.030, loss=1.471, loss_att=0.695, loss_ctc=2.248, acc=0.962, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.231e-04, train_time=0.087 -[v016] 2022-01-31 07:13:57,984 (trainer:653) INFO: 121epoch:train:406-432batch: iter_time=7.657e-05, forward_time=0.032, loss=1.731, loss_att=0.694, loss_ctc=2.768, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.230e-04, train_time=0.092 -[v016] 2022-01-31 07:14:00,439 (trainer:653) INFO: 121epoch:train:433-459batch: iter_time=8.201e-05, forward_time=0.032, loss=1.558, loss_att=0.746, loss_ctc=2.370, acc=0.963, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.230e-04, train_time=0.091 -[v016] 2022-01-31 07:14:02,905 (trainer:653) INFO: 121epoch:train:460-486batch: iter_time=7.684e-05, forward_time=0.032, loss=1.901, loss_att=0.779, loss_ctc=3.023, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.230e-04, train_time=0.091 -[v016] 2022-01-31 07:14:05,811 (trainer:653) INFO: 121epoch:train:487-513batch: iter_time=0.014, forward_time=0.033, loss=1.655, loss_att=0.744, loss_ctc=2.566, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.230e-04, train_time=0.107 -[v016] 2022-01-31 07:14:08,374 (trainer:653) INFO: 121epoch:train:514-540batch: iter_time=7.713e-05, forward_time=0.033, loss=1.763, loss_att=0.703, loss_ctc=2.823, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.229e-04, train_time=0.095 -[v016] 2022-01-31 07:14:41,440 (trainer:328) INFO: 121epoch results: [train] iter_time=0.001, forward_time=0.031, loss=1.579, loss_att=0.704, loss_ctc=2.455, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.232e-04, train_time=0.091, time=50.14 seconds, total_count=66187, gpu_max_cached_mem_GB=5.824, [valid] loss=7.167, loss_att=5.912, loss_ctc=8.422, acc=0.905, cer=0.100, wer=0.400, cer_ctc=0.144, time=5.41 seconds, total_count=21538, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.98 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:14:43,392 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:14:43,400 (trainer:261) INFO: 122/200epoch started. Estimated time to finish: 2 hours, 25 minutes and 53.04 seconds -[v016] 2022-01-31 07:14:45,983 (trainer:653) INFO: 122epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=1.536, loss_att=0.646, loss_ctc=2.426, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.229e-04, train_time=0.095 -[v016] 2022-01-31 07:14:48,470 (trainer:653) INFO: 122epoch:train:28-54batch: iter_time=8.612e-05, forward_time=0.032, loss=1.485, loss_att=0.620, loss_ctc=2.351, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.229e-04, train_time=0.092 -[v016] 2022-01-31 07:14:50,811 (trainer:653) INFO: 122epoch:train:55-81batch: iter_time=7.438e-05, forward_time=0.030, loss=1.236, loss_att=0.642, loss_ctc=1.830, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.229e-04, train_time=0.087 -[v016] 2022-01-31 07:14:53,313 (trainer:653) INFO: 122epoch:train:82-108batch: iter_time=7.432e-05, forward_time=0.032, loss=1.664, loss_att=0.697, loss_ctc=2.632, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.228e-04, train_time=0.092 -[v016] 2022-01-31 07:14:55,702 (trainer:653) INFO: 122epoch:train:109-135batch: iter_time=7.414e-05, forward_time=0.031, loss=1.370, loss_att=0.634, loss_ctc=2.106, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.228e-04, train_time=0.088 -[v016] 2022-01-31 07:14:58,162 (trainer:653) INFO: 122epoch:train:136-162batch: iter_time=7.401e-05, forward_time=0.032, loss=1.730, loss_att=0.754, loss_ctc=2.707, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.228e-04, train_time=0.091 -[v016] 2022-01-31 07:15:00,659 (trainer:653) INFO: 122epoch:train:163-189batch: iter_time=7.493e-05, forward_time=0.032, loss=1.700, loss_att=0.711, loss_ctc=2.690, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.228e-04, train_time=0.092 -[v016] 2022-01-31 07:15:03,110 (trainer:653) INFO: 122epoch:train:190-216batch: iter_time=7.723e-05, forward_time=0.032, loss=1.344, loss_att=0.649, loss_ctc=2.040, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.227e-04, train_time=0.091 -[v016] 2022-01-31 07:15:05,565 (trainer:653) INFO: 122epoch:train:217-243batch: iter_time=7.567e-05, forward_time=0.032, loss=1.547, loss_att=0.692, loss_ctc=2.402, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.227e-04, train_time=0.091 -[v016] 2022-01-31 07:15:08,303 (trainer:653) INFO: 122epoch:train:244-270batch: iter_time=0.013, forward_time=0.030, loss=1.446, loss_att=0.685, loss_ctc=2.207, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.227e-04, train_time=0.101 -[v016] 2022-01-31 07:15:10,687 (trainer:653) INFO: 122epoch:train:271-297batch: iter_time=7.479e-05, forward_time=0.030, loss=1.576, loss_att=0.724, loss_ctc=2.429, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.227e-04, train_time=0.088 -[v016] 2022-01-31 07:15:13,122 (trainer:653) INFO: 122epoch:train:298-324batch: iter_time=7.382e-05, forward_time=0.031, loss=1.599, loss_att=0.766, loss_ctc=2.431, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.226e-04, train_time=0.090 -[v016] 2022-01-31 07:15:15,578 (trainer:653) INFO: 122epoch:train:325-351batch: iter_time=7.371e-05, forward_time=0.032, loss=1.618, loss_att=0.777, loss_ctc=2.459, acc=0.964, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.226e-04, train_time=0.091 -[v016] 2022-01-31 07:15:18,011 (trainer:653) INFO: 122epoch:train:352-378batch: iter_time=7.920e-05, forward_time=0.031, loss=1.382, loss_att=0.595, loss_ctc=2.169, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.226e-04, train_time=0.090 -[v016] 2022-01-31 07:15:20,463 (trainer:653) INFO: 122epoch:train:379-405batch: iter_time=8.263e-05, forward_time=0.031, loss=1.459, loss_att=0.662, loss_ctc=2.255, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.226e-04, train_time=0.091 -[v016] 2022-01-31 07:15:22,924 (trainer:653) INFO: 122epoch:train:406-432batch: iter_time=7.530e-05, forward_time=0.032, loss=1.388, loss_att=0.634, loss_ctc=2.142, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.225e-04, train_time=0.091 -[v016] 2022-01-31 07:15:25,375 (trainer:653) INFO: 122epoch:train:433-459batch: iter_time=7.460e-05, forward_time=0.032, loss=1.751, loss_att=0.846, loss_ctc=2.656, acc=0.962, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.225e-04, train_time=0.091 -[v016] 2022-01-31 07:15:27,839 (trainer:653) INFO: 122epoch:train:460-486batch: iter_time=7.555e-05, forward_time=0.032, loss=1.586, loss_att=0.720, loss_ctc=2.452, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.225e-04, train_time=0.091 -[v016] 2022-01-31 07:15:30,233 (trainer:653) INFO: 122epoch:train:487-513batch: iter_time=7.663e-05, forward_time=0.031, loss=1.392, loss_att=0.703, loss_ctc=2.080, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.225e-04, train_time=0.088 -[v016] 2022-01-31 07:15:32,731 (trainer:653) INFO: 122epoch:train:514-540batch: iter_time=7.730e-05, forward_time=0.032, loss=1.655, loss_att=0.679, loss_ctc=2.632, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.224e-04, train_time=0.092 -[v016] 2022-01-31 07:16:06,088 (trainer:328) INFO: 122epoch results: [train] iter_time=8.965e-04, forward_time=0.031, loss=1.516, loss_att=0.689, loss_ctc=2.342, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.227e-04, train_time=0.091, time=49.99 seconds, total_count=66734, gpu_max_cached_mem_GB=5.824, [valid] loss=7.173, loss_att=5.917, loss_ctc=8.429, acc=0.904, cer=0.101, wer=0.400, cer_ctc=0.146, time=6.15 seconds, total_count=21716, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.55 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:16:08,298 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:16:08,332 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/114epoch.pth -[v016] 2022-01-31 07:16:08,333 (trainer:261) INFO: 123/200epoch started. Estimated time to finish: 2 hours, 23 minutes and 42.47 seconds -[v016] 2022-01-31 07:16:11,002 (trainer:653) INFO: 123epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.698, loss_att=0.732, loss_ctc=2.665, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.224e-04, train_time=0.099 -[v016] 2022-01-31 07:16:13,474 (trainer:653) INFO: 123epoch:train:28-54batch: iter_time=7.987e-05, forward_time=0.032, loss=1.408, loss_att=0.615, loss_ctc=2.202, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.224e-04, train_time=0.091 -[v016] 2022-01-31 07:16:15,908 (trainer:653) INFO: 123epoch:train:55-81batch: iter_time=7.698e-05, forward_time=0.031, loss=1.571, loss_att=0.749, loss_ctc=2.394, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.223e-04, train_time=0.090 -[v016] 2022-01-31 07:16:18,311 (trainer:653) INFO: 123epoch:train:82-108batch: iter_time=7.496e-05, forward_time=0.031, loss=1.456, loss_att=0.705, loss_ctc=2.208, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.223e-04, train_time=0.089 -[v016] 2022-01-31 07:16:20,705 (trainer:653) INFO: 123epoch:train:109-135batch: iter_time=7.454e-05, forward_time=0.031, loss=1.202, loss_att=0.559, loss_ctc=1.846, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.223e-04, train_time=0.088 -[v016] 2022-01-31 07:16:23,227 (trainer:653) INFO: 123epoch:train:136-162batch: iter_time=7.939e-05, forward_time=0.033, loss=1.595, loss_att=0.616, loss_ctc=2.575, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.223e-04, train_time=0.093 -[v016] 2022-01-31 07:16:25,675 (trainer:653) INFO: 123epoch:train:163-189batch: iter_time=8.000e-05, forward_time=0.031, loss=1.379, loss_att=0.640, loss_ctc=2.118, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.223e-04, train_time=0.090 -[v016] 2022-01-31 07:16:28,053 (trainer:653) INFO: 123epoch:train:190-216batch: iter_time=7.382e-05, forward_time=0.030, loss=1.618, loss_att=0.773, loss_ctc=2.464, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.222e-04, train_time=0.088 -[v016] 2022-01-31 07:16:30,481 (trainer:653) INFO: 123epoch:train:217-243batch: iter_time=7.297e-05, forward_time=0.031, loss=1.527, loss_att=0.732, loss_ctc=2.322, acc=0.966, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.222e-04, train_time=0.090 -[v016] 2022-01-31 07:16:32,995 (trainer:653) INFO: 123epoch:train:244-270batch: iter_time=7.627e-05, forward_time=0.032, loss=1.482, loss_att=0.632, loss_ctc=2.332, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.222e-04, train_time=0.093 -[v016] 2022-01-31 07:16:35,489 (trainer:653) INFO: 123epoch:train:271-297batch: iter_time=7.699e-05, forward_time=0.032, loss=1.665, loss_att=0.679, loss_ctc=2.652, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.222e-04, train_time=0.092 -[v016] 2022-01-31 07:16:37,902 (trainer:653) INFO: 123epoch:train:298-324batch: iter_time=7.494e-05, forward_time=0.031, loss=1.501, loss_att=0.718, loss_ctc=2.285, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.221e-04, train_time=0.089 -[v016] 2022-01-31 07:16:40,383 (trainer:653) INFO: 123epoch:train:325-351batch: iter_time=0.002, forward_time=0.031, loss=1.685, loss_att=0.724, loss_ctc=2.646, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.221e-04, train_time=0.092 -[v016] 2022-01-31 07:16:42,789 (trainer:653) INFO: 123epoch:train:352-378batch: iter_time=7.674e-05, forward_time=0.031, loss=1.638, loss_att=0.789, loss_ctc=2.487, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.221e-04, train_time=0.089 -[v016] 2022-01-31 07:16:45,217 (trainer:653) INFO: 123epoch:train:379-405batch: iter_time=7.449e-05, forward_time=0.031, loss=1.736, loss_att=0.761, loss_ctc=2.711, acc=0.962, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.221e-04, train_time=0.090 -[v016] 2022-01-31 07:16:47,624 (trainer:653) INFO: 123epoch:train:406-432batch: iter_time=7.395e-05, forward_time=0.031, loss=1.622, loss_att=0.728, loss_ctc=2.516, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.220e-04, train_time=0.089 -[v016] 2022-01-31 07:16:50,075 (trainer:653) INFO: 123epoch:train:433-459batch: iter_time=7.542e-05, forward_time=0.031, loss=1.599, loss_att=0.707, loss_ctc=2.492, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.220e-04, train_time=0.091 -[v016] 2022-01-31 07:16:52,545 (trainer:653) INFO: 123epoch:train:460-486batch: iter_time=7.517e-05, forward_time=0.032, loss=1.527, loss_att=0.646, loss_ctc=2.408, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.220e-04, train_time=0.091 -[v016] 2022-01-31 07:16:54,908 (trainer:653) INFO: 123epoch:train:487-513batch: iter_time=7.560e-05, forward_time=0.030, loss=1.326, loss_att=0.673, loss_ctc=1.980, acc=0.961, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.220e-04, train_time=0.087 -[v016] 2022-01-31 07:16:57,389 (trainer:653) INFO: 123epoch:train:514-540batch: iter_time=7.974e-05, forward_time=0.032, loss=1.633, loss_att=0.730, loss_ctc=2.536, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.219e-04, train_time=0.092 -[v016] 2022-01-31 07:17:30,260 (trainer:328) INFO: 123epoch results: [train] iter_time=2.967e-04, forward_time=0.031, loss=1.548, loss_att=0.695, loss_ctc=2.400, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.222e-04, train_time=0.091, time=49.77 seconds, total_count=67281, gpu_max_cached_mem_GB=5.824, [valid] loss=7.163, loss_att=5.909, loss_ctc=8.416, acc=0.906, cer=0.097, wer=0.394, cer_ctc=0.141, time=5.37 seconds, total_count=21894, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.78 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:17:32,362 (trainer:375) INFO: The best model has been updated: valid.acc -[v016] 2022-01-31 07:17:32,410 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/107epoch.pth, exp/asr_train_asr_raw_en_word/117epoch.pth, exp/asr_train_asr_raw_en_word/118epoch.pth -[v016] 2022-01-31 07:17:32,410 (trainer:261) INFO: 124/200epoch started. Estimated time to finish: 2 hours, 21 minutes and 32.14 seconds -[v016] 2022-01-31 07:17:35,055 (trainer:653) INFO: 124epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.583, loss_att=0.710, loss_ctc=2.456, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.219e-04, train_time=0.098 -[v016] 2022-01-31 07:17:37,531 (trainer:653) INFO: 124epoch:train:28-54batch: iter_time=8.435e-05, forward_time=0.032, loss=1.309, loss_att=0.580, loss_ctc=2.038, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.219e-04, train_time=0.092 -[v016] 2022-01-31 07:17:40,072 (trainer:653) INFO: 124epoch:train:55-81batch: iter_time=8.377e-05, forward_time=0.033, loss=1.612, loss_att=0.671, loss_ctc=2.553, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.219e-04, train_time=0.094 -[v016] 2022-01-31 07:17:42,620 (trainer:653) INFO: 124epoch:train:82-108batch: iter_time=8.214e-05, forward_time=0.033, loss=1.782, loss_att=0.750, loss_ctc=2.814, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.218e-04, train_time=0.094 -[v016] 2022-01-31 07:17:45,114 (trainer:653) INFO: 124epoch:train:109-135batch: iter_time=8.284e-05, forward_time=0.033, loss=1.578, loss_att=0.648, loss_ctc=2.508, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.218e-04, train_time=0.092 -[v016] 2022-01-31 07:17:47,562 (trainer:653) INFO: 124epoch:train:136-162batch: iter_time=7.687e-05, forward_time=0.032, loss=1.490, loss_att=0.704, loss_ctc=2.276, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.218e-04, train_time=0.090 -[v016] 2022-01-31 07:17:50,010 (trainer:653) INFO: 124epoch:train:163-189batch: iter_time=7.933e-05, forward_time=0.032, loss=1.616, loss_att=0.722, loss_ctc=2.510, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.218e-04, train_time=0.090 -[v016] 2022-01-31 07:17:52,586 (trainer:653) INFO: 124epoch:train:190-216batch: iter_time=8.770e-05, forward_time=0.033, loss=1.697, loss_att=0.838, loss_ctc=2.556, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.217e-04, train_time=0.095 -[v016] 2022-01-31 07:17:55,024 (trainer:653) INFO: 124epoch:train:217-243batch: iter_time=8.026e-05, forward_time=0.031, loss=1.317, loss_att=0.696, loss_ctc=1.939, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.217e-04, train_time=0.090 -[v016] 2022-01-31 07:17:57,657 (trainer:653) INFO: 124epoch:train:244-270batch: iter_time=8.013e-05, forward_time=0.034, loss=1.819, loss_att=0.735, loss_ctc=2.902, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.217e-04, train_time=0.097 -[v016] 2022-01-31 07:18:00,155 (trainer:653) INFO: 124epoch:train:271-297batch: iter_time=8.990e-05, forward_time=0.033, loss=1.337, loss_att=0.594, loss_ctc=2.081, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.217e-04, train_time=0.092 -[v016] 2022-01-31 07:18:02,697 (trainer:653) INFO: 124epoch:train:298-324batch: iter_time=8.600e-05, forward_time=0.032, loss=1.667, loss_att=0.703, loss_ctc=2.631, acc=0.968, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.216e-04, train_time=0.094 -[v016] 2022-01-31 07:18:05,264 (trainer:653) INFO: 124epoch:train:325-351batch: iter_time=8.234e-05, forward_time=0.033, loss=1.331, loss_att=0.618, loss_ctc=2.044, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.216e-04, train_time=0.095 -[v016] 2022-01-31 07:18:07,950 (trainer:653) INFO: 124epoch:train:352-378batch: iter_time=9.194e-05, forward_time=0.035, loss=1.469, loss_att=0.632, loss_ctc=2.307, acc=0.978, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.216e-04, train_time=0.099 -[v016] 2022-01-31 07:18:10,527 (trainer:653) INFO: 124epoch:train:379-405batch: iter_time=1.007e-04, forward_time=0.034, loss=1.479, loss_att=0.648, loss_ctc=2.310, acc=0.966, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.216e-04, train_time=0.095 -[v016] 2022-01-31 07:18:13,084 (trainer:653) INFO: 124epoch:train:406-432batch: iter_time=8.779e-05, forward_time=0.033, loss=1.175, loss_att=0.618, loss_ctc=1.732, acc=0.970, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.215e-04, train_time=0.094 -[v016] 2022-01-31 07:18:15,653 (trainer:653) INFO: 124epoch:train:433-459batch: iter_time=2.124e-04, forward_time=0.033, loss=1.452, loss_att=0.645, loss_ctc=2.259, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.215e-04, train_time=0.095 -[v016] 2022-01-31 07:18:18,162 (trainer:653) INFO: 124epoch:train:460-486batch: iter_time=8.469e-05, forward_time=0.032, loss=1.399, loss_att=0.671, loss_ctc=2.128, acc=0.959, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.215e-04, train_time=0.093 -[v016] 2022-01-31 07:18:20,629 (trainer:653) INFO: 124epoch:train:487-513batch: iter_time=8.170e-05, forward_time=0.032, loss=1.295, loss_att=0.606, loss_ctc=1.984, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.215e-04, train_time=0.091 -[v016] 2022-01-31 07:18:23,043 (trainer:653) INFO: 124epoch:train:514-540batch: iter_time=7.461e-05, forward_time=0.031, loss=1.416, loss_att=0.647, loss_ctc=2.185, acc=0.973, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.214e-04, train_time=0.089 -[v016] 2022-01-31 07:18:57,131 (trainer:328) INFO: 124epoch results: [train] iter_time=2.321e-04, forward_time=0.033, loss=1.498, loss_att=0.675, loss_ctc=2.320, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.217e-04, train_time=0.094, time=51.35 seconds, total_count=67828, gpu_max_cached_mem_GB=5.824, [valid] loss=7.180, loss_att=5.945, loss_ctc=8.415, acc=0.904, cer=0.101, wer=0.400, cer_ctc=0.147, time=5.32 seconds, total_count=22072, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.05 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:18:59,127 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:18:59,158 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/121epoch.pth -[v016] 2022-01-31 07:18:59,158 (trainer:261) INFO: 125/200epoch started. Estimated time to finish: 2 hours, 19 minutes and 24.65 seconds -[v016] 2022-01-31 07:19:01,721 (trainer:653) INFO: 125epoch:train:1-27batch: iter_time=0.004, forward_time=0.031, loss=1.226, loss_att=0.612, loss_ctc=1.839, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.214e-04, train_time=0.095 -[v016] 2022-01-31 07:19:04,218 (trainer:653) INFO: 125epoch:train:28-54batch: iter_time=8.690e-05, forward_time=0.032, loss=1.647, loss_att=0.716, loss_ctc=2.579, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.214e-04, train_time=0.092 -[v016] 2022-01-31 07:19:06,682 (trainer:653) INFO: 125epoch:train:55-81batch: iter_time=9.168e-05, forward_time=0.031, loss=1.367, loss_att=0.554, loss_ctc=2.180, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.214e-04, train_time=0.091 -[v016] 2022-01-31 07:19:09,145 (trainer:653) INFO: 125epoch:train:82-108batch: iter_time=8.220e-05, forward_time=0.031, loss=1.553, loss_att=0.682, loss_ctc=2.424, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.213e-04, train_time=0.091 -[v016] 2022-01-31 07:19:11,607 (trainer:653) INFO: 125epoch:train:109-135batch: iter_time=8.474e-05, forward_time=0.032, loss=1.384, loss_att=0.614, loss_ctc=2.154, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.213e-04, train_time=0.091 -[v016] 2022-01-31 07:19:14,123 (trainer:653) INFO: 125epoch:train:136-162batch: iter_time=8.752e-05, forward_time=0.032, loss=1.602, loss_att=0.743, loss_ctc=2.461, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.213e-04, train_time=0.093 -[v016] 2022-01-31 07:19:17,085 (trainer:653) INFO: 125epoch:train:163-189batch: iter_time=0.019, forward_time=0.031, loss=1.572, loss_att=0.709, loss_ctc=2.436, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.213e-04, train_time=0.109 -[v016] 2022-01-31 07:19:19,518 (trainer:653) INFO: 125epoch:train:190-216batch: iter_time=7.797e-05, forward_time=0.031, loss=1.453, loss_att=0.665, loss_ctc=2.240, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.212e-04, train_time=0.090 -[v016] 2022-01-31 07:19:21,980 (trainer:653) INFO: 125epoch:train:217-243batch: iter_time=8.370e-05, forward_time=0.031, loss=1.294, loss_att=0.588, loss_ctc=2.000, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.212e-04, train_time=0.091 -[v016] 2022-01-31 07:19:24,416 (trainer:653) INFO: 125epoch:train:244-270batch: iter_time=7.608e-05, forward_time=0.031, loss=1.336, loss_att=0.576, loss_ctc=2.096, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.212e-04, train_time=0.090 -[v016] 2022-01-31 07:19:26,998 (trainer:653) INFO: 125epoch:train:271-297batch: iter_time=7.881e-05, forward_time=0.033, loss=1.689, loss_att=0.740, loss_ctc=2.637, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.212e-04, train_time=0.095 -[v016] 2022-01-31 07:19:29,450 (trainer:653) INFO: 125epoch:train:298-324batch: iter_time=1.539e-04, forward_time=0.031, loss=1.619, loss_att=0.680, loss_ctc=2.558, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.211e-04, train_time=0.091 -[v016] 2022-01-31 07:19:31,841 (trainer:653) INFO: 125epoch:train:325-351batch: iter_time=7.630e-05, forward_time=0.030, loss=1.474, loss_att=0.743, loss_ctc=2.205, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.211e-04, train_time=0.088 -[v016] 2022-01-31 07:19:34,206 (trainer:653) INFO: 125epoch:train:352-378batch: iter_time=7.428e-05, forward_time=0.030, loss=1.359, loss_att=0.687, loss_ctc=2.031, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.211e-04, train_time=0.087 -[v016] 2022-01-31 07:19:36,686 (trainer:653) INFO: 125epoch:train:379-405batch: iter_time=8.409e-05, forward_time=0.031, loss=1.533, loss_att=0.665, loss_ctc=2.402, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.211e-04, train_time=0.092 -[v016] 2022-01-31 07:19:39,119 (trainer:653) INFO: 125epoch:train:406-432batch: iter_time=8.167e-05, forward_time=0.030, loss=1.506, loss_att=0.675, loss_ctc=2.337, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.210e-04, train_time=0.090 -[v016] 2022-01-31 07:19:41,749 (trainer:653) INFO: 125epoch:train:433-459batch: iter_time=7.686e-05, forward_time=0.033, loss=1.497, loss_att=0.549, loss_ctc=2.444, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.210e-04, train_time=0.097 -[v016] 2022-01-31 07:19:44,226 (trainer:653) INFO: 125epoch:train:460-486batch: iter_time=8.382e-05, forward_time=0.031, loss=1.520, loss_att=0.690, loss_ctc=2.350, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.210e-04, train_time=0.092 -[v016] 2022-01-31 07:19:46,826 (trainer:653) INFO: 125epoch:train:487-513batch: iter_time=7.928e-05, forward_time=0.031, loss=1.417, loss_att=0.617, loss_ctc=2.216, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.210e-04, train_time=0.096 -[v016] 2022-01-31 07:19:49,264 (trainer:653) INFO: 125epoch:train:514-540batch: iter_time=1.713e-04, forward_time=0.031, loss=1.542, loss_att=0.726, loss_ctc=2.358, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.210e-04, train_time=0.090 -[v016] 2022-01-31 07:20:22,390 (trainer:328) INFO: 125epoch results: [train] iter_time=0.001, forward_time=0.031, loss=1.476, loss_att=0.661, loss_ctc=2.292, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.212e-04, train_time=0.093, time=50.8 seconds, total_count=68375, gpu_max_cached_mem_GB=5.824, [valid] loss=7.268, loss_att=5.988, loss_ctc=8.548, acc=0.905, cer=0.101, wer=0.405, cer_ctc=0.141, time=5.35 seconds, total_count=22250, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.08 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:20:24,348 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:20:24,375 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/120epoch.pth -[v016] 2022-01-31 07:20:24,376 (trainer:261) INFO: 126/200epoch started. Estimated time to finish: 2 hours, 17 minutes and 16.84 seconds -[v016] 2022-01-31 07:20:26,922 (trainer:653) INFO: 126epoch:train:1-27batch: iter_time=0.004, forward_time=0.031, loss=1.459, loss_att=0.689, loss_ctc=2.229, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.209e-04, train_time=0.094 -[v016] 2022-01-31 07:20:29,330 (trainer:653) INFO: 126epoch:train:28-54batch: iter_time=8.311e-05, forward_time=0.030, loss=1.358, loss_att=0.653, loss_ctc=2.064, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.209e-04, train_time=0.089 -[v016] 2022-01-31 07:20:31,771 (trainer:653) INFO: 126epoch:train:55-81batch: iter_time=7.444e-05, forward_time=0.031, loss=1.400, loss_att=0.637, loss_ctc=2.163, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.209e-04, train_time=0.090 -[v016] 2022-01-31 07:20:34,220 (trainer:653) INFO: 126epoch:train:82-108batch: iter_time=7.343e-05, forward_time=0.031, loss=1.397, loss_att=0.612, loss_ctc=2.183, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.209e-04, train_time=0.090 -[v016] 2022-01-31 07:20:36,599 (trainer:653) INFO: 126epoch:train:109-135batch: iter_time=7.382e-05, forward_time=0.030, loss=1.739, loss_att=0.839, loss_ctc=2.640, acc=0.964, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.208e-04, train_time=0.088 -[v016] 2022-01-31 07:20:39,080 (trainer:653) INFO: 126epoch:train:136-162batch: iter_time=7.437e-05, forward_time=0.032, loss=1.573, loss_att=0.715, loss_ctc=2.431, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.208e-04, train_time=0.092 -[v016] 2022-01-31 07:20:41,530 (trainer:653) INFO: 126epoch:train:163-189batch: iter_time=8.096e-05, forward_time=0.032, loss=1.476, loss_att=0.688, loss_ctc=2.263, acc=0.962, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.208e-04, train_time=0.091 -[v016] 2022-01-31 07:20:43,890 (trainer:653) INFO: 126epoch:train:190-216batch: iter_time=7.377e-05, forward_time=0.030, loss=1.249, loss_att=0.599, loss_ctc=1.898, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.208e-04, train_time=0.087 -[v016] 2022-01-31 07:20:46,380 (trainer:653) INFO: 126epoch:train:217-243batch: iter_time=7.425e-05, forward_time=0.032, loss=1.430, loss_att=0.622, loss_ctc=2.238, acc=0.977, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.207e-04, train_time=0.092 -[v016] 2022-01-31 07:20:48,826 (trainer:653) INFO: 126epoch:train:244-270batch: iter_time=7.694e-05, forward_time=0.031, loss=1.493, loss_att=0.570, loss_ctc=2.416, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.207e-04, train_time=0.090 -[v016] 2022-01-31 07:20:51,619 (trainer:653) INFO: 126epoch:train:271-297batch: iter_time=0.014, forward_time=0.031, loss=1.342, loss_att=0.687, loss_ctc=1.997, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.207e-04, train_time=0.103 -[v016] 2022-01-31 07:20:54,003 (trainer:653) INFO: 126epoch:train:298-324batch: iter_time=7.934e-05, forward_time=0.030, loss=1.472, loss_att=0.708, loss_ctc=2.237, acc=0.968, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.207e-04, train_time=0.088 -[v016] 2022-01-31 07:20:56,506 (trainer:653) INFO: 126epoch:train:325-351batch: iter_time=8.745e-05, forward_time=0.032, loss=1.493, loss_att=0.698, loss_ctc=2.288, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.206e-04, train_time=0.093 -[v016] 2022-01-31 07:20:58,994 (trainer:653) INFO: 126epoch:train:352-378batch: iter_time=7.936e-05, forward_time=0.032, loss=1.618, loss_att=0.729, loss_ctc=2.508, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.206e-04, train_time=0.092 -[v016] 2022-01-31 07:21:01,468 (trainer:653) INFO: 126epoch:train:379-405batch: iter_time=7.577e-05, forward_time=0.032, loss=1.484, loss_att=0.633, loss_ctc=2.335, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.206e-04, train_time=0.091 -[v016] 2022-01-31 07:21:03,842 (trainer:653) INFO: 126epoch:train:406-432batch: iter_time=7.984e-05, forward_time=0.031, loss=1.358, loss_att=0.656, loss_ctc=2.059, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.206e-04, train_time=0.088 -[v016] 2022-01-31 07:21:06,251 (trainer:653) INFO: 126epoch:train:433-459batch: iter_time=7.625e-05, forward_time=0.031, loss=1.494, loss_att=0.630, loss_ctc=2.359, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.205e-04, train_time=0.089 -[v016] 2022-01-31 07:21:08,776 (trainer:653) INFO: 126epoch:train:460-486batch: iter_time=7.825e-05, forward_time=0.032, loss=1.514, loss_att=0.652, loss_ctc=2.375, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.205e-04, train_time=0.093 -[v016] 2022-01-31 07:21:11,171 (trainer:653) INFO: 126epoch:train:487-513batch: iter_time=7.607e-05, forward_time=0.031, loss=1.449, loss_att=0.651, loss_ctc=2.248, acc=0.972, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.205e-04, train_time=0.088 -[v016] 2022-01-31 07:21:13,653 (trainer:653) INFO: 126epoch:train:514-540batch: iter_time=8.391e-05, forward_time=0.032, loss=1.302, loss_att=0.568, loss_ctc=2.035, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.205e-04, train_time=0.092 -[v016] 2022-01-31 07:21:47,219 (trainer:328) INFO: 126epoch results: [train] iter_time=9.420e-04, forward_time=0.031, loss=1.459, loss_att=0.662, loss_ctc=2.255, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.207e-04, train_time=0.091, time=49.96 seconds, total_count=68922, gpu_max_cached_mem_GB=5.824, [valid] loss=7.221, loss_att=5.912, loss_ctc=8.530, acc=0.907, cer=0.095, wer=0.387, cer_ctc=0.144, time=5.35 seconds, total_count=22428, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.53 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:21:49,154 (trainer:375) INFO: The best model has been updated: train.loss, train.acc, valid.acc -[v016] 2022-01-31 07:21:49,182 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/115epoch.pth -[v016] 2022-01-31 07:21:49,182 (trainer:261) INFO: 127/200epoch started. Estimated time to finish: 2 hours, 15 minutes and 9.55 seconds -[v016] 2022-01-31 07:21:51,749 (trainer:653) INFO: 127epoch:train:1-27batch: iter_time=0.003, forward_time=0.031, loss=1.409, loss_att=0.575, loss_ctc=2.242, acc=0.973, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.204e-04, train_time=0.095 -[v016] 2022-01-31 07:21:54,177 (trainer:653) INFO: 127epoch:train:28-54batch: iter_time=0.003, forward_time=0.030, loss=1.225, loss_att=0.584, loss_ctc=1.866, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.204e-04, train_time=0.090 -[v016] 2022-01-31 07:21:56,666 (trainer:653) INFO: 127epoch:train:55-81batch: iter_time=7.670e-05, forward_time=0.032, loss=1.552, loss_att=0.655, loss_ctc=2.449, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.204e-04, train_time=0.092 -[v016] 2022-01-31 07:21:59,234 (trainer:653) INFO: 127epoch:train:82-108batch: iter_time=8.037e-05, forward_time=0.033, loss=1.702, loss_att=0.629, loss_ctc=2.776, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.204e-04, train_time=0.095 -[v016] 2022-01-31 07:22:01,742 (trainer:653) INFO: 127epoch:train:109-135batch: iter_time=7.894e-05, forward_time=0.032, loss=1.387, loss_att=0.576, loss_ctc=2.199, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.203e-04, train_time=0.093 -[v016] 2022-01-31 07:22:04,134 (trainer:653) INFO: 127epoch:train:136-162batch: iter_time=7.684e-05, forward_time=0.030, loss=1.418, loss_att=0.651, loss_ctc=2.185, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.203e-04, train_time=0.088 -[v016] 2022-01-31 07:22:06,467 (trainer:653) INFO: 127epoch:train:163-189batch: iter_time=7.555e-05, forward_time=0.030, loss=1.263, loss_att=0.614, loss_ctc=1.913, acc=0.965, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.203e-04, train_time=0.086 -[v016] 2022-01-31 07:22:09,078 (trainer:653) INFO: 127epoch:train:190-216batch: iter_time=7.764e-05, forward_time=0.033, loss=1.804, loss_att=0.689, loss_ctc=2.920, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.203e-04, train_time=0.097 -[v016] 2022-01-31 07:22:11,484 (trainer:653) INFO: 127epoch:train:217-243batch: iter_time=7.405e-05, forward_time=0.031, loss=1.369, loss_att=0.575, loss_ctc=2.163, acc=0.972, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.203e-04, train_time=0.089 -[v016] 2022-01-31 07:22:13,916 (trainer:653) INFO: 127epoch:train:244-270batch: iter_time=7.632e-05, forward_time=0.031, loss=1.488, loss_att=0.682, loss_ctc=2.295, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.202e-04, train_time=0.090 -[v016] 2022-01-31 07:22:16,376 (trainer:653) INFO: 127epoch:train:271-297batch: iter_time=8.017e-05, forward_time=0.032, loss=1.251, loss_att=0.579, loss_ctc=1.923, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.202e-04, train_time=0.091 -[v016] 2022-01-31 07:22:18,830 (trainer:653) INFO: 127epoch:train:298-324batch: iter_time=7.596e-05, forward_time=0.031, loss=1.312, loss_att=0.587, loss_ctc=2.036, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.202e-04, train_time=0.091 -[v016] 2022-01-31 07:22:21,235 (trainer:653) INFO: 127epoch:train:325-351batch: iter_time=7.530e-05, forward_time=0.031, loss=1.439, loss_att=0.679, loss_ctc=2.198, acc=0.973, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.202e-04, train_time=0.089 -[v016] 2022-01-31 07:22:23,719 (trainer:653) INFO: 127epoch:train:352-378batch: iter_time=0.003, forward_time=0.030, loss=1.494, loss_att=0.774, loss_ctc=2.214, acc=0.960, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.201e-04, train_time=0.092 -[v016] 2022-01-31 07:22:26,160 (trainer:653) INFO: 127epoch:train:379-405batch: iter_time=7.554e-05, forward_time=0.031, loss=1.291, loss_att=0.560, loss_ctc=2.023, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.201e-04, train_time=0.090 -[v016] 2022-01-31 07:22:28,645 (trainer:653) INFO: 127epoch:train:406-432batch: iter_time=8.064e-05, forward_time=0.032, loss=1.497, loss_att=0.677, loss_ctc=2.317, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.201e-04, train_time=0.092 -[v016] 2022-01-31 07:22:31,129 (trainer:653) INFO: 127epoch:train:433-459batch: iter_time=8.408e-05, forward_time=0.032, loss=1.360, loss_att=0.636, loss_ctc=2.084, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.201e-04, train_time=0.092 -[v016] 2022-01-31 07:22:33,800 (trainer:653) INFO: 127epoch:train:460-486batch: iter_time=1.030e-04, forward_time=0.035, loss=1.593, loss_att=0.682, loss_ctc=2.504, acc=0.970, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.200e-04, train_time=0.099 -[v016] 2022-01-31 07:22:36,347 (trainer:653) INFO: 127epoch:train:487-513batch: iter_time=9.375e-05, forward_time=0.033, loss=1.372, loss_att=0.565, loss_ctc=2.179, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.200e-04, train_time=0.094 -[v016] 2022-01-31 07:22:38,939 (trainer:653) INFO: 127epoch:train:514-540batch: iter_time=1.110e-04, forward_time=0.034, loss=1.468, loss_att=0.698, loss_ctc=2.238, acc=0.964, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.200e-04, train_time=0.096 -[v016] 2022-01-31 07:23:14,537 (trainer:328) INFO: 127epoch results: [train] iter_time=5.164e-04, forward_time=0.032, loss=1.433, loss_att=0.631, loss_ctc=2.236, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.202e-04, train_time=0.092, time=50.52 seconds, total_count=69469, gpu_max_cached_mem_GB=5.824, [valid] loss=7.391, loss_att=6.033, loss_ctc=8.748, acc=0.905, cer=0.100, wer=0.397, cer_ctc=0.148, time=5.69 seconds, total_count=22606, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.15 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:23:16,577 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:23:16,586 (trainer:261) INFO: 128/200epoch started. Estimated time to finish: 2 hours, 13 minutes and 4.83 seconds -[v016] 2022-01-31 07:23:19,458 (trainer:653) INFO: 128epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=1.493, loss_att=0.696, loss_ctc=2.290, acc=0.965, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.200e-04, train_time=0.106 -[v016] 2022-01-31 07:23:22,120 (trainer:653) INFO: 128epoch:train:28-54batch: iter_time=1.191e-04, forward_time=0.035, loss=1.517, loss_att=0.725, loss_ctc=2.308, acc=0.965, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.199e-04, train_time=0.098 -[v016] 2022-01-31 07:23:24,842 (trainer:653) INFO: 128epoch:train:55-81batch: iter_time=9.640e-05, forward_time=0.036, loss=1.479, loss_att=0.698, loss_ctc=2.259, acc=0.970, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.199e-04, train_time=0.101 -[v016] 2022-01-31 07:23:27,677 (trainer:653) INFO: 128epoch:train:82-108batch: iter_time=0.009, forward_time=0.034, loss=1.484, loss_att=0.671, loss_ctc=2.296, acc=0.968, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.199e-04, train_time=0.105 -[v016] 2022-01-31 07:23:30,254 (trainer:653) INFO: 128epoch:train:109-135batch: iter_time=1.098e-04, forward_time=0.033, loss=1.300, loss_att=0.614, loss_ctc=1.985, acc=0.971, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.199e-04, train_time=0.095 -[v016] 2022-01-31 07:23:32,839 (trainer:653) INFO: 128epoch:train:136-162batch: iter_time=9.848e-05, forward_time=0.033, loss=1.504, loss_att=0.630, loss_ctc=2.378, acc=0.971, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.198e-04, train_time=0.095 -[v016] 2022-01-31 07:23:35,393 (trainer:653) INFO: 128epoch:train:163-189batch: iter_time=1.043e-04, forward_time=0.033, loss=1.216, loss_att=0.567, loss_ctc=1.865, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.198e-04, train_time=0.094 -[v016] 2022-01-31 07:23:37,995 (trainer:653) INFO: 128epoch:train:190-216batch: iter_time=1.001e-04, forward_time=0.033, loss=1.559, loss_att=0.648, loss_ctc=2.470, acc=0.972, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.198e-04, train_time=0.096 -[v016] 2022-01-31 07:23:40,582 (trainer:653) INFO: 128epoch:train:217-243batch: iter_time=1.104e-04, forward_time=0.033, loss=1.329, loss_att=0.614, loss_ctc=2.044, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.198e-04, train_time=0.096 -[v016] 2022-01-31 07:23:43,244 (trainer:653) INFO: 128epoch:train:244-270batch: iter_time=1.091e-04, forward_time=0.034, loss=1.527, loss_att=0.707, loss_ctc=2.346, acc=0.970, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.198e-04, train_time=0.098 -[v016] 2022-01-31 07:23:45,908 (trainer:653) INFO: 128epoch:train:271-297batch: iter_time=1.076e-04, forward_time=0.034, loss=1.445, loss_att=0.636, loss_ctc=2.255, acc=0.973, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.197e-04, train_time=0.098 -[v016] 2022-01-31 07:23:48,399 (trainer:653) INFO: 128epoch:train:298-324batch: iter_time=7.943e-05, forward_time=0.032, loss=1.531, loss_att=0.778, loss_ctc=2.284, acc=0.958, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.197e-04, train_time=0.092 -[v016] 2022-01-31 07:23:50,881 (trainer:653) INFO: 128epoch:train:325-351batch: iter_time=8.229e-05, forward_time=0.032, loss=1.277, loss_att=0.617, loss_ctc=1.937, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.197e-04, train_time=0.092 -[v016] 2022-01-31 07:23:53,326 (trainer:653) INFO: 128epoch:train:352-378batch: iter_time=8.158e-05, forward_time=0.031, loss=1.454, loss_att=0.694, loss_ctc=2.213, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.197e-04, train_time=0.090 -[v016] 2022-01-31 07:23:55,694 (trainer:653) INFO: 128epoch:train:379-405batch: iter_time=8.195e-05, forward_time=0.030, loss=1.431, loss_att=0.644, loss_ctc=2.219, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.196e-04, train_time=0.087 -[v016] 2022-01-31 07:23:58,714 (trainer:653) INFO: 128epoch:train:406-432batch: iter_time=0.019, forward_time=0.032, loss=1.700, loss_att=0.703, loss_ctc=2.697, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.196e-04, train_time=0.112 -[v016] 2022-01-31 07:24:01,167 (trainer:653) INFO: 128epoch:train:433-459batch: iter_time=7.780e-05, forward_time=0.031, loss=1.432, loss_att=0.635, loss_ctc=2.229, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.196e-04, train_time=0.091 -[v016] 2022-01-31 07:24:03,519 (trainer:653) INFO: 128epoch:train:460-486batch: iter_time=7.679e-05, forward_time=0.030, loss=1.173, loss_att=0.553, loss_ctc=1.792, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.196e-04, train_time=0.087 -[v016] 2022-01-31 07:24:05,932 (trainer:653) INFO: 128epoch:train:487-513batch: iter_time=7.598e-05, forward_time=0.031, loss=1.613, loss_att=0.768, loss_ctc=2.458, acc=0.963, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.195e-04, train_time=0.089 -[v016] 2022-01-31 07:24:08,408 (trainer:653) INFO: 128epoch:train:514-540batch: iter_time=8.306e-05, forward_time=0.032, loss=1.781, loss_att=0.789, loss_ctc=2.773, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.195e-04, train_time=0.091 -[v016] 2022-01-31 07:24:41,719 (trainer:328) INFO: 128epoch results: [train] iter_time=0.002, forward_time=0.033, loss=1.464, loss_att=0.669, loss_ctc=2.260, acc=0.969, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.197e-04, train_time=0.096, time=52.55 seconds, total_count=70016, gpu_max_cached_mem_GB=5.824, [valid] loss=7.205, loss_att=5.962, loss_ctc=8.447, acc=0.905, cer=0.099, wer=0.398, cer_ctc=0.144, time=5.41 seconds, total_count=22784, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.17 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:24:43,662 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:24:43,710 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/119epoch.pth, exp/asr_train_asr_raw_en_word/122epoch.pth -[v016] 2022-01-31 07:24:43,710 (trainer:261) INFO: 129/200epoch started. Estimated time to finish: 2 hours, 11 minutes and 0.61 seconds -[v016] 2022-01-31 07:24:46,311 (trainer:653) INFO: 129epoch:train:1-27batch: iter_time=0.003, forward_time=0.031, loss=1.360, loss_att=0.639, loss_ctc=2.081, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.195e-04, train_time=0.096 -[v016] 2022-01-31 07:24:48,700 (trainer:653) INFO: 129epoch:train:28-54batch: iter_time=8.248e-05, forward_time=0.031, loss=1.310, loss_att=0.605, loss_ctc=2.015, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.195e-04, train_time=0.088 -[v016] 2022-01-31 07:24:51,116 (trainer:653) INFO: 129epoch:train:55-81batch: iter_time=7.673e-05, forward_time=0.031, loss=1.171, loss_att=0.540, loss_ctc=1.802, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.195e-04, train_time=0.089 -[v016] 2022-01-31 07:24:53,540 (trainer:653) INFO: 129epoch:train:82-108batch: iter_time=7.512e-05, forward_time=0.031, loss=1.445, loss_att=0.660, loss_ctc=2.230, acc=0.968, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.194e-04, train_time=0.090 -[v016] 2022-01-31 07:24:56,020 (trainer:653) INFO: 129epoch:train:109-135batch: iter_time=8.214e-05, forward_time=0.032, loss=1.433, loss_att=0.672, loss_ctc=2.194, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.194e-04, train_time=0.092 -[v016] 2022-01-31 07:24:58,598 (trainer:653) INFO: 129epoch:train:136-162batch: iter_time=7.914e-05, forward_time=0.033, loss=1.424, loss_att=0.580, loss_ctc=2.268, acc=0.977, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.194e-04, train_time=0.095 -[v016] 2022-01-31 07:25:01,199 (trainer:653) INFO: 129epoch:train:163-189batch: iter_time=0.007, forward_time=0.031, loss=1.444, loss_att=0.618, loss_ctc=2.271, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.194e-04, train_time=0.096 -[v016] 2022-01-31 07:25:03,720 (trainer:653) INFO: 129epoch:train:190-216batch: iter_time=7.533e-05, forward_time=0.032, loss=1.497, loss_att=0.658, loss_ctc=2.336, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.193e-04, train_time=0.093 -[v016] 2022-01-31 07:25:06,147 (trainer:653) INFO: 129epoch:train:217-243batch: iter_time=7.471e-05, forward_time=0.031, loss=1.604, loss_att=0.726, loss_ctc=2.482, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.193e-04, train_time=0.090 -[v016] 2022-01-31 07:25:08,621 (trainer:653) INFO: 129epoch:train:244-270batch: iter_time=7.517e-05, forward_time=0.032, loss=1.420, loss_att=0.583, loss_ctc=2.257, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.193e-04, train_time=0.091 -[v016] 2022-01-31 07:25:11,014 (trainer:653) INFO: 129epoch:train:271-297batch: iter_time=7.782e-05, forward_time=0.031, loss=1.293, loss_att=0.620, loss_ctc=1.966, acc=0.965, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.193e-04, train_time=0.088 -[v016] 2022-01-31 07:25:13,430 (trainer:653) INFO: 129epoch:train:298-324batch: iter_time=8.016e-05, forward_time=0.031, loss=1.383, loss_att=0.607, loss_ctc=2.159, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.192e-04, train_time=0.089 -[v016] 2022-01-31 07:25:15,932 (trainer:653) INFO: 129epoch:train:325-351batch: iter_time=7.830e-05, forward_time=0.032, loss=1.341, loss_att=0.619, loss_ctc=2.063, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.192e-04, train_time=0.092 -[v016] 2022-01-31 07:25:18,378 (trainer:653) INFO: 129epoch:train:352-378batch: iter_time=7.706e-05, forward_time=0.032, loss=1.442, loss_att=0.698, loss_ctc=2.186, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.192e-04, train_time=0.090 -[v016] 2022-01-31 07:25:20,929 (trainer:653) INFO: 129epoch:train:379-405batch: iter_time=7.623e-05, forward_time=0.033, loss=1.508, loss_att=0.664, loss_ctc=2.353, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.192e-04, train_time=0.094 -[v016] 2022-01-31 07:25:23,423 (trainer:653) INFO: 129epoch:train:406-432batch: iter_time=7.684e-05, forward_time=0.032, loss=1.619, loss_att=0.653, loss_ctc=2.585, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.192e-04, train_time=0.092 -[v016] 2022-01-31 07:25:25,898 (trainer:653) INFO: 129epoch:train:433-459batch: iter_time=7.688e-05, forward_time=0.032, loss=1.235, loss_att=0.590, loss_ctc=1.879, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.191e-04, train_time=0.091 -[v016] 2022-01-31 07:25:28,327 (trainer:653) INFO: 129epoch:train:460-486batch: iter_time=8.117e-05, forward_time=0.031, loss=1.489, loss_att=0.721, loss_ctc=2.257, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.191e-04, train_time=0.090 -[v016] 2022-01-31 07:25:30,806 (trainer:653) INFO: 129epoch:train:487-513batch: iter_time=7.907e-05, forward_time=0.032, loss=1.560, loss_att=0.698, loss_ctc=2.422, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.191e-04, train_time=0.092 -[v016] 2022-01-31 07:25:33,539 (trainer:653) INFO: 129epoch:train:514-540batch: iter_time=0.007, forward_time=0.032, loss=1.503, loss_att=0.653, loss_ctc=2.352, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.191e-04, train_time=0.101 -[v016] 2022-01-31 07:26:07,208 (trainer:328) INFO: 129epoch results: [train] iter_time=9.454e-04, forward_time=0.032, loss=1.426, loss_att=0.640, loss_ctc=2.212, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.193e-04, train_time=0.092, time=50.54 seconds, total_count=70563, gpu_max_cached_mem_GB=5.824, [valid] loss=7.379, loss_att=6.030, loss_ctc=8.729, acc=0.903, cer=0.100, wer=0.408, cer_ctc=0.145, time=5.56 seconds, total_count=22962, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.4 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:26:09,300 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:26:09,332 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/124epoch.pth -[v016] 2022-01-31 07:26:09,332 (trainer:261) INFO: 130/200epoch started. Estimated time to finish: 2 hours, 8 minutes and 56.09 seconds -[v016] 2022-01-31 07:26:12,034 (trainer:653) INFO: 130epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.409, loss_att=0.627, loss_ctc=2.192, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.190e-04, train_time=0.100 -[v016] 2022-01-31 07:26:14,440 (trainer:653) INFO: 130epoch:train:28-54batch: iter_time=8.061e-05, forward_time=0.031, loss=1.358, loss_att=0.672, loss_ctc=2.044, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.190e-04, train_time=0.089 -[v016] 2022-01-31 07:26:16,920 (trainer:653) INFO: 130epoch:train:55-81batch: iter_time=8.291e-05, forward_time=0.032, loss=1.390, loss_att=0.604, loss_ctc=2.176, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.190e-04, train_time=0.092 -[v016] 2022-01-31 07:26:19,362 (trainer:653) INFO: 130epoch:train:82-108batch: iter_time=7.507e-05, forward_time=0.032, loss=1.343, loss_att=0.611, loss_ctc=2.075, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.190e-04, train_time=0.090 -[v016] 2022-01-31 07:26:21,794 (trainer:653) INFO: 130epoch:train:109-135batch: iter_time=7.372e-05, forward_time=0.031, loss=1.380, loss_att=0.630, loss_ctc=2.130, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.189e-04, train_time=0.090 -[v016] 2022-01-31 07:26:24,291 (trainer:653) INFO: 130epoch:train:136-162batch: iter_time=7.495e-05, forward_time=0.032, loss=1.364, loss_att=0.554, loss_ctc=2.174, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.189e-04, train_time=0.092 -[v016] 2022-01-31 07:26:26,734 (trainer:653) INFO: 130epoch:train:163-189batch: iter_time=7.528e-05, forward_time=0.032, loss=1.385, loss_att=0.586, loss_ctc=2.185, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.189e-04, train_time=0.090 -[v016] 2022-01-31 07:26:29,305 (trainer:653) INFO: 130epoch:train:190-216batch: iter_time=7.525e-05, forward_time=0.033, loss=1.683, loss_att=0.620, loss_ctc=2.745, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.189e-04, train_time=0.095 -[v016] 2022-01-31 07:26:31,752 (trainer:653) INFO: 130epoch:train:217-243batch: iter_time=9.267e-05, forward_time=0.031, loss=1.205, loss_att=0.523, loss_ctc=1.887, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.189e-04, train_time=0.090 -[v016] 2022-01-31 07:26:34,190 (trainer:653) INFO: 130epoch:train:244-270batch: iter_time=0.002, forward_time=0.031, loss=1.420, loss_att=0.700, loss_ctc=2.139, acc=0.962, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.188e-04, train_time=0.090 -[v016] 2022-01-31 07:26:36,870 (trainer:653) INFO: 130epoch:train:271-297batch: iter_time=0.007, forward_time=0.032, loss=1.504, loss_att=0.632, loss_ctc=2.377, acc=0.971, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.188e-04, train_time=0.099 -[v016] 2022-01-31 07:26:39,326 (trainer:653) INFO: 130epoch:train:298-324batch: iter_time=7.538e-05, forward_time=0.031, loss=1.360, loss_att=0.570, loss_ctc=2.150, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.188e-04, train_time=0.091 -[v016] 2022-01-31 07:26:41,813 (trainer:653) INFO: 130epoch:train:325-351batch: iter_time=7.680e-05, forward_time=0.032, loss=1.566, loss_att=0.662, loss_ctc=2.469, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.188e-04, train_time=0.092 -[v016] 2022-01-31 07:26:44,252 (trainer:653) INFO: 130epoch:train:352-378batch: iter_time=7.551e-05, forward_time=0.032, loss=1.533, loss_att=0.683, loss_ctc=2.383, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.187e-04, train_time=0.090 -[v016] 2022-01-31 07:26:46,714 (trainer:653) INFO: 130epoch:train:379-405batch: iter_time=7.765e-05, forward_time=0.032, loss=1.305, loss_att=0.568, loss_ctc=2.043, acc=0.972, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.187e-04, train_time=0.091 -[v016] 2022-01-31 07:26:49,134 (trainer:653) INFO: 130epoch:train:406-432batch: iter_time=8.164e-05, forward_time=0.031, loss=1.487, loss_att=0.685, loss_ctc=2.288, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.187e-04, train_time=0.089 -[v016] 2022-01-31 07:26:51,538 (trainer:653) INFO: 130epoch:train:433-459batch: iter_time=7.747e-05, forward_time=0.031, loss=1.533, loss_att=0.685, loss_ctc=2.382, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.187e-04, train_time=0.089 -[v016] 2022-01-31 07:26:53,984 (trainer:653) INFO: 130epoch:train:460-486batch: iter_time=7.530e-05, forward_time=0.032, loss=1.586, loss_att=0.715, loss_ctc=2.457, acc=0.966, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.186e-04, train_time=0.090 -[v016] 2022-01-31 07:26:56,495 (trainer:653) INFO: 130epoch:train:487-513batch: iter_time=7.551e-05, forward_time=0.032, loss=1.481, loss_att=0.716, loss_ctc=2.247, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.186e-04, train_time=0.093 -[v016] 2022-01-31 07:26:58,899 (trainer:653) INFO: 130epoch:train:514-540batch: iter_time=7.542e-05, forward_time=0.031, loss=1.438, loss_att=0.659, loss_ctc=2.218, acc=0.970, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.186e-04, train_time=0.089 -[v016] 2022-01-31 07:27:31,949 (trainer:328) INFO: 130epoch results: [train] iter_time=6.756e-04, forward_time=0.032, loss=1.433, loss_att=0.634, loss_ctc=2.231, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.188e-04, train_time=0.092, time=50.26 seconds, total_count=71110, gpu_max_cached_mem_GB=5.824, [valid] loss=7.461, loss_att=6.065, loss_ctc=8.858, acc=0.904, cer=0.099, wer=0.397, cer_ctc=0.142, time=5.53 seconds, total_count=23140, gpu_max_cached_mem_GB=5.824, [att_plot] time=26.82 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:27:34,088 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:27:34,096 (trainer:261) INFO: 131/200epoch started. Estimated time to finish: 2 hours, 6 minutes and 51.73 seconds -[v016] 2022-01-31 07:27:37,323 (trainer:653) INFO: 131epoch:train:1-27batch: iter_time=0.024, forward_time=0.033, loss=1.301, loss_att=0.545, loss_ctc=2.057, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.186e-04, train_time=0.119 -[v016] 2022-01-31 07:27:39,989 (trainer:653) INFO: 131epoch:train:28-54batch: iter_time=0.003, forward_time=0.034, loss=1.494, loss_att=0.619, loss_ctc=2.370, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.186e-04, train_time=0.099 -[v016] 2022-01-31 07:27:42,521 (trainer:653) INFO: 131epoch:train:55-81batch: iter_time=8.079e-05, forward_time=0.033, loss=1.260, loss_att=0.563, loss_ctc=1.957, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.185e-04, train_time=0.094 -[v016] 2022-01-31 07:27:44,957 (trainer:653) INFO: 131epoch:train:82-108batch: iter_time=7.976e-05, forward_time=0.032, loss=1.351, loss_att=0.608, loss_ctc=2.095, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.185e-04, train_time=0.090 -[v016] 2022-01-31 07:27:47,384 (trainer:653) INFO: 131epoch:train:109-135batch: iter_time=7.927e-05, forward_time=0.031, loss=1.322, loss_att=0.633, loss_ctc=2.011, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.185e-04, train_time=0.090 -[v016] 2022-01-31 07:27:49,762 (trainer:653) INFO: 131epoch:train:136-162batch: iter_time=7.712e-05, forward_time=0.031, loss=1.217, loss_att=0.569, loss_ctc=1.866, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.185e-04, train_time=0.088 -[v016] 2022-01-31 07:27:52,278 (trainer:653) INFO: 131epoch:train:163-189batch: iter_time=8.424e-05, forward_time=0.033, loss=1.595, loss_att=0.679, loss_ctc=2.510, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.184e-04, train_time=0.093 -[v016] 2022-01-31 07:27:54,742 (trainer:653) INFO: 131epoch:train:190-216batch: iter_time=7.791e-05, forward_time=0.032, loss=1.159, loss_att=0.547, loss_ctc=1.772, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.184e-04, train_time=0.091 -[v016] 2022-01-31 07:27:57,214 (trainer:653) INFO: 131epoch:train:217-243batch: iter_time=7.863e-05, forward_time=0.032, loss=1.090, loss_att=0.482, loss_ctc=1.698, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.184e-04, train_time=0.091 -[v016] 2022-01-31 07:27:59,678 (trainer:653) INFO: 131epoch:train:244-270batch: iter_time=7.776e-05, forward_time=0.031, loss=1.475, loss_att=0.689, loss_ctc=2.261, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.184e-04, train_time=0.091 -[v016] 2022-01-31 07:28:02,212 (trainer:653) INFO: 131epoch:train:271-297batch: iter_time=7.837e-05, forward_time=0.033, loss=1.795, loss_att=0.750, loss_ctc=2.840, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.183e-04, train_time=0.094 -[v016] 2022-01-31 07:28:04,685 (trainer:653) INFO: 131epoch:train:298-324batch: iter_time=7.757e-05, forward_time=0.032, loss=1.387, loss_att=0.584, loss_ctc=2.190, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.183e-04, train_time=0.091 -[v016] 2022-01-31 07:28:07,271 (trainer:653) INFO: 131epoch:train:325-351batch: iter_time=9.585e-05, forward_time=0.034, loss=1.426, loss_att=0.640, loss_ctc=2.213, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.183e-04, train_time=0.096 -[v016] 2022-01-31 07:28:10,159 (trainer:653) INFO: 131epoch:train:352-378batch: iter_time=0.012, forward_time=0.033, loss=1.629, loss_att=0.707, loss_ctc=2.551, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.183e-04, train_time=0.107 -[v016] 2022-01-31 07:28:12,674 (trainer:653) INFO: 131epoch:train:379-405batch: iter_time=8.741e-05, forward_time=0.033, loss=1.133, loss_att=0.553, loss_ctc=1.712, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.183e-04, train_time=0.093 -[v016] 2022-01-31 07:28:15,233 (trainer:653) INFO: 131epoch:train:406-432batch: iter_time=8.542e-05, forward_time=0.033, loss=1.164, loss_att=0.533, loss_ctc=1.796, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.182e-04, train_time=0.095 -[v016] 2022-01-31 07:28:17,771 (trainer:653) INFO: 131epoch:train:433-459batch: iter_time=8.369e-05, forward_time=0.033, loss=1.445, loss_att=0.584, loss_ctc=2.306, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.182e-04, train_time=0.094 -[v016] 2022-01-31 07:28:20,179 (trainer:653) INFO: 131epoch:train:460-486batch: iter_time=7.825e-05, forward_time=0.031, loss=1.350, loss_att=0.638, loss_ctc=2.063, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.182e-04, train_time=0.089 -[v016] 2022-01-31 07:28:22,558 (trainer:653) INFO: 131epoch:train:487-513batch: iter_time=7.530e-05, forward_time=0.031, loss=1.378, loss_att=0.614, loss_ctc=2.143, acc=0.974, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.182e-04, train_time=0.088 -[v016] 2022-01-31 07:28:25,058 (trainer:653) INFO: 131epoch:train:514-540batch: iter_time=7.992e-05, forward_time=0.032, loss=1.701, loss_att=0.770, loss_ctc=2.631, acc=0.967, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.181e-04, train_time=0.092 -[v016] 2022-01-31 07:28:58,357 (trainer:328) INFO: 131epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.388, loss_att=0.619, loss_ctc=2.158, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.184e-04, train_time=0.094, time=51.67 seconds, total_count=71657, gpu_max_cached_mem_GB=5.824, [valid] loss=7.434, loss_att=6.022, loss_ctc=8.845, acc=0.904, cer=0.104, wer=0.402, cer_ctc=0.153, time=5.39 seconds, total_count=23318, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.2 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:29:00,451 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:29:00,475 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/125epoch.pth -[v016] 2022-01-31 07:29:00,475 (trainer:261) INFO: 132/200epoch started. Estimated time to finish: 2 hours, 4 minutes and 49.1 seconds -[v016] 2022-01-31 07:29:03,104 (trainer:653) INFO: 132epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=1.353, loss_att=0.567, loss_ctc=2.139, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.181e-04, train_time=0.097 -[v016] 2022-01-31 07:29:05,589 (trainer:653) INFO: 132epoch:train:28-54batch: iter_time=9.768e-05, forward_time=0.032, loss=1.175, loss_att=0.548, loss_ctc=1.803, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.181e-04, train_time=0.092 -[v016] 2022-01-31 07:29:08,056 (trainer:653) INFO: 132epoch:train:55-81batch: iter_time=9.767e-05, forward_time=0.032, loss=1.353, loss_att=0.626, loss_ctc=2.079, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.181e-04, train_time=0.091 -[v016] 2022-01-31 07:29:10,448 (trainer:653) INFO: 132epoch:train:82-108batch: iter_time=7.439e-05, forward_time=0.031, loss=1.274, loss_att=0.678, loss_ctc=1.870, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.181e-04, train_time=0.088 -[v016] 2022-01-31 07:29:13,024 (trainer:653) INFO: 132epoch:train:109-135batch: iter_time=8.174e-05, forward_time=0.032, loss=1.446, loss_att=0.670, loss_ctc=2.223, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.180e-04, train_time=0.095 -[v016] 2022-01-31 07:29:15,519 (trainer:653) INFO: 132epoch:train:136-162batch: iter_time=7.675e-05, forward_time=0.032, loss=1.319, loss_att=0.570, loss_ctc=2.068, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.180e-04, train_time=0.092 -[v016] 2022-01-31 07:29:17,974 (trainer:653) INFO: 132epoch:train:163-189batch: iter_time=7.832e-05, forward_time=0.032, loss=1.559, loss_att=0.611, loss_ctc=2.506, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.180e-04, train_time=0.091 -[v016] 2022-01-31 07:29:20,386 (trainer:653) INFO: 132epoch:train:190-216batch: iter_time=7.762e-05, forward_time=0.031, loss=1.482, loss_att=0.712, loss_ctc=2.251, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.180e-04, train_time=0.089 -[v016] 2022-01-31 07:29:22,900 (trainer:653) INFO: 132epoch:train:217-243batch: iter_time=7.746e-05, forward_time=0.032, loss=1.309, loss_att=0.511, loss_ctc=2.107, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.093 -[v016] 2022-01-31 07:29:25,393 (trainer:653) INFO: 132epoch:train:244-270batch: iter_time=8.260e-05, forward_time=0.032, loss=1.193, loss_att=0.510, loss_ctc=1.875, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.092 -[v016] 2022-01-31 07:29:27,924 (trainer:653) INFO: 132epoch:train:271-297batch: iter_time=8.256e-05, forward_time=0.033, loss=1.362, loss_att=0.604, loss_ctc=2.120, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.094 -[v016] 2022-01-31 07:29:30,394 (trainer:653) INFO: 132epoch:train:298-324batch: iter_time=8.575e-05, forward_time=0.032, loss=1.365, loss_att=0.600, loss_ctc=2.129, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.091 -[v016] 2022-01-31 07:29:32,831 (trainer:653) INFO: 132epoch:train:325-351batch: iter_time=7.650e-05, forward_time=0.032, loss=1.318, loss_att=0.622, loss_ctc=2.015, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.090 -[v016] 2022-01-31 07:29:35,340 (trainer:653) INFO: 132epoch:train:352-378batch: iter_time=7.693e-05, forward_time=0.032, loss=1.306, loss_att=0.538, loss_ctc=2.073, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.178e-04, train_time=0.093 -[v016] 2022-01-31 07:29:37,808 (trainer:653) INFO: 132epoch:train:379-405batch: iter_time=7.897e-05, forward_time=0.032, loss=1.346, loss_att=0.728, loss_ctc=1.964, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.178e-04, train_time=0.091 -[v016] 2022-01-31 07:29:40,270 (trainer:653) INFO: 132epoch:train:406-432batch: iter_time=8.081e-05, forward_time=0.032, loss=1.421, loss_att=0.659, loss_ctc=2.183, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.178e-04, train_time=0.091 -[v016] 2022-01-31 07:29:42,986 (trainer:653) INFO: 132epoch:train:433-459batch: iter_time=0.009, forward_time=0.032, loss=1.312, loss_att=0.574, loss_ctc=2.050, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.178e-04, train_time=0.100 -[v016] 2022-01-31 07:29:45,636 (trainer:653) INFO: 132epoch:train:460-486batch: iter_time=8.293e-05, forward_time=0.035, loss=1.487, loss_att=0.593, loss_ctc=2.381, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.177e-04, train_time=0.098 -[v016] 2022-01-31 07:29:48,207 (trainer:653) INFO: 132epoch:train:487-513batch: iter_time=7.721e-05, forward_time=0.033, loss=1.642, loss_att=0.693, loss_ctc=2.592, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.177e-04, train_time=0.095 -[v016] 2022-01-31 07:29:50,656 (trainer:653) INFO: 132epoch:train:514-540batch: iter_time=7.694e-05, forward_time=0.032, loss=1.470, loss_att=0.623, loss_ctc=2.316, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.177e-04, train_time=0.090 -[v016] 2022-01-31 07:30:24,292 (trainer:328) INFO: 132epoch results: [train] iter_time=6.559e-04, forward_time=0.032, loss=1.372, loss_att=0.610, loss_ctc=2.133, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.179e-04, train_time=0.093, time=50.88 seconds, total_count=72204, gpu_max_cached_mem_GB=5.824, [valid] loss=7.221, loss_att=5.935, loss_ctc=8.507, acc=0.906, cer=0.098, wer=0.396, cer_ctc=0.141, time=5.52 seconds, total_count=23496, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.41 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:30:26,431 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:30:26,460 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/116epoch.pth -[v016] 2022-01-31 07:30:26,461 (trainer:261) INFO: 133/200epoch started. Estimated time to finish: 2 hours, 2 minutes and 46.87 seconds -[v016] 2022-01-31 07:30:29,092 (trainer:653) INFO: 133epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.221, loss_att=0.553, loss_ctc=1.890, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.177e-04, train_time=0.097 -[v016] 2022-01-31 07:30:31,581 (trainer:653) INFO: 133epoch:train:28-54batch: iter_time=8.314e-05, forward_time=0.032, loss=1.282, loss_att=0.500, loss_ctc=2.064, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.177e-04, train_time=0.092 -[v016] 2022-01-31 07:30:34,104 (trainer:653) INFO: 133epoch:train:55-81batch: iter_time=8.701e-05, forward_time=0.033, loss=1.659, loss_att=0.694, loss_ctc=2.625, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.176e-04, train_time=0.093 -[v016] 2022-01-31 07:30:36,566 (trainer:653) INFO: 133epoch:train:82-108batch: iter_time=8.548e-05, forward_time=0.031, loss=1.163, loss_att=0.531, loss_ctc=1.795, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.176e-04, train_time=0.091 -[v016] 2022-01-31 07:30:39,276 (trainer:653) INFO: 133epoch:train:109-135batch: iter_time=1.069e-04, forward_time=0.035, loss=1.420, loss_att=0.544, loss_ctc=2.296, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.176e-04, train_time=0.100 -[v016] 2022-01-31 07:30:41,937 (trainer:653) INFO: 133epoch:train:136-162batch: iter_time=9.082e-05, forward_time=0.034, loss=1.551, loss_att=0.661, loss_ctc=2.440, acc=0.973, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.176e-04, train_time=0.098 -[v016] 2022-01-31 07:30:44,650 (trainer:653) INFO: 133epoch:train:163-189batch: iter_time=0.002, forward_time=0.034, loss=1.295, loss_att=0.535, loss_ctc=2.055, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.175e-04, train_time=0.100 -[v016] 2022-01-31 07:30:47,143 (trainer:653) INFO: 133epoch:train:190-216batch: iter_time=8.853e-05, forward_time=0.032, loss=1.596, loss_att=0.736, loss_ctc=2.455, acc=0.964, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.175e-04, train_time=0.092 -[v016] 2022-01-31 07:30:49,704 (trainer:653) INFO: 133epoch:train:217-243batch: iter_time=1.122e-04, forward_time=0.033, loss=1.233, loss_att=0.509, loss_ctc=1.957, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.175e-04, train_time=0.095 -[v016] 2022-01-31 07:30:52,223 (trainer:653) INFO: 133epoch:train:244-270batch: iter_time=8.845e-05, forward_time=0.032, loss=1.373, loss_att=0.600, loss_ctc=2.146, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.175e-04, train_time=0.093 -[v016] 2022-01-31 07:30:54,825 (trainer:653) INFO: 133epoch:train:271-297batch: iter_time=9.527e-05, forward_time=0.033, loss=1.415, loss_att=0.592, loss_ctc=2.237, acc=0.975, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.175e-04, train_time=0.096 -[v016] 2022-01-31 07:30:57,287 (trainer:653) INFO: 133epoch:train:298-324batch: iter_time=8.047e-05, forward_time=0.032, loss=1.416, loss_att=0.687, loss_ctc=2.146, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.174e-04, train_time=0.091 -[v016] 2022-01-31 07:30:59,788 (trainer:653) INFO: 133epoch:train:325-351batch: iter_time=9.354e-05, forward_time=0.032, loss=1.386, loss_att=0.638, loss_ctc=2.135, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.174e-04, train_time=0.092 -[v016] 2022-01-31 07:31:02,362 (trainer:653) INFO: 133epoch:train:352-378batch: iter_time=1.163e-04, forward_time=0.034, loss=1.557, loss_att=0.679, loss_ctc=2.434, acc=0.970, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.174e-04, train_time=0.095 -[v016] 2022-01-31 07:31:04,827 (trainer:653) INFO: 133epoch:train:379-405batch: iter_time=9.156e-05, forward_time=0.031, loss=1.410, loss_att=0.721, loss_ctc=2.098, acc=0.968, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.174e-04, train_time=0.091 -[v016] 2022-01-31 07:31:07,918 (trainer:653) INFO: 133epoch:train:406-432batch: iter_time=0.020, forward_time=0.033, loss=1.359, loss_att=0.611, loss_ctc=2.108, acc=0.972, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.173e-04, train_time=0.114 -[v016] 2022-01-31 07:31:10,369 (trainer:653) INFO: 133epoch:train:433-459batch: iter_time=8.882e-05, forward_time=0.031, loss=1.245, loss_att=0.619, loss_ctc=1.871, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.173e-04, train_time=0.091 -[v016] 2022-01-31 07:31:12,842 (trainer:653) INFO: 133epoch:train:460-486batch: iter_time=8.791e-05, forward_time=0.032, loss=1.232, loss_att=0.657, loss_ctc=1.807, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.173e-04, train_time=0.091 -[v016] 2022-01-31 07:31:15,359 (trainer:653) INFO: 133epoch:train:487-513batch: iter_time=9.094e-05, forward_time=0.032, loss=1.566, loss_att=0.707, loss_ctc=2.425, acc=0.970, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.173e-04, train_time=0.093 -[v016] 2022-01-31 07:31:17,946 (trainer:653) INFO: 133epoch:train:514-540batch: iter_time=1.006e-04, forward_time=0.033, loss=1.501, loss_att=0.681, loss_ctc=2.321, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.173e-04, train_time=0.096 -[v016] 2022-01-31 07:31:52,268 (trainer:328) INFO: 133epoch results: [train] iter_time=0.001, forward_time=0.033, loss=1.396, loss_att=0.623, loss_ctc=2.170, acc=0.972, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.175e-04, train_time=0.095, time=52.3 seconds, total_count=72751, gpu_max_cached_mem_GB=5.824, [valid] loss=7.627, loss_att=6.209, loss_ctc=9.044, acc=0.904, cer=0.103, wer=0.401, cer_ctc=0.151, time=5.56 seconds, total_count=23674, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.94 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:31:54,271 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:31:54,280 (trainer:261) INFO: 134/200epoch started. Estimated time to finish: 2 hours and 46.36 seconds -[v016] 2022-01-31 07:31:56,919 (trainer:653) INFO: 134epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=1.454, loss_att=0.628, loss_ctc=2.279, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.172e-04, train_time=0.097 -[v016] 2022-01-31 07:31:59,403 (trainer:653) INFO: 134epoch:train:28-54batch: iter_time=7.972e-05, forward_time=0.031, loss=1.329, loss_att=0.542, loss_ctc=2.115, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.172e-04, train_time=0.092 -[v016] 2022-01-31 07:32:01,824 (trainer:653) INFO: 134epoch:train:55-81batch: iter_time=7.185e-05, forward_time=0.030, loss=1.234, loss_att=0.581, loss_ctc=1.887, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.172e-04, train_time=0.089 -[v016] 2022-01-31 07:32:04,268 (trainer:653) INFO: 134epoch:train:82-108batch: iter_time=7.605e-05, forward_time=0.031, loss=1.276, loss_att=0.628, loss_ctc=1.923, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.172e-04, train_time=0.090 -[v016] 2022-01-31 07:32:06,794 (trainer:653) INFO: 134epoch:train:109-135batch: iter_time=7.632e-05, forward_time=0.032, loss=1.445, loss_att=0.634, loss_ctc=2.257, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.171e-04, train_time=0.093 -[v016] 2022-01-31 07:32:09,196 (trainer:653) INFO: 134epoch:train:136-162batch: iter_time=7.674e-05, forward_time=0.030, loss=1.301, loss_att=0.600, loss_ctc=2.003, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.171e-04, train_time=0.089 -[v016] 2022-01-31 07:32:11,669 (trainer:653) INFO: 134epoch:train:163-189batch: iter_time=9.112e-05, forward_time=0.032, loss=1.408, loss_att=0.604, loss_ctc=2.211, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.171e-04, train_time=0.091 -[v016] 2022-01-31 07:32:14,111 (trainer:653) INFO: 134epoch:train:190-216batch: iter_time=7.589e-05, forward_time=0.031, loss=1.439, loss_att=0.628, loss_ctc=2.251, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.171e-04, train_time=0.090 -[v016] 2022-01-31 07:32:16,500 (trainer:653) INFO: 134epoch:train:217-243batch: iter_time=7.548e-05, forward_time=0.030, loss=1.155, loss_att=0.508, loss_ctc=1.801, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.171e-04, train_time=0.088 -[v016] 2022-01-31 07:32:19,163 (trainer:653) INFO: 134epoch:train:244-270batch: iter_time=0.009, forward_time=0.030, loss=1.254, loss_att=0.514, loss_ctc=1.995, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.170e-04, train_time=0.098 -[v016] 2022-01-31 07:32:21,559 (trainer:653) INFO: 134epoch:train:271-297batch: iter_time=7.866e-05, forward_time=0.031, loss=1.352, loss_att=0.625, loss_ctc=2.080, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.170e-04, train_time=0.089 -[v016] 2022-01-31 07:32:24,039 (trainer:653) INFO: 134epoch:train:298-324batch: iter_time=7.685e-05, forward_time=0.031, loss=1.328, loss_att=0.594, loss_ctc=2.062, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.170e-04, train_time=0.092 -[v016] 2022-01-31 07:32:26,507 (trainer:653) INFO: 134epoch:train:325-351batch: iter_time=8.353e-05, forward_time=0.032, loss=1.283, loss_att=0.613, loss_ctc=1.953, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.170e-04, train_time=0.091 -[v016] 2022-01-31 07:32:29,002 (trainer:653) INFO: 134epoch:train:352-378batch: iter_time=8.552e-05, forward_time=0.032, loss=1.466, loss_att=0.667, loss_ctc=2.265, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.169e-04, train_time=0.092 -[v016] 2022-01-31 07:32:31,435 (trainer:653) INFO: 134epoch:train:379-405batch: iter_time=8.288e-05, forward_time=0.031, loss=1.162, loss_att=0.644, loss_ctc=1.679, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.169e-04, train_time=0.090 -[v016] 2022-01-31 07:32:33,971 (trainer:653) INFO: 134epoch:train:406-432batch: iter_time=8.225e-05, forward_time=0.033, loss=1.444, loss_att=0.637, loss_ctc=2.252, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.169e-04, train_time=0.094 -[v016] 2022-01-31 07:32:36,481 (trainer:653) INFO: 134epoch:train:433-459batch: iter_time=7.632e-05, forward_time=0.032, loss=1.498, loss_att=0.683, loss_ctc=2.314, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.169e-04, train_time=0.093 -[v016] 2022-01-31 07:32:39,017 (trainer:653) INFO: 134epoch:train:460-486batch: iter_time=8.478e-05, forward_time=0.033, loss=1.485, loss_att=0.673, loss_ctc=2.297, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.169e-04, train_time=0.094 -[v016] 2022-01-31 07:32:41,535 (trainer:653) INFO: 134epoch:train:487-513batch: iter_time=8.140e-05, forward_time=0.032, loss=1.385, loss_att=0.618, loss_ctc=2.152, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.168e-04, train_time=0.093 -[v016] 2022-01-31 07:32:44,112 (trainer:653) INFO: 134epoch:train:514-540batch: iter_time=8.517e-05, forward_time=0.033, loss=1.261, loss_att=0.555, loss_ctc=1.966, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.168e-04, train_time=0.095 -[v016] 2022-01-31 07:33:18,883 (trainer:328) INFO: 134epoch results: [train] iter_time=7.129e-04, forward_time=0.031, loss=1.347, loss_att=0.609, loss_ctc=2.085, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.170e-04, train_time=0.092, time=50.58 seconds, total_count=73298, gpu_max_cached_mem_GB=5.824, [valid] loss=7.655, loss_att=6.183, loss_ctc=9.127, acc=0.903, cer=0.102, wer=0.400, cer_ctc=0.149, time=6.4 seconds, total_count=23852, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.61 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:33:21,190 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:33:21,218 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/130epoch.pth -[v016] 2022-01-31 07:33:21,218 (trainer:261) INFO: 135/200epoch started. Estimated time to finish: 1 hour, 58 minutes and 45.93 seconds -[v016] 2022-01-31 07:33:23,869 (trainer:653) INFO: 135epoch:train:1-27batch: iter_time=0.005, forward_time=0.032, loss=1.196, loss_att=0.573, loss_ctc=1.818, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.168e-04, train_time=0.098 -[v016] 2022-01-31 07:33:26,393 (trainer:653) INFO: 135epoch:train:28-54batch: iter_time=8.321e-05, forward_time=0.032, loss=1.321, loss_att=0.541, loss_ctc=2.100, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.168e-04, train_time=0.093 -[v016] 2022-01-31 07:33:28,886 (trainer:653) INFO: 135epoch:train:55-81batch: iter_time=8.101e-05, forward_time=0.032, loss=1.325, loss_att=0.582, loss_ctc=2.068, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.167e-04, train_time=0.092 -[v016] 2022-01-31 07:33:31,395 (trainer:653) INFO: 135epoch:train:82-108batch: iter_time=8.204e-05, forward_time=0.032, loss=1.417, loss_att=0.623, loss_ctc=2.212, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.167e-04, train_time=0.093 -[v016] 2022-01-31 07:33:33,837 (trainer:653) INFO: 135epoch:train:109-135batch: iter_time=7.732e-05, forward_time=0.031, loss=1.381, loss_att=0.633, loss_ctc=2.130, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.167e-04, train_time=0.090 -[v016] 2022-01-31 07:33:36,387 (trainer:653) INFO: 135epoch:train:136-162batch: iter_time=7.562e-05, forward_time=0.032, loss=1.517, loss_att=0.663, loss_ctc=2.371, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.167e-04, train_time=0.094 -[v016] 2022-01-31 07:33:38,830 (trainer:653) INFO: 135epoch:train:163-189batch: iter_time=7.718e-05, forward_time=0.032, loss=1.313, loss_att=0.604, loss_ctc=2.021, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.167e-04, train_time=0.090 -[v016] 2022-01-31 07:33:41,267 (trainer:653) INFO: 135epoch:train:190-216batch: iter_time=7.493e-05, forward_time=0.032, loss=1.326, loss_att=0.609, loss_ctc=2.043, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.090 -[v016] 2022-01-31 07:33:43,846 (trainer:653) INFO: 135epoch:train:217-243batch: iter_time=7.603e-05, forward_time=0.034, loss=1.414, loss_att=0.578, loss_ctc=2.250, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.095 -[v016] 2022-01-31 07:33:46,369 (trainer:653) INFO: 135epoch:train:244-270batch: iter_time=7.607e-05, forward_time=0.032, loss=1.353, loss_att=0.581, loss_ctc=2.124, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.093 -[v016] 2022-01-31 07:33:48,886 (trainer:653) INFO: 135epoch:train:271-297batch: iter_time=8.499e-05, forward_time=0.033, loss=1.331, loss_att=0.643, loss_ctc=2.018, acc=0.965, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.093 -[v016] 2022-01-31 07:33:51,412 (trainer:653) INFO: 135epoch:train:298-324batch: iter_time=7.907e-05, forward_time=0.032, loss=1.385, loss_att=0.531, loss_ctc=2.239, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.093 -[v016] 2022-01-31 07:33:54,202 (trainer:653) INFO: 135epoch:train:325-351batch: iter_time=0.013, forward_time=0.031, loss=1.384, loss_att=0.683, loss_ctc=2.084, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.165e-04, train_time=0.103 -[v016] 2022-01-31 07:33:56,655 (trainer:653) INFO: 135epoch:train:352-378batch: iter_time=7.661e-05, forward_time=0.031, loss=1.251, loss_att=0.657, loss_ctc=1.845, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.165e-04, train_time=0.091 -[v016] 2022-01-31 07:33:59,121 (trainer:653) INFO: 135epoch:train:379-405batch: iter_time=7.770e-05, forward_time=0.031, loss=1.313, loss_att=0.639, loss_ctc=1.987, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.165e-04, train_time=0.091 -[v016] 2022-01-31 07:34:01,579 (trainer:653) INFO: 135epoch:train:406-432batch: iter_time=7.728e-05, forward_time=0.031, loss=1.172, loss_att=0.529, loss_ctc=1.815, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.165e-04, train_time=0.091 -[v016] 2022-01-31 07:34:04,109 (trainer:653) INFO: 135epoch:train:433-459batch: iter_time=8.750e-05, forward_time=0.033, loss=1.345, loss_att=0.609, loss_ctc=2.082, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.164e-04, train_time=0.094 -[v016] 2022-01-31 07:34:06,592 (trainer:653) INFO: 135epoch:train:460-486batch: iter_time=8.037e-05, forward_time=0.032, loss=1.378, loss_att=0.606, loss_ctc=2.150, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.164e-04, train_time=0.092 -[v016] 2022-01-31 07:34:09,098 (trainer:653) INFO: 135epoch:train:487-513batch: iter_time=7.786e-05, forward_time=0.032, loss=1.424, loss_att=0.652, loss_ctc=2.195, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.164e-04, train_time=0.093 -[v016] 2022-01-31 07:34:11,596 (trainer:653) INFO: 135epoch:train:514-540batch: iter_time=8.535e-05, forward_time=0.032, loss=1.258, loss_att=0.548, loss_ctc=1.967, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.164e-04, train_time=0.092 -[v016] 2022-01-31 07:34:46,609 (trainer:328) INFO: 135epoch results: [train] iter_time=9.470e-04, forward_time=0.032, loss=1.341, loss_att=0.606, loss_ctc=2.076, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.166e-04, train_time=0.093, time=51.09 seconds, total_count=73845, gpu_max_cached_mem_GB=5.824, [valid] loss=7.527, loss_att=6.199, loss_ctc=8.855, acc=0.904, cer=0.102, wer=0.400, cer_ctc=0.145, time=5.48 seconds, total_count=24030, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.83 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:34:48,838 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:34:48,885 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/127epoch.pth, exp/asr_train_asr_raw_en_word/129epoch.pth -[v016] 2022-01-31 07:34:48,885 (trainer:261) INFO: 136/200epoch started. Estimated time to finish: 1 hour, 56 minutes and 46.48 seconds -[v016] 2022-01-31 07:34:51,681 (trainer:653) INFO: 136epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=1.283, loss_att=0.578, loss_ctc=1.988, acc=0.971, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.164e-04, train_time=0.103 -[v016] 2022-01-31 07:34:54,384 (trainer:653) INFO: 136epoch:train:28-54batch: iter_time=1.151e-04, forward_time=0.034, loss=1.339, loss_att=0.634, loss_ctc=2.043, acc=0.968, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.163e-04, train_time=0.100 -[v016] 2022-01-31 07:34:57,002 (trainer:653) INFO: 136epoch:train:55-81batch: iter_time=0.001, forward_time=0.033, loss=1.148, loss_att=0.531, loss_ctc=1.764, acc=0.973, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.163e-04, train_time=0.097 -[v016] 2022-01-31 07:34:59,773 (trainer:653) INFO: 136epoch:train:82-108batch: iter_time=1.060e-04, forward_time=0.035, loss=1.503, loss_att=0.609, loss_ctc=2.396, acc=0.975, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.163e-04, train_time=0.102 -[v016] 2022-01-31 07:35:02,467 (trainer:653) INFO: 136epoch:train:109-135batch: iter_time=1.021e-04, forward_time=0.034, loss=1.632, loss_att=0.667, loss_ctc=2.596, acc=0.970, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.163e-04, train_time=0.100 -[v016] 2022-01-31 07:35:05,081 (trainer:653) INFO: 136epoch:train:136-162batch: iter_time=1.060e-04, forward_time=0.034, loss=1.397, loss_att=0.575, loss_ctc=2.219, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.163e-04, train_time=0.097 -[v016] 2022-01-31 07:35:07,475 (trainer:653) INFO: 136epoch:train:163-189batch: iter_time=7.461e-05, forward_time=0.031, loss=1.261, loss_att=0.519, loss_ctc=2.002, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.162e-04, train_time=0.088 -[v016] 2022-01-31 07:35:10,038 (trainer:653) INFO: 136epoch:train:190-216batch: iter_time=9.372e-05, forward_time=0.033, loss=1.211, loss_att=0.601, loss_ctc=1.820, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.162e-04, train_time=0.095 -[v016] 2022-01-31 07:35:12,562 (trainer:653) INFO: 136epoch:train:217-243batch: iter_time=9.110e-05, forward_time=0.033, loss=1.261, loss_att=0.576, loss_ctc=1.947, acc=0.973, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.162e-04, train_time=0.093 -[v016] 2022-01-31 07:35:15,292 (trainer:653) INFO: 136epoch:train:244-270batch: iter_time=1.072e-04, forward_time=0.035, loss=1.107, loss_att=0.506, loss_ctc=1.709, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.162e-04, train_time=0.101 -[v016] 2022-01-31 07:35:17,933 (trainer:653) INFO: 136epoch:train:271-297batch: iter_time=1.055e-04, forward_time=0.034, loss=1.206, loss_att=0.568, loss_ctc=1.844, acc=0.975, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.161e-04, train_time=0.098 -[v016] 2022-01-31 07:35:20,630 (trainer:653) INFO: 136epoch:train:298-324batch: iter_time=1.081e-04, forward_time=0.035, loss=1.434, loss_att=0.568, loss_ctc=2.300, acc=0.973, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.161e-04, train_time=0.100 -[v016] 2022-01-31 07:35:23,252 (trainer:653) INFO: 136epoch:train:325-351batch: iter_time=1.098e-04, forward_time=0.034, loss=1.392, loss_att=0.609, loss_ctc=2.176, acc=0.971, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.161e-04, train_time=0.097 -[v016] 2022-01-31 07:35:25,909 (trainer:653) INFO: 136epoch:train:352-378batch: iter_time=9.388e-05, forward_time=0.034, loss=1.275, loss_att=0.585, loss_ctc=1.965, acc=0.974, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.161e-04, train_time=0.098 -[v016] 2022-01-31 07:35:28,813 (trainer:653) INFO: 136epoch:train:379-405batch: iter_time=0.013, forward_time=0.033, loss=1.062, loss_att=0.474, loss_ctc=1.650, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.161e-04, train_time=0.107 -[v016] 2022-01-31 07:35:31,376 (trainer:653) INFO: 136epoch:train:406-432batch: iter_time=1.259e-04, forward_time=0.033, loss=1.429, loss_att=0.731, loss_ctc=2.128, acc=0.966, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.160e-04, train_time=0.095 -[v016] 2022-01-31 07:35:34,044 (trainer:653) INFO: 136epoch:train:433-459batch: iter_time=9.784e-05, forward_time=0.034, loss=1.353, loss_att=0.666, loss_ctc=2.040, acc=0.967, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.160e-04, train_time=0.099 -[v016] 2022-01-31 07:35:36,722 (trainer:653) INFO: 136epoch:train:460-486batch: iter_time=9.966e-05, forward_time=0.035, loss=1.214, loss_att=0.501, loss_ctc=1.927, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.160e-04, train_time=0.099 -[v016] 2022-01-31 07:35:39,329 (trainer:653) INFO: 136epoch:train:487-513batch: iter_time=9.377e-05, forward_time=0.033, loss=1.326, loss_att=0.647, loss_ctc=2.005, acc=0.968, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.160e-04, train_time=0.096 -[v016] 2022-01-31 07:35:41,976 (trainer:653) INFO: 136epoch:train:514-540batch: iter_time=1.056e-04, forward_time=0.034, loss=1.338, loss_att=0.632, loss_ctc=2.044, acc=0.971, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.160e-04, train_time=0.098 -[v016] 2022-01-31 07:36:15,937 (trainer:328) INFO: 136epoch results: [train] iter_time=9.617e-04, forward_time=0.034, loss=1.308, loss_att=0.588, loss_ctc=2.029, acc=0.973, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.162e-04, train_time=0.098, time=53.87 seconds, total_count=74392, gpu_max_cached_mem_GB=5.824, [valid] loss=7.483, loss_att=6.068, loss_ctc=8.899, acc=0.905, cer=0.099, wer=0.396, cer_ctc=0.146, time=5.5 seconds, total_count=24208, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.68 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:36:17,963 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:36:17,974 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/92epoch.pth -[v016] 2022-01-31 07:36:17,974 (trainer:261) INFO: 137/200epoch started. Estimated time to finish: 1 hour, 54 minutes and 48.37 seconds -[v016] 2022-01-31 07:36:20,736 (trainer:653) INFO: 137epoch:train:1-27batch: iter_time=0.003, forward_time=0.035, loss=1.160, loss_att=0.437, loss_ctc=1.883, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.159e-04, train_time=0.102 -[v016] 2022-01-31 07:36:23,263 (trainer:653) INFO: 137epoch:train:28-54batch: iter_time=8.140e-05, forward_time=0.033, loss=1.278, loss_att=0.598, loss_ctc=1.958, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.159e-04, train_time=0.093 -[v016] 2022-01-31 07:36:25,740 (trainer:653) INFO: 137epoch:train:55-81batch: iter_time=7.775e-05, forward_time=0.032, loss=1.117, loss_att=0.447, loss_ctc=1.788, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.159e-04, train_time=0.092 -[v016] 2022-01-31 07:36:28,269 (trainer:653) INFO: 137epoch:train:82-108batch: iter_time=8.496e-05, forward_time=0.033, loss=1.302, loss_att=0.595, loss_ctc=2.009, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.159e-04, train_time=0.093 -[v016] 2022-01-31 07:36:31,108 (trainer:653) INFO: 137epoch:train:109-135batch: iter_time=0.014, forward_time=0.031, loss=1.146, loss_att=0.491, loss_ctc=1.800, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.158e-04, train_time=0.105 -[v016] 2022-01-31 07:36:33,620 (trainer:653) INFO: 137epoch:train:136-162batch: iter_time=7.661e-05, forward_time=0.033, loss=1.525, loss_att=0.742, loss_ctc=2.308, acc=0.961, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.158e-04, train_time=0.093 -[v016] 2022-01-31 07:36:36,123 (trainer:653) INFO: 137epoch:train:163-189batch: iter_time=9.843e-05, forward_time=0.033, loss=1.065, loss_att=0.498, loss_ctc=1.633, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.158e-04, train_time=0.093 -[v016] 2022-01-31 07:36:38,569 (trainer:653) INFO: 137epoch:train:190-216batch: iter_time=8.262e-05, forward_time=0.032, loss=1.364, loss_att=0.602, loss_ctc=2.126, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.158e-04, train_time=0.090 -[v016] 2022-01-31 07:36:41,119 (trainer:653) INFO: 137epoch:train:217-243batch: iter_time=8.069e-05, forward_time=0.033, loss=1.655, loss_att=0.703, loss_ctc=2.607, acc=0.963, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.158e-04, train_time=0.094 -[v016] 2022-01-31 07:36:43,622 (trainer:653) INFO: 137epoch:train:244-270batch: iter_time=8.093e-05, forward_time=0.032, loss=1.203, loss_att=0.534, loss_ctc=1.873, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.092 -[v016] 2022-01-31 07:36:46,064 (trainer:653) INFO: 137epoch:train:271-297batch: iter_time=7.780e-05, forward_time=0.032, loss=1.309, loss_att=0.560, loss_ctc=2.057, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.090 -[v016] 2022-01-31 07:36:48,586 (trainer:653) INFO: 137epoch:train:298-324batch: iter_time=8.468e-05, forward_time=0.033, loss=1.253, loss_att=0.615, loss_ctc=1.892, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.093 -[v016] 2022-01-31 07:36:51,111 (trainer:653) INFO: 137epoch:train:325-351batch: iter_time=9.220e-05, forward_time=0.033, loss=1.242, loss_att=0.605, loss_ctc=1.879, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.093 -[v016] 2022-01-31 07:36:53,610 (trainer:653) INFO: 137epoch:train:352-378batch: iter_time=8.042e-05, forward_time=0.032, loss=1.671, loss_att=0.798, loss_ctc=2.543, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.092 -[v016] 2022-01-31 07:36:56,118 (trainer:653) INFO: 137epoch:train:379-405batch: iter_time=7.707e-05, forward_time=0.032, loss=1.291, loss_att=0.532, loss_ctc=2.050, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.156e-04, train_time=0.093 -[v016] 2022-01-31 07:36:58,664 (trainer:653) INFO: 137epoch:train:406-432batch: iter_time=8.139e-05, forward_time=0.033, loss=1.299, loss_att=0.539, loss_ctc=2.059, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.156e-04, train_time=0.094 -[v016] 2022-01-31 07:37:01,551 (trainer:653) INFO: 137epoch:train:433-459batch: iter_time=0.013, forward_time=0.033, loss=1.219, loss_att=0.544, loss_ctc=1.895, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.156e-04, train_time=0.107 -[v016] 2022-01-31 07:37:04,002 (trainer:653) INFO: 137epoch:train:460-486batch: iter_time=7.751e-05, forward_time=0.032, loss=1.331, loss_att=0.630, loss_ctc=2.032, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.156e-04, train_time=0.091 -[v016] 2022-01-31 07:37:06,506 (trainer:653) INFO: 137epoch:train:487-513batch: iter_time=7.965e-05, forward_time=0.033, loss=1.298, loss_att=0.590, loss_ctc=2.005, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.156e-04, train_time=0.093 -[v016] 2022-01-31 07:37:09,006 (trainer:653) INFO: 137epoch:train:514-540batch: iter_time=7.906e-05, forward_time=0.033, loss=1.307, loss_att=0.669, loss_ctc=1.946, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.155e-04, train_time=0.092 -[v016] 2022-01-31 07:37:43,230 (trainer:328) INFO: 137epoch results: [train] iter_time=0.002, forward_time=0.033, loss=1.299, loss_att=0.584, loss_ctc=2.014, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.157e-04, train_time=0.094, time=51.72 seconds, total_count=74939, gpu_max_cached_mem_GB=5.824, [valid] loss=7.544, loss_att=6.138, loss_ctc=8.949, acc=0.907, cer=0.099, wer=0.393, cer_ctc=0.145, time=5.6 seconds, total_count=24386, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.93 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:37:45,507 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:37:45,534 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/128epoch.pth -[v016] 2022-01-31 07:37:45,534 (trainer:261) INFO: 138/200epoch started. Estimated time to finish: 1 hour, 52 minutes and 49.93 seconds -[v016] 2022-01-31 07:37:48,290 (trainer:653) INFO: 138epoch:train:1-27batch: iter_time=0.003, forward_time=0.034, loss=1.385, loss_att=0.573, loss_ctc=2.197, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.155e-04, train_time=0.102 -[v016] 2022-01-31 07:37:50,732 (trainer:653) INFO: 138epoch:train:28-54batch: iter_time=8.061e-05, forward_time=0.032, loss=1.111, loss_att=0.553, loss_ctc=1.669, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.155e-04, train_time=0.090 -[v016] 2022-01-31 07:37:53,220 (trainer:653) INFO: 138epoch:train:55-81batch: iter_time=7.942e-05, forward_time=0.032, loss=1.304, loss_att=0.512, loss_ctc=2.096, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.155e-04, train_time=0.092 -[v016] 2022-01-31 07:37:55,769 (trainer:653) INFO: 138epoch:train:82-108batch: iter_time=8.484e-05, forward_time=0.033, loss=1.267, loss_att=0.508, loss_ctc=2.026, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.154e-04, train_time=0.094 -[v016] 2022-01-31 07:37:58,341 (trainer:653) INFO: 138epoch:train:109-135batch: iter_time=7.657e-05, forward_time=0.033, loss=1.396, loss_att=0.503, loss_ctc=2.288, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.154e-04, train_time=0.095 -[v016] 2022-01-31 07:38:00,878 (trainer:653) INFO: 138epoch:train:136-162batch: iter_time=7.702e-05, forward_time=0.033, loss=1.298, loss_att=0.516, loss_ctc=2.081, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.154e-04, train_time=0.094 -[v016] 2022-01-31 07:38:03,585 (trainer:653) INFO: 138epoch:train:163-189batch: iter_time=0.008, forward_time=0.033, loss=1.260, loss_att=0.509, loss_ctc=2.010, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.154e-04, train_time=0.100 -[v016] 2022-01-31 07:38:06,008 (trainer:653) INFO: 138epoch:train:190-216batch: iter_time=8.522e-05, forward_time=0.031, loss=1.205, loss_att=0.574, loss_ctc=1.836, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.154e-04, train_time=0.090 -[v016] 2022-01-31 07:38:08,534 (trainer:653) INFO: 138epoch:train:217-243batch: iter_time=8.600e-05, forward_time=0.033, loss=1.266, loss_att=0.576, loss_ctc=1.957, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.093 -[v016] 2022-01-31 07:38:11,198 (trainer:653) INFO: 138epoch:train:244-270batch: iter_time=9.051e-05, forward_time=0.035, loss=1.521, loss_att=0.636, loss_ctc=2.406, acc=0.974, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.098 -[v016] 2022-01-31 07:38:13,725 (trainer:653) INFO: 138epoch:train:271-297batch: iter_time=8.406e-05, forward_time=0.033, loss=1.229, loss_att=0.545, loss_ctc=1.912, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.093 -[v016] 2022-01-31 07:38:16,217 (trainer:653) INFO: 138epoch:train:298-324batch: iter_time=8.031e-05, forward_time=0.032, loss=1.286, loss_att=0.591, loss_ctc=1.981, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.092 -[v016] 2022-01-31 07:38:18,657 (trainer:653) INFO: 138epoch:train:325-351batch: iter_time=7.853e-05, forward_time=0.031, loss=1.310, loss_att=0.637, loss_ctc=1.982, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.090 -[v016] 2022-01-31 07:38:21,022 (trainer:653) INFO: 138epoch:train:352-378batch: iter_time=7.636e-05, forward_time=0.031, loss=1.155, loss_att=0.578, loss_ctc=1.732, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.152e-04, train_time=0.087 -[v016] 2022-01-31 07:38:23,514 (trainer:653) INFO: 138epoch:train:379-405batch: iter_time=7.495e-05, forward_time=0.032, loss=1.162, loss_att=0.510, loss_ctc=1.815, acc=0.976, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.152e-04, train_time=0.092 -[v016] 2022-01-31 07:38:25,923 (trainer:653) INFO: 138epoch:train:406-432batch: iter_time=7.372e-05, forward_time=0.031, loss=1.223, loss_att=0.501, loss_ctc=1.945, acc=0.974, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.152e-04, train_time=0.089 -[v016] 2022-01-31 07:38:28,401 (trainer:653) INFO: 138epoch:train:433-459batch: iter_time=8.183e-05, forward_time=0.032, loss=1.240, loss_att=0.543, loss_ctc=1.936, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.152e-04, train_time=0.092 -[v016] 2022-01-31 07:38:30,894 (trainer:653) INFO: 138epoch:train:460-486batch: iter_time=7.465e-05, forward_time=0.032, loss=1.481, loss_att=0.630, loss_ctc=2.332, acc=0.971, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.152e-04, train_time=0.092 -[v016] 2022-01-31 07:38:33,292 (trainer:653) INFO: 138epoch:train:487-513batch: iter_time=7.411e-05, forward_time=0.031, loss=1.239, loss_att=0.586, loss_ctc=1.892, acc=0.972, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.151e-04, train_time=0.089 -[v016] 2022-01-31 07:38:35,676 (trainer:653) INFO: 138epoch:train:514-540batch: iter_time=4.656e-04, forward_time=0.031, loss=1.309, loss_att=0.656, loss_ctc=1.961, acc=0.969, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.151e-04, train_time=0.088 -[v016] 2022-01-31 07:39:09,426 (trainer:328) INFO: 138epoch results: [train] iter_time=6.259e-04, forward_time=0.032, loss=1.282, loss_att=0.562, loss_ctc=2.001, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.153e-04, train_time=0.093, time=50.87 seconds, total_count=75486, gpu_max_cached_mem_GB=5.824, [valid] loss=7.524, loss_att=6.159, loss_ctc=8.888, acc=0.904, cer=0.102, wer=0.409, cer_ctc=0.145, time=5.48 seconds, total_count=24564, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.54 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:39:11,498 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:39:11,525 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/131epoch.pth -[v016] 2022-01-31 07:39:11,526 (trainer:261) INFO: 139/200epoch started. Estimated time to finish: 1 hour, 50 minutes and 51.2 seconds -[v016] 2022-01-31 07:39:14,164 (trainer:653) INFO: 139epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.386, loss_att=0.631, loss_ctc=2.142, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.151e-04, train_time=0.097 -[v016] 2022-01-31 07:39:16,634 (trainer:653) INFO: 139epoch:train:28-54batch: iter_time=1.032e-04, forward_time=0.032, loss=1.224, loss_att=0.536, loss_ctc=1.912, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.151e-04, train_time=0.091 -[v016] 2022-01-31 07:39:19,140 (trainer:653) INFO: 139epoch:train:55-81batch: iter_time=7.579e-05, forward_time=0.032, loss=1.408, loss_att=0.674, loss_ctc=2.141, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.150e-04, train_time=0.093 -[v016] 2022-01-31 07:39:21,568 (trainer:653) INFO: 139epoch:train:82-108batch: iter_time=7.491e-05, forward_time=0.031, loss=1.145, loss_att=0.524, loss_ctc=1.767, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.150e-04, train_time=0.090 -[v016] 2022-01-31 07:39:23,991 (trainer:653) INFO: 139epoch:train:109-135batch: iter_time=7.448e-05, forward_time=0.031, loss=1.605, loss_att=0.813, loss_ctc=2.397, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.150e-04, train_time=0.090 -[v016] 2022-01-31 07:39:26,511 (trainer:653) INFO: 139epoch:train:136-162batch: iter_time=7.556e-05, forward_time=0.033, loss=1.365, loss_att=0.588, loss_ctc=2.143, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.150e-04, train_time=0.093 -[v016] 2022-01-31 07:39:29,044 (trainer:653) INFO: 139epoch:train:163-189batch: iter_time=7.568e-05, forward_time=0.033, loss=1.153, loss_att=0.476, loss_ctc=1.830, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.150e-04, train_time=0.094 -[v016] 2022-01-31 07:39:31,560 (trainer:653) INFO: 139epoch:train:190-216batch: iter_time=7.948e-05, forward_time=0.033, loss=1.283, loss_att=0.654, loss_ctc=1.911, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.093 -[v016] 2022-01-31 07:39:34,135 (trainer:653) INFO: 139epoch:train:217-243batch: iter_time=7.751e-05, forward_time=0.034, loss=1.591, loss_att=0.558, loss_ctc=2.625, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.095 -[v016] 2022-01-31 07:39:36,656 (trainer:653) INFO: 139epoch:train:244-270batch: iter_time=8.004e-05, forward_time=0.033, loss=1.450, loss_att=0.642, loss_ctc=2.257, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.093 -[v016] 2022-01-31 07:39:39,336 (trainer:653) INFO: 139epoch:train:271-297batch: iter_time=0.007, forward_time=0.032, loss=1.111, loss_att=0.494, loss_ctc=1.728, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.099 -[v016] 2022-01-31 07:39:41,918 (trainer:653) INFO: 139epoch:train:298-324batch: iter_time=7.925e-05, forward_time=0.033, loss=1.396, loss_att=0.606, loss_ctc=2.186, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.095 -[v016] 2022-01-31 07:39:44,406 (trainer:653) INFO: 139epoch:train:325-351batch: iter_time=8.372e-05, forward_time=0.032, loss=1.196, loss_att=0.547, loss_ctc=1.844, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.148e-04, train_time=0.092 -[v016] 2022-01-31 07:39:46,897 (trainer:653) INFO: 139epoch:train:352-378batch: iter_time=8.035e-05, forward_time=0.032, loss=1.302, loss_att=0.686, loss_ctc=1.919, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.148e-04, train_time=0.092 -[v016] 2022-01-31 07:39:49,307 (trainer:653) INFO: 139epoch:train:379-405batch: iter_time=7.918e-05, forward_time=0.031, loss=1.222, loss_att=0.550, loss_ctc=1.895, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.148e-04, train_time=0.089 -[v016] 2022-01-31 07:39:51,769 (trainer:653) INFO: 139epoch:train:406-432batch: iter_time=7.511e-05, forward_time=0.032, loss=1.187, loss_att=0.567, loss_ctc=1.807, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.148e-04, train_time=0.091 -[v016] 2022-01-31 07:39:54,276 (trainer:653) INFO: 139epoch:train:433-459batch: iter_time=7.437e-05, forward_time=0.032, loss=1.362, loss_att=0.553, loss_ctc=2.170, acc=0.976, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.148e-04, train_time=0.093 -[v016] 2022-01-31 07:39:56,769 (trainer:653) INFO: 139epoch:train:460-486batch: iter_time=7.828e-05, forward_time=0.032, loss=1.371, loss_att=0.620, loss_ctc=2.122, acc=0.973, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.147e-04, train_time=0.092 -[v016] 2022-01-31 07:39:59,239 (trainer:653) INFO: 139epoch:train:487-513batch: iter_time=7.532e-05, forward_time=0.032, loss=1.322, loss_att=0.581, loss_ctc=2.064, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.147e-04, train_time=0.091 -[v016] 2022-01-31 07:40:01,666 (trainer:653) INFO: 139epoch:train:514-540batch: iter_time=7.620e-05, forward_time=0.032, loss=1.267, loss_att=0.574, loss_ctc=1.959, acc=0.970, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.147e-04, train_time=0.090 -[v016] 2022-01-31 07:40:35,291 (trainer:328) INFO: 139epoch results: [train] iter_time=5.835e-04, forward_time=0.032, loss=1.318, loss_att=0.597, loss_ctc=2.039, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.149e-04, train_time=0.093, time=50.84 seconds, total_count=76033, gpu_max_cached_mem_GB=5.824, [valid] loss=7.593, loss_att=6.178, loss_ctc=9.007, acc=0.905, cer=0.099, wer=0.404, cer_ctc=0.147, time=5.54 seconds, total_count=24742, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.38 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:40:37,400 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:40:37,440 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/133epoch.pth, exp/asr_train_asr_raw_en_word/134epoch.pth -[v016] 2022-01-31 07:40:37,440 (trainer:261) INFO: 140/200epoch started. Estimated time to finish: 1 hour, 48 minutes and 52.97 seconds -[v016] 2022-01-31 07:40:40,210 (trainer:653) INFO: 140epoch:train:1-27batch: iter_time=0.003, forward_time=0.035, loss=1.225, loss_att=0.480, loss_ctc=1.970, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.147e-04, train_time=0.102 -[v016] 2022-01-31 07:40:42,858 (trainer:653) INFO: 140epoch:train:28-54batch: iter_time=0.007, forward_time=0.032, loss=1.264, loss_att=0.572, loss_ctc=1.955, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.147e-04, train_time=0.098 -[v016] 2022-01-31 07:40:45,389 (trainer:653) INFO: 140epoch:train:55-81batch: iter_time=7.665e-05, forward_time=0.033, loss=1.138, loss_att=0.419, loss_ctc=1.857, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.146e-04, train_time=0.094 -[v016] 2022-01-31 07:40:47,881 (trainer:653) INFO: 140epoch:train:82-108batch: iter_time=7.864e-05, forward_time=0.033, loss=1.440, loss_att=0.683, loss_ctc=2.197, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.146e-04, train_time=0.092 -[v016] 2022-01-31 07:40:50,402 (trainer:653) INFO: 140epoch:train:109-135batch: iter_time=7.689e-05, forward_time=0.033, loss=1.344, loss_att=0.557, loss_ctc=2.130, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.146e-04, train_time=0.093 -[v016] 2022-01-31 07:40:52,968 (trainer:653) INFO: 140epoch:train:136-162batch: iter_time=8.118e-05, forward_time=0.033, loss=1.344, loss_att=0.567, loss_ctc=2.122, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.146e-04, train_time=0.095 -[v016] 2022-01-31 07:40:55,488 (trainer:653) INFO: 140epoch:train:163-189batch: iter_time=7.989e-05, forward_time=0.033, loss=1.261, loss_att=0.518, loss_ctc=2.004, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.093 -[v016] 2022-01-31 07:40:57,895 (trainer:653) INFO: 140epoch:train:190-216batch: iter_time=7.510e-05, forward_time=0.031, loss=1.100, loss_att=0.545, loss_ctc=1.656, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.089 -[v016] 2022-01-31 07:41:00,328 (trainer:653) INFO: 140epoch:train:217-243batch: iter_time=7.741e-05, forward_time=0.031, loss=1.331, loss_att=0.632, loss_ctc=2.031, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.090 -[v016] 2022-01-31 07:41:02,791 (trainer:653) INFO: 140epoch:train:244-270batch: iter_time=7.764e-05, forward_time=0.032, loss=1.250, loss_att=0.551, loss_ctc=1.948, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.091 -[v016] 2022-01-31 07:41:05,241 (trainer:653) INFO: 140epoch:train:271-297batch: iter_time=7.730e-05, forward_time=0.032, loss=1.208, loss_att=0.512, loss_ctc=1.903, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.091 -[v016] 2022-01-31 07:41:07,747 (trainer:653) INFO: 140epoch:train:298-324batch: iter_time=0.002, forward_time=0.032, loss=1.516, loss_att=0.761, loss_ctc=2.271, acc=0.960, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.144e-04, train_time=0.093 -[v016] 2022-01-31 07:41:10,247 (trainer:653) INFO: 140epoch:train:325-351batch: iter_time=8.192e-05, forward_time=0.033, loss=1.435, loss_att=0.573, loss_ctc=2.297, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.144e-04, train_time=0.092 -[v016] 2022-01-31 07:41:13,080 (trainer:653) INFO: 140epoch:train:352-378batch: iter_time=0.014, forward_time=0.032, loss=1.286, loss_att=0.574, loss_ctc=1.998, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.144e-04, train_time=0.105 -[v016] 2022-01-31 07:41:15,618 (trainer:653) INFO: 140epoch:train:379-405batch: iter_time=8.107e-05, forward_time=0.033, loss=1.404, loss_att=0.560, loss_ctc=2.248, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.144e-04, train_time=0.094 -[v016] 2022-01-31 07:41:18,157 (trainer:653) INFO: 140epoch:train:406-432batch: iter_time=7.757e-05, forward_time=0.033, loss=1.440, loss_att=0.603, loss_ctc=2.277, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.144e-04, train_time=0.094 -[v016] 2022-01-31 07:41:20,655 (trainer:653) INFO: 140epoch:train:433-459batch: iter_time=7.656e-05, forward_time=0.032, loss=1.188, loss_att=0.629, loss_ctc=1.747, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.143e-04, train_time=0.092 -[v016] 2022-01-31 07:41:23,116 (trainer:653) INFO: 140epoch:train:460-486batch: iter_time=7.599e-05, forward_time=0.032, loss=1.416, loss_att=0.650, loss_ctc=2.183, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.143e-04, train_time=0.091 -[v016] 2022-01-31 07:41:25,699 (trainer:653) INFO: 140epoch:train:487-513batch: iter_time=8.581e-05, forward_time=0.034, loss=1.387, loss_att=0.550, loss_ctc=2.225, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.143e-04, train_time=0.095 -[v016] 2022-01-31 07:41:28,148 (trainer:653) INFO: 140epoch:train:514-540batch: iter_time=8.369e-05, forward_time=0.031, loss=1.404, loss_att=0.648, loss_ctc=2.160, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.143e-04, train_time=0.090 -[v016] 2022-01-31 07:42:02,109 (trainer:328) INFO: 140epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.320, loss_att=0.579, loss_ctc=2.060, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.145e-04, train_time=0.094, time=51.4 seconds, total_count=76580, gpu_max_cached_mem_GB=5.824, [valid] loss=7.673, loss_att=6.200, loss_ctc=9.146, acc=0.903, cer=0.100, wer=0.401, cer_ctc=0.150, time=5.47 seconds, total_count=24920, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.79 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:42:04,089 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:42:04,114 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/135epoch.pth -[v016] 2022-01-31 07:42:04,115 (trainer:261) INFO: 141/200epoch started. Estimated time to finish: 1 hour, 46 minutes and 55.66 seconds -[v016] 2022-01-31 07:42:06,729 (trainer:653) INFO: 141epoch:train:1-27batch: iter_time=0.004, forward_time=0.032, loss=1.142, loss_att=0.493, loss_ctc=1.792, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.143e-04, train_time=0.096 -[v016] 2022-01-31 07:42:09,098 (trainer:653) INFO: 141epoch:train:28-54batch: iter_time=5.277e-04, forward_time=0.030, loss=1.206, loss_att=0.618, loss_ctc=1.794, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.142e-04, train_time=0.088 -[v016] 2022-01-31 07:42:11,571 (trainer:653) INFO: 141epoch:train:55-81batch: iter_time=7.813e-05, forward_time=0.032, loss=1.219, loss_att=0.520, loss_ctc=1.918, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.142e-04, train_time=0.091 -[v016] 2022-01-31 07:42:14,040 (trainer:653) INFO: 141epoch:train:82-108batch: iter_time=8.635e-05, forward_time=0.032, loss=1.118, loss_att=0.553, loss_ctc=1.683, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.142e-04, train_time=0.091 -[v016] 2022-01-31 07:42:16,649 (trainer:653) INFO: 141epoch:train:109-135batch: iter_time=0.004, forward_time=0.032, loss=1.328, loss_att=0.597, loss_ctc=2.059, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.142e-04, train_time=0.096 -[v016] 2022-01-31 07:42:19,133 (trainer:653) INFO: 141epoch:train:136-162batch: iter_time=8.308e-05, forward_time=0.032, loss=1.380, loss_att=0.617, loss_ctc=2.143, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.142e-04, train_time=0.092 -[v016] 2022-01-31 07:42:21,662 (trainer:653) INFO: 141epoch:train:163-189batch: iter_time=8.096e-05, forward_time=0.033, loss=1.309, loss_att=0.529, loss_ctc=2.088, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.093 -[v016] 2022-01-31 07:42:24,260 (trainer:653) INFO: 141epoch:train:190-216batch: iter_time=8.031e-05, forward_time=0.034, loss=1.574, loss_att=0.636, loss_ctc=2.512, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.096 -[v016] 2022-01-31 07:42:26,741 (trainer:653) INFO: 141epoch:train:217-243batch: iter_time=7.944e-05, forward_time=0.032, loss=1.169, loss_att=0.495, loss_ctc=1.842, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.092 -[v016] 2022-01-31 07:42:29,287 (trainer:653) INFO: 141epoch:train:244-270batch: iter_time=8.747e-05, forward_time=0.033, loss=1.578, loss_att=0.673, loss_ctc=2.484, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.094 -[v016] 2022-01-31 07:42:31,773 (trainer:653) INFO: 141epoch:train:271-297batch: iter_time=8.622e-05, forward_time=0.032, loss=1.194, loss_att=0.525, loss_ctc=1.862, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.092 -[v016] 2022-01-31 07:42:34,264 (trainer:653) INFO: 141epoch:train:298-324batch: iter_time=9.986e-05, forward_time=0.033, loss=1.203, loss_att=0.470, loss_ctc=1.935, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.140e-04, train_time=0.092 -[v016] 2022-01-31 07:42:36,792 (trainer:653) INFO: 141epoch:train:325-351batch: iter_time=8.786e-05, forward_time=0.032, loss=1.426, loss_att=0.656, loss_ctc=2.195, acc=0.962, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.140e-04, train_time=0.093 -[v016] 2022-01-31 07:42:39,320 (trainer:653) INFO: 141epoch:train:352-378batch: iter_time=8.815e-05, forward_time=0.033, loss=1.347, loss_att=0.572, loss_ctc=2.121, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.140e-04, train_time=0.093 -[v016] 2022-01-31 07:42:41,781 (trainer:653) INFO: 141epoch:train:379-405batch: iter_time=8.043e-05, forward_time=0.032, loss=1.284, loss_att=0.582, loss_ctc=1.986, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.140e-04, train_time=0.091 -[v016] 2022-01-31 07:42:44,302 (trainer:653) INFO: 141epoch:train:406-432batch: iter_time=8.233e-05, forward_time=0.033, loss=1.116, loss_att=0.487, loss_ctc=1.746, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.140e-04, train_time=0.093 -[v016] 2022-01-31 07:42:46,779 (trainer:653) INFO: 141epoch:train:433-459batch: iter_time=0.002, forward_time=0.031, loss=1.216, loss_att=0.572, loss_ctc=1.860, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.139e-04, train_time=0.092 -[v016] 2022-01-31 07:42:49,154 (trainer:653) INFO: 141epoch:train:460-486batch: iter_time=7.756e-05, forward_time=0.030, loss=1.289, loss_att=0.651, loss_ctc=1.927, acc=0.967, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.139e-04, train_time=0.088 -[v016] 2022-01-31 07:42:51,635 (trainer:653) INFO: 141epoch:train:487-513batch: iter_time=7.941e-05, forward_time=0.032, loss=1.509, loss_att=0.668, loss_ctc=2.349, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.139e-04, train_time=0.092 -[v016] 2022-01-31 07:42:54,206 (trainer:653) INFO: 141epoch:train:514-540batch: iter_time=8.114e-05, forward_time=0.033, loss=1.405, loss_att=0.553, loss_ctc=2.257, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.139e-04, train_time=0.095 -[v016] 2022-01-31 07:43:28,484 (trainer:328) INFO: 141epoch results: [train] iter_time=5.493e-04, forward_time=0.032, loss=1.300, loss_att=0.572, loss_ctc=2.028, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.141e-04, train_time=0.093, time=50.84 seconds, total_count=77127, gpu_max_cached_mem_GB=5.824, [valid] loss=7.588, loss_att=6.229, loss_ctc=8.948, acc=0.905, cer=0.101, wer=0.401, cer_ctc=0.145, time=5.64 seconds, total_count=25098, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.89 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:43:30,541 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:43:30,550 (trainer:261) INFO: 142/200epoch started. Estimated time to finish: 1 hour, 44 minutes and 58.74 seconds -[v016] 2022-01-31 07:43:33,309 (trainer:653) INFO: 142epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=1.317, loss_att=0.565, loss_ctc=2.070, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.139e-04, train_time=0.102 -[v016] 2022-01-31 07:43:35,763 (trainer:653) INFO: 142epoch:train:28-54batch: iter_time=8.349e-05, forward_time=0.032, loss=1.343, loss_att=0.574, loss_ctc=2.112, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.138e-04, train_time=0.091 -[v016] 2022-01-31 07:43:38,207 (trainer:653) INFO: 142epoch:train:55-81batch: iter_time=7.616e-05, forward_time=0.032, loss=1.203, loss_att=0.619, loss_ctc=1.787, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.138e-04, train_time=0.090 -[v016] 2022-01-31 07:43:40,670 (trainer:653) INFO: 142epoch:train:82-108batch: iter_time=7.923e-05, forward_time=0.032, loss=1.231, loss_att=0.571, loss_ctc=1.891, acc=0.975, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.138e-04, train_time=0.091 -[v016] 2022-01-31 07:43:43,081 (trainer:653) INFO: 142epoch:train:109-135batch: iter_time=0.001, forward_time=0.031, loss=1.391, loss_att=0.634, loss_ctc=2.149, acc=0.969, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.138e-04, train_time=0.089 -[v016] 2022-01-31 07:43:45,565 (trainer:653) INFO: 142epoch:train:136-162batch: iter_time=7.540e-05, forward_time=0.032, loss=1.265, loss_att=0.520, loss_ctc=2.011, acc=0.978, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.138e-04, train_time=0.092 -[v016] 2022-01-31 07:43:47,948 (trainer:653) INFO: 142epoch:train:163-189batch: iter_time=7.935e-05, forward_time=0.031, loss=1.168, loss_att=0.595, loss_ctc=1.742, acc=0.967, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.137e-04, train_time=0.088 -[v016] 2022-01-31 07:43:51,038 (trainer:653) INFO: 142epoch:train:190-216batch: iter_time=0.018, forward_time=0.034, loss=1.331, loss_att=0.541, loss_ctc=2.120, acc=0.980, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.137e-04, train_time=0.114 -[v016] 2022-01-31 07:43:53,483 (trainer:653) INFO: 142epoch:train:217-243batch: iter_time=7.534e-05, forward_time=0.032, loss=1.233, loss_att=0.535, loss_ctc=1.932, acc=0.977, backward_time=0.020, optim_step_time=0.020, optim0_lr0=1.137e-04, train_time=0.090 -[v016] 2022-01-31 07:43:55,906 (trainer:653) INFO: 142epoch:train:244-270batch: iter_time=7.733e-05, forward_time=0.031, loss=1.175, loss_att=0.515, loss_ctc=1.835, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.137e-04, train_time=0.090 -[v016] 2022-01-31 07:43:58,382 (trainer:653) INFO: 142epoch:train:271-297batch: iter_time=8.167e-05, forward_time=0.032, loss=1.231, loss_att=0.553, loss_ctc=1.908, acc=0.974, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.137e-04, train_time=0.091 -[v016] 2022-01-31 07:44:00,888 (trainer:653) INFO: 142epoch:train:298-324batch: iter_time=7.604e-05, forward_time=0.032, loss=1.322, loss_att=0.619, loss_ctc=2.025, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.136e-04, train_time=0.093 -[v016] 2022-01-31 07:44:03,251 (trainer:653) INFO: 142epoch:train:325-351batch: iter_time=7.500e-05, forward_time=0.031, loss=1.012, loss_att=0.539, loss_ctc=1.485, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.136e-04, train_time=0.087 -[v016] 2022-01-31 07:44:05,687 (trainer:653) INFO: 142epoch:train:352-378batch: iter_time=8.363e-05, forward_time=0.032, loss=1.276, loss_att=0.643, loss_ctc=1.910, acc=0.966, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.136e-04, train_time=0.090 -[v016] 2022-01-31 07:44:08,163 (trainer:653) INFO: 142epoch:train:379-405batch: iter_time=7.675e-05, forward_time=0.032, loss=1.249, loss_att=0.461, loss_ctc=2.037, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.136e-04, train_time=0.092 -[v016] 2022-01-31 07:44:10,664 (trainer:653) INFO: 142epoch:train:406-432batch: iter_time=7.889e-05, forward_time=0.032, loss=1.359, loss_att=0.530, loss_ctc=2.187, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.136e-04, train_time=0.092 -[v016] 2022-01-31 07:44:13,131 (trainer:653) INFO: 142epoch:train:433-459batch: iter_time=7.667e-05, forward_time=0.032, loss=1.156, loss_att=0.544, loss_ctc=1.768, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.135e-04, train_time=0.091 -[v016] 2022-01-31 07:44:15,675 (trainer:653) INFO: 142epoch:train:460-486batch: iter_time=7.795e-05, forward_time=0.033, loss=1.342, loss_att=0.594, loss_ctc=2.089, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.135e-04, train_time=0.094 -[v016] 2022-01-31 07:44:18,273 (trainer:653) INFO: 142epoch:train:487-513batch: iter_time=7.966e-05, forward_time=0.033, loss=1.320, loss_att=0.534, loss_ctc=2.106, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.135e-04, train_time=0.096 -[v016] 2022-01-31 07:44:21,155 (trainer:653) INFO: 142epoch:train:514-540batch: iter_time=0.015, forward_time=0.031, loss=1.003, loss_att=0.509, loss_ctc=1.497, acc=0.973, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.135e-04, train_time=0.107 -[v016] 2022-01-31 07:44:56,201 (trainer:328) INFO: 142epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.246, loss_att=0.561, loss_ctc=1.931, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.137e-04, train_time=0.094, time=51.35 seconds, total_count=77674, gpu_max_cached_mem_GB=5.824, [valid] loss=7.574, loss_att=6.201, loss_ctc=8.947, acc=0.906, cer=0.095, wer=0.391, cer_ctc=0.141, time=5.73 seconds, total_count=25276, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.57 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:44:58,176 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:44:58,205 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/139epoch.pth -[v016] 2022-01-31 07:44:58,206 (trainer:261) INFO: 143/200epoch started. Estimated time to finish: 1 hour, 43 minutes and 2.9 seconds -[v016] 2022-01-31 07:45:00,856 (trainer:653) INFO: 143epoch:train:1-27batch: iter_time=0.004, forward_time=0.032, loss=1.439, loss_att=0.643, loss_ctc=2.236, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.135e-04, train_time=0.098 -[v016] 2022-01-31 07:45:03,353 (trainer:653) INFO: 143epoch:train:28-54batch: iter_time=1.001e-04, forward_time=0.032, loss=1.020, loss_att=0.425, loss_ctc=1.616, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.134e-04, train_time=0.092 -[v016] 2022-01-31 07:45:05,784 (trainer:653) INFO: 143epoch:train:55-81batch: iter_time=1.021e-04, forward_time=0.031, loss=1.020, loss_att=0.421, loss_ctc=1.619, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.134e-04, train_time=0.090 -[v016] 2022-01-31 07:45:08,240 (trainer:653) INFO: 143epoch:train:82-108batch: iter_time=9.534e-05, forward_time=0.031, loss=1.262, loss_att=0.565, loss_ctc=1.958, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.134e-04, train_time=0.091 -[v016] 2022-01-31 07:45:10,763 (trainer:653) INFO: 143epoch:train:109-135batch: iter_time=1.045e-04, forward_time=0.032, loss=1.279, loss_att=0.566, loss_ctc=1.993, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.134e-04, train_time=0.093 -[v016] 2022-01-31 07:45:13,264 (trainer:653) INFO: 143epoch:train:136-162batch: iter_time=9.479e-05, forward_time=0.032, loss=1.373, loss_att=0.642, loss_ctc=2.103, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.134e-04, train_time=0.092 -[v016] 2022-01-31 07:45:15,672 (trainer:653) INFO: 143epoch:train:163-189batch: iter_time=9.269e-05, forward_time=0.031, loss=1.227, loss_att=0.561, loss_ctc=1.892, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.089 -[v016] 2022-01-31 07:45:18,113 (trainer:653) INFO: 143epoch:train:190-216batch: iter_time=7.703e-05, forward_time=0.031, loss=1.453, loss_att=0.589, loss_ctc=2.316, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.090 -[v016] 2022-01-31 07:45:20,589 (trainer:653) INFO: 143epoch:train:217-243batch: iter_time=7.657e-05, forward_time=0.032, loss=1.283, loss_att=0.572, loss_ctc=1.995, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.091 -[v016] 2022-01-31 07:45:23,494 (trainer:653) INFO: 143epoch:train:244-270batch: iter_time=0.015, forward_time=0.032, loss=1.188, loss_att=0.538, loss_ctc=1.838, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.107 -[v016] 2022-01-31 07:45:26,085 (trainer:653) INFO: 143epoch:train:271-297batch: iter_time=8.137e-05, forward_time=0.033, loss=1.248, loss_att=0.488, loss_ctc=2.008, acc=0.979, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.096 -[v016] 2022-01-31 07:45:28,596 (trainer:653) INFO: 143epoch:train:298-324batch: iter_time=8.030e-05, forward_time=0.032, loss=1.214, loss_att=0.542, loss_ctc=1.887, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.132e-04, train_time=0.093 -[v016] 2022-01-31 07:45:31,001 (trainer:653) INFO: 143epoch:train:325-351batch: iter_time=7.572e-05, forward_time=0.031, loss=1.188, loss_att=0.598, loss_ctc=1.778, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.132e-04, train_time=0.089 -[v016] 2022-01-31 07:45:33,505 (trainer:653) INFO: 143epoch:train:352-378batch: iter_time=8.015e-05, forward_time=0.032, loss=1.188, loss_att=0.479, loss_ctc=1.896, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.132e-04, train_time=0.093 -[v016] 2022-01-31 07:45:36,035 (trainer:653) INFO: 143epoch:train:379-405batch: iter_time=7.713e-05, forward_time=0.032, loss=1.355, loss_att=0.579, loss_ctc=2.130, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.132e-04, train_time=0.093 -[v016] 2022-01-31 07:45:38,492 (trainer:653) INFO: 143epoch:train:406-432batch: iter_time=7.625e-05, forward_time=0.031, loss=1.265, loss_att=0.602, loss_ctc=1.927, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.132e-04, train_time=0.091 -[v016] 2022-01-31 07:45:41,089 (trainer:653) INFO: 143epoch:train:433-459batch: iter_time=7.774e-05, forward_time=0.033, loss=1.419, loss_att=0.571, loss_ctc=2.267, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.131e-04, train_time=0.096 -[v016] 2022-01-31 07:45:43,572 (trainer:653) INFO: 143epoch:train:460-486batch: iter_time=9.956e-05, forward_time=0.032, loss=1.165, loss_att=0.564, loss_ctc=1.766, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.131e-04, train_time=0.092 -[v016] 2022-01-31 07:45:45,970 (trainer:653) INFO: 143epoch:train:487-513batch: iter_time=7.558e-05, forward_time=0.030, loss=1.106, loss_att=0.570, loss_ctc=1.642, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.131e-04, train_time=0.089 -[v016] 2022-01-31 07:45:48,388 (trainer:653) INFO: 143epoch:train:514-540batch: iter_time=7.677e-05, forward_time=0.031, loss=1.401, loss_att=0.583, loss_ctc=2.218, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.131e-04, train_time=0.089 -[v016] 2022-01-31 07:46:23,798 (trainer:328) INFO: 143epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.253, loss_att=0.555, loss_ctc=1.952, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.133e-04, train_time=0.093, time=50.91 seconds, total_count=78221, gpu_max_cached_mem_GB=5.824, [valid] loss=7.624, loss_att=6.261, loss_ctc=8.986, acc=0.904, cer=0.101, wer=0.403, cer_ctc=0.143, time=5.95 seconds, total_count=25454, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.63 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:46:25,981 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 07:46:26,006 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/136epoch.pth -[v016] 2022-01-31 07:46:26,006 (trainer:261) INFO: 144/200epoch started. Estimated time to finish: 1 hour, 41 minutes and 7.58 seconds -[v016] 2022-01-31 07:46:28,881 (trainer:653) INFO: 144epoch:train:1-27batch: iter_time=0.004, forward_time=0.038, loss=1.568, loss_att=0.661, loss_ctc=2.476, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.131e-04, train_time=0.106 -[v016] 2022-01-31 07:46:31,448 (trainer:653) INFO: 144epoch:train:28-54batch: iter_time=9.463e-05, forward_time=0.033, loss=0.987, loss_att=0.409, loss_ctc=1.564, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.130e-04, train_time=0.095 -[v016] 2022-01-31 07:46:34,064 (trainer:653) INFO: 144epoch:train:55-81batch: iter_time=1.172e-04, forward_time=0.034, loss=1.061, loss_att=0.485, loss_ctc=1.638, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.130e-04, train_time=0.097 -[v016] 2022-01-31 07:46:36,716 (trainer:653) INFO: 144epoch:train:82-108batch: iter_time=1.281e-04, forward_time=0.034, loss=1.197, loss_att=0.449, loss_ctc=1.944, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.130e-04, train_time=0.098 -[v016] 2022-01-31 07:46:39,351 (trainer:653) INFO: 144epoch:train:109-135batch: iter_time=1.315e-04, forward_time=0.034, loss=1.324, loss_att=0.600, loss_ctc=2.047, acc=0.971, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.130e-04, train_time=0.097 -[v016] 2022-01-31 07:46:41,947 (trainer:653) INFO: 144epoch:train:136-162batch: iter_time=1.265e-04, forward_time=0.033, loss=1.232, loss_att=0.554, loss_ctc=1.911, acc=0.972, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.130e-04, train_time=0.096 -[v016] 2022-01-31 07:46:44,581 (trainer:653) INFO: 144epoch:train:163-189batch: iter_time=1.282e-04, forward_time=0.034, loss=1.248, loss_att=0.592, loss_ctc=1.904, acc=0.974, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.129e-04, train_time=0.097 -[v016] 2022-01-31 07:46:47,263 (trainer:653) INFO: 144epoch:train:190-216batch: iter_time=1.154e-04, forward_time=0.034, loss=1.190, loss_att=0.562, loss_ctc=1.819, acc=0.973, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.129e-04, train_time=0.099 -[v016] 2022-01-31 07:46:49,969 (trainer:653) INFO: 144epoch:train:217-243batch: iter_time=1.092e-04, forward_time=0.035, loss=1.255, loss_att=0.541, loss_ctc=1.968, acc=0.974, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.129e-04, train_time=0.100 -[v016] 2022-01-31 07:46:52,720 (trainer:653) INFO: 144epoch:train:244-270batch: iter_time=0.003, forward_time=0.034, loss=1.391, loss_att=0.584, loss_ctc=2.198, acc=0.971, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.129e-04, train_time=0.102 -[v016] 2022-01-31 07:46:55,348 (trainer:653) INFO: 144epoch:train:271-297batch: iter_time=9.341e-05, forward_time=0.033, loss=1.232, loss_att=0.561, loss_ctc=1.903, acc=0.971, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.129e-04, train_time=0.097 -[v016] 2022-01-31 07:46:57,971 (trainer:653) INFO: 144epoch:train:298-324batch: iter_time=1.007e-04, forward_time=0.034, loss=1.055, loss_att=0.553, loss_ctc=1.556, acc=0.972, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.128e-04, train_time=0.097 -[v016] 2022-01-31 07:47:00,482 (trainer:653) INFO: 144epoch:train:325-351batch: iter_time=9.226e-05, forward_time=0.033, loss=1.099, loss_att=0.535, loss_ctc=1.664, acc=0.973, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.128e-04, train_time=0.093 -[v016] 2022-01-31 07:47:02,944 (trainer:653) INFO: 144epoch:train:352-378batch: iter_time=8.084e-05, forward_time=0.032, loss=1.288, loss_att=0.578, loss_ctc=1.997, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.128e-04, train_time=0.091 -[v016] 2022-01-31 07:47:05,740 (trainer:653) INFO: 144epoch:train:379-405batch: iter_time=9.457e-05, forward_time=0.037, loss=1.557, loss_att=0.597, loss_ctc=2.517, acc=0.978, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.128e-04, train_time=0.103 -[v016] 2022-01-31 07:47:08,250 (trainer:653) INFO: 144epoch:train:406-432batch: iter_time=8.937e-05, forward_time=0.033, loss=1.136, loss_att=0.566, loss_ctc=1.707, acc=0.971, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.128e-04, train_time=0.093 -[v016] 2022-01-31 07:47:10,965 (trainer:653) INFO: 144epoch:train:433-459batch: iter_time=1.169e-04, forward_time=0.035, loss=1.281, loss_att=0.548, loss_ctc=2.014, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.127e-04, train_time=0.100 -[v016] 2022-01-31 07:47:13,580 (trainer:653) INFO: 144epoch:train:460-486batch: iter_time=1.170e-04, forward_time=0.033, loss=1.214, loss_att=0.547, loss_ctc=1.881, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.127e-04, train_time=0.097 -[v016] 2022-01-31 07:47:16,271 (trainer:653) INFO: 144epoch:train:487-513batch: iter_time=1.204e-04, forward_time=0.035, loss=1.258, loss_att=0.508, loss_ctc=2.008, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.127e-04, train_time=0.099 -[v016] 2022-01-31 07:47:18,997 (trainer:653) INFO: 144epoch:train:514-540batch: iter_time=1.077e-04, forward_time=0.035, loss=1.496, loss_att=0.682, loss_ctc=2.310, acc=0.972, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.127e-04, train_time=0.101 -[v016] 2022-01-31 07:47:56,316 (trainer:328) INFO: 144epoch results: [train] iter_time=4.538e-04, forward_time=0.034, loss=1.250, loss_att=0.555, loss_ctc=1.944, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.129e-04, train_time=0.098, time=53.73 seconds, total_count=78768, gpu_max_cached_mem_GB=5.824, [valid] loss=7.573, loss_att=6.217, loss_ctc=8.928, acc=0.906, cer=0.099, wer=0.396, cer_ctc=0.145, time=6.21 seconds, total_count=25632, gpu_max_cached_mem_GB=5.824, [att_plot] time=30.37 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:47:59,042 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:47:59,097 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/123epoch.pth, exp/asr_train_asr_raw_en_word/140epoch.pth -[v016] 2022-01-31 07:47:59,097 (trainer:261) INFO: 145/200epoch started. Estimated time to finish: 1 hour, 39 minutes and 15.1 seconds -[v016] 2022-01-31 07:48:01,974 (trainer:653) INFO: 145epoch:train:1-27batch: iter_time=0.004, forward_time=0.035, loss=1.252, loss_att=0.578, loss_ctc=1.925, acc=0.970, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.127e-04, train_time=0.104 -[v016] 2022-01-31 07:48:04,539 (trainer:653) INFO: 145epoch:train:28-54batch: iter_time=1.293e-04, forward_time=0.033, loss=1.188, loss_att=0.549, loss_ctc=1.828, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.126e-04, train_time=0.095 -[v016] 2022-01-31 07:48:07,225 (trainer:653) INFO: 145epoch:train:55-81batch: iter_time=1.151e-04, forward_time=0.035, loss=1.233, loss_att=0.555, loss_ctc=1.911, acc=0.978, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.126e-04, train_time=0.099 -[v016] 2022-01-31 07:48:09,850 (trainer:653) INFO: 145epoch:train:82-108batch: iter_time=1.058e-04, forward_time=0.034, loss=1.202, loss_att=0.567, loss_ctc=1.838, acc=0.974, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.126e-04, train_time=0.097 -[v016] 2022-01-31 07:48:12,556 (trainer:653) INFO: 145epoch:train:109-135batch: iter_time=1.178e-04, forward_time=0.035, loss=1.170, loss_att=0.552, loss_ctc=1.788, acc=0.974, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.126e-04, train_time=0.100 -[v016] 2022-01-31 07:48:15,318 (trainer:653) INFO: 145epoch:train:136-162batch: iter_time=1.397e-04, forward_time=0.035, loss=1.197, loss_att=0.543, loss_ctc=1.851, acc=0.974, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.126e-04, train_time=0.102 -[v016] 2022-01-31 07:48:18,062 (trainer:653) INFO: 145epoch:train:163-189batch: iter_time=1.339e-04, forward_time=0.035, loss=1.187, loss_att=0.445, loss_ctc=1.930, acc=0.981, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.125e-04, train_time=0.101 -[v016] 2022-01-31 07:48:20,734 (trainer:653) INFO: 145epoch:train:190-216batch: iter_time=1.155e-04, forward_time=0.034, loss=1.120, loss_att=0.463, loss_ctc=1.777, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.125e-04, train_time=0.099 -[v016] 2022-01-31 07:48:23,307 (trainer:653) INFO: 145epoch:train:217-243batch: iter_time=9.424e-05, forward_time=0.033, loss=1.254, loss_att=0.536, loss_ctc=1.972, acc=0.975, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.125e-04, train_time=0.095 -[v016] 2022-01-31 07:48:25,784 (trainer:653) INFO: 145epoch:train:244-270batch: iter_time=7.777e-05, forward_time=0.032, loss=1.167, loss_att=0.492, loss_ctc=1.841, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.125e-04, train_time=0.092 -[v016] 2022-01-31 07:48:28,536 (trainer:653) INFO: 145epoch:train:271-297batch: iter_time=1.162e-04, forward_time=0.036, loss=1.129, loss_att=0.468, loss_ctc=1.790, acc=0.982, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.125e-04, train_time=0.102 -[v016] 2022-01-31 07:48:31,311 (trainer:653) INFO: 145epoch:train:298-324batch: iter_time=1.231e-04, forward_time=0.036, loss=1.351, loss_att=0.589, loss_ctc=2.113, acc=0.972, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.125e-04, train_time=0.103 -[v016] 2022-01-31 07:48:34,152 (trainer:653) INFO: 145epoch:train:325-351batch: iter_time=1.345e-04, forward_time=0.037, loss=1.281, loss_att=0.555, loss_ctc=2.007, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.124e-04, train_time=0.105 -[v016] 2022-01-31 07:48:36,862 (trainer:653) INFO: 145epoch:train:352-378batch: iter_time=1.186e-04, forward_time=0.035, loss=1.169, loss_att=0.554, loss_ctc=1.783, acc=0.971, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.124e-04, train_time=0.100 -[v016] 2022-01-31 07:48:39,627 (trainer:653) INFO: 145epoch:train:379-405batch: iter_time=1.150e-04, forward_time=0.036, loss=1.250, loss_att=0.503, loss_ctc=1.996, acc=0.975, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.124e-04, train_time=0.102 -[v016] 2022-01-31 07:48:42,332 (trainer:653) INFO: 145epoch:train:406-432batch: iter_time=1.337e-04, forward_time=0.035, loss=1.202, loss_att=0.578, loss_ctc=1.827, acc=0.970, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.124e-04, train_time=0.100 -[v016] 2022-01-31 07:48:45,186 (trainer:653) INFO: 145epoch:train:433-459batch: iter_time=1.319e-04, forward_time=0.037, loss=1.384, loss_att=0.577, loss_ctc=2.190, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.124e-04, train_time=0.105 -[v016] 2022-01-31 07:48:50,641 (trainer:653) INFO: 145epoch:train:460-486batch: iter_time=0.003, forward_time=0.113, loss=1.340, loss_att=0.619, loss_ctc=2.060, acc=0.973, backward_time=0.037, optim_step_time=0.024, optim0_lr0=1.123e-04, train_time=0.201 -[v016] 2022-01-31 07:48:53,407 (trainer:653) INFO: 145epoch:train:487-513batch: iter_time=2.854e-04, forward_time=0.034, loss=1.392, loss_att=0.654, loss_ctc=2.129, acc=0.967, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.123e-04, train_time=0.103 -[v016] 2022-01-31 07:48:57,276 (trainer:653) INFO: 145epoch:train:514-540batch: iter_time=0.038, forward_time=0.036, loss=1.324, loss_att=0.532, loss_ctc=2.117, acc=0.973, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.123e-04, train_time=0.143 -[v016] 2022-01-31 07:49:46,584 (trainer:328) INFO: 145epoch results: [train] iter_time=0.002, forward_time=0.039, loss=1.241, loss_att=0.545, loss_ctc=1.936, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.125e-04, train_time=0.108, time=59.03 seconds, total_count=79315, gpu_max_cached_mem_GB=5.824, [valid] loss=7.557, loss_att=6.155, loss_ctc=8.960, acc=0.906, cer=0.099, wer=0.393, cer_ctc=0.145, time=19.69 seconds, total_count=25810, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.67 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:49:48,903 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:49:48,913 (trainer:261) INFO: 146/200epoch started. Estimated time to finish: 1 hour, 37 minutes and 30.29 seconds -[v016] 2022-01-31 07:49:56,280 (trainer:653) INFO: 146epoch:train:1-27batch: iter_time=0.115, forward_time=0.063, loss=1.082, loss_att=0.445, loss_ctc=1.719, acc=0.980, backward_time=0.042, optim_step_time=0.023, optim0_lr0=1.123e-04, train_time=0.267 -[v016] 2022-01-31 07:50:01,122 (trainer:653) INFO: 146epoch:train:28-54batch: iter_time=0.089, forward_time=0.031, loss=1.319, loss_att=0.634, loss_ctc=2.004, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.123e-04, train_time=0.179 -[v016] 2022-01-31 07:50:06,838 (trainer:653) INFO: 146epoch:train:55-81batch: iter_time=0.118, forward_time=0.032, loss=1.330, loss_att=0.567, loss_ctc=2.093, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.122e-04, train_time=0.211 -[v016] 2022-01-31 07:50:11,250 (trainer:653) INFO: 146epoch:train:82-108batch: iter_time=0.069, forward_time=0.032, loss=1.425, loss_att=0.593, loss_ctc=2.257, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.122e-04, train_time=0.163 -[v016] 2022-01-31 07:50:15,035 (trainer:653) INFO: 146epoch:train:109-135batch: iter_time=0.046, forward_time=0.032, loss=1.178, loss_att=0.497, loss_ctc=1.858, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.122e-04, train_time=0.140 -[v016] 2022-01-31 07:50:18,863 (trainer:653) INFO: 146epoch:train:136-162batch: iter_time=0.051, forward_time=0.030, loss=1.363, loss_att=0.612, loss_ctc=2.114, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.122e-04, train_time=0.142 -[v016] 2022-01-31 07:50:22,434 (trainer:653) INFO: 146epoch:train:163-189batch: iter_time=0.040, forward_time=0.031, loss=1.330, loss_att=0.605, loss_ctc=2.055, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.122e-04, train_time=0.132 -[v016] 2022-01-31 07:50:27,136 (trainer:653) INFO: 146epoch:train:190-216batch: iter_time=0.082, forward_time=0.031, loss=1.170, loss_att=0.602, loss_ctc=1.738, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.174 -[v016] 2022-01-31 07:50:30,315 (trainer:653) INFO: 146epoch:train:217-243batch: iter_time=0.024, forward_time=0.032, loss=1.193, loss_att=0.491, loss_ctc=1.894, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.118 -[v016] 2022-01-31 07:50:33,371 (trainer:653) INFO: 146epoch:train:244-270batch: iter_time=0.020, forward_time=0.032, loss=1.177, loss_att=0.471, loss_ctc=1.882, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.113 -[v016] 2022-01-31 07:50:37,995 (trainer:653) INFO: 146epoch:train:271-297batch: iter_time=0.082, forward_time=0.030, loss=0.945, loss_att=0.476, loss_ctc=1.414, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.171 -[v016] 2022-01-31 07:50:41,606 (trainer:653) INFO: 146epoch:train:298-324batch: iter_time=0.039, forward_time=0.032, loss=1.254, loss_att=0.524, loss_ctc=1.984, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.134 -[v016] 2022-01-31 07:50:45,331 (trainer:653) INFO: 146epoch:train:325-351batch: iter_time=0.044, forward_time=0.031, loss=1.319, loss_att=0.570, loss_ctc=2.068, acc=0.974, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.120e-04, train_time=0.138 -[v016] 2022-01-31 07:50:50,163 (trainer:653) INFO: 146epoch:train:352-378batch: iter_time=0.084, forward_time=0.032, loss=1.447, loss_att=0.614, loss_ctc=2.280, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.120e-04, train_time=0.179 -[v016] 2022-01-31 07:50:53,492 (trainer:653) INFO: 146epoch:train:379-405batch: iter_time=0.031, forward_time=0.031, loss=1.120, loss_att=0.543, loss_ctc=1.696, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.120e-04, train_time=0.123 -[v016] 2022-01-31 07:50:56,347 (trainer:653) INFO: 146epoch:train:406-432batch: iter_time=0.015, forward_time=0.031, loss=1.251, loss_att=0.555, loss_ctc=1.947, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.120e-04, train_time=0.106 -[v016] 2022-01-31 07:50:59,679 (trainer:653) INFO: 146epoch:train:433-459batch: iter_time=0.032, forward_time=0.031, loss=1.191, loss_att=0.528, loss_ctc=1.854, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.120e-04, train_time=0.123 -[v016] 2022-01-31 07:51:04,893 (trainer:653) INFO: 146epoch:train:460-486batch: iter_time=0.098, forward_time=0.032, loss=1.266, loss_att=0.522, loss_ctc=2.011, acc=0.975, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.120e-04, train_time=0.193 -[v016] 2022-01-31 07:51:10,667 (trainer:653) INFO: 146epoch:train:487-513batch: iter_time=0.123, forward_time=0.031, loss=1.124, loss_att=0.485, loss_ctc=1.764, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.119e-04, train_time=0.214 -[v016] 2022-01-31 07:51:14,735 (trainer:653) INFO: 146epoch:train:514-540batch: iter_time=0.058, forward_time=0.032, loss=1.335, loss_att=0.621, loss_ctc=2.050, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.119e-04, train_time=0.150 -[v016] 2022-01-31 07:51:50,719 (trainer:328) INFO: 146epoch results: [train] iter_time=0.065, forward_time=0.033, loss=1.239, loss_att=0.547, loss_ctc=1.930, acc=0.974, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.121e-04, train_time=0.161, time=1 minute and 28.13 seconds, total_count=79862, gpu_max_cached_mem_GB=5.824, [valid] loss=7.553, loss_att=6.205, loss_ctc=8.900, acc=0.905, cer=0.097, wer=0.402, cer_ctc=0.141, time=6.04 seconds, total_count=25988, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.57 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:51:52,810 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:51:52,839 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/141epoch.pth -[v016] 2022-01-31 07:51:52,840 (trainer:261) INFO: 147/200epoch started. Estimated time to finish: 1 hour, 35 minutes and 51.45 seconds -[v016] 2022-01-31 07:51:55,566 (trainer:653) INFO: 147epoch:train:1-27batch: iter_time=0.004, forward_time=0.032, loss=1.255, loss_att=0.507, loss_ctc=2.004, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.119e-04, train_time=0.101 -[v016] 2022-01-31 07:51:58,026 (trainer:653) INFO: 147epoch:train:28-54batch: iter_time=8.387e-05, forward_time=0.031, loss=1.239, loss_att=0.590, loss_ctc=1.889, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.119e-04, train_time=0.091 -[v016] 2022-01-31 07:52:00,638 (trainer:653) INFO: 147epoch:train:55-81batch: iter_time=0.004, forward_time=0.032, loss=1.090, loss_att=0.513, loss_ctc=1.666, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.119e-04, train_time=0.097 -[v016] 2022-01-31 07:52:03,632 (trainer:653) INFO: 147epoch:train:82-108batch: iter_time=0.020, forward_time=0.031, loss=1.211, loss_att=0.531, loss_ctc=1.891, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.118e-04, train_time=0.111 -[v016] 2022-01-31 07:52:06,128 (trainer:653) INFO: 147epoch:train:109-135batch: iter_time=7.633e-05, forward_time=0.032, loss=1.217, loss_att=0.488, loss_ctc=1.946, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.118e-04, train_time=0.092 -[v016] 2022-01-31 07:52:08,600 (trainer:653) INFO: 147epoch:train:136-162batch: iter_time=7.666e-05, forward_time=0.032, loss=1.250, loss_att=0.541, loss_ctc=1.960, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.118e-04, train_time=0.091 -[v016] 2022-01-31 07:52:11,027 (trainer:653) INFO: 147epoch:train:163-189batch: iter_time=7.781e-05, forward_time=0.031, loss=1.268, loss_att=0.610, loss_ctc=1.927, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.118e-04, train_time=0.090 -[v016] 2022-01-31 07:52:13,485 (trainer:653) INFO: 147epoch:train:190-216batch: iter_time=8.838e-05, forward_time=0.031, loss=1.252, loss_att=0.534, loss_ctc=1.970, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.118e-04, train_time=0.091 -[v016] 2022-01-31 07:52:15,954 (trainer:653) INFO: 147epoch:train:217-243batch: iter_time=8.338e-05, forward_time=0.032, loss=1.210, loss_att=0.551, loss_ctc=1.868, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.091 -[v016] 2022-01-31 07:52:18,426 (trainer:653) INFO: 147epoch:train:244-270batch: iter_time=7.738e-05, forward_time=0.032, loss=1.188, loss_att=0.532, loss_ctc=1.843, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.091 -[v016] 2022-01-31 07:52:20,928 (trainer:653) INFO: 147epoch:train:271-297batch: iter_time=7.493e-05, forward_time=0.032, loss=1.222, loss_att=0.453, loss_ctc=1.991, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.092 -[v016] 2022-01-31 07:52:23,376 (trainer:653) INFO: 147epoch:train:298-324batch: iter_time=8.135e-05, forward_time=0.031, loss=1.059, loss_att=0.489, loss_ctc=1.630, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.090 -[v016] 2022-01-31 07:52:25,852 (trainer:653) INFO: 147epoch:train:325-351batch: iter_time=8.475e-05, forward_time=0.032, loss=1.144, loss_att=0.535, loss_ctc=1.753, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.091 -[v016] 2022-01-31 07:52:28,424 (trainer:653) INFO: 147epoch:train:352-378batch: iter_time=8.268e-05, forward_time=0.033, loss=1.359, loss_att=0.523, loss_ctc=2.195, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.095 -[v016] 2022-01-31 07:52:31,277 (trainer:653) INFO: 147epoch:train:379-405batch: iter_time=0.009, forward_time=0.033, loss=1.331, loss_att=0.548, loss_ctc=2.115, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.105 -[v016] 2022-01-31 07:52:33,860 (trainer:653) INFO: 147epoch:train:406-432batch: iter_time=8.735e-05, forward_time=0.033, loss=1.190, loss_att=0.530, loss_ctc=1.850, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.095 -[v016] 2022-01-31 07:52:36,659 (trainer:653) INFO: 147epoch:train:433-459batch: iter_time=0.013, forward_time=0.031, loss=1.118, loss_att=0.544, loss_ctc=1.693, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.103 -[v016] 2022-01-31 07:52:39,112 (trainer:653) INFO: 147epoch:train:460-486batch: iter_time=8.237e-05, forward_time=0.031, loss=1.181, loss_att=0.575, loss_ctc=1.786, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.091 -[v016] 2022-01-31 07:52:41,550 (trainer:653) INFO: 147epoch:train:487-513batch: iter_time=7.943e-05, forward_time=0.031, loss=1.307, loss_att=0.565, loss_ctc=2.048, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.116e-04, train_time=0.090 -[v016] 2022-01-31 07:52:44,292 (trainer:653) INFO: 147epoch:train:514-540batch: iter_time=8.531e-05, forward_time=0.034, loss=1.332, loss_att=0.536, loss_ctc=2.128, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.115e-04, train_time=0.101 -[v016] 2022-01-31 07:53:18,542 (trainer:328) INFO: 147epoch results: [train] iter_time=0.003, forward_time=0.032, loss=1.226, loss_att=0.538, loss_ctc=1.914, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.117e-04, train_time=0.095, time=52.17 seconds, total_count=80409, gpu_max_cached_mem_GB=5.824, [valid] loss=7.647, loss_att=6.235, loss_ctc=9.060, acc=0.904, cer=0.100, wer=0.402, cer_ctc=0.148, time=5.65 seconds, total_count=26166, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.88 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:53:20,532 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 07:53:20,571 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/138epoch.pth -[v016] 2022-01-31 07:53:20,572 (trainer:261) INFO: 148/200epoch started. Estimated time to finish: 1 hour, 33 minutes and 57.1 seconds -[v016] 2022-01-31 07:53:23,287 (trainer:653) INFO: 148epoch:train:1-27batch: iter_time=0.003, forward_time=0.034, loss=1.146, loss_att=0.519, loss_ctc=1.773, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.115e-04, train_time=0.100 -[v016] 2022-01-31 07:53:25,757 (trainer:653) INFO: 148epoch:train:28-54batch: iter_time=8.578e-05, forward_time=0.032, loss=1.214, loss_att=0.560, loss_ctc=1.868, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.115e-04, train_time=0.091 -[v016] 2022-01-31 07:53:28,324 (trainer:653) INFO: 148epoch:train:55-81batch: iter_time=7.848e-05, forward_time=0.033, loss=1.275, loss_att=0.512, loss_ctc=2.038, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.115e-04, train_time=0.095 -[v016] 2022-01-31 07:53:30,816 (trainer:653) INFO: 148epoch:train:82-108batch: iter_time=7.769e-05, forward_time=0.032, loss=1.109, loss_att=0.552, loss_ctc=1.666, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.115e-04, train_time=0.092 -[v016] 2022-01-31 07:53:33,327 (trainer:653) INFO: 148epoch:train:109-135batch: iter_time=7.599e-05, forward_time=0.033, loss=1.202, loss_att=0.510, loss_ctc=1.894, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.114e-04, train_time=0.093 -[v016] 2022-01-31 07:53:35,878 (trainer:653) INFO: 148epoch:train:136-162batch: iter_time=8.211e-05, forward_time=0.033, loss=1.427, loss_att=0.620, loss_ctc=2.234, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.114e-04, train_time=0.094 -[v016] 2022-01-31 07:53:38,572 (trainer:653) INFO: 148epoch:train:163-189batch: iter_time=0.007, forward_time=0.032, loss=1.158, loss_att=0.492, loss_ctc=1.823, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.114e-04, train_time=0.100 -[v016] 2022-01-31 07:53:41,055 (trainer:653) INFO: 148epoch:train:190-216batch: iter_time=7.777e-05, forward_time=0.032, loss=1.230, loss_att=0.541, loss_ctc=1.919, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.114e-04, train_time=0.092 -[v016] 2022-01-31 07:53:43,558 (trainer:653) INFO: 148epoch:train:217-243batch: iter_time=7.657e-05, forward_time=0.033, loss=1.313, loss_att=0.572, loss_ctc=2.054, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.114e-04, train_time=0.092 -[v016] 2022-01-31 07:53:46,013 (trainer:653) INFO: 148epoch:train:244-270batch: iter_time=7.533e-05, forward_time=0.032, loss=1.282, loss_att=0.602, loss_ctc=1.963, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.091 -[v016] 2022-01-31 07:53:48,435 (trainer:653) INFO: 148epoch:train:271-297batch: iter_time=7.557e-05, forward_time=0.031, loss=1.160, loss_att=0.543, loss_ctc=1.777, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.090 -[v016] 2022-01-31 07:53:50,927 (trainer:653) INFO: 148epoch:train:298-324batch: iter_time=7.622e-05, forward_time=0.032, loss=1.176, loss_att=0.532, loss_ctc=1.820, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.092 -[v016] 2022-01-31 07:53:53,378 (trainer:653) INFO: 148epoch:train:325-351batch: iter_time=8.316e-05, forward_time=0.032, loss=1.255, loss_att=0.652, loss_ctc=1.857, acc=0.964, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.091 -[v016] 2022-01-31 07:53:55,912 (trainer:653) INFO: 148epoch:train:352-378batch: iter_time=7.727e-05, forward_time=0.033, loss=1.490, loss_att=0.574, loss_ctc=2.406, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.094 -[v016] 2022-01-31 07:53:58,345 (trainer:653) INFO: 148epoch:train:379-405batch: iter_time=7.584e-05, forward_time=0.031, loss=1.105, loss_att=0.460, loss_ctc=1.750, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.090 -[v016] 2022-01-31 07:54:00,821 (trainer:653) INFO: 148epoch:train:406-432batch: iter_time=7.780e-05, forward_time=0.033, loss=1.173, loss_att=0.505, loss_ctc=1.841, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.091 -[v016] 2022-01-31 07:54:03,303 (trainer:653) INFO: 148epoch:train:433-459batch: iter_time=7.724e-05, forward_time=0.032, loss=1.327, loss_att=0.560, loss_ctc=2.094, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.092 -[v016] 2022-01-31 07:54:05,688 (trainer:653) INFO: 148epoch:train:460-486batch: iter_time=7.971e-05, forward_time=0.031, loss=0.987, loss_att=0.461, loss_ctc=1.513, acc=0.976, backward_time=0.020, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.088 -[v016] 2022-01-31 07:54:08,206 (trainer:653) INFO: 148epoch:train:487-513batch: iter_time=8.049e-05, forward_time=0.033, loss=1.172, loss_att=0.506, loss_ctc=1.839, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.093 -[v016] 2022-01-31 07:54:11,109 (trainer:653) INFO: 148epoch:train:514-540batch: iter_time=0.014, forward_time=0.032, loss=1.358, loss_att=0.593, loss_ctc=2.123, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.112e-04, train_time=0.107 -[v016] 2022-01-31 07:54:44,931 (trainer:328) INFO: 148epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.233, loss_att=0.543, loss_ctc=1.924, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.113e-04, train_time=0.093, time=51.29 seconds, total_count=80956, gpu_max_cached_mem_GB=5.824, [valid] loss=7.668, loss_att=6.274, loss_ctc=9.063, acc=0.905, cer=0.099, wer=0.398, cer_ctc=0.145, time=5.59 seconds, total_count=26344, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.47 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:54:46,896 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 07:54:46,906 (trainer:261) INFO: 149/200epoch started. Estimated time to finish: 1 hour, 32 minutes and 2.61 seconds -[v016] 2022-01-31 07:54:49,544 (trainer:653) INFO: 149epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.322, loss_att=0.501, loss_ctc=2.143, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.111e-04, train_time=0.097 -[v016] 2022-01-31 07:54:52,164 (trainer:653) INFO: 149epoch:train:28-54batch: iter_time=0.001, forward_time=0.034, loss=1.127, loss_att=0.468, loss_ctc=1.786, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.111e-04, train_time=0.097 -[v016] 2022-01-31 07:54:54,696 (trainer:653) INFO: 149epoch:train:55-81batch: iter_time=7.751e-05, forward_time=0.033, loss=1.206, loss_att=0.526, loss_ctc=1.885, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.111e-04, train_time=0.094 -[v016] 2022-01-31 07:54:57,165 (trainer:653) INFO: 149epoch:train:82-108batch: iter_time=8.522e-05, forward_time=0.032, loss=0.971, loss_att=0.448, loss_ctc=1.494, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.111e-04, train_time=0.091 -[v016] 2022-01-31 07:54:59,518 (trainer:653) INFO: 149epoch:train:109-135batch: iter_time=7.543e-05, forward_time=0.030, loss=0.986, loss_att=0.496, loss_ctc=1.477, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.111e-04, train_time=0.087 -[v016] 2022-01-31 07:55:01,950 (trainer:653) INFO: 149epoch:train:136-162batch: iter_time=7.520e-05, forward_time=0.031, loss=1.076, loss_att=0.510, loss_ctc=1.641, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.090 -[v016] 2022-01-31 07:55:04,369 (trainer:653) INFO: 149epoch:train:163-189batch: iter_time=7.507e-05, forward_time=0.031, loss=1.006, loss_att=0.477, loss_ctc=1.535, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.089 -[v016] 2022-01-31 07:55:07,258 (trainer:653) INFO: 149epoch:train:190-216batch: iter_time=0.013, forward_time=0.033, loss=1.204, loss_att=0.501, loss_ctc=1.906, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.107 -[v016] 2022-01-31 07:55:09,848 (trainer:653) INFO: 149epoch:train:217-243batch: iter_time=7.776e-05, forward_time=0.033, loss=1.319, loss_att=0.492, loss_ctc=2.145, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.096 -[v016] 2022-01-31 07:55:12,361 (trainer:653) INFO: 149epoch:train:244-270batch: iter_time=0.001, forward_time=0.032, loss=1.090, loss_att=0.478, loss_ctc=1.702, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.093 -[v016] 2022-01-31 07:55:14,859 (trainer:653) INFO: 149epoch:train:271-297batch: iter_time=9.073e-05, forward_time=0.032, loss=1.395, loss_att=0.585, loss_ctc=2.204, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.092 -[v016] 2022-01-31 07:55:17,343 (trainer:653) INFO: 149epoch:train:298-324batch: iter_time=7.845e-05, forward_time=0.032, loss=1.180, loss_att=0.471, loss_ctc=1.888, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.092 -[v016] 2022-01-31 07:55:19,765 (trainer:653) INFO: 149epoch:train:325-351batch: iter_time=7.671e-05, forward_time=0.031, loss=1.301, loss_att=0.654, loss_ctc=1.948, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.089 -[v016] 2022-01-31 07:55:22,249 (trainer:653) INFO: 149epoch:train:352-378batch: iter_time=7.639e-05, forward_time=0.032, loss=1.217, loss_att=0.476, loss_ctc=1.958, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.092 -[v016] 2022-01-31 07:55:24,770 (trainer:653) INFO: 149epoch:train:379-405batch: iter_time=7.660e-05, forward_time=0.033, loss=1.376, loss_att=0.601, loss_ctc=2.151, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.093 -[v016] 2022-01-31 07:55:27,205 (trainer:653) INFO: 149epoch:train:406-432batch: iter_time=7.818e-05, forward_time=0.031, loss=1.143, loss_att=0.497, loss_ctc=1.789, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.109e-04, train_time=0.090 -[v016] 2022-01-31 07:55:29,846 (trainer:653) INFO: 149epoch:train:433-459batch: iter_time=9.011e-05, forward_time=0.034, loss=1.338, loss_att=0.538, loss_ctc=2.138, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.108e-04, train_time=0.098 -[v016] 2022-01-31 07:55:32,410 (trainer:653) INFO: 149epoch:train:460-486batch: iter_time=0.004, forward_time=0.031, loss=1.218, loss_att=0.525, loss_ctc=1.912, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.108e-04, train_time=0.095 -[v016] 2022-01-31 07:55:34,870 (trainer:653) INFO: 149epoch:train:487-513batch: iter_time=7.936e-05, forward_time=0.032, loss=1.086, loss_att=0.541, loss_ctc=1.631, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.108e-04, train_time=0.091 -[v016] 2022-01-31 07:55:37,666 (trainer:653) INFO: 149epoch:train:514-540batch: iter_time=0.011, forward_time=0.032, loss=1.245, loss_att=0.576, loss_ctc=1.914, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.108e-04, train_time=0.103 -[v016] 2022-01-31 07:56:12,025 (trainer:328) INFO: 149epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.189, loss_att=0.520, loss_ctc=1.857, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.110e-04, train_time=0.094, time=51.46 seconds, total_count=81503, gpu_max_cached_mem_GB=5.824, [valid] loss=7.724, loss_att=6.301, loss_ctc=9.147, acc=0.905, cer=0.100, wer=0.403, cer_ctc=0.145, time=5.77 seconds, total_count=26522, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.89 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:56:14,478 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:56:14,488 (trainer:261) INFO: 150/200epoch started. Estimated time to finish: 1 hour, 30 minutes and 9.04 seconds -[v016] 2022-01-31 07:56:17,214 (trainer:653) INFO: 150epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=1.217, loss_att=0.480, loss_ctc=1.954, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.108e-04, train_time=0.101 -[v016] 2022-01-31 07:56:19,680 (trainer:653) INFO: 150epoch:train:28-54batch: iter_time=7.813e-05, forward_time=0.032, loss=1.039, loss_att=0.437, loss_ctc=1.641, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.107e-04, train_time=0.091 -[v016] 2022-01-31 07:56:22,204 (trainer:653) INFO: 150epoch:train:55-81batch: iter_time=7.604e-05, forward_time=0.032, loss=1.140, loss_att=0.479, loss_ctc=1.801, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.107e-04, train_time=0.093 -[v016] 2022-01-31 07:56:24,688 (trainer:653) INFO: 150epoch:train:82-108batch: iter_time=7.473e-05, forward_time=0.032, loss=1.114, loss_att=0.533, loss_ctc=1.695, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.107e-04, train_time=0.092 -[v016] 2022-01-31 07:56:27,106 (trainer:653) INFO: 150epoch:train:109-135batch: iter_time=7.453e-05, forward_time=0.031, loss=1.263, loss_att=0.558, loss_ctc=1.968, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.107e-04, train_time=0.089 -[v016] 2022-01-31 07:56:29,584 (trainer:653) INFO: 150epoch:train:136-162batch: iter_time=7.359e-05, forward_time=0.032, loss=1.201, loss_att=0.577, loss_ctc=1.826, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.107e-04, train_time=0.092 -[v016] 2022-01-31 07:56:32,062 (trainer:653) INFO: 150epoch:train:163-189batch: iter_time=8.168e-05, forward_time=0.033, loss=1.051, loss_att=0.513, loss_ctc=1.589, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.092 -[v016] 2022-01-31 07:56:34,617 (trainer:653) INFO: 150epoch:train:190-216batch: iter_time=7.907e-05, forward_time=0.033, loss=1.275, loss_att=0.612, loss_ctc=1.938, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.094 -[v016] 2022-01-31 07:56:37,158 (trainer:653) INFO: 150epoch:train:217-243batch: iter_time=7.541e-05, forward_time=0.033, loss=1.337, loss_att=0.490, loss_ctc=2.185, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.094 -[v016] 2022-01-31 07:56:39,870 (trainer:653) INFO: 150epoch:train:244-270batch: iter_time=0.008, forward_time=0.032, loss=1.228, loss_att=0.541, loss_ctc=1.915, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.100 -[v016] 2022-01-31 07:56:42,317 (trainer:653) INFO: 150epoch:train:271-297batch: iter_time=7.546e-05, forward_time=0.031, loss=1.162, loss_att=0.496, loss_ctc=1.828, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.090 -[v016] 2022-01-31 07:56:44,790 (trainer:653) INFO: 150epoch:train:298-324batch: iter_time=7.409e-05, forward_time=0.032, loss=1.192, loss_att=0.579, loss_ctc=1.805, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.091 -[v016] 2022-01-31 07:56:47,365 (trainer:653) INFO: 150epoch:train:325-351batch: iter_time=7.813e-05, forward_time=0.034, loss=1.234, loss_att=0.513, loss_ctc=1.956, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.105e-04, train_time=0.095 -[v016] 2022-01-31 07:56:49,951 (trainer:653) INFO: 150epoch:train:352-378batch: iter_time=8.239e-05, forward_time=0.033, loss=1.245, loss_att=0.475, loss_ctc=2.016, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.105e-04, train_time=0.096 -[v016] 2022-01-31 07:56:52,397 (trainer:653) INFO: 150epoch:train:379-405batch: iter_time=7.463e-05, forward_time=0.032, loss=0.961, loss_att=0.446, loss_ctc=1.475, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.105e-04, train_time=0.090 -[v016] 2022-01-31 07:56:54,844 (trainer:653) INFO: 150epoch:train:406-432batch: iter_time=7.574e-05, forward_time=0.032, loss=1.044, loss_att=0.544, loss_ctc=1.543, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.105e-04, train_time=0.090 -[v016] 2022-01-31 07:56:57,329 (trainer:653) INFO: 150epoch:train:433-459batch: iter_time=8.134e-05, forward_time=0.032, loss=1.124, loss_att=0.504, loss_ctc=1.744, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.105e-04, train_time=0.092 -[v016] 2022-01-31 07:56:59,849 (trainer:653) INFO: 150epoch:train:460-486batch: iter_time=7.523e-05, forward_time=0.032, loss=0.993, loss_att=0.456, loss_ctc=1.530, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.093 -[v016] 2022-01-31 07:57:02,290 (trainer:653) INFO: 150epoch:train:487-513batch: iter_time=7.539e-05, forward_time=0.032, loss=1.305, loss_att=0.570, loss_ctc=2.041, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.090 -[v016] 2022-01-31 07:57:04,765 (trainer:653) INFO: 150epoch:train:514-540batch: iter_time=8.207e-05, forward_time=0.032, loss=1.264, loss_att=0.597, loss_ctc=1.932, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.091 -[v016] 2022-01-31 07:57:39,885 (trainer:328) INFO: 150epoch results: [train] iter_time=6.389e-04, forward_time=0.032, loss=1.168, loss_att=0.520, loss_ctc=1.817, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.106e-04, train_time=0.093, time=50.99 seconds, total_count=82050, gpu_max_cached_mem_GB=5.824, [valid] loss=7.718, loss_att=6.347, loss_ctc=9.089, acc=0.905, cer=0.099, wer=0.400, cer_ctc=0.141, time=6.69 seconds, total_count=26700, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.72 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:57:42,230 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 07:57:42,258 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/144epoch.pth -[v016] 2022-01-31 07:57:42,258 (trainer:261) INFO: 151/200epoch started. Estimated time to finish: 1 hour, 28 minutes and 15.95 seconds -[v016] 2022-01-31 07:57:45,258 (trainer:653) INFO: 151epoch:train:1-27batch: iter_time=0.016, forward_time=0.033, loss=1.152, loss_att=0.518, loss_ctc=1.786, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.111 -[v016] 2022-01-31 07:57:47,754 (trainer:653) INFO: 151epoch:train:28-54batch: iter_time=8.164e-05, forward_time=0.033, loss=1.323, loss_att=0.535, loss_ctc=2.111, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.092 -[v016] 2022-01-31 07:57:50,217 (trainer:653) INFO: 151epoch:train:55-81batch: iter_time=7.766e-05, forward_time=0.032, loss=0.986, loss_att=0.373, loss_ctc=1.598, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.104e-04, train_time=0.091 -[v016] 2022-01-31 07:57:52,727 (trainer:653) INFO: 151epoch:train:82-108batch: iter_time=8.432e-05, forward_time=0.033, loss=1.236, loss_att=0.561, loss_ctc=1.912, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.103e-04, train_time=0.093 -[v016] 2022-01-31 07:57:55,290 (trainer:653) INFO: 151epoch:train:109-135batch: iter_time=8.247e-05, forward_time=0.034, loss=1.286, loss_att=0.535, loss_ctc=2.038, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.103e-04, train_time=0.095 -[v016] 2022-01-31 07:57:57,760 (trainer:653) INFO: 151epoch:train:136-162batch: iter_time=7.807e-05, forward_time=0.032, loss=1.028, loss_att=0.444, loss_ctc=1.613, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.103e-04, train_time=0.091 -[v016] 2022-01-31 07:58:00,195 (trainer:653) INFO: 151epoch:train:163-189batch: iter_time=7.755e-05, forward_time=0.032, loss=1.128, loss_att=0.534, loss_ctc=1.723, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.103e-04, train_time=0.090 -[v016] 2022-01-31 07:58:02,745 (trainer:653) INFO: 151epoch:train:190-216batch: iter_time=7.929e-05, forward_time=0.033, loss=1.146, loss_att=0.526, loss_ctc=1.766, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.103e-04, train_time=0.094 -[v016] 2022-01-31 07:58:05,232 (trainer:653) INFO: 151epoch:train:217-243batch: iter_time=7.782e-05, forward_time=0.033, loss=1.159, loss_att=0.502, loss_ctc=1.816, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.102e-04, train_time=0.092 -[v016] 2022-01-31 07:58:07,863 (trainer:653) INFO: 151epoch:train:244-270batch: iter_time=1.016e-04, forward_time=0.034, loss=0.957, loss_att=0.447, loss_ctc=1.468, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.102e-04, train_time=0.097 -[v016] 2022-01-31 07:58:10,703 (trainer:653) INFO: 151epoch:train:271-297batch: iter_time=1.163e-04, forward_time=0.037, loss=1.300, loss_att=0.519, loss_ctc=2.082, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.102e-04, train_time=0.105 -[v016] 2022-01-31 07:58:14,068 (trainer:653) INFO: 151epoch:train:298-324batch: iter_time=0.008, forward_time=0.043, loss=1.207, loss_att=0.453, loss_ctc=1.961, acc=0.976, backward_time=0.022, optim_step_time=0.033, optim0_lr0=1.102e-04, train_time=0.124 -[v016] 2022-01-31 07:58:16,686 (trainer:653) INFO: 151epoch:train:325-351batch: iter_time=0.004, forward_time=0.032, loss=1.265, loss_att=0.616, loss_ctc=1.915, acc=0.968, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.102e-04, train_time=0.097 -[v016] 2022-01-31 07:58:19,283 (trainer:653) INFO: 151epoch:train:352-378batch: iter_time=1.075e-04, forward_time=0.033, loss=1.227, loss_att=0.583, loss_ctc=1.871, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.102e-04, train_time=0.096 -[v016] 2022-01-31 07:58:22,035 (trainer:653) INFO: 151epoch:train:379-405batch: iter_time=1.095e-04, forward_time=0.035, loss=1.009, loss_att=0.458, loss_ctc=1.560, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.101e-04, train_time=0.098 -[v016] 2022-01-31 07:58:24,754 (trainer:653) INFO: 151epoch:train:406-432batch: iter_time=0.002, forward_time=0.034, loss=1.375, loss_att=0.546, loss_ctc=2.204, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.101e-04, train_time=0.104 -[v016] 2022-01-31 07:58:27,267 (trainer:653) INFO: 151epoch:train:433-459batch: iter_time=8.197e-05, forward_time=0.032, loss=1.129, loss_att=0.542, loss_ctc=1.717, acc=0.973, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.101e-04, train_time=0.093 -[v016] 2022-01-31 07:58:30,027 (trainer:653) INFO: 151epoch:train:460-486batch: iter_time=0.005, forward_time=0.033, loss=1.195, loss_att=0.512, loss_ctc=1.878, acc=0.978, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.101e-04, train_time=0.102 -[v016] 2022-01-31 07:58:32,561 (trainer:653) INFO: 151epoch:train:487-513batch: iter_time=8.067e-05, forward_time=0.032, loss=1.284, loss_att=0.553, loss_ctc=2.016, acc=0.972, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.101e-04, train_time=0.094 -[v016] 2022-01-31 07:58:35,141 (trainer:653) INFO: 151epoch:train:514-540batch: iter_time=8.025e-05, forward_time=0.033, loss=1.183, loss_att=0.510, loss_ctc=1.855, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.100e-04, train_time=0.095 -[v016] 2022-01-31 07:59:11,291 (trainer:328) INFO: 151epoch results: [train] iter_time=0.002, forward_time=0.034, loss=1.178, loss_att=0.514, loss_ctc=1.842, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.102e-04, train_time=0.098, time=53.63 seconds, total_count=82597, gpu_max_cached_mem_GB=5.824, [valid] loss=7.742, loss_att=6.320, loss_ctc=9.165, acc=0.905, cer=0.099, wer=0.404, cer_ctc=0.146, time=6.3 seconds, total_count=26878, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.09 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 07:59:13,405 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 07:59:13,446 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/143epoch.pth -[v016] 2022-01-31 07:59:13,449 (trainer:261) INFO: 152/200epoch started. Estimated time to finish: 1 hour, 26 minutes and 24.52 seconds -[v016] 2022-01-31 07:59:16,611 (trainer:653) INFO: 152epoch:train:1-27batch: iter_time=0.024, forward_time=0.031, loss=0.870, loss_att=0.419, loss_ctc=1.321, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.100e-04, train_time=0.117 -[v016] 2022-01-31 07:59:19,064 (trainer:653) INFO: 152epoch:train:28-54batch: iter_time=8.611e-05, forward_time=0.031, loss=1.195, loss_att=0.519, loss_ctc=1.871, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.100e-04, train_time=0.091 -[v016] 2022-01-31 07:59:21,506 (trainer:653) INFO: 152epoch:train:55-81batch: iter_time=7.724e-05, forward_time=0.031, loss=1.124, loss_att=0.542, loss_ctc=1.705, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.100e-04, train_time=0.090 -[v016] 2022-01-31 07:59:24,003 (trainer:653) INFO: 152epoch:train:82-108batch: iter_time=7.829e-05, forward_time=0.032, loss=1.182, loss_att=0.553, loss_ctc=1.812, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.100e-04, train_time=0.092 -[v016] 2022-01-31 07:59:26,564 (trainer:653) INFO: 152epoch:train:109-135batch: iter_time=1.680e-04, forward_time=0.032, loss=1.090, loss_att=0.414, loss_ctc=1.766, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.095 -[v016] 2022-01-31 07:59:29,017 (trainer:653) INFO: 152epoch:train:136-162batch: iter_time=8.798e-05, forward_time=0.031, loss=1.004, loss_att=0.439, loss_ctc=1.569, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.091 -[v016] 2022-01-31 07:59:31,543 (trainer:653) INFO: 152epoch:train:163-189batch: iter_time=9.968e-05, forward_time=0.032, loss=1.168, loss_att=0.535, loss_ctc=1.801, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.093 -[v016] 2022-01-31 07:59:34,127 (trainer:653) INFO: 152epoch:train:190-216batch: iter_time=9.299e-05, forward_time=0.032, loss=1.172, loss_att=0.467, loss_ctc=1.877, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.095 -[v016] 2022-01-31 07:59:36,850 (trainer:653) INFO: 152epoch:train:217-243batch: iter_time=0.002, forward_time=0.032, loss=1.281, loss_att=0.571, loss_ctc=1.991, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.101 -[v016] 2022-01-31 07:59:39,511 (trainer:653) INFO: 152epoch:train:244-270batch: iter_time=0.003, forward_time=0.033, loss=1.306, loss_att=0.578, loss_ctc=2.034, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.099e-04, train_time=0.098 -[v016] 2022-01-31 07:59:42,024 (trainer:653) INFO: 152epoch:train:271-297batch: iter_time=8.516e-05, forward_time=0.032, loss=1.284, loss_att=0.545, loss_ctc=2.024, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.098e-04, train_time=0.093 -[v016] 2022-01-31 07:59:44,536 (trainer:653) INFO: 152epoch:train:298-324batch: iter_time=8.946e-05, forward_time=0.032, loss=1.245, loss_att=0.553, loss_ctc=1.938, acc=0.973, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.098e-04, train_time=0.093 -[v016] 2022-01-31 07:59:47,285 (trainer:653) INFO: 152epoch:train:325-351batch: iter_time=1.296e-04, forward_time=0.034, loss=1.295, loss_att=0.522, loss_ctc=2.069, acc=0.976, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.098e-04, train_time=0.102 -[v016] 2022-01-31 07:59:50,023 (trainer:653) INFO: 152epoch:train:352-378batch: iter_time=0.004, forward_time=0.033, loss=1.318, loss_att=0.577, loss_ctc=2.060, acc=0.975, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.098e-04, train_time=0.101 -[v016] 2022-01-31 07:59:52,700 (trainer:653) INFO: 152epoch:train:379-405batch: iter_time=1.103e-04, forward_time=0.034, loss=1.176, loss_att=0.543, loss_ctc=1.810, acc=0.973, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.098e-04, train_time=0.099 -[v016] 2022-01-31 07:59:55,363 (trainer:653) INFO: 152epoch:train:406-432batch: iter_time=5.984e-04, forward_time=0.033, loss=1.142, loss_att=0.542, loss_ctc=1.742, acc=0.975, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.098e-04, train_time=0.098 -[v016] 2022-01-31 07:59:58,106 (trainer:653) INFO: 152epoch:train:433-459batch: iter_time=1.111e-04, forward_time=0.035, loss=1.347, loss_att=0.558, loss_ctc=2.136, acc=0.975, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.097e-04, train_time=0.101 -[v016] 2022-01-31 08:00:00,860 (trainer:653) INFO: 152epoch:train:460-486batch: iter_time=1.076e-04, forward_time=0.035, loss=0.880, loss_att=0.391, loss_ctc=1.369, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.097e-04, train_time=0.102 -[v016] 2022-01-31 08:00:03,481 (trainer:653) INFO: 152epoch:train:487-513batch: iter_time=1.086e-04, forward_time=0.033, loss=1.024, loss_att=0.463, loss_ctc=1.586, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.097e-04, train_time=0.097 -[v016] 2022-01-31 08:00:06,133 (trainer:653) INFO: 152epoch:train:514-540batch: iter_time=1.050e-04, forward_time=0.034, loss=1.285, loss_att=0.484, loss_ctc=2.085, acc=0.978, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.097e-04, train_time=0.098 -[v016] 2022-01-31 08:00:44,234 (trainer:328) INFO: 152epoch results: [train] iter_time=0.002, forward_time=0.033, loss=1.170, loss_att=0.511, loss_ctc=1.829, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.098e-04, train_time=0.097, time=53.45 seconds, total_count=83144, gpu_max_cached_mem_GB=5.824, [valid] loss=7.624, loss_att=6.304, loss_ctc=8.944, acc=0.904, cer=0.101, wer=0.408, cer_ctc=0.143, time=5.93 seconds, total_count=27056, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.41 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:00:46,470 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:00:46,533 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/146epoch.pth, exp/asr_train_asr_raw_en_word/148epoch.pth -[v016] 2022-01-31 08:00:46,533 (trainer:261) INFO: 153/200epoch started. Estimated time to finish: 1 hour, 24 minutes and 34.09 seconds -[v016] 2022-01-31 08:00:49,892 (trainer:653) INFO: 153epoch:train:1-27batch: iter_time=0.023, forward_time=0.033, loss=1.101, loss_att=0.518, loss_ctc=1.683, acc=0.974, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.097e-04, train_time=0.122 -[v016] 2022-01-31 08:00:53,091 (trainer:653) INFO: 153epoch:train:28-54batch: iter_time=0.021, forward_time=0.033, loss=0.996, loss_att=0.416, loss_ctc=1.577, acc=0.981, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.096e-04, train_time=0.120 -[v016] 2022-01-31 08:00:56,060 (trainer:653) INFO: 153epoch:train:55-81batch: iter_time=0.018, forward_time=0.031, loss=1.078, loss_att=0.536, loss_ctc=1.620, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.096e-04, train_time=0.110 -[v016] 2022-01-31 08:00:58,793 (trainer:653) INFO: 153epoch:train:82-108batch: iter_time=1.030e-04, forward_time=0.035, loss=1.149, loss_att=0.514, loss_ctc=1.784, acc=0.971, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.096e-04, train_time=0.101 -[v016] 2022-01-31 08:01:01,725 (trainer:653) INFO: 153epoch:train:109-135batch: iter_time=0.005, forward_time=0.036, loss=1.247, loss_att=0.455, loss_ctc=2.039, acc=0.980, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.096e-04, train_time=0.108 -[v016] 2022-01-31 08:01:04,439 (trainer:653) INFO: 153epoch:train:136-162batch: iter_time=1.105e-04, forward_time=0.034, loss=1.194, loss_att=0.528, loss_ctc=1.861, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.096e-04, train_time=0.100 -[v016] 2022-01-31 08:01:07,213 (trainer:653) INFO: 153epoch:train:163-189batch: iter_time=0.006, forward_time=0.033, loss=1.089, loss_att=0.476, loss_ctc=1.702, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.096e-04, train_time=0.103 -[v016] 2022-01-31 08:01:09,985 (trainer:653) INFO: 153epoch:train:190-216batch: iter_time=1.379e-04, forward_time=0.035, loss=1.143, loss_att=0.483, loss_ctc=1.803, acc=0.980, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.102 -[v016] 2022-01-31 08:01:13,217 (trainer:653) INFO: 153epoch:train:217-243batch: iter_time=0.022, forward_time=0.034, loss=0.978, loss_att=0.468, loss_ctc=1.488, acc=0.977, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.095e-04, train_time=0.119 -[v016] 2022-01-31 08:01:15,916 (trainer:653) INFO: 153epoch:train:244-270batch: iter_time=1.135e-04, forward_time=0.033, loss=1.277, loss_att=0.576, loss_ctc=1.978, acc=0.972, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.100 -[v016] 2022-01-31 08:01:18,711 (trainer:653) INFO: 153epoch:train:271-297batch: iter_time=0.002, forward_time=0.035, loss=1.227, loss_att=0.504, loss_ctc=1.949, acc=0.974, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.103 -[v016] 2022-01-31 08:01:24,378 (trainer:653) INFO: 153epoch:train:298-324batch: iter_time=9.927e-05, forward_time=0.125, loss=1.101, loss_att=0.550, loss_ctc=1.651, acc=0.972, backward_time=0.041, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.210 -[v016] 2022-01-31 08:01:27,562 (trainer:653) INFO: 153epoch:train:325-351batch: iter_time=0.019, forward_time=0.033, loss=1.072, loss_att=0.452, loss_ctc=1.692, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.094e-04, train_time=0.118 -[v016] 2022-01-31 08:01:30,239 (trainer:653) INFO: 153epoch:train:352-378batch: iter_time=0.002, forward_time=0.033, loss=1.366, loss_att=0.657, loss_ctc=2.075, acc=0.971, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.094e-04, train_time=0.099 -[v016] 2022-01-31 08:01:33,706 (trainer:653) INFO: 153epoch:train:379-405batch: iter_time=0.031, forward_time=0.033, loss=0.984, loss_att=0.438, loss_ctc=1.530, acc=0.979, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.094e-04, train_time=0.128 -[v016] 2022-01-31 08:01:36,991 (trainer:653) INFO: 153epoch:train:406-432batch: iter_time=0.024, forward_time=0.033, loss=1.373, loss_att=0.622, loss_ctc=2.124, acc=0.969, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.094e-04, train_time=0.121 -[v016] 2022-01-31 08:01:39,550 (trainer:653) INFO: 153epoch:train:433-459batch: iter_time=0.003, forward_time=0.031, loss=1.289, loss_att=0.514, loss_ctc=2.065, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.094e-04, train_time=0.095 -[v016] 2022-01-31 08:01:43,511 (trainer:653) INFO: 153epoch:train:460-486batch: iter_time=0.038, forward_time=0.037, loss=1.247, loss_att=0.590, loss_ctc=1.905, acc=0.971, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.094e-04, train_time=0.144 -[v016] 2022-01-31 08:01:46,302 (trainer:653) INFO: 153epoch:train:487-513batch: iter_time=0.004, forward_time=0.033, loss=1.231, loss_att=0.572, loss_ctc=1.890, acc=0.972, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.093e-04, train_time=0.105 -[v016] 2022-01-31 08:01:49,171 (trainer:653) INFO: 153epoch:train:514-540batch: iter_time=0.005, forward_time=0.035, loss=1.549, loss_att=0.601, loss_ctc=2.497, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.093e-04, train_time=0.106 -[v016] 2022-01-31 08:02:32,266 (trainer:328) INFO: 153epoch results: [train] iter_time=0.011, forward_time=0.038, loss=1.184, loss_att=0.524, loss_ctc=1.843, acc=0.975, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.095e-04, train_time=0.115, time=1 minute and 3.4 seconds, total_count=83691, gpu_max_cached_mem_GB=5.824, [valid] loss=7.608, loss_att=6.317, loss_ctc=8.900, acc=0.905, cer=0.099, wer=0.396, cer_ctc=0.141, time=13.48 seconds, total_count=27234, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.85 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:02:34,808 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:02:34,838 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/147epoch.pth -[v016] 2022-01-31 08:02:34,838 (trainer:261) INFO: 154/200epoch started. Estimated time to finish: 1 hour, 22 minutes and 49.29 seconds -[v016] 2022-01-31 08:02:38,931 (trainer:653) INFO: 154epoch:train:1-27batch: iter_time=0.005, forward_time=0.053, loss=0.709, loss_att=0.322, loss_ctc=1.096, acc=0.984, backward_time=0.048, optim_step_time=0.022, optim0_lr0=1.093e-04, train_time=0.149 -[v016] 2022-01-31 08:02:41,502 (trainer:653) INFO: 154epoch:train:28-54batch: iter_time=8.480e-05, forward_time=0.033, loss=1.193, loss_att=0.509, loss_ctc=1.878, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.093e-04, train_time=0.095 -[v016] 2022-01-31 08:02:44,049 (trainer:653) INFO: 154epoch:train:55-81batch: iter_time=8.787e-04, forward_time=0.033, loss=1.299, loss_att=0.568, loss_ctc=2.029, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.093e-04, train_time=0.094 -[v016] 2022-01-31 08:02:46,522 (trainer:653) INFO: 154epoch:train:82-108batch: iter_time=8.753e-05, forward_time=0.032, loss=1.114, loss_att=0.520, loss_ctc=1.709, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.091 -[v016] 2022-01-31 08:02:49,213 (trainer:653) INFO: 154epoch:train:109-135batch: iter_time=0.010, forward_time=0.031, loss=1.094, loss_att=0.544, loss_ctc=1.644, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.099 -[v016] 2022-01-31 08:02:51,623 (trainer:653) INFO: 154epoch:train:136-162batch: iter_time=7.639e-04, forward_time=0.030, loss=0.875, loss_att=0.445, loss_ctc=1.306, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.089 -[v016] 2022-01-31 08:02:54,164 (trainer:653) INFO: 154epoch:train:163-189batch: iter_time=0.004, forward_time=0.030, loss=1.034, loss_att=0.471, loss_ctc=1.596, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.094 -[v016] 2022-01-31 08:02:56,620 (trainer:653) INFO: 154epoch:train:190-216batch: iter_time=6.097e-04, forward_time=0.030, loss=0.966, loss_att=0.410, loss_ctc=1.523, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.091 -[v016] 2022-01-31 08:02:59,672 (trainer:653) INFO: 154epoch:train:217-243batch: iter_time=0.018, forward_time=0.033, loss=1.156, loss_att=0.500, loss_ctc=1.812, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.092e-04, train_time=0.113 -[v016] 2022-01-31 08:03:02,325 (trainer:653) INFO: 154epoch:train:244-270batch: iter_time=0.003, forward_time=0.033, loss=1.287, loss_att=0.505, loss_ctc=2.069, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.098 -[v016] 2022-01-31 08:03:04,767 (trainer:653) INFO: 154epoch:train:271-297batch: iter_time=8.408e-05, forward_time=0.031, loss=1.123, loss_att=0.474, loss_ctc=1.773, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.090 -[v016] 2022-01-31 08:03:07,461 (trainer:653) INFO: 154epoch:train:298-324batch: iter_time=8.974e-05, forward_time=0.034, loss=1.416, loss_att=0.545, loss_ctc=2.286, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.100 -[v016] 2022-01-31 08:03:10,023 (trainer:653) INFO: 154epoch:train:325-351batch: iter_time=9.158e-05, forward_time=0.033, loss=1.129, loss_att=0.486, loss_ctc=1.773, acc=0.975, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.095 -[v016] 2022-01-31 08:03:13,054 (trainer:653) INFO: 154epoch:train:352-378batch: iter_time=0.017, forward_time=0.033, loss=1.239, loss_att=0.493, loss_ctc=1.985, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.112 -[v016] 2022-01-31 08:03:15,806 (trainer:653) INFO: 154epoch:train:379-405batch: iter_time=0.007, forward_time=0.033, loss=1.357, loss_att=0.581, loss_ctc=2.132, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.102 -[v016] 2022-01-31 08:03:18,262 (trainer:653) INFO: 154epoch:train:406-432batch: iter_time=8.464e-05, forward_time=0.031, loss=1.138, loss_att=0.527, loss_ctc=1.749, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.090e-04, train_time=0.091 -[v016] 2022-01-31 08:03:20,743 (trainer:653) INFO: 154epoch:train:433-459batch: iter_time=0.004, forward_time=0.030, loss=1.129, loss_att=0.539, loss_ctc=1.719, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.090e-04, train_time=0.092 -[v016] 2022-01-31 08:03:23,360 (trainer:653) INFO: 154epoch:train:460-486batch: iter_time=5.575e-04, forward_time=0.031, loss=1.232, loss_att=0.514, loss_ctc=1.950, acc=0.978, backward_time=0.021, optim_step_time=0.026, optim0_lr0=1.090e-04, train_time=0.097 -[v016] 2022-01-31 08:03:25,802 (trainer:653) INFO: 154epoch:train:487-513batch: iter_time=8.334e-05, forward_time=0.031, loss=1.137, loss_att=0.576, loss_ctc=1.698, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.090e-04, train_time=0.090 -[v016] 2022-01-31 08:03:28,958 (trainer:653) INFO: 154epoch:train:514-540batch: iter_time=0.021, forward_time=0.033, loss=1.323, loss_att=0.504, loss_ctc=2.143, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.090e-04, train_time=0.117 -[v016] 2022-01-31 08:04:02,840 (trainer:328) INFO: 154epoch results: [train] iter_time=0.005, forward_time=0.033, loss=1.145, loss_att=0.501, loss_ctc=1.789, acc=0.976, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.091e-04, train_time=0.100, time=54.81 seconds, total_count=84238, gpu_max_cached_mem_GB=5.824, [valid] loss=7.651, loss_att=6.280, loss_ctc=9.021, acc=0.907, cer=0.098, wer=0.398, cer_ctc=0.138, time=5.6 seconds, total_count=27412, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.57 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:04:05,304 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 08:04:05,315 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/145epoch.pth -[v016] 2022-01-31 08:04:05,315 (trainer:261) INFO: 155/200epoch started. Estimated time to finish: 1 hour, 20 minutes and 58.33 seconds -[v016] 2022-01-31 08:04:07,995 (trainer:653) INFO: 155epoch:train:1-27batch: iter_time=0.004, forward_time=0.033, loss=1.244, loss_att=0.560, loss_ctc=1.928, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.099 -[v016] 2022-01-31 08:04:10,426 (trainer:653) INFO: 155epoch:train:28-54batch: iter_time=8.170e-05, forward_time=0.031, loss=1.196, loss_att=0.574, loss_ctc=1.818, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.090 -[v016] 2022-01-31 08:04:12,860 (trainer:653) INFO: 155epoch:train:55-81batch: iter_time=7.719e-05, forward_time=0.031, loss=1.049, loss_att=0.496, loss_ctc=1.603, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.090 -[v016] 2022-01-31 08:04:15,372 (trainer:653) INFO: 155epoch:train:82-108batch: iter_time=7.788e-05, forward_time=0.032, loss=1.393, loss_att=0.565, loss_ctc=2.220, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.093 -[v016] 2022-01-31 08:04:17,801 (trainer:653) INFO: 155epoch:train:109-135batch: iter_time=7.608e-05, forward_time=0.032, loss=0.950, loss_att=0.450, loss_ctc=1.449, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.090 -[v016] 2022-01-31 08:04:20,394 (trainer:653) INFO: 155epoch:train:136-162batch: iter_time=7.826e-05, forward_time=0.033, loss=1.225, loss_att=0.492, loss_ctc=1.957, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.089e-04, train_time=0.096 -[v016] 2022-01-31 08:04:22,898 (trainer:653) INFO: 155epoch:train:163-189batch: iter_time=8.465e-05, forward_time=0.032, loss=1.095, loss_att=0.497, loss_ctc=1.692, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.092 -[v016] 2022-01-31 08:04:25,389 (trainer:653) INFO: 155epoch:train:190-216batch: iter_time=7.763e-05, forward_time=0.032, loss=1.302, loss_att=0.601, loss_ctc=2.003, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.092 -[v016] 2022-01-31 08:04:27,793 (trainer:653) INFO: 155epoch:train:217-243batch: iter_time=7.627e-05, forward_time=0.031, loss=1.020, loss_att=0.528, loss_ctc=1.513, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.089 -[v016] 2022-01-31 08:04:30,580 (trainer:653) INFO: 155epoch:train:244-270batch: iter_time=0.010, forward_time=0.032, loss=1.273, loss_att=0.469, loss_ctc=2.077, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.103 -[v016] 2022-01-31 08:04:33,101 (trainer:653) INFO: 155epoch:train:271-297batch: iter_time=7.771e-05, forward_time=0.033, loss=1.177, loss_att=0.495, loss_ctc=1.860, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.093 -[v016] 2022-01-31 08:04:35,627 (trainer:653) INFO: 155epoch:train:298-324batch: iter_time=7.818e-05, forward_time=0.032, loss=1.106, loss_att=0.482, loss_ctc=1.729, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.093 -[v016] 2022-01-31 08:04:38,039 (trainer:653) INFO: 155epoch:train:325-351batch: iter_time=7.448e-05, forward_time=0.031, loss=1.052, loss_att=0.497, loss_ctc=1.608, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.087e-04, train_time=0.089 -[v016] 2022-01-31 08:04:40,564 (trainer:653) INFO: 155epoch:train:352-378batch: iter_time=9.032e-05, forward_time=0.033, loss=1.255, loss_att=0.497, loss_ctc=2.013, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.087e-04, train_time=0.093 -[v016] 2022-01-31 08:04:43,070 (trainer:653) INFO: 155epoch:train:379-405batch: iter_time=7.582e-05, forward_time=0.032, loss=1.091, loss_att=0.463, loss_ctc=1.718, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.087e-04, train_time=0.093 -[v016] 2022-01-31 08:04:45,541 (trainer:653) INFO: 155epoch:train:406-432batch: iter_time=7.804e-05, forward_time=0.032, loss=1.080, loss_att=0.462, loss_ctc=1.698, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.087e-04, train_time=0.091 -[v016] 2022-01-31 08:04:48,114 (trainer:653) INFO: 155epoch:train:433-459batch: iter_time=8.259e-05, forward_time=0.033, loss=1.258, loss_att=0.481, loss_ctc=2.035, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.087e-04, train_time=0.095 -[v016] 2022-01-31 08:04:50,583 (trainer:653) INFO: 155epoch:train:460-486batch: iter_time=8.028e-05, forward_time=0.032, loss=1.286, loss_att=0.557, loss_ctc=2.014, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.091 -[v016] 2022-01-31 08:04:53,088 (trainer:653) INFO: 155epoch:train:487-513batch: iter_time=7.852e-05, forward_time=0.032, loss=1.286, loss_att=0.590, loss_ctc=1.982, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.093 -[v016] 2022-01-31 08:04:55,600 (trainer:653) INFO: 155epoch:train:514-540batch: iter_time=8.299e-05, forward_time=0.032, loss=1.235, loss_att=0.541, loss_ctc=1.928, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.093 -[v016] 2022-01-31 08:05:30,447 (trainer:328) INFO: 155epoch results: [train] iter_time=7.278e-04, forward_time=0.032, loss=1.179, loss_att=0.515, loss_ctc=1.844, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.088e-04, train_time=0.093, time=51.01 seconds, total_count=84785, gpu_max_cached_mem_GB=5.824, [valid] loss=7.787, loss_att=6.424, loss_ctc=9.150, acc=0.904, cer=0.099, wer=0.400, cer_ctc=0.142, time=6.49 seconds, total_count=27590, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.63 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:05:32,558 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:05:32,593 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/153epoch.pth -[v016] 2022-01-31 08:05:32,593 (trainer:261) INFO: 156/200epoch started. Estimated time to finish: 1 hour, 19 minutes and 6.6 seconds -[v016] 2022-01-31 08:05:35,231 (trainer:653) INFO: 156epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.097, loss_att=0.451, loss_ctc=1.742, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.097 -[v016] 2022-01-31 08:05:37,775 (trainer:653) INFO: 156epoch:train:28-54batch: iter_time=8.637e-05, forward_time=0.033, loss=1.187, loss_att=0.494, loss_ctc=1.880, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.094 -[v016] 2022-01-31 08:05:40,165 (trainer:653) INFO: 156epoch:train:55-81batch: iter_time=7.639e-05, forward_time=0.031, loss=0.943, loss_att=0.422, loss_ctc=1.464, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.086e-04, train_time=0.088 -[v016] 2022-01-31 08:05:42,684 (trainer:653) INFO: 156epoch:train:82-108batch: iter_time=7.735e-05, forward_time=0.032, loss=1.180, loss_att=0.482, loss_ctc=1.879, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.093 -[v016] 2022-01-31 08:05:45,139 (trainer:653) INFO: 156epoch:train:109-135batch: iter_time=8.117e-05, forward_time=0.032, loss=0.995, loss_att=0.533, loss_ctc=1.456, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.091 -[v016] 2022-01-31 08:05:47,675 (trainer:653) INFO: 156epoch:train:136-162batch: iter_time=7.675e-05, forward_time=0.033, loss=1.095, loss_att=0.405, loss_ctc=1.784, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.094 -[v016] 2022-01-31 08:05:50,565 (trainer:653) INFO: 156epoch:train:163-189batch: iter_time=0.014, forward_time=0.033, loss=0.906, loss_att=0.385, loss_ctc=1.427, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.107 -[v016] 2022-01-31 08:05:53,102 (trainer:653) INFO: 156epoch:train:190-216batch: iter_time=7.781e-05, forward_time=0.033, loss=1.152, loss_att=0.502, loss_ctc=1.801, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.094 -[v016] 2022-01-31 08:05:55,663 (trainer:653) INFO: 156epoch:train:217-243batch: iter_time=7.720e-05, forward_time=0.033, loss=1.157, loss_att=0.514, loss_ctc=1.799, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.085e-04, train_time=0.095 -[v016] 2022-01-31 08:05:58,193 (trainer:653) INFO: 156epoch:train:244-270batch: iter_time=7.727e-05, forward_time=0.033, loss=1.272, loss_att=0.534, loss_ctc=2.010, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.093 -[v016] 2022-01-31 08:06:00,772 (trainer:653) INFO: 156epoch:train:271-297batch: iter_time=8.683e-05, forward_time=0.034, loss=1.275, loss_att=0.561, loss_ctc=1.988, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.095 -[v016] 2022-01-31 08:06:03,822 (trainer:653) INFO: 156epoch:train:298-324batch: iter_time=0.021, forward_time=0.032, loss=1.096, loss_att=0.451, loss_ctc=1.742, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.113 -[v016] 2022-01-31 08:06:06,385 (trainer:653) INFO: 156epoch:train:325-351batch: iter_time=7.755e-05, forward_time=0.033, loss=1.105, loss_att=0.446, loss_ctc=1.763, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.095 -[v016] 2022-01-31 08:06:08,865 (trainer:653) INFO: 156epoch:train:352-378batch: iter_time=9.537e-04, forward_time=0.032, loss=1.026, loss_att=0.492, loss_ctc=1.560, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.092 -[v016] 2022-01-31 08:06:11,278 (trainer:653) INFO: 156epoch:train:379-405batch: iter_time=7.687e-05, forward_time=0.032, loss=1.226, loss_att=0.517, loss_ctc=1.936, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.089 -[v016] 2022-01-31 08:06:13,815 (trainer:653) INFO: 156epoch:train:406-432batch: iter_time=0.001, forward_time=0.032, loss=1.198, loss_att=0.511, loss_ctc=1.884, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.083e-04, train_time=0.094 -[v016] 2022-01-31 08:06:16,326 (trainer:653) INFO: 156epoch:train:433-459batch: iter_time=8.472e-05, forward_time=0.033, loss=1.114, loss_att=0.521, loss_ctc=1.708, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.083e-04, train_time=0.093 -[v016] 2022-01-31 08:06:18,731 (trainer:653) INFO: 156epoch:train:460-486batch: iter_time=7.652e-05, forward_time=0.031, loss=1.130, loss_att=0.570, loss_ctc=1.690, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.083e-04, train_time=0.089 -[v016] 2022-01-31 08:06:21,214 (trainer:653) INFO: 156epoch:train:487-513batch: iter_time=7.882e-05, forward_time=0.032, loss=1.191, loss_att=0.534, loss_ctc=1.848, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.083e-04, train_time=0.092 -[v016] 2022-01-31 08:06:23,707 (trainer:653) INFO: 156epoch:train:514-540batch: iter_time=7.631e-05, forward_time=0.032, loss=1.128, loss_att=0.508, loss_ctc=1.747, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.083e-04, train_time=0.092 -[v016] 2022-01-31 08:06:57,267 (trainer:328) INFO: 156epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.127, loss_att=0.494, loss_ctc=1.760, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.084e-04, train_time=0.094, time=51.86 seconds, total_count=85332, gpu_max_cached_mem_GB=5.824, [valid] loss=7.735, loss_att=6.401, loss_ctc=9.069, acc=0.905, cer=0.097, wer=0.397, cer_ctc=0.140, time=5.55 seconds, total_count=27768, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.25 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:06:59,397 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:06:59,449 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/149epoch.pth, exp/asr_train_asr_raw_en_word/155epoch.pth -[v016] 2022-01-31 08:06:59,449 (trainer:261) INFO: 157/200epoch started. Estimated time to finish: 1 hour, 17 minutes and 15.09 seconds -[v016] 2022-01-31 08:07:02,091 (trainer:653) INFO: 157epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.075, loss_att=0.495, loss_ctc=1.654, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.097 -[v016] 2022-01-31 08:07:04,618 (trainer:653) INFO: 157epoch:train:28-54batch: iter_time=8.452e-05, forward_time=0.033, loss=0.944, loss_att=0.416, loss_ctc=1.472, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.093 -[v016] 2022-01-31 08:07:07,218 (trainer:653) INFO: 157epoch:train:55-81batch: iter_time=0.006, forward_time=0.031, loss=1.060, loss_att=0.437, loss_ctc=1.683, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.096 -[v016] 2022-01-31 08:07:09,674 (trainer:653) INFO: 157epoch:train:82-108batch: iter_time=7.570e-05, forward_time=0.032, loss=0.939, loss_att=0.418, loss_ctc=1.461, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.091 -[v016] 2022-01-31 08:07:12,199 (trainer:653) INFO: 157epoch:train:109-135batch: iter_time=7.943e-05, forward_time=0.033, loss=1.171, loss_att=0.478, loss_ctc=1.864, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.093 -[v016] 2022-01-31 08:07:14,722 (trainer:653) INFO: 157epoch:train:136-162batch: iter_time=7.815e-05, forward_time=0.033, loss=1.155, loss_att=0.420, loss_ctc=1.891, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.082e-04, train_time=0.093 -[v016] 2022-01-31 08:07:17,188 (trainer:653) INFO: 157epoch:train:163-189batch: iter_time=7.547e-05, forward_time=0.032, loss=1.214, loss_att=0.542, loss_ctc=1.885, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.091 -[v016] 2022-01-31 08:07:19,634 (trainer:653) INFO: 157epoch:train:190-216batch: iter_time=8.124e-05, forward_time=0.032, loss=1.059, loss_att=0.487, loss_ctc=1.631, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.090 -[v016] 2022-01-31 08:07:22,181 (trainer:653) INFO: 157epoch:train:217-243batch: iter_time=7.955e-05, forward_time=0.033, loss=1.398, loss_att=0.602, loss_ctc=2.195, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.094 -[v016] 2022-01-31 08:07:24,659 (trainer:653) INFO: 157epoch:train:244-270batch: iter_time=7.747e-05, forward_time=0.032, loss=1.140, loss_att=0.494, loss_ctc=1.787, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.092 -[v016] 2022-01-31 08:07:27,129 (trainer:653) INFO: 157epoch:train:271-297batch: iter_time=8.151e-05, forward_time=0.032, loss=1.303, loss_att=0.587, loss_ctc=2.019, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.091 -[v016] 2022-01-31 08:07:29,682 (trainer:653) INFO: 157epoch:train:298-324batch: iter_time=9.425e-05, forward_time=0.033, loss=1.190, loss_att=0.546, loss_ctc=1.834, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.094 -[v016] 2022-01-31 08:07:32,210 (trainer:653) INFO: 157epoch:train:325-351batch: iter_time=8.303e-05, forward_time=0.033, loss=1.214, loss_att=0.535, loss_ctc=1.894, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.093 -[v016] 2022-01-31 08:07:34,733 (trainer:653) INFO: 157epoch:train:352-378batch: iter_time=8.496e-05, forward_time=0.033, loss=1.017, loss_att=0.458, loss_ctc=1.576, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.093 -[v016] 2022-01-31 08:07:37,661 (trainer:653) INFO: 157epoch:train:379-405batch: iter_time=0.016, forward_time=0.032, loss=1.096, loss_att=0.466, loss_ctc=1.725, acc=0.975, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.108 -[v016] 2022-01-31 08:07:40,234 (trainer:653) INFO: 157epoch:train:406-432batch: iter_time=1.141e-04, forward_time=0.033, loss=1.182, loss_att=0.506, loss_ctc=1.858, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.095 -[v016] 2022-01-31 08:07:42,697 (trainer:653) INFO: 157epoch:train:433-459batch: iter_time=8.403e-05, forward_time=0.032, loss=1.177, loss_att=0.544, loss_ctc=1.811, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.091 -[v016] 2022-01-31 08:07:45,247 (trainer:653) INFO: 157epoch:train:460-486batch: iter_time=7.836e-05, forward_time=0.033, loss=1.204, loss_att=0.484, loss_ctc=1.925, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.080e-04, train_time=0.094 -[v016] 2022-01-31 08:07:47,779 (trainer:653) INFO: 157epoch:train:487-513batch: iter_time=7.720e-05, forward_time=0.032, loss=1.410, loss_att=0.560, loss_ctc=2.260, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.079e-04, train_time=0.094 -[v016] 2022-01-31 08:07:50,287 (trainer:653) INFO: 157epoch:train:514-540batch: iter_time=7.819e-05, forward_time=0.032, loss=1.278, loss_att=0.511, loss_ctc=2.045, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.079e-04, train_time=0.093 -[v016] 2022-01-31 08:08:24,258 (trainer:328) INFO: 157epoch results: [train] iter_time=0.001, forward_time=0.033, loss=1.166, loss_att=0.500, loss_ctc=1.832, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.081e-04, train_time=0.094, time=51.57 seconds, total_count=85879, gpu_max_cached_mem_GB=5.824, [valid] loss=7.804, loss_att=6.422, loss_ctc=9.187, acc=0.906, cer=0.097, wer=0.390, cer_ctc=0.141, time=5.62 seconds, total_count=27946, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.61 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:08:26,747 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:08:26,789 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/132epoch.pth -[v016] 2022-01-31 08:08:26,789 (trainer:261) INFO: 158/200epoch started. Estimated time to finish: 1 hour, 15 minutes and 24.1 seconds -[v016] 2022-01-31 08:08:29,485 (trainer:653) INFO: 158epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=1.219, loss_att=0.543, loss_ctc=1.895, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.079e-04, train_time=0.099 -[v016] 2022-01-31 08:08:32,040 (trainer:653) INFO: 158epoch:train:28-54batch: iter_time=9.838e-05, forward_time=0.033, loss=1.117, loss_att=0.456, loss_ctc=1.777, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.079e-04, train_time=0.094 -[v016] 2022-01-31 08:08:34,529 (trainer:653) INFO: 158epoch:train:55-81batch: iter_time=8.852e-05, forward_time=0.032, loss=1.082, loss_att=0.450, loss_ctc=1.715, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.079e-04, train_time=0.092 -[v016] 2022-01-31 08:08:37,018 (trainer:653) INFO: 158epoch:train:82-108batch: iter_time=7.638e-05, forward_time=0.032, loss=1.132, loss_att=0.504, loss_ctc=1.759, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.092 -[v016] 2022-01-31 08:08:39,508 (trainer:653) INFO: 158epoch:train:109-135batch: iter_time=1.767e-04, forward_time=0.032, loss=1.116, loss_att=0.497, loss_ctc=1.734, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.092 -[v016] 2022-01-31 08:08:41,991 (trainer:653) INFO: 158epoch:train:136-162batch: iter_time=8.286e-05, forward_time=0.032, loss=1.139, loss_att=0.515, loss_ctc=1.763, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.092 -[v016] 2022-01-31 08:08:44,434 (trainer:653) INFO: 158epoch:train:163-189batch: iter_time=9.728e-05, forward_time=0.031, loss=1.215, loss_att=0.528, loss_ctc=1.902, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.090 -[v016] 2022-01-31 08:08:46,928 (trainer:653) INFO: 158epoch:train:190-216batch: iter_time=7.723e-05, forward_time=0.032, loss=1.251, loss_att=0.540, loss_ctc=1.961, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.092 -[v016] 2022-01-31 08:08:49,456 (trainer:653) INFO: 158epoch:train:217-243batch: iter_time=8.731e-05, forward_time=0.033, loss=1.219, loss_att=0.529, loss_ctc=1.910, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.078e-04, train_time=0.093 -[v016] 2022-01-31 08:08:51,966 (trainer:653) INFO: 158epoch:train:244-270batch: iter_time=7.890e-05, forward_time=0.032, loss=1.134, loss_att=0.448, loss_ctc=1.820, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.093 -[v016] 2022-01-31 08:08:54,455 (trainer:653) INFO: 158epoch:train:271-297batch: iter_time=7.611e-05, forward_time=0.032, loss=1.104, loss_att=0.433, loss_ctc=1.775, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.092 -[v016] 2022-01-31 08:08:56,918 (trainer:653) INFO: 158epoch:train:298-324batch: iter_time=8.145e-05, forward_time=0.032, loss=0.996, loss_att=0.456, loss_ctc=1.537, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.091 -[v016] 2022-01-31 08:08:59,351 (trainer:653) INFO: 158epoch:train:325-351batch: iter_time=7.692e-05, forward_time=0.031, loss=1.092, loss_att=0.523, loss_ctc=1.662, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.090 -[v016] 2022-01-31 08:09:01,811 (trainer:653) INFO: 158epoch:train:352-378batch: iter_time=7.600e-05, forward_time=0.032, loss=1.126, loss_att=0.455, loss_ctc=1.798, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.091 -[v016] 2022-01-31 08:09:04,356 (trainer:653) INFO: 158epoch:train:379-405batch: iter_time=7.745e-05, forward_time=0.033, loss=1.199, loss_att=0.533, loss_ctc=1.864, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.094 -[v016] 2022-01-31 08:09:06,831 (trainer:653) INFO: 158epoch:train:406-432batch: iter_time=7.529e-05, forward_time=0.032, loss=0.979, loss_att=0.428, loss_ctc=1.530, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.091 -[v016] 2022-01-31 08:09:09,314 (trainer:653) INFO: 158epoch:train:433-459batch: iter_time=7.629e-05, forward_time=0.032, loss=1.175, loss_att=0.524, loss_ctc=1.826, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.092 -[v016] 2022-01-31 08:09:12,391 (trainer:653) INFO: 158epoch:train:460-486batch: iter_time=0.019, forward_time=0.033, loss=1.218, loss_att=0.491, loss_ctc=1.946, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.114 -[v016] 2022-01-31 08:09:14,926 (trainer:653) INFO: 158epoch:train:487-513batch: iter_time=8.116e-05, forward_time=0.033, loss=1.136, loss_att=0.482, loss_ctc=1.790, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.094 -[v016] 2022-01-31 08:09:17,385 (trainer:653) INFO: 158epoch:train:514-540batch: iter_time=7.619e-05, forward_time=0.032, loss=1.273, loss_att=0.598, loss_ctc=1.949, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.091 -[v016] 2022-01-31 08:09:51,060 (trainer:328) INFO: 158epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.145, loss_att=0.496, loss_ctc=1.793, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.077e-04, train_time=0.093, time=51.29 seconds, total_count=86426, gpu_max_cached_mem_GB=5.824, [valid] loss=7.780, loss_att=6.375, loss_ctc=9.186, acc=0.906, cer=0.099, wer=0.399, cer_ctc=0.145, time=5.72 seconds, total_count=28124, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.25 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:09:53,310 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:09:53,344 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/151epoch.pth -[v016] 2022-01-31 08:09:53,344 (trainer:261) INFO: 159/200epoch started. Estimated time to finish: 1 hour, 13 minutes and 33.21 seconds -[v016] 2022-01-31 08:09:55,950 (trainer:653) INFO: 159epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=1.013, loss_att=0.396, loss_ctc=1.630, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.076e-04, train_time=0.096 -[v016] 2022-01-31 08:09:58,527 (trainer:653) INFO: 159epoch:train:28-54batch: iter_time=0.003, forward_time=0.032, loss=1.133, loss_att=0.483, loss_ctc=1.783, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.075e-04, train_time=0.095 -[v016] 2022-01-31 08:10:01,054 (trainer:653) INFO: 159epoch:train:55-81batch: iter_time=7.677e-05, forward_time=0.032, loss=1.272, loss_att=0.523, loss_ctc=2.021, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.075e-04, train_time=0.093 -[v016] 2022-01-31 08:10:03,510 (trainer:653) INFO: 159epoch:train:82-108batch: iter_time=8.390e-05, forward_time=0.032, loss=0.944, loss_att=0.422, loss_ctc=1.467, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.075e-04, train_time=0.091 -[v016] 2022-01-31 08:10:06,571 (trainer:653) INFO: 159epoch:train:109-135batch: iter_time=8.202e-05, forward_time=0.037, loss=1.035, loss_att=0.521, loss_ctc=1.549, acc=0.967, backward_time=0.031, optim_step_time=0.022, optim0_lr0=1.075e-04, train_time=0.113 -[v016] 2022-01-31 08:10:09,043 (trainer:653) INFO: 159epoch:train:136-162batch: iter_time=9.753e-05, forward_time=0.032, loss=1.182, loss_att=0.599, loss_ctc=1.764, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.075e-04, train_time=0.091 -[v016] 2022-01-31 08:10:11,573 (trainer:653) INFO: 159epoch:train:163-189batch: iter_time=9.101e-05, forward_time=0.033, loss=1.157, loss_att=0.462, loss_ctc=1.852, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.075e-04, train_time=0.093 -[v016] 2022-01-31 08:10:14,331 (trainer:653) INFO: 159epoch:train:190-216batch: iter_time=0.008, forward_time=0.033, loss=1.067, loss_att=0.453, loss_ctc=1.680, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.102 -[v016] 2022-01-31 08:10:16,877 (trainer:653) INFO: 159epoch:train:217-243batch: iter_time=1.037e-04, forward_time=0.033, loss=1.102, loss_att=0.463, loss_ctc=1.742, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.094 -[v016] 2022-01-31 08:10:19,422 (trainer:653) INFO: 159epoch:train:244-270batch: iter_time=9.216e-05, forward_time=0.033, loss=1.165, loss_att=0.518, loss_ctc=1.812, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.094 -[v016] 2022-01-31 08:10:21,887 (trainer:653) INFO: 159epoch:train:271-297batch: iter_time=7.614e-05, forward_time=0.032, loss=0.975, loss_att=0.436, loss_ctc=1.513, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.091 -[v016] 2022-01-31 08:10:24,498 (trainer:653) INFO: 159epoch:train:298-324batch: iter_time=8.050e-05, forward_time=0.034, loss=1.194, loss_att=0.464, loss_ctc=1.923, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.096 -[v016] 2022-01-31 08:10:27,004 (trainer:653) INFO: 159epoch:train:325-351batch: iter_time=7.715e-05, forward_time=0.033, loss=1.067, loss_att=0.471, loss_ctc=1.662, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.093 -[v016] 2022-01-31 08:10:29,531 (trainer:653) INFO: 159epoch:train:352-378batch: iter_time=7.828e-05, forward_time=0.033, loss=0.977, loss_att=0.426, loss_ctc=1.528, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.093 -[v016] 2022-01-31 08:10:32,051 (trainer:653) INFO: 159epoch:train:379-405batch: iter_time=7.807e-05, forward_time=0.032, loss=1.053, loss_att=0.463, loss_ctc=1.643, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.093 -[v016] 2022-01-31 08:10:34,548 (trainer:653) INFO: 159epoch:train:406-432batch: iter_time=8.006e-05, forward_time=0.032, loss=1.179, loss_att=0.491, loss_ctc=1.867, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.092 -[v016] 2022-01-31 08:10:37,036 (trainer:653) INFO: 159epoch:train:433-459batch: iter_time=8.233e-05, forward_time=0.032, loss=1.038, loss_att=0.455, loss_ctc=1.621, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.092 -[v016] 2022-01-31 08:10:39,684 (trainer:653) INFO: 159epoch:train:460-486batch: iter_time=0.005, forward_time=0.032, loss=1.123, loss_att=0.476, loss_ctc=1.770, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.098 -[v016] 2022-01-31 08:10:42,080 (trainer:653) INFO: 159epoch:train:487-513batch: iter_time=7.470e-05, forward_time=0.031, loss=0.970, loss_att=0.421, loss_ctc=1.518, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.073e-04, train_time=0.089 -[v016] 2022-01-31 08:10:44,541 (trainer:653) INFO: 159epoch:train:514-540batch: iter_time=7.673e-05, forward_time=0.032, loss=1.127, loss_att=0.506, loss_ctc=1.748, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.091 -[v016] 2022-01-31 08:11:19,037 (trainer:328) INFO: 159epoch results: [train] iter_time=0.001, forward_time=0.033, loss=1.084, loss_att=0.472, loss_ctc=1.696, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.074e-04, train_time=0.095, time=52.1 seconds, total_count=86973, gpu_max_cached_mem_GB=5.824, [valid] loss=7.853, loss_att=6.433, loss_ctc=9.272, acc=0.906, cer=0.098, wer=0.398, cer_ctc=0.140, time=5.82 seconds, total_count=28302, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.77 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:11:21,162 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:11:21,194 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/150epoch.pth -[v016] 2022-01-31 08:11:21,194 (trainer:261) INFO: 160/200epoch started. Estimated time to finish: 1 hour, 11 minutes and 43.05 seconds -[v016] 2022-01-31 08:11:23,932 (trainer:653) INFO: 160epoch:train:1-27batch: iter_time=0.006, forward_time=0.033, loss=1.027, loss_att=0.444, loss_ctc=1.610, acc=0.980, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.101 -[v016] 2022-01-31 08:11:26,432 (trainer:653) INFO: 160epoch:train:28-54batch: iter_time=8.167e-05, forward_time=0.032, loss=0.931, loss_att=0.374, loss_ctc=1.488, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.092 -[v016] 2022-01-31 08:11:28,900 (trainer:653) INFO: 160epoch:train:55-81batch: iter_time=7.648e-05, forward_time=0.032, loss=1.171, loss_att=0.531, loss_ctc=1.811, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.091 -[v016] 2022-01-31 08:11:31,579 (trainer:653) INFO: 160epoch:train:82-108batch: iter_time=0.008, forward_time=0.032, loss=1.092, loss_att=0.499, loss_ctc=1.686, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.099 -[v016] 2022-01-31 08:11:34,110 (trainer:653) INFO: 160epoch:train:109-135batch: iter_time=7.879e-05, forward_time=0.032, loss=1.038, loss_att=0.476, loss_ctc=1.600, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.072e-04, train_time=0.094 -[v016] 2022-01-31 08:11:36,580 (trainer:653) INFO: 160epoch:train:136-162batch: iter_time=7.672e-05, forward_time=0.032, loss=1.036, loss_att=0.503, loss_ctc=1.568, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.091 -[v016] 2022-01-31 08:11:39,091 (trainer:653) INFO: 160epoch:train:163-189batch: iter_time=1.026e-04, forward_time=0.032, loss=1.078, loss_att=0.465, loss_ctc=1.691, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.093 -[v016] 2022-01-31 08:11:41,566 (trainer:653) INFO: 160epoch:train:190-216batch: iter_time=7.591e-05, forward_time=0.032, loss=1.171, loss_att=0.550, loss_ctc=1.792, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.091 -[v016] 2022-01-31 08:11:44,065 (trainer:653) INFO: 160epoch:train:217-243batch: iter_time=7.483e-05, forward_time=0.032, loss=1.112, loss_att=0.486, loss_ctc=1.737, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.092 -[v016] 2022-01-31 08:11:46,508 (trainer:653) INFO: 160epoch:train:244-270batch: iter_time=7.726e-05, forward_time=0.031, loss=1.071, loss_att=0.456, loss_ctc=1.686, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.090 -[v016] 2022-01-31 08:11:49,268 (trainer:653) INFO: 160epoch:train:271-297batch: iter_time=0.008, forward_time=0.032, loss=1.180, loss_att=0.524, loss_ctc=1.836, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.102 -[v016] 2022-01-31 08:11:51,725 (trainer:653) INFO: 160epoch:train:298-324batch: iter_time=7.668e-05, forward_time=0.032, loss=0.976, loss_att=0.390, loss_ctc=1.562, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.091 -[v016] 2022-01-31 08:11:54,290 (trainer:653) INFO: 160epoch:train:325-351batch: iter_time=8.015e-05, forward_time=0.033, loss=1.062, loss_att=0.456, loss_ctc=1.669, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.095 -[v016] 2022-01-31 08:11:56,806 (trainer:653) INFO: 160epoch:train:352-378batch: iter_time=8.435e-05, forward_time=0.033, loss=1.137, loss_att=0.484, loss_ctc=1.789, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.093 -[v016] 2022-01-31 08:11:59,717 (trainer:653) INFO: 160epoch:train:379-405batch: iter_time=0.016, forward_time=0.032, loss=1.170, loss_att=0.524, loss_ctc=1.816, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.108 -[v016] 2022-01-31 08:12:02,218 (trainer:653) INFO: 160epoch:train:406-432batch: iter_time=7.604e-05, forward_time=0.032, loss=1.219, loss_att=0.501, loss_ctc=1.936, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.092 -[v016] 2022-01-31 08:12:04,771 (trainer:653) INFO: 160epoch:train:433-459batch: iter_time=8.066e-05, forward_time=0.033, loss=1.350, loss_att=0.538, loss_ctc=2.162, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.070e-04, train_time=0.094 -[v016] 2022-01-31 08:12:07,309 (trainer:653) INFO: 160epoch:train:460-486batch: iter_time=7.720e-05, forward_time=0.032, loss=1.140, loss_att=0.577, loss_ctc=1.704, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.094 -[v016] 2022-01-31 08:12:09,834 (trainer:653) INFO: 160epoch:train:487-513batch: iter_time=7.610e-05, forward_time=0.033, loss=1.120, loss_att=0.469, loss_ctc=1.771, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.093 -[v016] 2022-01-31 08:12:12,351 (trainer:653) INFO: 160epoch:train:514-540batch: iter_time=8.651e-05, forward_time=0.033, loss=1.051, loss_att=0.464, loss_ctc=1.638, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.093 -[v016] 2022-01-31 08:12:47,163 (trainer:328) INFO: 160epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.105, loss_att=0.485, loss_ctc=1.726, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.071e-04, train_time=0.094, time=51.85 seconds, total_count=87520, gpu_max_cached_mem_GB=5.824, [valid] loss=7.823, loss_att=6.409, loss_ctc=9.238, acc=0.903, cer=0.104, wer=0.411, cer_ctc=0.148, time=6.62 seconds, total_count=28480, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.5 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:12:49,508 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:12:49,725 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/152epoch.pth -[v016] 2022-01-31 08:12:49,725 (trainer:261) INFO: 161/200epoch started. Estimated time to finish: 1 hour, 9 minutes and 53.41 seconds -[v016] 2022-01-31 08:12:52,695 (trainer:653) INFO: 161epoch:train:1-27batch: iter_time=0.015, forward_time=0.033, loss=1.062, loss_att=0.457, loss_ctc=1.667, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.110 -[v016] 2022-01-31 08:12:55,171 (trainer:653) INFO: 161epoch:train:28-54batch: iter_time=8.362e-05, forward_time=0.032, loss=0.946, loss_att=0.466, loss_ctc=1.426, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.092 -[v016] 2022-01-31 08:12:57,673 (trainer:653) INFO: 161epoch:train:55-81batch: iter_time=7.662e-05, forward_time=0.033, loss=0.947, loss_att=0.422, loss_ctc=1.472, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.069e-04, train_time=0.092 -[v016] 2022-01-31 08:13:00,355 (trainer:653) INFO: 161epoch:train:82-108batch: iter_time=1.042e-04, forward_time=0.035, loss=1.100, loss_att=0.447, loss_ctc=1.752, acc=0.981, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.068e-04, train_time=0.099 -[v016] 2022-01-31 08:13:03,102 (trainer:653) INFO: 161epoch:train:109-135batch: iter_time=1.325e-04, forward_time=0.035, loss=1.118, loss_att=0.518, loss_ctc=1.718, acc=0.974, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.068e-04, train_time=0.101 -[v016] 2022-01-31 08:13:05,796 (trainer:653) INFO: 161epoch:train:136-162batch: iter_time=1.049e-04, forward_time=0.034, loss=0.844, loss_att=0.384, loss_ctc=1.303, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.068e-04, train_time=0.100 -[v016] 2022-01-31 08:13:08,522 (trainer:653) INFO: 161epoch:train:163-189batch: iter_time=1.755e-04, forward_time=0.034, loss=1.180, loss_att=0.500, loss_ctc=1.859, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.068e-04, train_time=0.101 -[v016] 2022-01-31 08:13:11,284 (trainer:653) INFO: 161epoch:train:190-216batch: iter_time=1.071e-04, forward_time=0.036, loss=1.031, loss_att=0.479, loss_ctc=1.583, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.068e-04, train_time=0.102 -[v016] 2022-01-31 08:13:13,990 (trainer:653) INFO: 161epoch:train:217-243batch: iter_time=1.206e-04, forward_time=0.034, loss=1.152, loss_att=0.531, loss_ctc=1.773, acc=0.976, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.068e-04, train_time=0.100 -[v016] 2022-01-31 08:13:16,619 (trainer:653) INFO: 161epoch:train:244-270batch: iter_time=1.619e-04, forward_time=0.033, loss=1.042, loss_att=0.485, loss_ctc=1.600, acc=0.973, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.067e-04, train_time=0.097 -[v016] 2022-01-31 08:13:19,543 (trainer:653) INFO: 161epoch:train:271-297batch: iter_time=0.006, forward_time=0.035, loss=1.134, loss_att=0.400, loss_ctc=1.868, acc=0.983, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.067e-04, train_time=0.108 -[v016] 2022-01-31 08:13:22,471 (trainer:653) INFO: 161epoch:train:298-324batch: iter_time=0.010, forward_time=0.033, loss=1.135, loss_att=0.485, loss_ctc=1.785, acc=0.974, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.067e-04, train_time=0.108 -[v016] 2022-01-31 08:13:25,199 (trainer:653) INFO: 161epoch:train:325-351batch: iter_time=1.298e-04, forward_time=0.035, loss=1.206, loss_att=0.549, loss_ctc=1.863, acc=0.977, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.067e-04, train_time=0.101 -[v016] 2022-01-31 08:13:28,076 (trainer:653) INFO: 161epoch:train:352-378batch: iter_time=0.009, forward_time=0.033, loss=1.016, loss_att=0.484, loss_ctc=1.549, acc=0.975, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.067e-04, train_time=0.106 -[v016] 2022-01-31 08:13:30,689 (trainer:653) INFO: 161epoch:train:379-405batch: iter_time=1.039e-04, forward_time=0.033, loss=0.954, loss_att=0.416, loss_ctc=1.491, acc=0.982, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.067e-04, train_time=0.097 -[v016] 2022-01-31 08:13:35,571 (trainer:653) INFO: 161epoch:train:406-432batch: iter_time=9.808e-05, forward_time=0.058, loss=0.966, loss_att=0.445, loss_ctc=1.488, acc=0.976, backward_time=0.073, optim_step_time=0.024, optim0_lr0=1.066e-04, train_time=0.181 -[v016] 2022-01-31 08:13:38,080 (trainer:653) INFO: 161epoch:train:433-459batch: iter_time=8.267e-05, forward_time=0.031, loss=1.221, loss_att=0.562, loss_ctc=1.880, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.066e-04, train_time=0.093 -[v016] 2022-01-31 08:13:40,648 (trainer:653) INFO: 161epoch:train:460-486batch: iter_time=8.180e-05, forward_time=0.032, loss=1.011, loss_att=0.449, loss_ctc=1.574, acc=0.979, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.066e-04, train_time=0.095 -[v016] 2022-01-31 08:13:45,192 (trainer:653) INFO: 161epoch:train:487-513batch: iter_time=0.005, forward_time=0.053, loss=1.112, loss_att=0.434, loss_ctc=1.790, acc=0.979, backward_time=0.045, optim_step_time=0.026, optim0_lr0=1.066e-04, train_time=0.168 -[v016] 2022-01-31 08:13:48,270 (trainer:653) INFO: 161epoch:train:514-540batch: iter_time=0.013, forward_time=0.035, loss=1.058, loss_att=0.554, loss_ctc=1.562, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.066e-04, train_time=0.114 -[v016] 2022-01-31 08:14:29,763 (trainer:328) INFO: 161epoch results: [train] iter_time=0.003, forward_time=0.036, loss=1.060, loss_att=0.471, loss_ctc=1.648, acc=0.977, backward_time=0.026, optim_step_time=0.022, optim0_lr0=1.067e-04, train_time=0.108, time=59.33 seconds, total_count=88067, gpu_max_cached_mem_GB=5.824, [valid] loss=7.728, loss_att=6.397, loss_ctc=9.058, acc=0.905, cer=0.100, wer=0.400, cer_ctc=0.141, time=9.24 seconds, total_count=28658, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.45 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:14:32,105 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 08:14:32,116 (trainer:261) INFO: 162/200epoch started. Estimated time to finish: 1 hour, 8 minutes and 7.9 seconds -[v016] 2022-01-31 08:14:35,056 (trainer:653) INFO: 162epoch:train:1-27batch: iter_time=0.011, forward_time=0.033, loss=1.197, loss_att=0.520, loss_ctc=1.874, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.066e-04, train_time=0.108 -[v016] 2022-01-31 08:14:37,699 (trainer:653) INFO: 162epoch:train:28-54batch: iter_time=1.028e-04, forward_time=0.033, loss=1.120, loss_att=0.430, loss_ctc=1.811, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.065e-04, train_time=0.098 -[v016] 2022-01-31 08:14:40,684 (trainer:653) INFO: 162epoch:train:55-81batch: iter_time=0.013, forward_time=0.033, loss=1.068, loss_att=0.439, loss_ctc=1.697, acc=0.975, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.065e-04, train_time=0.110 -[v016] 2022-01-31 08:14:43,650 (trainer:653) INFO: 162epoch:train:82-108batch: iter_time=0.013, forward_time=0.032, loss=1.122, loss_att=0.448, loss_ctc=1.796, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.065e-04, train_time=0.110 -[v016] 2022-01-31 08:14:46,702 (trainer:653) INFO: 162epoch:train:109-135batch: iter_time=0.013, forward_time=0.034, loss=1.037, loss_att=0.431, loss_ctc=1.644, acc=0.981, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.065e-04, train_time=0.113 -[v016] 2022-01-31 08:14:49,514 (trainer:653) INFO: 162epoch:train:136-162batch: iter_time=0.005, forward_time=0.034, loss=1.144, loss_att=0.477, loss_ctc=1.811, acc=0.976, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.065e-04, train_time=0.104 -[v016] 2022-01-31 08:14:52,166 (trainer:653) INFO: 162epoch:train:163-189batch: iter_time=7.071e-04, forward_time=0.033, loss=1.055, loss_att=0.515, loss_ctc=1.595, acc=0.973, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.065e-04, train_time=0.098 -[v016] 2022-01-31 08:14:54,798 (trainer:653) INFO: 162epoch:train:190-216batch: iter_time=8.562e-05, forward_time=0.032, loss=0.940, loss_att=0.422, loss_ctc=1.457, acc=0.979, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.064e-04, train_time=0.097 -[v016] 2022-01-31 08:14:58,072 (trainer:653) INFO: 162epoch:train:217-243batch: iter_time=0.024, forward_time=0.033, loss=1.265, loss_att=0.515, loss_ctc=2.015, acc=0.979, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.064e-04, train_time=0.121 -[v016] 2022-01-31 08:15:00,745 (trainer:653) INFO: 162epoch:train:244-270batch: iter_time=0.003, forward_time=0.033, loss=1.224, loss_att=0.527, loss_ctc=1.921, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.064e-04, train_time=0.099 -[v016] 2022-01-31 08:15:03,387 (trainer:653) INFO: 162epoch:train:271-297batch: iter_time=9.764e-05, forward_time=0.033, loss=0.991, loss_att=0.440, loss_ctc=1.543, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.064e-04, train_time=0.098 -[v016] 2022-01-31 08:15:06,052 (trainer:653) INFO: 162epoch:train:298-324batch: iter_time=1.069e-04, forward_time=0.033, loss=1.140, loss_att=0.447, loss_ctc=1.834, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.064e-04, train_time=0.098 -[v016] 2022-01-31 08:15:09,478 (trainer:653) INFO: 162epoch:train:325-351batch: iter_time=0.032, forward_time=0.033, loss=1.137, loss_att=0.494, loss_ctc=1.779, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.064e-04, train_time=0.127 -[v016] 2022-01-31 08:15:12,384 (trainer:653) INFO: 162epoch:train:352-378batch: iter_time=0.009, forward_time=0.033, loss=1.114, loss_att=0.560, loss_ctc=1.669, acc=0.968, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.107 -[v016] 2022-01-31 08:15:15,058 (trainer:653) INFO: 162epoch:train:379-405batch: iter_time=1.173e-04, forward_time=0.033, loss=0.821, loss_att=0.419, loss_ctc=1.222, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.099 -[v016] 2022-01-31 08:15:17,752 (trainer:653) INFO: 162epoch:train:406-432batch: iter_time=1.191e-04, forward_time=0.034, loss=1.147, loss_att=0.580, loss_ctc=1.715, acc=0.971, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.100 -[v016] 2022-01-31 08:15:20,693 (trainer:653) INFO: 162epoch:train:433-459batch: iter_time=0.008, forward_time=0.034, loss=1.037, loss_att=0.423, loss_ctc=1.650, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.109 -[v016] 2022-01-31 08:15:23,797 (trainer:653) INFO: 162epoch:train:460-486batch: iter_time=0.015, forward_time=0.034, loss=0.885, loss_att=0.383, loss_ctc=1.387, acc=0.983, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.115 -[v016] 2022-01-31 08:15:28,003 (trainer:653) INFO: 162epoch:train:487-513batch: iter_time=0.057, forward_time=0.033, loss=1.103, loss_att=0.472, loss_ctc=1.733, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.063e-04, train_time=0.156 -[v016] 2022-01-31 08:15:31,645 (trainer:653) INFO: 162epoch:train:514-540batch: iter_time=0.035, forward_time=0.033, loss=1.013, loss_att=0.444, loss_ctc=1.582, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.062e-04, train_time=0.135 -[v016] 2022-01-31 08:16:12,117 (trainer:328) INFO: 162epoch results: [train] iter_time=0.012, forward_time=0.033, loss=1.073, loss_att=0.467, loss_ctc=1.678, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.064e-04, train_time=0.110, time=1 minute and 0.42 seconds, total_count=88614, gpu_max_cached_mem_GB=5.824, [valid] loss=7.796, loss_att=6.476, loss_ctc=9.116, acc=0.906, cer=0.100, wer=0.396, cer_ctc=0.140, time=7.87 seconds, total_count=28836, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.64 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:16:14,843 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:16:14,854 (trainer:261) INFO: 163/200epoch started. Estimated time to finish: 1 hour, 6 minutes and 22.52 seconds -[v016] 2022-01-31 08:16:20,175 (trainer:653) INFO: 163epoch:train:1-27batch: iter_time=0.048, forward_time=0.062, loss=0.861, loss_att=0.395, loss_ctc=1.328, acc=0.980, backward_time=0.036, optim_step_time=0.025, optim0_lr0=1.062e-04, train_time=0.195 -[v016] 2022-01-31 08:16:23,730 (trainer:653) INFO: 163epoch:train:28-54batch: iter_time=0.026, forward_time=0.036, loss=1.055, loss_att=0.395, loss_ctc=1.715, acc=0.984, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.062e-04, train_time=0.132 -[v016] 2022-01-31 08:16:28,174 (trainer:653) INFO: 163epoch:train:55-81batch: iter_time=0.062, forward_time=0.034, loss=1.083, loss_att=0.392, loss_ctc=1.774, acc=0.985, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.062e-04, train_time=0.164 -[v016] 2022-01-31 08:16:31,900 (trainer:653) INFO: 163epoch:train:82-108batch: iter_time=0.040, forward_time=0.034, loss=1.008, loss_att=0.478, loss_ctc=1.539, acc=0.977, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.062e-04, train_time=0.138 -[v016] 2022-01-31 08:16:34,884 (trainer:653) INFO: 163epoch:train:109-135batch: iter_time=0.020, forward_time=0.030, loss=1.102, loss_att=0.533, loss_ctc=1.671, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.062e-04, train_time=0.110 -[v016] 2022-01-31 08:16:38,356 (trainer:653) INFO: 163epoch:train:136-162batch: iter_time=0.031, forward_time=0.033, loss=0.972, loss_att=0.387, loss_ctc=1.557, acc=0.983, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.061e-04, train_time=0.128 -[v016] 2022-01-31 08:16:41,534 (trainer:653) INFO: 163epoch:train:163-189batch: iter_time=0.017, forward_time=0.034, loss=1.139, loss_att=0.564, loss_ctc=1.715, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.117 -[v016] 2022-01-31 08:16:44,801 (trainer:653) INFO: 163epoch:train:190-216batch: iter_time=0.020, forward_time=0.034, loss=1.266, loss_att=0.531, loss_ctc=2.001, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.121 -[v016] 2022-01-31 08:16:48,195 (trainer:653) INFO: 163epoch:train:217-243batch: iter_time=0.021, forward_time=0.038, loss=1.131, loss_att=0.438, loss_ctc=1.824, acc=0.979, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.125 -[v016] 2022-01-31 08:16:51,194 (trainer:653) INFO: 163epoch:train:244-270batch: iter_time=0.007, forward_time=0.035, loss=1.191, loss_att=0.529, loss_ctc=1.852, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.111 -[v016] 2022-01-31 08:16:57,640 (trainer:653) INFO: 163epoch:train:271-297batch: iter_time=0.139, forward_time=0.034, loss=0.973, loss_att=0.432, loss_ctc=1.513, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.239 -[v016] 2022-01-31 08:17:01,386 (trainer:653) INFO: 163epoch:train:298-324batch: iter_time=0.039, forward_time=0.034, loss=1.107, loss_att=0.531, loss_ctc=1.683, acc=0.970, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.060e-04, train_time=0.138 -[v016] 2022-01-31 08:17:04,977 (trainer:653) INFO: 163epoch:train:325-351batch: iter_time=0.029, forward_time=0.035, loss=1.200, loss_att=0.463, loss_ctc=1.938, acc=0.980, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.060e-04, train_time=0.133 -[v016] 2022-01-31 08:17:08,878 (trainer:653) INFO: 163epoch:train:352-378batch: iter_time=0.049, forward_time=0.032, loss=1.214, loss_att=0.550, loss_ctc=1.878, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.060e-04, train_time=0.144 -[v016] 2022-01-31 08:17:11,899 (trainer:653) INFO: 163epoch:train:379-405batch: iter_time=0.015, forward_time=0.032, loss=1.106, loss_att=0.483, loss_ctc=1.729, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.060e-04, train_time=0.112 -[v016] 2022-01-31 08:17:15,540 (trainer:653) INFO: 163epoch:train:406-432batch: iter_time=0.033, forward_time=0.034, loss=0.959, loss_att=0.428, loss_ctc=1.490, acc=0.981, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.060e-04, train_time=0.135 -[v016] 2022-01-31 08:17:20,525 (trainer:653) INFO: 163epoch:train:433-459batch: iter_time=0.086, forward_time=0.033, loss=0.964, loss_att=0.457, loss_ctc=1.470, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.060e-04, train_time=0.184 -[v016] 2022-01-31 08:17:23,372 (trainer:653) INFO: 163epoch:train:460-486batch: iter_time=0.017, forward_time=0.030, loss=1.169, loss_att=0.547, loss_ctc=1.791, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.059e-04, train_time=0.105 -[v016] 2022-01-31 08:17:28,040 (trainer:653) INFO: 163epoch:train:487-513batch: iter_time=0.079, forward_time=0.032, loss=1.213, loss_att=0.531, loss_ctc=1.895, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.059e-04, train_time=0.173 -[v016] 2022-01-31 08:17:36,120 (trainer:653) INFO: 163epoch:train:514-540batch: iter_time=0.188, forward_time=0.043, loss=1.124, loss_att=0.464, loss_ctc=1.783, acc=0.979, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.059e-04, train_time=0.299 -[v016] 2022-01-31 08:18:30,155 (trainer:328) INFO: 163epoch results: [train] iter_time=0.048, forward_time=0.035, loss=1.086, loss_att=0.475, loss_ctc=1.698, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.061e-04, train_time=0.150, time=1 minute and 22.14 seconds, total_count=89161, gpu_max_cached_mem_GB=5.824, [valid] loss=7.717, loss_att=6.374, loss_ctc=9.059, acc=0.906, cer=0.098, wer=0.398, cer_ctc=0.137, time=19.3 seconds, total_count=29014, gpu_max_cached_mem_GB=5.824, [att_plot] time=33.81 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:18:32,733 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:18:32,812 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/156epoch.pth, exp/asr_train_asr_raw_en_word/158epoch.pth -[v016] 2022-01-31 08:18:32,813 (trainer:261) INFO: 164/200epoch started. Estimated time to finish: 1 hour, 4 minutes and 46.3 seconds -[v016] 2022-01-31 08:18:37,588 (trainer:653) INFO: 164epoch:train:1-27batch: iter_time=0.029, forward_time=0.050, loss=1.057, loss_att=0.379, loss_ctc=1.735, acc=0.982, backward_time=0.040, optim_step_time=0.023, optim0_lr0=1.059e-04, train_time=0.174 -[v016] 2022-01-31 08:18:41,418 (trainer:653) INFO: 164epoch:train:28-54batch: iter_time=0.050, forward_time=0.031, loss=0.849, loss_att=0.339, loss_ctc=1.360, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.059e-04, train_time=0.142 -[v016] 2022-01-31 08:18:44,178 (trainer:653) INFO: 164epoch:train:55-81batch: iter_time=0.011, forward_time=0.031, loss=1.089, loss_att=0.468, loss_ctc=1.711, acc=0.976, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.059e-04, train_time=0.102 -[v016] 2022-01-31 08:18:47,042 (trainer:653) INFO: 164epoch:train:82-108batch: iter_time=0.014, forward_time=0.031, loss=1.171, loss_att=0.461, loss_ctc=1.881, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.106 -[v016] 2022-01-31 08:18:50,045 (trainer:653) INFO: 164epoch:train:109-135batch: iter_time=0.020, forward_time=0.030, loss=1.084, loss_att=0.423, loss_ctc=1.745, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.111 -[v016] 2022-01-31 08:18:53,079 (trainer:653) INFO: 164epoch:train:136-162batch: iter_time=0.022, forward_time=0.031, loss=1.047, loss_att=0.451, loss_ctc=1.642, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.112 -[v016] 2022-01-31 08:18:55,541 (trainer:653) INFO: 164epoch:train:163-189batch: iter_time=7.785e-04, forward_time=0.031, loss=1.108, loss_att=0.491, loss_ctc=1.725, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.091 -[v016] 2022-01-31 08:18:58,126 (trainer:653) INFO: 164epoch:train:190-216batch: iter_time=0.002, forward_time=0.032, loss=1.149, loss_att=0.451, loss_ctc=1.847, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.096 -[v016] 2022-01-31 08:19:01,214 (trainer:653) INFO: 164epoch:train:217-243batch: iter_time=0.020, forward_time=0.032, loss=1.021, loss_att=0.409, loss_ctc=1.634, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.114 -[v016] 2022-01-31 08:19:04,243 (trainer:653) INFO: 164epoch:train:244-270batch: iter_time=0.021, forward_time=0.031, loss=1.029, loss_att=0.421, loss_ctc=1.638, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.058e-04, train_time=0.112 -[v016] 2022-01-31 08:19:07,192 (trainer:653) INFO: 164epoch:train:271-297batch: iter_time=0.018, forward_time=0.031, loss=1.062, loss_att=0.458, loss_ctc=1.667, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.109 -[v016] 2022-01-31 08:19:09,953 (trainer:653) INFO: 164epoch:train:298-324batch: iter_time=0.010, forward_time=0.031, loss=1.185, loss_att=0.540, loss_ctc=1.831, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.102 -[v016] 2022-01-31 08:19:12,470 (trainer:653) INFO: 164epoch:train:325-351batch: iter_time=0.002, forward_time=0.031, loss=1.029, loss_att=0.467, loss_ctc=1.592, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.093 -[v016] 2022-01-31 08:19:15,059 (trainer:653) INFO: 164epoch:train:352-378batch: iter_time=0.004, forward_time=0.031, loss=1.245, loss_att=0.584, loss_ctc=1.906, acc=0.969, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.096 -[v016] 2022-01-31 08:19:17,837 (trainer:653) INFO: 164epoch:train:379-405batch: iter_time=0.010, forward_time=0.031, loss=1.274, loss_att=0.559, loss_ctc=1.989, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.103 -[v016] 2022-01-31 08:19:21,211 (trainer:653) INFO: 164epoch:train:406-432batch: iter_time=0.032, forward_time=0.031, loss=1.100, loss_att=0.512, loss_ctc=1.688, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.125 -[v016] 2022-01-31 08:19:23,649 (trainer:653) INFO: 164epoch:train:433-459batch: iter_time=8.939e-05, forward_time=0.030, loss=0.960, loss_att=0.456, loss_ctc=1.465, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.090 -[v016] 2022-01-31 08:19:26,064 (trainer:653) INFO: 164epoch:train:460-486batch: iter_time=8.524e-05, forward_time=0.030, loss=1.114, loss_att=0.535, loss_ctc=1.693, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.089 -[v016] 2022-01-31 08:19:29,050 (trainer:653) INFO: 164epoch:train:487-513batch: iter_time=0.016, forward_time=0.032, loss=1.274, loss_att=0.502, loss_ctc=2.046, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.110 -[v016] 2022-01-31 08:19:32,268 (trainer:653) INFO: 164epoch:train:514-540batch: iter_time=0.024, forward_time=0.032, loss=1.270, loss_att=0.549, loss_ctc=1.992, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.119 -[v016] 2022-01-31 08:20:08,547 (trainer:328) INFO: 164epoch results: [train] iter_time=0.015, forward_time=0.032, loss=1.105, loss_att=0.472, loss_ctc=1.737, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.057e-04, train_time=0.110, time=1 minute and 0.17 seconds, total_count=89708, gpu_max_cached_mem_GB=5.824, [valid] loss=7.816, loss_att=6.376, loss_ctc=9.255, acc=0.904, cer=0.100, wer=0.400, cer_ctc=0.143, time=7.84 seconds, total_count=29192, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.71 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:20:10,970 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:20:11,003 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/160epoch.pth -[v016] 2022-01-31 08:20:11,003 (trainer:261) INFO: 165/200epoch started. Estimated time to finish: 1 hour, 2 minutes and 59.55 seconds -[v016] 2022-01-31 08:20:13,669 (trainer:653) INFO: 165epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=0.902, loss_att=0.412, loss_ctc=1.391, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.097 -[v016] 2022-01-31 08:20:16,182 (trainer:653) INFO: 165epoch:train:28-54batch: iter_time=7.951e-05, forward_time=0.032, loss=0.966, loss_att=0.438, loss_ctc=1.493, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.056e-04, train_time=0.093 -[v016] 2022-01-31 08:20:18,642 (trainer:653) INFO: 165epoch:train:55-81batch: iter_time=8.081e-05, forward_time=0.032, loss=0.915, loss_att=0.433, loss_ctc=1.396, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.091 -[v016] 2022-01-31 08:20:21,113 (trainer:653) INFO: 165epoch:train:82-108batch: iter_time=7.905e-05, forward_time=0.032, loss=1.014, loss_att=0.413, loss_ctc=1.615, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.091 -[v016] 2022-01-31 08:20:23,563 (trainer:653) INFO: 165epoch:train:109-135batch: iter_time=7.511e-05, forward_time=0.031, loss=1.166, loss_att=0.573, loss_ctc=1.760, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.091 -[v016] 2022-01-31 08:20:26,105 (trainer:653) INFO: 165epoch:train:136-162batch: iter_time=7.747e-05, forward_time=0.033, loss=1.032, loss_att=0.363, loss_ctc=1.702, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.094 -[v016] 2022-01-31 08:20:28,502 (trainer:653) INFO: 165epoch:train:163-189batch: iter_time=7.795e-05, forward_time=0.031, loss=1.005, loss_att=0.494, loss_ctc=1.517, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.089 -[v016] 2022-01-31 08:20:31,048 (trainer:653) INFO: 165epoch:train:190-216batch: iter_time=7.883e-05, forward_time=0.033, loss=1.084, loss_att=0.467, loss_ctc=1.701, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.055e-04, train_time=0.094 -[v016] 2022-01-31 08:20:33,469 (trainer:653) INFO: 165epoch:train:217-243batch: iter_time=7.627e-05, forward_time=0.031, loss=0.951, loss_att=0.442, loss_ctc=1.461, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.089 -[v016] 2022-01-31 08:20:36,071 (trainer:653) INFO: 165epoch:train:244-270batch: iter_time=0.004, forward_time=0.032, loss=1.169, loss_att=0.531, loss_ctc=1.806, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.096 -[v016] 2022-01-31 08:20:38,515 (trainer:653) INFO: 165epoch:train:271-297batch: iter_time=7.819e-05, forward_time=0.031, loss=1.142, loss_att=0.508, loss_ctc=1.776, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.090 -[v016] 2022-01-31 08:20:41,237 (trainer:653) INFO: 165epoch:train:298-324batch: iter_time=0.009, forward_time=0.031, loss=1.259, loss_att=0.490, loss_ctc=2.028, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.101 -[v016] 2022-01-31 08:20:43,803 (trainer:653) INFO: 165epoch:train:325-351batch: iter_time=7.840e-05, forward_time=0.033, loss=1.195, loss_att=0.513, loss_ctc=1.877, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.095 -[v016] 2022-01-31 08:20:46,313 (trainer:653) INFO: 165epoch:train:352-378batch: iter_time=8.636e-05, forward_time=0.032, loss=1.220, loss_att=0.545, loss_ctc=1.895, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.093 -[v016] 2022-01-31 08:20:48,757 (trainer:653) INFO: 165epoch:train:379-405batch: iter_time=7.993e-05, forward_time=0.031, loss=1.076, loss_att=0.517, loss_ctc=1.635, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.090 -[v016] 2022-01-31 08:20:51,303 (trainer:653) INFO: 165epoch:train:406-432batch: iter_time=9.128e-05, forward_time=0.033, loss=1.132, loss_att=0.467, loss_ctc=1.796, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.094 -[v016] 2022-01-31 08:20:53,691 (trainer:653) INFO: 165epoch:train:433-459batch: iter_time=7.726e-05, forward_time=0.031, loss=1.057, loss_att=0.536, loss_ctc=1.578, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.088 -[v016] 2022-01-31 08:20:56,262 (trainer:653) INFO: 165epoch:train:460-486batch: iter_time=7.947e-05, forward_time=0.033, loss=1.386, loss_att=0.608, loss_ctc=2.163, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.095 -[v016] 2022-01-31 08:20:58,739 (trainer:653) INFO: 165epoch:train:487-513batch: iter_time=8.177e-05, forward_time=0.032, loss=1.089, loss_att=0.493, loss_ctc=1.684, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.092 -[v016] 2022-01-31 08:21:01,216 (trainer:653) INFO: 165epoch:train:514-540batch: iter_time=8.097e-05, forward_time=0.032, loss=1.079, loss_att=0.447, loss_ctc=1.711, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.092 -[v016] 2022-01-31 08:21:35,706 (trainer:328) INFO: 165epoch results: [train] iter_time=9.250e-04, forward_time=0.032, loss=1.091, loss_att=0.482, loss_ctc=1.700, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.054e-04, train_time=0.093, time=50.94 seconds, total_count=90255, gpu_max_cached_mem_GB=5.824, [valid] loss=7.969, loss_att=6.553, loss_ctc=9.384, acc=0.904, cer=0.102, wer=0.404, cer_ctc=0.144, time=5.87 seconds, total_count=29370, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.87 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:21:37,861 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:21:37,873 (trainer:261) INFO: 166/200epoch started. Estimated time to finish: 1 hour, 1 minute and 10.19 seconds -[v016] 2022-01-31 08:21:40,557 (trainer:653) INFO: 166epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=1.030, loss_att=0.439, loss_ctc=1.621, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.053e-04, train_time=0.099 -[v016] 2022-01-31 08:21:43,869 (trainer:653) INFO: 166epoch:train:28-54batch: iter_time=0.030, forward_time=0.032, loss=0.838, loss_att=0.377, loss_ctc=1.300, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.122 -[v016] 2022-01-31 08:21:46,295 (trainer:653) INFO: 166epoch:train:55-81batch: iter_time=7.531e-05, forward_time=0.031, loss=1.175, loss_att=0.572, loss_ctc=1.778, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.090 -[v016] 2022-01-31 08:21:48,827 (trainer:653) INFO: 166epoch:train:82-108batch: iter_time=7.538e-05, forward_time=0.033, loss=1.158, loss_att=0.496, loss_ctc=1.820, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.094 -[v016] 2022-01-31 08:21:51,311 (trainer:653) INFO: 166epoch:train:109-135batch: iter_time=7.705e-05, forward_time=0.032, loss=1.097, loss_att=0.520, loss_ctc=1.674, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.092 -[v016] 2022-01-31 08:21:54,574 (trainer:653) INFO: 166epoch:train:136-162batch: iter_time=0.029, forward_time=0.032, loss=0.938, loss_att=0.406, loss_ctc=1.471, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.121 -[v016] 2022-01-31 08:21:57,153 (trainer:653) INFO: 166epoch:train:163-189batch: iter_time=8.964e-05, forward_time=0.034, loss=0.994, loss_att=0.388, loss_ctc=1.600, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.052e-04, train_time=0.095 -[v016] 2022-01-31 08:21:59,641 (trainer:653) INFO: 166epoch:train:190-216batch: iter_time=8.082e-05, forward_time=0.032, loss=0.971, loss_att=0.409, loss_ctc=1.532, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.092 -[v016] 2022-01-31 08:22:02,119 (trainer:653) INFO: 166epoch:train:217-243batch: iter_time=8.005e-05, forward_time=0.032, loss=1.292, loss_att=0.599, loss_ctc=1.986, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.092 -[v016] 2022-01-31 08:22:04,602 (trainer:653) INFO: 166epoch:train:244-270batch: iter_time=9.274e-05, forward_time=0.033, loss=0.899, loss_att=0.407, loss_ctc=1.390, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.092 -[v016] 2022-01-31 08:22:07,173 (trainer:653) INFO: 166epoch:train:271-297batch: iter_time=7.922e-05, forward_time=0.033, loss=1.014, loss_att=0.422, loss_ctc=1.606, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.095 -[v016] 2022-01-31 08:22:09,715 (trainer:653) INFO: 166epoch:train:298-324batch: iter_time=0.002, forward_time=0.033, loss=1.034, loss_att=0.441, loss_ctc=1.628, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.094 -[v016] 2022-01-31 08:22:12,212 (trainer:653) INFO: 166epoch:train:325-351batch: iter_time=8.342e-05, forward_time=0.033, loss=0.936, loss_att=0.382, loss_ctc=1.489, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.092 -[v016] 2022-01-31 08:22:14,933 (trainer:653) INFO: 166epoch:train:352-378batch: iter_time=0.009, forward_time=0.032, loss=1.064, loss_att=0.459, loss_ctc=1.668, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.101 -[v016] 2022-01-31 08:22:17,440 (trainer:653) INFO: 166epoch:train:379-405batch: iter_time=7.974e-05, forward_time=0.033, loss=1.099, loss_att=0.418, loss_ctc=1.780, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.093 -[v016] 2022-01-31 08:22:20,014 (trainer:653) INFO: 166epoch:train:406-432batch: iter_time=8.024e-05, forward_time=0.034, loss=1.033, loss_att=0.437, loss_ctc=1.629, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.095 -[v016] 2022-01-31 08:22:22,457 (trainer:653) INFO: 166epoch:train:433-459batch: iter_time=7.630e-05, forward_time=0.032, loss=1.093, loss_att=0.469, loss_ctc=1.717, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.090 -[v016] 2022-01-31 08:22:24,902 (trainer:653) INFO: 166epoch:train:460-486batch: iter_time=7.896e-05, forward_time=0.032, loss=0.947, loss_att=0.447, loss_ctc=1.447, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.090 -[v016] 2022-01-31 08:22:27,386 (trainer:653) INFO: 166epoch:train:487-513batch: iter_time=8.845e-05, forward_time=0.032, loss=0.979, loss_att=0.438, loss_ctc=1.520, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.092 -[v016] 2022-01-31 08:22:29,945 (trainer:653) INFO: 166epoch:train:514-540batch: iter_time=9.505e-05, forward_time=0.033, loss=0.965, loss_att=0.463, loss_ctc=1.467, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.050e-04, train_time=0.095 -[v016] 2022-01-31 08:23:04,141 (trainer:328) INFO: 166epoch results: [train] iter_time=0.004, forward_time=0.033, loss=1.033, loss_att=0.450, loss_ctc=1.616, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.051e-04, train_time=0.096, time=52.83 seconds, total_count=90802, gpu_max_cached_mem_GB=5.824, [valid] loss=7.968, loss_att=6.575, loss_ctc=9.362, acc=0.905, cer=0.100, wer=0.399, cer_ctc=0.144, time=5.83 seconds, total_count=29548, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.61 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:23:06,266 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:23:06,278 (trainer:261) INFO: 167/200epoch started. Estimated time to finish: 59 minutes and 21.49 seconds -[v016] 2022-01-31 08:23:08,940 (trainer:653) INFO: 167epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.945, loss_att=0.452, loss_ctc=1.439, acc=0.973, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.049e-04, train_time=0.098 -[v016] 2022-01-31 08:23:11,510 (trainer:653) INFO: 167epoch:train:28-54batch: iter_time=9.093e-05, forward_time=0.033, loss=0.899, loss_att=0.351, loss_ctc=1.448, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.049e-04, train_time=0.095 -[v016] 2022-01-31 08:23:13,982 (trainer:653) INFO: 167epoch:train:55-81batch: iter_time=8.611e-05, forward_time=0.032, loss=0.903, loss_att=0.481, loss_ctc=1.325, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.049e-04, train_time=0.091 -[v016] 2022-01-31 08:23:16,886 (trainer:653) INFO: 167epoch:train:82-108batch: iter_time=0.016, forward_time=0.032, loss=0.927, loss_att=0.444, loss_ctc=1.409, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.049e-04, train_time=0.107 -[v016] 2022-01-31 08:23:19,334 (trainer:653) INFO: 167epoch:train:109-135batch: iter_time=0.002, forward_time=0.031, loss=1.087, loss_att=0.475, loss_ctc=1.698, acc=0.977, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.049e-04, train_time=0.090 -[v016] 2022-01-31 08:23:21,741 (trainer:653) INFO: 167epoch:train:136-162batch: iter_time=7.600e-05, forward_time=0.031, loss=1.080, loss_att=0.447, loss_ctc=1.714, acc=0.979, backward_time=0.021, optim_step_time=0.020, optim0_lr0=1.049e-04, train_time=0.089 -[v016] 2022-01-31 08:23:24,212 (trainer:653) INFO: 167epoch:train:163-189batch: iter_time=7.591e-05, forward_time=0.031, loss=1.007, loss_att=0.438, loss_ctc=1.576, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.091 -[v016] 2022-01-31 08:23:26,652 (trainer:653) INFO: 167epoch:train:190-216batch: iter_time=7.581e-05, forward_time=0.031, loss=0.971, loss_att=0.431, loss_ctc=1.510, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.090 -[v016] 2022-01-31 08:23:29,175 (trainer:653) INFO: 167epoch:train:217-243batch: iter_time=7.781e-05, forward_time=0.032, loss=1.285, loss_att=0.559, loss_ctc=2.011, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.093 -[v016] 2022-01-31 08:23:31,630 (trainer:653) INFO: 167epoch:train:244-270batch: iter_time=7.984e-05, forward_time=0.031, loss=1.074, loss_att=0.524, loss_ctc=1.624, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.091 -[v016] 2022-01-31 08:23:34,133 (trainer:653) INFO: 167epoch:train:271-297batch: iter_time=8.086e-05, forward_time=0.032, loss=1.206, loss_att=0.456, loss_ctc=1.957, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.092 -[v016] 2022-01-31 08:23:36,640 (trainer:653) INFO: 167epoch:train:298-324batch: iter_time=7.727e-05, forward_time=0.032, loss=1.055, loss_att=0.493, loss_ctc=1.616, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.093 -[v016] 2022-01-31 08:23:39,155 (trainer:653) INFO: 167epoch:train:325-351batch: iter_time=8.071e-05, forward_time=0.033, loss=1.142, loss_att=0.434, loss_ctc=1.850, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.093 -[v016] 2022-01-31 08:23:41,660 (trainer:653) INFO: 167epoch:train:352-378batch: iter_time=7.661e-05, forward_time=0.032, loss=0.943, loss_att=0.390, loss_ctc=1.497, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.093 -[v016] 2022-01-31 08:23:44,134 (trainer:653) INFO: 167epoch:train:379-405batch: iter_time=7.552e-05, forward_time=0.031, loss=0.917, loss_att=0.361, loss_ctc=1.473, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.091 -[v016] 2022-01-31 08:23:46,998 (trainer:653) INFO: 167epoch:train:406-432batch: iter_time=0.009, forward_time=0.033, loss=1.253, loss_att=0.492, loss_ctc=2.014, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.106 -[v016] 2022-01-31 08:23:49,950 (trainer:653) INFO: 167epoch:train:433-459batch: iter_time=0.017, forward_time=0.032, loss=1.137, loss_att=0.447, loss_ctc=1.828, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.109 -[v016] 2022-01-31 08:23:52,345 (trainer:653) INFO: 167epoch:train:460-486batch: iter_time=7.568e-05, forward_time=0.031, loss=0.935, loss_att=0.409, loss_ctc=1.461, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.088 -[v016] 2022-01-31 08:23:54,814 (trainer:653) INFO: 167epoch:train:487-513batch: iter_time=7.752e-05, forward_time=0.032, loss=1.036, loss_att=0.476, loss_ctc=1.596, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.047e-04, train_time=0.091 -[v016] 2022-01-31 08:23:57,338 (trainer:653) INFO: 167epoch:train:514-540batch: iter_time=8.017e-05, forward_time=0.033, loss=1.220, loss_att=0.472, loss_ctc=1.967, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.093 -[v016] 2022-01-31 08:24:31,924 (trainer:328) INFO: 167epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.045, loss_att=0.450, loss_ctc=1.640, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.048e-04, train_time=0.094, time=51.76 seconds, total_count=91349, gpu_max_cached_mem_GB=5.824, [valid] loss=7.883, loss_att=6.516, loss_ctc=9.251, acc=0.906, cer=0.098, wer=0.398, cer_ctc=0.141, time=6.11 seconds, total_count=29726, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.78 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:24:34,036 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:24:34,087 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/165epoch.pth -[v016] 2022-01-31 08:24:34,087 (trainer:261) INFO: 168/200epoch started. Estimated time to finish: 57 minutes and 32.94 seconds -[v016] 2022-01-31 08:24:36,732 (trainer:653) INFO: 168epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.848, loss_att=0.370, loss_ctc=1.326, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.098 -[v016] 2022-01-31 08:24:39,286 (trainer:653) INFO: 168epoch:train:28-54batch: iter_time=8.827e-05, forward_time=0.033, loss=1.058, loss_att=0.473, loss_ctc=1.643, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.094 -[v016] 2022-01-31 08:24:41,840 (trainer:653) INFO: 168epoch:train:55-81batch: iter_time=7.952e-05, forward_time=0.033, loss=1.023, loss_att=0.410, loss_ctc=1.636, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.094 -[v016] 2022-01-31 08:24:44,263 (trainer:653) INFO: 168epoch:train:82-108batch: iter_time=7.378e-05, forward_time=0.031, loss=0.906, loss_att=0.416, loss_ctc=1.396, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.090 -[v016] 2022-01-31 08:24:46,700 (trainer:653) INFO: 168epoch:train:109-135batch: iter_time=7.387e-05, forward_time=0.032, loss=1.070, loss_att=0.519, loss_ctc=1.622, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.046e-04, train_time=0.090 -[v016] 2022-01-31 08:24:49,204 (trainer:653) INFO: 168epoch:train:136-162batch: iter_time=7.311e-05, forward_time=0.032, loss=1.096, loss_att=0.437, loss_ctc=1.754, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.093 -[v016] 2022-01-31 08:24:52,289 (trainer:653) INFO: 168epoch:train:163-189batch: iter_time=0.021, forward_time=0.033, loss=1.151, loss_att=0.461, loss_ctc=1.840, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.114 -[v016] 2022-01-31 08:24:54,784 (trainer:653) INFO: 168epoch:train:190-216batch: iter_time=7.947e-05, forward_time=0.032, loss=1.158, loss_att=0.512, loss_ctc=1.805, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.092 -[v016] 2022-01-31 08:24:57,249 (trainer:653) INFO: 168epoch:train:217-243batch: iter_time=7.778e-05, forward_time=0.032, loss=0.990, loss_att=0.451, loss_ctc=1.529, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.091 -[v016] 2022-01-31 08:24:59,706 (trainer:653) INFO: 168epoch:train:244-270batch: iter_time=7.796e-05, forward_time=0.032, loss=1.044, loss_att=0.432, loss_ctc=1.656, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.091 -[v016] 2022-01-31 08:25:02,186 (trainer:653) INFO: 168epoch:train:271-297batch: iter_time=7.693e-05, forward_time=0.032, loss=0.964, loss_att=0.401, loss_ctc=1.527, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.092 -[v016] 2022-01-31 08:25:04,626 (trainer:653) INFO: 168epoch:train:298-324batch: iter_time=7.694e-05, forward_time=0.032, loss=1.046, loss_att=0.468, loss_ctc=1.624, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.090 -[v016] 2022-01-31 08:25:07,083 (trainer:653) INFO: 168epoch:train:325-351batch: iter_time=7.820e-05, forward_time=0.032, loss=1.083, loss_att=0.512, loss_ctc=1.654, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.091 -[v016] 2022-01-31 08:25:09,511 (trainer:653) INFO: 168epoch:train:352-378batch: iter_time=8.361e-05, forward_time=0.032, loss=1.103, loss_att=0.578, loss_ctc=1.629, acc=0.968, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.090 -[v016] 2022-01-31 08:25:11,987 (trainer:653) INFO: 168epoch:train:379-405batch: iter_time=7.783e-05, forward_time=0.032, loss=1.225, loss_att=0.534, loss_ctc=1.916, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.092 -[v016] 2022-01-31 08:25:14,573 (trainer:653) INFO: 168epoch:train:406-432batch: iter_time=8.626e-05, forward_time=0.034, loss=1.084, loss_att=0.458, loss_ctc=1.710, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.096 -[v016] 2022-01-31 08:25:17,097 (trainer:653) INFO: 168epoch:train:433-459batch: iter_time=8.144e-05, forward_time=0.032, loss=1.011, loss_att=0.421, loss_ctc=1.602, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.093 -[v016] 2022-01-31 08:25:19,601 (trainer:653) INFO: 168epoch:train:460-486batch: iter_time=7.972e-05, forward_time=0.032, loss=1.117, loss_att=0.509, loss_ctc=1.725, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.044e-04, train_time=0.093 -[v016] 2022-01-31 08:25:22,586 (trainer:653) INFO: 168epoch:train:487-513batch: iter_time=0.015, forward_time=0.033, loss=1.114, loss_att=0.491, loss_ctc=1.736, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.110 -[v016] 2022-01-31 08:25:25,116 (trainer:653) INFO: 168epoch:train:514-540batch: iter_time=8.042e-05, forward_time=0.033, loss=1.083, loss_att=0.475, loss_ctc=1.691, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.093 -[v016] 2022-01-31 08:25:58,946 (trainer:328) INFO: 168epoch results: [train] iter_time=0.002, forward_time=0.032, loss=1.054, loss_att=0.465, loss_ctc=1.643, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.045e-04, train_time=0.094, time=51.72 seconds, total_count=91896, gpu_max_cached_mem_GB=5.824, [valid] loss=7.996, loss_att=6.586, loss_ctc=9.405, acc=0.904, cer=0.100, wer=0.404, cer_ctc=0.144, time=5.45 seconds, total_count=29904, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.69 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:26:01,047 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:26:01,060 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/159epoch.pth -[v016] 2022-01-31 08:26:01,060 (trainer:261) INFO: 169/200epoch started. Estimated time to finish: 55 minutes and 44.49 seconds -[v016] 2022-01-31 08:26:03,755 (trainer:653) INFO: 169epoch:train:1-27batch: iter_time=0.003, forward_time=0.034, loss=1.128, loss_att=0.484, loss_ctc=1.772, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.099 -[v016] 2022-01-31 08:26:06,237 (trainer:653) INFO: 169epoch:train:28-54batch: iter_time=8.443e-05, forward_time=0.032, loss=0.914, loss_att=0.397, loss_ctc=1.432, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.092 -[v016] 2022-01-31 08:26:08,719 (trainer:653) INFO: 169epoch:train:55-81batch: iter_time=7.665e-05, forward_time=0.032, loss=0.866, loss_att=0.350, loss_ctc=1.383, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.092 -[v016] 2022-01-31 08:26:11,173 (trainer:653) INFO: 169epoch:train:82-108batch: iter_time=7.800e-05, forward_time=0.032, loss=0.990, loss_att=0.444, loss_ctc=1.535, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.043e-04, train_time=0.091 -[v016] 2022-01-31 08:26:13,690 (trainer:653) INFO: 169epoch:train:109-135batch: iter_time=8.102e-05, forward_time=0.033, loss=0.935, loss_att=0.394, loss_ctc=1.477, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.093 -[v016] 2022-01-31 08:26:16,183 (trainer:653) INFO: 169epoch:train:136-162batch: iter_time=7.482e-05, forward_time=0.032, loss=1.065, loss_att=0.479, loss_ctc=1.651, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.092 -[v016] 2022-01-31 08:26:18,697 (trainer:653) INFO: 169epoch:train:163-189batch: iter_time=7.461e-05, forward_time=0.033, loss=1.012, loss_att=0.422, loss_ctc=1.603, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.093 -[v016] 2022-01-31 08:26:21,202 (trainer:653) INFO: 169epoch:train:190-216batch: iter_time=7.689e-05, forward_time=0.032, loss=0.970, loss_att=0.481, loss_ctc=1.460, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.093 -[v016] 2022-01-31 08:26:23,675 (trainer:653) INFO: 169epoch:train:217-243batch: iter_time=7.880e-05, forward_time=0.032, loss=0.860, loss_att=0.374, loss_ctc=1.345, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.091 -[v016] 2022-01-31 08:26:26,071 (trainer:653) INFO: 169epoch:train:244-270batch: iter_time=7.840e-05, forward_time=0.031, loss=0.892, loss_att=0.463, loss_ctc=1.320, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.089 -[v016] 2022-01-31 08:26:28,550 (trainer:653) INFO: 169epoch:train:271-297batch: iter_time=7.919e-05, forward_time=0.032, loss=0.963, loss_att=0.488, loss_ctc=1.438, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.092 -[v016] 2022-01-31 08:26:31,032 (trainer:653) INFO: 169epoch:train:298-324batch: iter_time=8.364e-05, forward_time=0.032, loss=1.035, loss_att=0.421, loss_ctc=1.649, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.092 -[v016] 2022-01-31 08:26:33,538 (trainer:653) INFO: 169epoch:train:325-351batch: iter_time=7.887e-05, forward_time=0.032, loss=1.085, loss_att=0.486, loss_ctc=1.684, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.093 -[v016] 2022-01-31 08:26:35,976 (trainer:653) INFO: 169epoch:train:352-378batch: iter_time=8.089e-05, forward_time=0.032, loss=1.022, loss_att=0.466, loss_ctc=1.577, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.090 -[v016] 2022-01-31 08:26:38,500 (trainer:653) INFO: 169epoch:train:379-405batch: iter_time=9.686e-05, forward_time=0.032, loss=1.099, loss_att=0.480, loss_ctc=1.718, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.093 -[v016] 2022-01-31 08:26:40,962 (trainer:653) INFO: 169epoch:train:406-432batch: iter_time=7.660e-05, forward_time=0.032, loss=0.996, loss_att=0.429, loss_ctc=1.562, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.091 -[v016] 2022-01-31 08:26:43,473 (trainer:653) INFO: 169epoch:train:433-459batch: iter_time=7.681e-05, forward_time=0.032, loss=1.129, loss_att=0.499, loss_ctc=1.760, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.041e-04, train_time=0.093 -[v016] 2022-01-31 08:26:46,085 (trainer:653) INFO: 169epoch:train:460-486batch: iter_time=0.002, forward_time=0.033, loss=0.982, loss_att=0.367, loss_ctc=1.596, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.097 -[v016] 2022-01-31 08:26:48,731 (trainer:653) INFO: 169epoch:train:487-513batch: iter_time=0.005, forward_time=0.032, loss=1.120, loss_att=0.422, loss_ctc=1.817, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.098 -[v016] 2022-01-31 08:26:51,218 (trainer:653) INFO: 169epoch:train:514-540batch: iter_time=8.073e-05, forward_time=0.032, loss=1.089, loss_att=0.417, loss_ctc=1.761, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.092 -[v016] 2022-01-31 08:27:25,603 (trainer:328) INFO: 169epoch results: [train] iter_time=5.880e-04, forward_time=0.032, loss=1.010, loss_att=0.440, loss_ctc=1.580, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.042e-04, train_time=0.093, time=50.86 seconds, total_count=92443, gpu_max_cached_mem_GB=5.824, [valid] loss=7.876, loss_att=6.480, loss_ctc=9.272, acc=0.905, cer=0.101, wer=0.400, cer_ctc=0.144, time=5.91 seconds, total_count=30082, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.77 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:27:27,762 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:27:27,813 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/162epoch.pth, exp/asr_train_asr_raw_en_word/164epoch.pth -[v016] 2022-01-31 08:27:27,813 (trainer:261) INFO: 170/200epoch started. Estimated time to finish: 53 minutes and 56.28 seconds -[v016] 2022-01-31 08:27:30,561 (trainer:653) INFO: 170epoch:train:1-27batch: iter_time=0.003, forward_time=0.034, loss=0.968, loss_att=0.358, loss_ctc=1.577, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.101 -[v016] 2022-01-31 08:27:33,060 (trainer:653) INFO: 170epoch:train:28-54batch: iter_time=9.212e-05, forward_time=0.033, loss=0.979, loss_att=0.445, loss_ctc=1.514, acc=0.979, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.092 -[v016] 2022-01-31 08:27:35,565 (trainer:653) INFO: 170epoch:train:55-81batch: iter_time=8.270e-05, forward_time=0.032, loss=1.045, loss_att=0.429, loss_ctc=1.661, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.093 -[v016] 2022-01-31 08:27:38,035 (trainer:653) INFO: 170epoch:train:82-108batch: iter_time=8.025e-05, forward_time=0.032, loss=0.969, loss_att=0.445, loss_ctc=1.493, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.040e-04, train_time=0.091 -[v016] 2022-01-31 08:27:40,557 (trainer:653) INFO: 170epoch:train:109-135batch: iter_time=7.916e-05, forward_time=0.033, loss=1.097, loss_att=0.485, loss_ctc=1.709, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.093 -[v016] 2022-01-31 08:27:43,084 (trainer:653) INFO: 170epoch:train:136-162batch: iter_time=0.001, forward_time=0.032, loss=1.142, loss_att=0.500, loss_ctc=1.784, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.093 -[v016] 2022-01-31 08:27:45,568 (trainer:653) INFO: 170epoch:train:163-189batch: iter_time=7.539e-05, forward_time=0.032, loss=1.040, loss_att=0.474, loss_ctc=1.607, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.092 -[v016] 2022-01-31 08:27:48,087 (trainer:653) INFO: 170epoch:train:190-216batch: iter_time=7.808e-05, forward_time=0.032, loss=1.012, loss_att=0.471, loss_ctc=1.553, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.093 -[v016] 2022-01-31 08:27:50,954 (trainer:653) INFO: 170epoch:train:217-243batch: iter_time=0.016, forward_time=0.031, loss=0.957, loss_att=0.477, loss_ctc=1.437, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.106 -[v016] 2022-01-31 08:27:53,447 (trainer:653) INFO: 170epoch:train:244-270batch: iter_time=7.928e-05, forward_time=0.032, loss=1.265, loss_att=0.521, loss_ctc=2.010, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.092 -[v016] 2022-01-31 08:27:56,020 (trainer:653) INFO: 170epoch:train:271-297batch: iter_time=8.458e-05, forward_time=0.032, loss=1.198, loss_att=0.452, loss_ctc=1.943, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.038e-04, train_time=0.095 -[v016] 2022-01-31 08:27:58,565 (trainer:653) INFO: 170epoch:train:298-324batch: iter_time=8.729e-05, forward_time=0.032, loss=1.044, loss_att=0.465, loss_ctc=1.624, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.038e-04, train_time=0.094 -[v016] 2022-01-31 08:28:01,097 (trainer:653) INFO: 170epoch:train:325-351batch: iter_time=9.033e-05, forward_time=0.032, loss=0.803, loss_att=0.369, loss_ctc=1.238, acc=0.980, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.038e-04, train_time=0.094 -[v016] 2022-01-31 08:28:03,608 (trainer:653) INFO: 170epoch:train:352-378batch: iter_time=9.013e-05, forward_time=0.032, loss=0.985, loss_att=0.416, loss_ctc=1.555, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.038e-04, train_time=0.093 -[v016] 2022-01-31 08:28:06,226 (trainer:653) INFO: 170epoch:train:379-405batch: iter_time=9.258e-05, forward_time=0.033, loss=1.161, loss_att=0.476, loss_ctc=1.845, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.038e-04, train_time=0.097 -[v016] 2022-01-31 08:28:08,902 (trainer:653) INFO: 170epoch:train:406-432batch: iter_time=9.480e-05, forward_time=0.035, loss=1.298, loss_att=0.487, loss_ctc=2.108, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.038e-04, train_time=0.099 -[v016] 2022-01-31 08:28:11,525 (trainer:653) INFO: 170epoch:train:433-459batch: iter_time=8.992e-05, forward_time=0.034, loss=1.037, loss_att=0.437, loss_ctc=1.638, acc=0.981, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.038e-04, train_time=0.097 -[v016] 2022-01-31 08:28:14,075 (trainer:653) INFO: 170epoch:train:460-486batch: iter_time=9.371e-05, forward_time=0.033, loss=0.873, loss_att=0.390, loss_ctc=1.356, acc=0.982, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.037e-04, train_time=0.094 -[v016] 2022-01-31 08:28:16,573 (trainer:653) INFO: 170epoch:train:487-513batch: iter_time=8.769e-05, forward_time=0.032, loss=0.809, loss_att=0.372, loss_ctc=1.246, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.037e-04, train_time=0.092 -[v016] 2022-01-31 08:28:19,148 (trainer:653) INFO: 170epoch:train:514-540batch: iter_time=8.323e-05, forward_time=0.032, loss=1.118, loss_att=0.509, loss_ctc=1.726, acc=0.975, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.037e-04, train_time=0.095 -[v016] 2022-01-31 08:28:55,498 (trainer:328) INFO: 170epoch results: [train] iter_time=0.001, forward_time=0.032, loss=1.042, loss_att=0.449, loss_ctc=1.634, acc=0.978, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.039e-04, train_time=0.095, time=52.07 seconds, total_count=92990, gpu_max_cached_mem_GB=5.824, [valid] loss=7.870, loss_att=6.488, loss_ctc=9.253, acc=0.904, cer=0.100, wer=0.404, cer_ctc=0.146, time=7.44 seconds, total_count=30260, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.18 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:28:57,775 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:28:57,818 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/161epoch.pth -[v016] 2022-01-31 08:28:57,818 (trainer:261) INFO: 171/200epoch started. Estimated time to finish: 52 minutes and 9 seconds -[v016] 2022-01-31 08:29:00,578 (trainer:653) INFO: 171epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=1.097, loss_att=0.359, loss_ctc=1.836, acc=0.984, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.037e-04, train_time=0.102 -[v016] 2022-01-31 08:29:03,101 (trainer:653) INFO: 171epoch:train:28-54batch: iter_time=8.544e-05, forward_time=0.032, loss=0.945, loss_att=0.398, loss_ctc=1.492, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.037e-04, train_time=0.093 -[v016] 2022-01-31 08:29:05,514 (trainer:653) INFO: 171epoch:train:55-81batch: iter_time=8.370e-05, forward_time=0.031, loss=0.791, loss_att=0.367, loss_ctc=1.215, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.037e-04, train_time=0.089 -[v016] 2022-01-31 08:29:07,932 (trainer:653) INFO: 171epoch:train:82-108batch: iter_time=7.520e-05, forward_time=0.031, loss=0.912, loss_att=0.434, loss_ctc=1.390, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.036e-04, train_time=0.089 -[v016] 2022-01-31 08:29:10,416 (trainer:653) INFO: 171epoch:train:109-135batch: iter_time=8.944e-05, forward_time=0.031, loss=1.029, loss_att=0.451, loss_ctc=1.606, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.036e-04, train_time=0.092 -[v016] 2022-01-31 08:29:13,631 (trainer:653) INFO: 171epoch:train:136-162batch: iter_time=0.022, forward_time=0.033, loss=1.155, loss_att=0.490, loss_ctc=1.820, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.036e-04, train_time=0.119 -[v016] 2022-01-31 08:29:16,068 (trainer:653) INFO: 171epoch:train:163-189batch: iter_time=7.985e-05, forward_time=0.031, loss=1.107, loss_att=0.485, loss_ctc=1.730, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.036e-04, train_time=0.090 -[v016] 2022-01-31 08:29:18,567 (trainer:653) INFO: 171epoch:train:190-216batch: iter_time=7.733e-05, forward_time=0.031, loss=1.231, loss_att=0.538, loss_ctc=1.925, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.036e-04, train_time=0.092 -[v016] 2022-01-31 08:29:21,033 (trainer:653) INFO: 171epoch:train:217-243batch: iter_time=8.214e-05, forward_time=0.031, loss=1.006, loss_att=0.449, loss_ctc=1.562, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.036e-04, train_time=0.091 -[v016] 2022-01-31 08:29:23,785 (trainer:653) INFO: 171epoch:train:244-270batch: iter_time=0.008, forward_time=0.032, loss=0.882, loss_att=0.420, loss_ctc=1.344, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.036e-04, train_time=0.102 -[v016] 2022-01-31 08:29:26,392 (trainer:653) INFO: 171epoch:train:271-297batch: iter_time=2.237e-04, forward_time=0.033, loss=1.167, loss_att=0.481, loss_ctc=1.853, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.035e-04, train_time=0.096 -[v016] 2022-01-31 08:29:29,216 (trainer:653) INFO: 171epoch:train:298-324batch: iter_time=1.251e-04, forward_time=0.036, loss=1.003, loss_att=0.393, loss_ctc=1.613, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.104 -[v016] 2022-01-31 08:29:32,078 (trainer:653) INFO: 171epoch:train:325-351batch: iter_time=0.009, forward_time=0.033, loss=1.060, loss_att=0.486, loss_ctc=1.633, acc=0.975, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.106 -[v016] 2022-01-31 08:29:34,736 (trainer:653) INFO: 171epoch:train:352-378batch: iter_time=1.200e-04, forward_time=0.033, loss=0.870, loss_att=0.384, loss_ctc=1.356, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.098 -[v016] 2022-01-31 08:29:37,396 (trainer:653) INFO: 171epoch:train:379-405batch: iter_time=9.204e-05, forward_time=0.034, loss=1.119, loss_att=0.471, loss_ctc=1.767, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.098 -[v016] 2022-01-31 08:29:40,446 (trainer:653) INFO: 171epoch:train:406-432batch: iter_time=0.013, forward_time=0.034, loss=1.022, loss_att=0.451, loss_ctc=1.593, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.113 -[v016] 2022-01-31 08:29:43,248 (trainer:653) INFO: 171epoch:train:433-459batch: iter_time=1.102e-04, forward_time=0.036, loss=1.023, loss_att=0.417, loss_ctc=1.629, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.035e-04, train_time=0.104 -[v016] 2022-01-31 08:29:46,044 (trainer:653) INFO: 171epoch:train:460-486batch: iter_time=9.706e-05, forward_time=0.036, loss=1.199, loss_att=0.491, loss_ctc=1.907, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.034e-04, train_time=0.103 -[v016] 2022-01-31 08:29:48,787 (trainer:653) INFO: 171epoch:train:487-513batch: iter_time=9.644e-05, forward_time=0.035, loss=1.165, loss_att=0.552, loss_ctc=1.779, acc=0.970, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.034e-04, train_time=0.101 -[v016] 2022-01-31 08:29:51,416 (trainer:653) INFO: 171epoch:train:514-540batch: iter_time=9.535e-05, forward_time=0.033, loss=1.011, loss_att=0.473, loss_ctc=1.550, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.034e-04, train_time=0.097 -[v016] 2022-01-31 08:30:31,241 (trainer:328) INFO: 171epoch results: [train] iter_time=0.003, forward_time=0.033, loss=1.041, loss_att=0.450, loss_ctc=1.633, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.035e-04, train_time=0.099, time=54.38 seconds, total_count=93537, gpu_max_cached_mem_GB=5.824, [valid] loss=7.981, loss_att=6.510, loss_ctc=9.452, acc=0.901, cer=0.104, wer=0.411, cer_ctc=0.150, time=6.46 seconds, total_count=30438, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.56 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:30:33,607 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:30:33,619 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/168epoch.pth -[v016] 2022-01-31 08:30:33,619 (trainer:261) INFO: 172/200epoch started. Estimated time to finish: 50 minutes and 23.07 seconds -[v016] 2022-01-31 08:30:37,994 (trainer:653) INFO: 172epoch:train:1-27batch: iter_time=0.011, forward_time=0.059, loss=1.035, loss_att=0.404, loss_ctc=1.665, acc=0.983, backward_time=0.038, optim_step_time=0.025, optim0_lr0=1.034e-04, train_time=0.158 -[v016] 2022-01-31 08:30:40,696 (trainer:653) INFO: 172epoch:train:28-54batch: iter_time=0.005, forward_time=0.032, loss=1.272, loss_att=0.468, loss_ctc=2.077, acc=0.982, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.034e-04, train_time=0.100 -[v016] 2022-01-31 08:30:43,987 (trainer:653) INFO: 172epoch:train:55-81batch: iter_time=0.002, forward_time=0.040, loss=0.878, loss_att=0.391, loss_ctc=1.366, acc=0.979, backward_time=0.023, optim_step_time=0.026, optim0_lr0=1.034e-04, train_time=0.122 -[v016] 2022-01-31 08:30:46,738 (trainer:653) INFO: 172epoch:train:82-108batch: iter_time=1.265e-04, forward_time=0.034, loss=0.872, loss_att=0.415, loss_ctc=1.329, acc=0.975, backward_time=0.025, optim_step_time=0.024, optim0_lr0=1.033e-04, train_time=0.102 -[v016] 2022-01-31 08:30:50,151 (trainer:653) INFO: 172epoch:train:109-135batch: iter_time=0.027, forward_time=0.034, loss=1.000, loss_att=0.374, loss_ctc=1.626, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.033e-04, train_time=0.126 -[v016] 2022-01-31 08:30:52,838 (trainer:653) INFO: 172epoch:train:136-162batch: iter_time=1.162e-04, forward_time=0.034, loss=0.920, loss_att=0.385, loss_ctc=1.455, acc=0.983, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.033e-04, train_time=0.099 -[v016] 2022-01-31 08:30:56,717 (trainer:653) INFO: 172epoch:train:163-189batch: iter_time=0.038, forward_time=0.035, loss=1.211, loss_att=0.549, loss_ctc=1.873, acc=0.976, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.033e-04, train_time=0.143 -[v016] 2022-01-31 08:30:59,641 (trainer:653) INFO: 172epoch:train:190-216batch: iter_time=0.009, forward_time=0.033, loss=0.924, loss_att=0.352, loss_ctc=1.496, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.033e-04, train_time=0.108 -[v016] 2022-01-31 08:31:03,198 (trainer:653) INFO: 172epoch:train:217-243batch: iter_time=0.032, forward_time=0.033, loss=1.013, loss_att=0.442, loss_ctc=1.584, acc=0.979, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.033e-04, train_time=0.132 -[v016] 2022-01-31 08:31:07,818 (trainer:653) INFO: 172epoch:train:244-270batch: iter_time=0.070, forward_time=0.034, loss=0.875, loss_att=0.367, loss_ctc=1.382, acc=0.981, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.033e-04, train_time=0.170 -[v016] 2022-01-31 08:31:10,751 (trainer:653) INFO: 172epoch:train:271-297batch: iter_time=0.006, forward_time=0.034, loss=0.841, loss_att=0.356, loss_ctc=1.326, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.032e-04, train_time=0.109 -[v016] 2022-01-31 08:31:16,243 (trainer:653) INFO: 172epoch:train:298-324batch: iter_time=0.016, forward_time=0.066, loss=1.039, loss_att=0.444, loss_ctc=1.634, acc=0.979, backward_time=0.072, optim_step_time=0.025, optim0_lr0=1.032e-04, train_time=0.203 -[v016] 2022-01-31 08:31:19,456 (trainer:653) INFO: 172epoch:train:325-351batch: iter_time=0.018, forward_time=0.034, loss=1.154, loss_att=0.489, loss_ctc=1.820, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.032e-04, train_time=0.119 -[v016] 2022-01-31 08:31:23,818 (trainer:653) INFO: 172epoch:train:352-378batch: iter_time=0.064, forward_time=0.033, loss=1.073, loss_att=0.551, loss_ctc=1.594, acc=0.970, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.032e-04, train_time=0.161 -[v016] 2022-01-31 08:31:27,671 (trainer:653) INFO: 172epoch:train:379-405batch: iter_time=0.047, forward_time=0.032, loss=1.117, loss_att=0.528, loss_ctc=1.706, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.032e-04, train_time=0.142 -[v016] 2022-01-31 08:31:30,989 (trainer:653) INFO: 172epoch:train:406-432batch: iter_time=0.006, forward_time=0.048, loss=1.069, loss_att=0.439, loss_ctc=1.699, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.032e-04, train_time=0.123 -[v016] 2022-01-31 08:31:33,918 (trainer:653) INFO: 172epoch:train:433-459batch: iter_time=0.011, forward_time=0.033, loss=0.902, loss_att=0.424, loss_ctc=1.379, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.032e-04, train_time=0.108 -[v016] 2022-01-31 08:31:40,607 (trainer:653) INFO: 172epoch:train:460-486batch: iter_time=0.086, forward_time=0.052, loss=1.019, loss_att=0.401, loss_ctc=1.637, acc=0.981, backward_time=0.054, optim_step_time=0.028, optim0_lr0=1.031e-04, train_time=0.248 -[v016] 2022-01-31 08:31:43,640 (trainer:653) INFO: 172epoch:train:487-513batch: iter_time=0.013, forward_time=0.033, loss=1.166, loss_att=0.434, loss_ctc=1.897, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.031e-04, train_time=0.112 -[v016] 2022-01-31 08:31:49,155 (trainer:653) INFO: 172epoch:train:514-540batch: iter_time=0.068, forward_time=0.049, loss=1.033, loss_att=0.401, loss_ctc=1.664, acc=0.981, backward_time=0.023, optim_step_time=0.026, optim0_lr0=1.031e-04, train_time=0.203 -[v016] 2022-01-31 08:33:03,766 (trainer:328) INFO: 172epoch results: [train] iter_time=0.027, forward_time=0.040, loss=1.017, loss_att=0.430, loss_ctc=1.604, acc=0.979, backward_time=0.028, optim_step_time=0.024, optim0_lr0=1.032e-04, train_time=0.141, time=1 minute and 17.76 seconds, total_count=94084, gpu_max_cached_mem_GB=5.824, [valid] loss=7.876, loss_att=6.404, loss_ctc=9.349, acc=0.905, cer=0.097, wer=0.398, cer_ctc=0.140, time=30.4 seconds, total_count=30616, gpu_max_cached_mem_GB=5.824, [att_plot] time=41.86 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:33:06,991 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:33:07,005 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/163epoch.pth -[v016] 2022-01-31 08:33:07,008 (trainer:261) INFO: 173/200epoch started. Estimated time to finish: 48 minutes and 47.88 seconds -[v016] 2022-01-31 08:33:22,058 (trainer:653) INFO: 173epoch:train:1-27batch: iter_time=0.387, forward_time=0.057, loss=1.269, loss_att=0.436, loss_ctc=2.102, acc=0.984, backward_time=0.041, optim_step_time=0.030, optim0_lr0=1.031e-04, train_time=0.550 -[v016] 2022-01-31 08:33:35,972 (trainer:653) INFO: 173epoch:train:28-54batch: iter_time=0.402, forward_time=0.038, loss=0.978, loss_att=0.451, loss_ctc=1.504, acc=0.977, backward_time=0.024, optim_step_time=0.026, optim0_lr0=1.031e-04, train_time=0.515 -[v016] 2022-01-31 08:33:50,018 (trainer:653) INFO: 173epoch:train:55-81batch: iter_time=0.327, forward_time=0.106, loss=0.958, loss_att=0.377, loss_ctc=1.539, acc=0.983, backward_time=0.032, optim_step_time=0.029, optim0_lr0=1.031e-04, train_time=0.520 -[v016] 2022-01-31 08:34:05,496 (trainer:653) INFO: 173epoch:train:82-108batch: iter_time=0.366, forward_time=0.115, loss=1.139, loss_att=0.462, loss_ctc=1.817, acc=0.980, backward_time=0.025, optim_step_time=0.030, optim0_lr0=1.030e-04, train_time=0.572 -[v016] 2022-01-31 08:34:16,572 (trainer:653) INFO: 173epoch:train:109-135batch: iter_time=0.314, forward_time=0.033, loss=0.958, loss_att=0.380, loss_ctc=1.537, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.030e-04, train_time=0.410 -[v016] 2022-01-31 08:34:28,171 (trainer:653) INFO: 173epoch:train:136-162batch: iter_time=0.328, forward_time=0.034, loss=1.092, loss_att=0.491, loss_ctc=1.693, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.030e-04, train_time=0.429 -[v016] 2022-01-31 08:34:39,762 (trainer:653) INFO: 173epoch:train:163-189batch: iter_time=0.330, forward_time=0.034, loss=0.887, loss_att=0.467, loss_ctc=1.307, acc=0.976, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.030e-04, train_time=0.429 -[v016] 2022-01-31 08:34:49,543 (trainer:653) INFO: 173epoch:train:190-216batch: iter_time=0.260, forward_time=0.034, loss=0.737, loss_att=0.290, loss_ctc=1.183, acc=0.986, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.030e-04, train_time=0.362 -[v016] 2022-01-31 08:34:58,949 (trainer:653) INFO: 173epoch:train:217-243batch: iter_time=0.252, forward_time=0.033, loss=0.829, loss_att=0.386, loss_ctc=1.273, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.030e-04, train_time=0.348 -[v016] 2022-01-31 08:35:13,135 (trainer:653) INFO: 173epoch:train:244-270batch: iter_time=0.424, forward_time=0.035, loss=0.893, loss_att=0.327, loss_ctc=1.460, acc=0.987, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.030e-04, train_time=0.525 -[v016] 2022-01-31 08:35:23,129 (trainer:653) INFO: 173epoch:train:271-297batch: iter_time=0.265, forward_time=0.034, loss=1.118, loss_att=0.489, loss_ctc=1.746, acc=0.972, backward_time=0.023, optim_step_time=0.026, optim0_lr0=1.029e-04, train_time=0.370 -[v016] 2022-01-31 08:35:33,342 (trainer:653) INFO: 173epoch:train:298-324batch: iter_time=0.279, forward_time=0.034, loss=1.256, loss_att=0.488, loss_ctc=2.024, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.029e-04, train_time=0.378 -[v016] 2022-01-31 08:35:45,201 (trainer:653) INFO: 173epoch:train:325-351batch: iter_time=0.336, forward_time=0.035, loss=1.095, loss_att=0.477, loss_ctc=1.713, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.029e-04, train_time=0.439 -[v016] 2022-01-31 08:35:53,681 (trainer:653) INFO: 173epoch:train:352-378batch: iter_time=0.216, forward_time=0.033, loss=0.914, loss_att=0.447, loss_ctc=1.382, acc=0.976, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.029e-04, train_time=0.314 -[v016] 2022-01-31 08:36:04,497 (trainer:653) INFO: 173epoch:train:379-405batch: iter_time=0.237, forward_time=0.062, loss=1.016, loss_att=0.447, loss_ctc=1.584, acc=0.978, backward_time=0.027, optim_step_time=0.046, optim0_lr0=1.029e-04, train_time=0.400 -[v016] 2022-01-31 08:36:16,060 (trainer:653) INFO: 173epoch:train:406-432batch: iter_time=0.333, forward_time=0.032, loss=1.001, loss_att=0.443, loss_ctc=1.559, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.029e-04, train_time=0.428 -[v016] 2022-01-31 08:36:24,069 (trainer:653) INFO: 173epoch:train:433-459batch: iter_time=0.201, forward_time=0.032, loss=1.035, loss_att=0.472, loss_ctc=1.597, acc=0.976, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.029e-04, train_time=0.296 -[v016] 2022-01-31 08:36:34,125 (trainer:653) INFO: 173epoch:train:460-486batch: iter_time=0.273, forward_time=0.034, loss=1.025, loss_att=0.454, loss_ctc=1.596, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.028e-04, train_time=0.372 -[v016] 2022-01-31 08:36:43,741 (trainer:653) INFO: 173epoch:train:487-513batch: iter_time=0.257, forward_time=0.034, loss=1.114, loss_att=0.500, loss_ctc=1.729, acc=0.976, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.028e-04, train_time=0.356 -[v016] 2022-01-31 08:36:52,525 (trainer:653) INFO: 173epoch:train:514-540batch: iter_time=0.229, forward_time=0.033, loss=1.146, loss_att=0.507, loss_ctc=1.786, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.028e-04, train_time=0.325 -[v016] 2022-01-31 08:38:19,658 (trainer:328) INFO: 173epoch results: [train] iter_time=0.301, forward_time=0.044, loss=1.016, loss_att=0.438, loss_ctc=1.595, acc=0.979, backward_time=0.025, optim_step_time=0.025, optim0_lr0=1.029e-04, train_time=0.416, time=3 minutes and 48.17 seconds, total_count=94631, gpu_max_cached_mem_GB=5.824, [valid] loss=7.952, loss_att=6.467, loss_ctc=9.436, acc=0.904, cer=0.100, wer=0.400, cer_ctc=0.146, time=54.91 seconds, total_count=30794, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.51 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:38:23,103 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:38:23,115 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/170epoch.pth -[v016] 2022-01-31 08:38:23,115 (trainer:261) INFO: 174/200epoch started. Estimated time to finish: 47 minutes and 40.64 seconds -[v016] 2022-01-31 08:38:26,282 (trainer:653) INFO: 174epoch:train:1-27batch: iter_time=0.016, forward_time=0.031, loss=0.891, loss_att=0.348, loss_ctc=1.434, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.028e-04, train_time=0.109 -[v016] 2022-01-31 08:38:28,777 (trainer:653) INFO: 174epoch:train:28-54batch: iter_time=0.002, forward_time=0.031, loss=1.012, loss_att=0.426, loss_ctc=1.598, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.028e-04, train_time=0.093 -[v016] 2022-01-31 08:38:31,421 (trainer:653) INFO: 174epoch:train:55-81batch: iter_time=8.448e-04, forward_time=0.036, loss=1.102, loss_att=0.511, loss_ctc=1.693, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.028e-04, train_time=0.098 -[v016] 2022-01-31 08:38:34,235 (trainer:653) INFO: 174epoch:train:82-108batch: iter_time=0.009, forward_time=0.033, loss=1.099, loss_att=0.390, loss_ctc=1.807, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.104 -[v016] 2022-01-31 08:38:36,631 (trainer:653) INFO: 174epoch:train:109-135batch: iter_time=7.513e-05, forward_time=0.030, loss=1.024, loss_att=0.520, loss_ctc=1.528, acc=0.970, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.089 -[v016] 2022-01-31 08:38:39,393 (trainer:653) INFO: 174epoch:train:136-162batch: iter_time=0.009, forward_time=0.032, loss=1.166, loss_att=0.487, loss_ctc=1.845, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.102 -[v016] 2022-01-31 08:38:41,865 (trainer:653) INFO: 174epoch:train:163-189batch: iter_time=7.734e-05, forward_time=0.032, loss=0.924, loss_att=0.443, loss_ctc=1.405, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.091 -[v016] 2022-01-31 08:38:44,496 (trainer:653) INFO: 174epoch:train:190-216batch: iter_time=0.005, forward_time=0.032, loss=1.080, loss_att=0.473, loss_ctc=1.687, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.097 -[v016] 2022-01-31 08:38:47,141 (trainer:653) INFO: 174epoch:train:217-243batch: iter_time=8.889e-05, forward_time=0.034, loss=1.032, loss_att=0.398, loss_ctc=1.666, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.098 -[v016] 2022-01-31 08:38:49,638 (trainer:653) INFO: 174epoch:train:244-270batch: iter_time=7.791e-05, forward_time=0.032, loss=1.119, loss_att=0.467, loss_ctc=1.772, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.027e-04, train_time=0.092 -[v016] 2022-01-31 08:38:52,080 (trainer:653) INFO: 174epoch:train:271-297batch: iter_time=7.952e-05, forward_time=0.031, loss=1.088, loss_att=0.450, loss_ctc=1.726, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.090 -[v016] 2022-01-31 08:38:54,490 (trainer:653) INFO: 174epoch:train:298-324batch: iter_time=7.486e-05, forward_time=0.030, loss=0.980, loss_att=0.435, loss_ctc=1.525, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.089 -[v016] 2022-01-31 08:38:57,357 (trainer:653) INFO: 174epoch:train:325-351batch: iter_time=7.716e-05, forward_time=0.045, loss=1.050, loss_att=0.408, loss_ctc=1.693, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.106 -[v016] 2022-01-31 08:38:59,826 (trainer:653) INFO: 174epoch:train:352-378batch: iter_time=7.756e-05, forward_time=0.031, loss=0.932, loss_att=0.426, loss_ctc=1.437, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.091 -[v016] 2022-01-31 08:39:02,437 (trainer:653) INFO: 174epoch:train:379-405batch: iter_time=0.001, forward_time=0.033, loss=1.044, loss_att=0.390, loss_ctc=1.697, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.097 -[v016] 2022-01-31 08:39:04,891 (trainer:653) INFO: 174epoch:train:406-432batch: iter_time=7.656e-05, forward_time=0.031, loss=0.974, loss_att=0.432, loss_ctc=1.516, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.091 -[v016] 2022-01-31 08:39:07,328 (trainer:653) INFO: 174epoch:train:433-459batch: iter_time=8.304e-05, forward_time=0.031, loss=0.881, loss_att=0.395, loss_ctc=1.367, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.090 -[v016] 2022-01-31 08:39:10,083 (trainer:653) INFO: 174epoch:train:460-486batch: iter_time=0.011, forward_time=0.032, loss=1.016, loss_att=0.484, loss_ctc=1.547, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.102 -[v016] 2022-01-31 08:39:12,572 (trainer:653) INFO: 174epoch:train:487-513batch: iter_time=7.733e-05, forward_time=0.032, loss=1.005, loss_att=0.494, loss_ctc=1.515, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.092 -[v016] 2022-01-31 08:39:15,187 (trainer:653) INFO: 174epoch:train:514-540batch: iter_time=0.006, forward_time=0.031, loss=0.952, loss_att=0.399, loss_ctc=1.505, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.097 -[v016] 2022-01-31 08:39:50,808 (trainer:328) INFO: 174epoch results: [train] iter_time=0.003, forward_time=0.033, loss=1.021, loss_att=0.439, loss_ctc=1.603, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.026e-04, train_time=0.096, time=52.93 seconds, total_count=95178, gpu_max_cached_mem_GB=5.824, [valid] loss=7.884, loss_att=6.509, loss_ctc=9.258, acc=0.907, cer=0.098, wer=0.394, cer_ctc=0.140, time=6.83 seconds, total_count=30972, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.89 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:39:52,817 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:39:52,830 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/142epoch.pth, exp/asr_train_asr_raw_en_word/171epoch.pth -[v016] 2022-01-31 08:39:52,830 (trainer:261) INFO: 175/200epoch started. Estimated time to finish: 45 minutes and 51.95 seconds -[v016] 2022-01-31 08:39:55,501 (trainer:653) INFO: 175epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.967, loss_att=0.429, loss_ctc=1.505, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.099 -[v016] 2022-01-31 08:39:58,055 (trainer:653) INFO: 175epoch:train:28-54batch: iter_time=8.132e-05, forward_time=0.034, loss=1.099, loss_att=0.400, loss_ctc=1.798, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.094 -[v016] 2022-01-31 08:40:00,541 (trainer:653) INFO: 175epoch:train:55-81batch: iter_time=8.181e-05, forward_time=0.032, loss=0.826, loss_att=0.386, loss_ctc=1.266, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.092 -[v016] 2022-01-31 08:40:03,027 (trainer:653) INFO: 175epoch:train:82-108batch: iter_time=8.047e-05, forward_time=0.032, loss=1.056, loss_att=0.454, loss_ctc=1.658, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.025e-04, train_time=0.092 -[v016] 2022-01-31 08:40:05,497 (trainer:653) INFO: 175epoch:train:109-135batch: iter_time=7.880e-05, forward_time=0.032, loss=1.060, loss_att=0.543, loss_ctc=1.578, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.091 -[v016] 2022-01-31 08:40:08,015 (trainer:653) INFO: 175epoch:train:136-162batch: iter_time=8.267e-05, forward_time=0.033, loss=1.035, loss_att=0.502, loss_ctc=1.569, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.093 -[v016] 2022-01-31 08:40:10,537 (trainer:653) INFO: 175epoch:train:163-189batch: iter_time=7.650e-05, forward_time=0.033, loss=1.047, loss_att=0.459, loss_ctc=1.636, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.093 -[v016] 2022-01-31 08:40:13,036 (trainer:653) INFO: 175epoch:train:190-216batch: iter_time=7.665e-05, forward_time=0.033, loss=0.939, loss_att=0.356, loss_ctc=1.521, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.092 -[v016] 2022-01-31 08:40:15,533 (trainer:653) INFO: 175epoch:train:217-243batch: iter_time=7.729e-05, forward_time=0.033, loss=1.005, loss_att=0.416, loss_ctc=1.594, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.092 -[v016] 2022-01-31 08:40:18,076 (trainer:653) INFO: 175epoch:train:244-270batch: iter_time=0.003, forward_time=0.032, loss=0.971, loss_att=0.445, loss_ctc=1.497, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.094 -[v016] 2022-01-31 08:40:20,544 (trainer:653) INFO: 175epoch:train:271-297batch: iter_time=7.992e-05, forward_time=0.032, loss=0.969, loss_att=0.395, loss_ctc=1.542, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.091 -[v016] 2022-01-31 08:40:22,993 (trainer:653) INFO: 175epoch:train:298-324batch: iter_time=8.335e-05, forward_time=0.032, loss=0.960, loss_att=0.436, loss_ctc=1.484, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.090 -[v016] 2022-01-31 08:40:25,413 (trainer:653) INFO: 175epoch:train:325-351batch: iter_time=7.654e-05, forward_time=0.032, loss=0.960, loss_att=0.435, loss_ctc=1.485, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.089 -[v016] 2022-01-31 08:40:27,904 (trainer:653) INFO: 175epoch:train:352-378batch: iter_time=7.798e-05, forward_time=0.032, loss=0.976, loss_att=0.442, loss_ctc=1.509, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.092 -[v016] 2022-01-31 08:40:30,469 (trainer:653) INFO: 175epoch:train:379-405batch: iter_time=7.805e-05, forward_time=0.033, loss=1.106, loss_att=0.460, loss_ctc=1.753, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.095 -[v016] 2022-01-31 08:40:32,971 (trainer:653) INFO: 175epoch:train:406-432batch: iter_time=7.705e-05, forward_time=0.033, loss=1.015, loss_att=0.437, loss_ctc=1.593, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.092 -[v016] 2022-01-31 08:40:35,590 (trainer:653) INFO: 175epoch:train:433-459batch: iter_time=7.767e-05, forward_time=0.034, loss=0.991, loss_att=0.371, loss_ctc=1.611, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.023e-04, train_time=0.097 -[v016] 2022-01-31 08:40:38,113 (trainer:653) INFO: 175epoch:train:460-486batch: iter_time=8.077e-05, forward_time=0.033, loss=0.964, loss_att=0.405, loss_ctc=1.523, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.093 -[v016] 2022-01-31 08:40:40,586 (trainer:653) INFO: 175epoch:train:487-513batch: iter_time=7.900e-05, forward_time=0.032, loss=0.923, loss_att=0.438, loss_ctc=1.408, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.091 -[v016] 2022-01-31 08:40:43,043 (trainer:653) INFO: 175epoch:train:514-540batch: iter_time=7.780e-05, forward_time=0.032, loss=1.094, loss_att=0.495, loss_ctc=1.692, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.091 -[v016] 2022-01-31 08:41:16,878 (trainer:328) INFO: 175epoch results: [train] iter_time=4.050e-04, forward_time=0.033, loss=1.004, loss_att=0.437, loss_ctc=1.570, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.024e-04, train_time=0.093, time=50.98 seconds, total_count=95725, gpu_max_cached_mem_GB=5.824, [valid] loss=8.033, loss_att=6.626, loss_ctc=9.441, acc=0.904, cer=0.101, wer=0.403, cer_ctc=0.144, time=5.8 seconds, total_count=31150, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.27 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:41:19,650 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 08:41:19,662 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/166epoch.pth -[v016] 2022-01-31 08:41:19,662 (trainer:261) INFO: 176/200epoch started. Estimated time to finish: 44 minutes and 3.04 seconds -[v016] 2022-01-31 08:41:22,447 (trainer:653) INFO: 176epoch:train:1-27batch: iter_time=0.003, forward_time=0.035, loss=1.087, loss_att=0.393, loss_ctc=1.782, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.103 -[v016] 2022-01-31 08:41:25,044 (trainer:653) INFO: 176epoch:train:28-54batch: iter_time=8.532e-05, forward_time=0.034, loss=1.085, loss_att=0.438, loss_ctc=1.732, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.096 -[v016] 2022-01-31 08:41:27,520 (trainer:653) INFO: 176epoch:train:55-81batch: iter_time=8.403e-05, forward_time=0.033, loss=1.026, loss_att=0.463, loss_ctc=1.589, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.091 -[v016] 2022-01-31 08:41:29,933 (trainer:653) INFO: 176epoch:train:82-108batch: iter_time=7.788e-05, forward_time=0.031, loss=0.941, loss_att=0.445, loss_ctc=1.437, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.022e-04, train_time=0.089 -[v016] 2022-01-31 08:41:32,469 (trainer:653) INFO: 176epoch:train:109-135batch: iter_time=7.580e-05, forward_time=0.033, loss=0.998, loss_att=0.423, loss_ctc=1.573, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.094 -[v016] 2022-01-31 08:41:34,936 (trainer:653) INFO: 176epoch:train:136-162batch: iter_time=7.491e-05, forward_time=0.032, loss=0.833, loss_att=0.351, loss_ctc=1.315, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.091 -[v016] 2022-01-31 08:41:37,469 (trainer:653) INFO: 176epoch:train:163-189batch: iter_time=7.446e-05, forward_time=0.033, loss=0.932, loss_att=0.444, loss_ctc=1.420, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.094 -[v016] 2022-01-31 08:41:39,969 (trainer:653) INFO: 176epoch:train:190-216batch: iter_time=7.550e-05, forward_time=0.032, loss=1.062, loss_att=0.476, loss_ctc=1.648, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.092 -[v016] 2022-01-31 08:41:42,469 (trainer:653) INFO: 176epoch:train:217-243batch: iter_time=7.827e-05, forward_time=0.032, loss=1.094, loss_att=0.452, loss_ctc=1.736, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.092 -[v016] 2022-01-31 08:41:44,968 (trainer:653) INFO: 176epoch:train:244-270batch: iter_time=8.327e-05, forward_time=0.033, loss=1.074, loss_att=0.448, loss_ctc=1.700, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.092 -[v016] 2022-01-31 08:41:47,470 (trainer:653) INFO: 176epoch:train:271-297batch: iter_time=0.002, forward_time=0.032, loss=1.163, loss_att=0.488, loss_ctc=1.838, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.092 -[v016] 2022-01-31 08:41:49,953 (trainer:653) INFO: 176epoch:train:298-324batch: iter_time=7.692e-05, forward_time=0.032, loss=1.004, loss_att=0.402, loss_ctc=1.606, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.092 -[v016] 2022-01-31 08:41:52,455 (trainer:653) INFO: 176epoch:train:325-351batch: iter_time=7.652e-05, forward_time=0.032, loss=0.954, loss_att=0.385, loss_ctc=1.523, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.092 -[v016] 2022-01-31 08:41:54,862 (trainer:653) INFO: 176epoch:train:352-378batch: iter_time=7.601e-05, forward_time=0.031, loss=0.892, loss_att=0.409, loss_ctc=1.375, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.089 -[v016] 2022-01-31 08:41:57,303 (trainer:653) INFO: 176epoch:train:379-405batch: iter_time=7.678e-05, forward_time=0.031, loss=0.976, loss_att=0.393, loss_ctc=1.559, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.090 -[v016] 2022-01-31 08:41:59,950 (trainer:653) INFO: 176epoch:train:406-432batch: iter_time=0.006, forward_time=0.032, loss=1.039, loss_att=0.448, loss_ctc=1.629, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.098 -[v016] 2022-01-31 08:42:02,348 (trainer:653) INFO: 176epoch:train:433-459batch: iter_time=7.479e-05, forward_time=0.031, loss=1.080, loss_att=0.572, loss_ctc=1.588, acc=0.969, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.089 -[v016] 2022-01-31 08:42:04,840 (trainer:653) INFO: 176epoch:train:460-486batch: iter_time=7.612e-05, forward_time=0.032, loss=1.078, loss_att=0.466, loss_ctc=1.689, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.020e-04, train_time=0.092 -[v016] 2022-01-31 08:42:07,359 (trainer:653) INFO: 176epoch:train:487-513batch: iter_time=7.962e-05, forward_time=0.033, loss=1.002, loss_att=0.471, loss_ctc=1.532, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.093 -[v016] 2022-01-31 08:42:09,790 (trainer:653) INFO: 176epoch:train:514-540batch: iter_time=9.594e-05, forward_time=0.031, loss=1.034, loss_att=0.465, loss_ctc=1.603, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.090 -[v016] 2022-01-31 08:42:43,759 (trainer:328) INFO: 176epoch results: [train] iter_time=6.206e-04, forward_time=0.032, loss=1.018, loss_att=0.442, loss_ctc=1.593, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.021e-04, train_time=0.093, time=50.82 seconds, total_count=96272, gpu_max_cached_mem_GB=5.824, [valid] loss=7.925, loss_att=6.481, loss_ctc=9.368, acc=0.905, cer=0.098, wer=0.398, cer_ctc=0.144, time=5.69 seconds, total_count=31328, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.59 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:42:45,903 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:42:45,917 (trainer:261) INFO: 177/200epoch started. Estimated time to finish: 42 minutes and 14.33 seconds -[v016] 2022-01-31 08:42:48,667 (trainer:653) INFO: 177epoch:train:1-27batch: iter_time=0.006, forward_time=0.033, loss=1.094, loss_att=0.449, loss_ctc=1.739, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.101 -[v016] 2022-01-31 08:42:51,222 (trainer:653) INFO: 177epoch:train:28-54batch: iter_time=8.185e-05, forward_time=0.033, loss=0.896, loss_att=0.353, loss_ctc=1.439, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.094 -[v016] 2022-01-31 08:42:53,827 (trainer:653) INFO: 177epoch:train:55-81batch: iter_time=0.003, forward_time=0.033, loss=0.948, loss_att=0.410, loss_ctc=1.486, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.096 -[v016] 2022-01-31 08:42:56,233 (trainer:653) INFO: 177epoch:train:82-108batch: iter_time=7.557e-05, forward_time=0.031, loss=0.776, loss_att=0.366, loss_ctc=1.187, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.089 -[v016] 2022-01-31 08:42:58,730 (trainer:653) INFO: 177epoch:train:109-135batch: iter_time=7.790e-05, forward_time=0.032, loss=0.819, loss_att=0.354, loss_ctc=1.285, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.019e-04, train_time=0.092 -[v016] 2022-01-31 08:43:01,213 (trainer:653) INFO: 177epoch:train:136-162batch: iter_time=7.827e-05, forward_time=0.032, loss=0.985, loss_att=0.385, loss_ctc=1.586, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.092 -[v016] 2022-01-31 08:43:03,738 (trainer:653) INFO: 177epoch:train:163-189batch: iter_time=8.354e-05, forward_time=0.033, loss=1.029, loss_att=0.434, loss_ctc=1.624, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.093 -[v016] 2022-01-31 08:43:06,261 (trainer:653) INFO: 177epoch:train:190-216batch: iter_time=8.194e-05, forward_time=0.033, loss=0.986, loss_att=0.407, loss_ctc=1.565, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.093 -[v016] 2022-01-31 08:43:08,804 (trainer:653) INFO: 177epoch:train:217-243batch: iter_time=8.803e-05, forward_time=0.033, loss=0.892, loss_att=0.402, loss_ctc=1.381, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.094 -[v016] 2022-01-31 08:43:11,386 (trainer:653) INFO: 177epoch:train:244-270batch: iter_time=1.091e-04, forward_time=0.034, loss=1.148, loss_att=0.433, loss_ctc=1.862, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.095 -[v016] 2022-01-31 08:43:13,923 (trainer:653) INFO: 177epoch:train:271-297batch: iter_time=8.872e-05, forward_time=0.033, loss=1.046, loss_att=0.499, loss_ctc=1.593, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.094 -[v016] 2022-01-31 08:43:16,497 (trainer:653) INFO: 177epoch:train:298-324batch: iter_time=8.364e-05, forward_time=0.034, loss=1.176, loss_att=0.504, loss_ctc=1.848, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.095 -[v016] 2022-01-31 08:43:19,011 (trainer:653) INFO: 177epoch:train:325-351batch: iter_time=8.454e-05, forward_time=0.033, loss=1.070, loss_att=0.481, loss_ctc=1.660, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.093 -[v016] 2022-01-31 08:43:21,488 (trainer:653) INFO: 177epoch:train:352-378batch: iter_time=8.398e-05, forward_time=0.032, loss=0.820, loss_att=0.392, loss_ctc=1.248, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.091 -[v016] 2022-01-31 08:43:24,034 (trainer:653) INFO: 177epoch:train:379-405batch: iter_time=8.216e-05, forward_time=0.033, loss=0.861, loss_att=0.397, loss_ctc=1.325, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.094 -[v016] 2022-01-31 08:43:26,766 (trainer:653) INFO: 177epoch:train:406-432batch: iter_time=0.008, forward_time=0.032, loss=1.004, loss_att=0.444, loss_ctc=1.564, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.101 -[v016] 2022-01-31 08:43:29,294 (trainer:653) INFO: 177epoch:train:433-459batch: iter_time=7.788e-05, forward_time=0.033, loss=1.115, loss_att=0.481, loss_ctc=1.748, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.093 -[v016] 2022-01-31 08:43:31,704 (trainer:653) INFO: 177epoch:train:460-486batch: iter_time=7.678e-05, forward_time=0.032, loss=0.818, loss_att=0.427, loss_ctc=1.208, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.089 -[v016] 2022-01-31 08:43:34,148 (trainer:653) INFO: 177epoch:train:487-513batch: iter_time=7.733e-05, forward_time=0.032, loss=0.844, loss_att=0.372, loss_ctc=1.316, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.017e-04, train_time=0.090 -[v016] 2022-01-31 08:43:36,629 (trainer:653) INFO: 177epoch:train:514-540batch: iter_time=8.346e-05, forward_time=0.032, loss=0.985, loss_att=0.489, loss_ctc=1.481, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.092 -[v016] 2022-01-31 08:44:10,379 (trainer:328) INFO: 177epoch results: [train] iter_time=8.797e-04, forward_time=0.033, loss=0.965, loss_att=0.423, loss_ctc=1.506, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.018e-04, train_time=0.094, time=51.41 seconds, total_count=96819, gpu_max_cached_mem_GB=5.824, [valid] loss=8.082, loss_att=6.577, loss_ctc=9.587, acc=0.903, cer=0.102, wer=0.408, cer_ctc=0.145, time=5.55 seconds, total_count=31506, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.51 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:44:12,517 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:44:12,550 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/167epoch.pth, exp/asr_train_asr_raw_en_word/176epoch.pth -[v016] 2022-01-31 08:44:12,550 (trainer:261) INFO: 178/200epoch started. Estimated time to finish: 40 minutes and 25.95 seconds -[v016] 2022-01-31 08:44:15,234 (trainer:653) INFO: 178epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.950, loss_att=0.351, loss_ctc=1.549, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.099 -[v016] 2022-01-31 08:44:17,661 (trainer:653) INFO: 178epoch:train:28-54batch: iter_time=7.764e-05, forward_time=0.031, loss=0.853, loss_att=0.368, loss_ctc=1.339, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.090 -[v016] 2022-01-31 08:44:20,184 (trainer:653) INFO: 178epoch:train:55-81batch: iter_time=7.675e-05, forward_time=0.032, loss=0.883, loss_att=0.347, loss_ctc=1.418, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.093 -[v016] 2022-01-31 08:44:22,711 (trainer:653) INFO: 178epoch:train:82-108batch: iter_time=7.636e-05, forward_time=0.032, loss=0.824, loss_att=0.321, loss_ctc=1.327, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.093 -[v016] 2022-01-31 08:44:25,156 (trainer:653) INFO: 178epoch:train:109-135batch: iter_time=7.878e-05, forward_time=0.032, loss=0.995, loss_att=0.475, loss_ctc=1.515, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.090 -[v016] 2022-01-31 08:44:27,734 (trainer:653) INFO: 178epoch:train:136-162batch: iter_time=0.007, forward_time=0.030, loss=0.935, loss_att=0.463, loss_ctc=1.407, acc=0.979, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.016e-04, train_time=0.095 -[v016] 2022-01-31 08:44:30,104 (trainer:653) INFO: 178epoch:train:163-189batch: iter_time=7.362e-05, forward_time=0.030, loss=0.841, loss_att=0.403, loss_ctc=1.280, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.088 -[v016] 2022-01-31 08:44:32,562 (trainer:653) INFO: 178epoch:train:190-216batch: iter_time=7.481e-05, forward_time=0.032, loss=0.906, loss_att=0.401, loss_ctc=1.410, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.091 -[v016] 2022-01-31 08:44:35,044 (trainer:653) INFO: 178epoch:train:217-243batch: iter_time=7.747e-05, forward_time=0.032, loss=1.011, loss_att=0.453, loss_ctc=1.568, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.092 -[v016] 2022-01-31 08:44:37,483 (trainer:653) INFO: 178epoch:train:244-270batch: iter_time=7.580e-05, forward_time=0.031, loss=0.993, loss_att=0.406, loss_ctc=1.580, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.090 -[v016] 2022-01-31 08:44:39,925 (trainer:653) INFO: 178epoch:train:271-297batch: iter_time=7.717e-05, forward_time=0.032, loss=0.937, loss_att=0.471, loss_ctc=1.404, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.090 -[v016] 2022-01-31 08:44:42,444 (trainer:653) INFO: 178epoch:train:298-324batch: iter_time=7.854e-05, forward_time=0.033, loss=0.874, loss_att=0.404, loss_ctc=1.344, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.093 -[v016] 2022-01-31 08:44:45,067 (trainer:653) INFO: 178epoch:train:325-351batch: iter_time=7.610e-05, forward_time=0.033, loss=1.207, loss_att=0.484, loss_ctc=1.930, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.097 -[v016] 2022-01-31 08:44:47,647 (trainer:653) INFO: 178epoch:train:352-378batch: iter_time=7.901e-05, forward_time=0.033, loss=1.091, loss_att=0.421, loss_ctc=1.760, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.095 -[v016] 2022-01-31 08:44:50,108 (trainer:653) INFO: 178epoch:train:379-405batch: iter_time=7.424e-05, forward_time=0.032, loss=1.037, loss_att=0.505, loss_ctc=1.568, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.091 -[v016] 2022-01-31 08:44:52,555 (trainer:653) INFO: 178epoch:train:406-432batch: iter_time=7.459e-05, forward_time=0.031, loss=1.019, loss_att=0.506, loss_ctc=1.532, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.090 -[v016] 2022-01-31 08:44:55,031 (trainer:653) INFO: 178epoch:train:433-459batch: iter_time=7.707e-05, forward_time=0.032, loss=0.993, loss_att=0.433, loss_ctc=1.554, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.091 -[v016] 2022-01-31 08:44:57,542 (trainer:653) INFO: 178epoch:train:460-486batch: iter_time=8.444e-05, forward_time=0.032, loss=1.008, loss_att=0.400, loss_ctc=1.617, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.093 -[v016] 2022-01-31 08:45:00,397 (trainer:653) INFO: 178epoch:train:487-513batch: iter_time=0.012, forward_time=0.033, loss=1.004, loss_att=0.441, loss_ctc=1.566, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.106 -[v016] 2022-01-31 08:45:02,955 (trainer:653) INFO: 178epoch:train:514-540batch: iter_time=7.564e-05, forward_time=0.033, loss=1.073, loss_att=0.407, loss_ctc=1.739, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.014e-04, train_time=0.095 -[v016] 2022-01-31 08:45:37,033 (trainer:328) INFO: 178epoch results: [train] iter_time=0.001, forward_time=0.032, loss=0.968, loss_att=0.423, loss_ctc=1.513, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.015e-04, train_time=0.093, time=51.1 seconds, total_count=97366, gpu_max_cached_mem_GB=5.824, [valid] loss=8.190, loss_att=6.650, loss_ctc=9.730, acc=0.903, cer=0.103, wer=0.398, cer_ctc=0.150, time=5.92 seconds, total_count=31684, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.46 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:45:39,273 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:45:39,287 (trainer:261) INFO: 179/200epoch started. Estimated time to finish: 38 minutes and 37.87 seconds -[v016] 2022-01-31 08:45:41,945 (trainer:653) INFO: 179epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.987, loss_att=0.380, loss_ctc=1.593, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.098 -[v016] 2022-01-31 08:45:44,431 (trainer:653) INFO: 179epoch:train:28-54batch: iter_time=8.337e-05, forward_time=0.032, loss=0.836, loss_att=0.292, loss_ctc=1.380, acc=0.987, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.092 -[v016] 2022-01-31 08:45:46,897 (trainer:653) INFO: 179epoch:train:55-81batch: iter_time=7.643e-05, forward_time=0.032, loss=0.871, loss_att=0.418, loss_ctc=1.325, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.091 -[v016] 2022-01-31 08:45:49,321 (trainer:653) INFO: 179epoch:train:82-108batch: iter_time=7.434e-05, forward_time=0.031, loss=1.054, loss_att=0.439, loss_ctc=1.669, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.090 -[v016] 2022-01-31 08:45:51,829 (trainer:653) INFO: 179epoch:train:109-135batch: iter_time=7.706e-05, forward_time=0.032, loss=0.943, loss_att=0.375, loss_ctc=1.512, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.093 -[v016] 2022-01-31 08:45:54,302 (trainer:653) INFO: 179epoch:train:136-162batch: iter_time=7.606e-05, forward_time=0.032, loss=0.854, loss_att=0.380, loss_ctc=1.329, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.091 -[v016] 2022-01-31 08:45:56,772 (trainer:653) INFO: 179epoch:train:163-189batch: iter_time=7.598e-05, forward_time=0.031, loss=1.016, loss_att=0.388, loss_ctc=1.644, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.013e-04, train_time=0.091 -[v016] 2022-01-31 08:45:59,268 (trainer:653) INFO: 179epoch:train:190-216batch: iter_time=7.993e-05, forward_time=0.031, loss=0.948, loss_att=0.413, loss_ctc=1.483, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.092 -[v016] 2022-01-31 08:46:01,998 (trainer:653) INFO: 179epoch:train:217-243batch: iter_time=0.008, forward_time=0.033, loss=0.999, loss_att=0.465, loss_ctc=1.532, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.101 -[v016] 2022-01-31 08:46:04,448 (trainer:653) INFO: 179epoch:train:244-270batch: iter_time=7.808e-05, forward_time=0.032, loss=0.938, loss_att=0.450, loss_ctc=1.427, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.091 -[v016] 2022-01-31 08:46:06,977 (trainer:653) INFO: 179epoch:train:271-297batch: iter_time=8.173e-05, forward_time=0.033, loss=1.239, loss_att=0.545, loss_ctc=1.933, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.093 -[v016] 2022-01-31 08:46:09,602 (trainer:653) INFO: 179epoch:train:298-324batch: iter_time=0.005, forward_time=0.033, loss=0.821, loss_att=0.357, loss_ctc=1.284, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.097 -[v016] 2022-01-31 08:46:12,146 (trainer:653) INFO: 179epoch:train:325-351batch: iter_time=7.882e-05, forward_time=0.033, loss=0.944, loss_att=0.404, loss_ctc=1.483, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.094 -[v016] 2022-01-31 08:46:14,621 (trainer:653) INFO: 179epoch:train:352-378batch: iter_time=7.865e-05, forward_time=0.032, loss=0.936, loss_att=0.396, loss_ctc=1.477, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.091 -[v016] 2022-01-31 08:46:17,094 (trainer:653) INFO: 179epoch:train:379-405batch: iter_time=9.014e-05, forward_time=0.033, loss=1.224, loss_att=0.535, loss_ctc=1.914, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.091 -[v016] 2022-01-31 08:46:19,620 (trainer:653) INFO: 179epoch:train:406-432batch: iter_time=7.784e-05, forward_time=0.033, loss=1.082, loss_att=0.404, loss_ctc=1.759, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.093 -[v016] 2022-01-31 08:46:22,199 (trainer:653) INFO: 179epoch:train:433-459batch: iter_time=7.786e-05, forward_time=0.034, loss=0.988, loss_att=0.334, loss_ctc=1.641, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.095 -[v016] 2022-01-31 08:46:24,749 (trainer:653) INFO: 179epoch:train:460-486batch: iter_time=7.931e-05, forward_time=0.033, loss=0.980, loss_att=0.403, loss_ctc=1.557, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.094 -[v016] 2022-01-31 08:46:27,199 (trainer:653) INFO: 179epoch:train:487-513batch: iter_time=7.763e-05, forward_time=0.032, loss=1.022, loss_att=0.497, loss_ctc=1.548, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.091 -[v016] 2022-01-31 08:46:29,637 (trainer:653) INFO: 179epoch:train:514-540batch: iter_time=7.588e-05, forward_time=0.032, loss=0.976, loss_att=0.433, loss_ctc=1.519, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.011e-04, train_time=0.090 -[v016] 2022-01-31 08:47:05,964 (trainer:328) INFO: 179epoch results: [train] iter_time=8.401e-04, forward_time=0.032, loss=0.989, loss_att=0.417, loss_ctc=1.560, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.012e-04, train_time=0.093, time=51.08 seconds, total_count=97913, gpu_max_cached_mem_GB=5.824, [valid] loss=8.068, loss_att=6.588, loss_ctc=9.549, acc=0.905, cer=0.099, wer=0.397, cer_ctc=0.143, time=6.09 seconds, total_count=31862, gpu_max_cached_mem_GB=5.824, [att_plot] time=29.42 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:47:08,303 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:47:08,357 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/173epoch.pth -[v016] 2022-01-31 08:47:08,357 (trainer:261) INFO: 180/200epoch started. Estimated time to finish: 36 minutes and 50.36 seconds -[v016] 2022-01-31 08:47:12,132 (trainer:653) INFO: 180epoch:train:1-27batch: iter_time=0.005, forward_time=0.048, loss=1.030, loss_att=0.486, loss_ctc=1.574, acc=0.975, backward_time=0.041, optim_step_time=0.022, optim0_lr0=1.011e-04, train_time=0.138 -[v016] 2022-01-31 08:47:14,550 (trainer:653) INFO: 180epoch:train:28-54batch: iter_time=0.001, forward_time=0.030, loss=0.835, loss_att=0.420, loss_ctc=1.250, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.010e-04, train_time=0.089 -[v016] 2022-01-31 08:47:17,167 (trainer:653) INFO: 180epoch:train:55-81batch: iter_time=0.003, forward_time=0.032, loss=1.036, loss_att=0.421, loss_ctc=1.651, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.010e-04, train_time=0.097 -[v016] 2022-01-31 08:47:19,763 (trainer:653) INFO: 180epoch:train:82-108batch: iter_time=8.192e-05, forward_time=0.033, loss=1.381, loss_att=0.476, loss_ctc=2.285, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.010e-04, train_time=0.096 -[v016] 2022-01-31 08:47:22,248 (trainer:653) INFO: 180epoch:train:109-135batch: iter_time=8.481e-05, forward_time=0.032, loss=0.938, loss_att=0.410, loss_ctc=1.466, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.010e-04, train_time=0.092 -[v016] 2022-01-31 08:47:24,893 (trainer:653) INFO: 180epoch:train:136-162batch: iter_time=1.060e-04, forward_time=0.034, loss=1.058, loss_att=0.424, loss_ctc=1.692, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.010e-04, train_time=0.098 -[v016] 2022-01-31 08:47:27,540 (trainer:653) INFO: 180epoch:train:163-189batch: iter_time=7.735e-04, forward_time=0.033, loss=0.864, loss_att=0.370, loss_ctc=1.359, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.010e-04, train_time=0.098 -[v016] 2022-01-31 08:47:30,164 (trainer:653) INFO: 180epoch:train:190-216batch: iter_time=1.117e-04, forward_time=0.033, loss=1.089, loss_att=0.450, loss_ctc=1.728, acc=0.977, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.010e-04, train_time=0.097 -[v016] 2022-01-31 08:47:34,704 (trainer:653) INFO: 180epoch:train:217-243batch: iter_time=1.021e-04, forward_time=0.076, loss=1.120, loss_att=0.475, loss_ctc=1.766, acc=0.976, backward_time=0.022, optim_step_time=0.031, optim0_lr0=1.009e-04, train_time=0.168 -[v016] 2022-01-31 08:47:37,257 (trainer:653) INFO: 180epoch:train:244-270batch: iter_time=8.552e-05, forward_time=0.032, loss=0.860, loss_att=0.379, loss_ctc=1.341, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.009e-04, train_time=0.094 -[v016] 2022-01-31 08:47:40,867 (trainer:653) INFO: 180epoch:train:271-297batch: iter_time=0.019, forward_time=0.053, loss=0.974, loss_att=0.436, loss_ctc=1.511, acc=0.980, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.009e-04, train_time=0.134 -[v016] 2022-01-31 08:47:43,374 (trainer:653) INFO: 180epoch:train:298-324batch: iter_time=8.271e-05, forward_time=0.031, loss=0.970, loss_att=0.445, loss_ctc=1.495, acc=0.974, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.009e-04, train_time=0.093 -[v016] 2022-01-31 08:47:45,996 (trainer:653) INFO: 180epoch:train:325-351batch: iter_time=0.002, forward_time=0.032, loss=0.962, loss_att=0.414, loss_ctc=1.510, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.009e-04, train_time=0.097 -[v016] 2022-01-31 08:47:48,894 (trainer:653) INFO: 180epoch:train:352-378batch: iter_time=0.002, forward_time=0.032, loss=0.859, loss_att=0.430, loss_ctc=1.288, acc=0.977, backward_time=0.035, optim_step_time=0.021, optim0_lr0=1.009e-04, train_time=0.107 -[v016] 2022-01-31 08:47:51,409 (trainer:653) INFO: 180epoch:train:379-405batch: iter_time=8.177e-05, forward_time=0.032, loss=0.795, loss_att=0.367, loss_ctc=1.223, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.009e-04, train_time=0.093 -[v016] 2022-01-31 08:47:54,010 (trainer:653) INFO: 180epoch:train:406-432batch: iter_time=0.004, forward_time=0.032, loss=0.957, loss_att=0.411, loss_ctc=1.502, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.008e-04, train_time=0.096 -[v016] 2022-01-31 08:47:56,489 (trainer:653) INFO: 180epoch:train:433-459batch: iter_time=4.601e-04, forward_time=0.031, loss=0.886, loss_att=0.355, loss_ctc=1.417, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=1.008e-04, train_time=0.092 -[v016] 2022-01-31 08:47:59,130 (trainer:653) INFO: 180epoch:train:460-486batch: iter_time=9.554e-05, forward_time=0.033, loss=0.894, loss_att=0.358, loss_ctc=1.430, acc=0.984, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.008e-04, train_time=0.098 -[v016] 2022-01-31 08:48:02,406 (trainer:653) INFO: 180epoch:train:487-513batch: iter_time=0.026, forward_time=0.033, loss=0.975, loss_att=0.439, loss_ctc=1.511, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.008e-04, train_time=0.121 -[v016] 2022-01-31 08:48:05,492 (trainer:653) INFO: 180epoch:train:514-540batch: iter_time=0.020, forward_time=0.032, loss=1.016, loss_att=0.445, loss_ctc=1.586, acc=0.979, backward_time=0.022, optim_step_time=0.021, optim0_lr0=1.008e-04, train_time=0.114 -[v016] 2022-01-31 08:48:56,154 (trainer:328) INFO: 180epoch results: [train] iter_time=0.004, forward_time=0.036, loss=0.976, loss_att=0.421, loss_ctc=1.530, acc=0.980, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.009e-04, train_time=0.105, time=57.89 seconds, total_count=98460, gpu_max_cached_mem_GB=5.824, [valid] loss=8.155, loss_att=6.654, loss_ctc=9.655, acc=0.904, cer=0.102, wer=0.400, cer_ctc=0.148, time=11.55 seconds, total_count=32040, gpu_max_cached_mem_GB=5.824, [att_plot] time=38.22 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:48:59,788 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 08:48:59,855 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/169epoch.pth -[v016] 2022-01-31 08:48:59,865 (trainer:261) INFO: 181/200epoch started. Estimated time to finish: 35 minutes and 5.88 seconds -[v016] 2022-01-31 08:49:06,600 (trainer:653) INFO: 181epoch:train:1-27batch: iter_time=0.032, forward_time=0.078, loss=0.929, loss_att=0.387, loss_ctc=1.471, acc=0.978, backward_time=0.038, optim_step_time=0.043, optim0_lr0=1.008e-04, train_time=0.244 -[v016] 2022-01-31 08:49:12,192 (trainer:653) INFO: 181epoch:train:28-54batch: iter_time=0.075, forward_time=0.042, loss=1.003, loss_att=0.372, loss_ctc=1.633, acc=0.983, backward_time=0.025, optim_step_time=0.029, optim0_lr0=1.008e-04, train_time=0.207 -[v016] 2022-01-31 08:49:17,088 (trainer:653) INFO: 181epoch:train:55-81batch: iter_time=0.042, forward_time=0.045, loss=1.022, loss_att=0.398, loss_ctc=1.646, acc=0.982, backward_time=0.025, optim_step_time=0.028, optim0_lr0=1.007e-04, train_time=0.176 -[v016] 2022-01-31 08:49:21,122 (trainer:653) INFO: 181epoch:train:82-108batch: iter_time=0.009, forward_time=0.042, loss=0.948, loss_att=0.448, loss_ctc=1.447, acc=0.977, backward_time=0.029, optim_step_time=0.036, optim0_lr0=1.007e-04, train_time=0.149 -[v016] 2022-01-31 08:49:25,508 (trainer:653) INFO: 181epoch:train:109-135batch: iter_time=0.029, forward_time=0.044, loss=0.918, loss_att=0.397, loss_ctc=1.439, acc=0.982, backward_time=0.026, optim_step_time=0.032, optim0_lr0=1.007e-04, train_time=0.162 -[v016] 2022-01-31 08:49:33,022 (trainer:653) INFO: 181epoch:train:136-162batch: iter_time=0.143, forward_time=0.044, loss=0.836, loss_att=0.308, loss_ctc=1.364, acc=0.986, backward_time=0.024, optim_step_time=0.029, optim0_lr0=1.007e-04, train_time=0.274 -[v016] 2022-01-31 08:49:47,096 (trainer:653) INFO: 181epoch:train:163-189batch: iter_time=0.245, forward_time=0.163, loss=0.997, loss_att=0.423, loss_ctc=1.571, acc=0.980, backward_time=0.031, optim_step_time=0.032, optim0_lr0=1.007e-04, train_time=0.524 -[v016] 2022-01-31 08:49:59,404 (trainer:653) INFO: 181epoch:train:190-216batch: iter_time=0.338, forward_time=0.040, loss=0.905, loss_att=0.392, loss_ctc=1.418, acc=0.981, backward_time=0.025, optim_step_time=0.026, optim0_lr0=1.007e-04, train_time=0.456 -[v016] 2022-01-31 08:50:08,544 (trainer:653) INFO: 181epoch:train:217-243batch: iter_time=0.230, forward_time=0.038, loss=0.958, loss_att=0.362, loss_ctc=1.553, acc=0.984, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.007e-04, train_time=0.338 -[v016] 2022-01-31 08:50:21,981 (trainer:653) INFO: 181epoch:train:244-270batch: iter_time=0.352, forward_time=0.057, loss=0.904, loss_att=0.405, loss_ctc=1.403, acc=0.978, backward_time=0.029, optim_step_time=0.030, optim0_lr0=1.006e-04, train_time=0.497 -[v016] 2022-01-31 08:50:32,320 (trainer:653) INFO: 181epoch:train:271-297batch: iter_time=0.280, forward_time=0.035, loss=0.928, loss_att=0.382, loss_ctc=1.475, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.006e-04, train_time=0.383 -[v016] 2022-01-31 08:50:42,141 (trainer:653) INFO: 181epoch:train:298-324batch: iter_time=0.262, forward_time=0.035, loss=0.982, loss_att=0.404, loss_ctc=1.560, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.006e-04, train_time=0.364 -[v016] 2022-01-31 08:50:53,057 (trainer:653) INFO: 181epoch:train:325-351batch: iter_time=0.290, forward_time=0.044, loss=1.097, loss_att=0.449, loss_ctc=1.744, acc=0.978, backward_time=0.023, optim_step_time=0.024, optim0_lr0=1.006e-04, train_time=0.404 -[v016] 2022-01-31 08:51:07,579 (trainer:653) INFO: 181epoch:train:352-378batch: iter_time=0.406, forward_time=0.048, loss=0.800, loss_att=0.385, loss_ctc=1.216, acc=0.982, backward_time=0.026, optim_step_time=0.029, optim0_lr0=1.006e-04, train_time=0.537 -[v016] 2022-01-31 08:51:22,560 (trainer:653) INFO: 181epoch:train:379-405batch: iter_time=0.418, forward_time=0.046, loss=1.050, loss_att=0.433, loss_ctc=1.667, acc=0.980, backward_time=0.026, optim_step_time=0.031, optim0_lr0=1.006e-04, train_time=0.553 -[v016] 2022-01-31 08:51:39,687 (trainer:653) INFO: 181epoch:train:406-432batch: iter_time=0.327, forward_time=0.204, loss=1.062, loss_att=0.371, loss_ctc=1.754, acc=0.982, backward_time=0.033, optim_step_time=0.031, optim0_lr0=1.006e-04, train_time=0.635 -[v016] 2022-01-31 08:51:53,514 (trainer:653) INFO: 181epoch:train:433-459batch: iter_time=0.309, forward_time=0.083, loss=0.926, loss_att=0.484, loss_ctc=1.368, acc=0.976, backward_time=0.028, optim_step_time=0.029, optim0_lr0=1.006e-04, train_time=0.511 -[v016] 2022-01-31 08:52:10,977 (trainer:653) INFO: 181epoch:train:460-486batch: iter_time=0.526, forward_time=0.041, loss=1.066, loss_att=0.444, loss_ctc=1.688, acc=0.980, backward_time=0.024, optim_step_time=0.027, optim0_lr0=1.005e-04, train_time=0.647 -[v016] 2022-01-31 08:52:22,710 (trainer:653) INFO: 181epoch:train:487-513batch: iter_time=0.321, forward_time=0.036, loss=1.006, loss_att=0.429, loss_ctc=1.584, acc=0.980, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.005e-04, train_time=0.434 -[v016] 2022-01-31 08:52:36,013 (trainer:653) INFO: 181epoch:train:514-540batch: iter_time=0.389, forward_time=0.035, loss=1.257, loss_att=0.552, loss_ctc=1.962, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.005e-04, train_time=0.493 -[v016] 2022-01-31 08:54:02,231 (trainer:328) INFO: 181epoch results: [train] iter_time=0.250, forward_time=0.060, loss=0.976, loss_att=0.411, loss_ctc=1.541, acc=0.980, backward_time=0.026, optim_step_time=0.028, optim0_lr0=1.006e-04, train_time=0.398, time=3 minutes and 38.37 seconds, total_count=99007, gpu_max_cached_mem_GB=5.824, [valid] loss=7.976, loss_att=6.634, loss_ctc=9.319, acc=0.906, cer=0.098, wer=0.393, cer_ctc=0.139, time=49.93 seconds, total_count=32218, gpu_max_cached_mem_GB=5.824, [att_plot] time=33.99 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:54:04,965 (trainer:375) INFO: The best model has been updated: train.acc -[v016] 2022-01-31 08:54:04,979 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/172epoch.pth, exp/asr_train_asr_raw_en_word/175epoch.pth -[v016] 2022-01-31 08:54:04,979 (trainer:261) INFO: 182/200epoch started. Estimated time to finish: 33 minutes and 44.17 seconds -[v016] 2022-01-31 08:54:18,279 (trainer:653) INFO: 182epoch:train:1-27batch: iter_time=0.379, forward_time=0.036, loss=0.950, loss_att=0.422, loss_ctc=1.479, acc=0.980, backward_time=0.025, optim_step_time=0.023, optim0_lr0=1.005e-04, train_time=0.486 -[v016] 2022-01-31 08:54:27,566 (trainer:653) INFO: 182epoch:train:28-54batch: iter_time=0.243, forward_time=0.034, loss=0.840, loss_att=0.349, loss_ctc=1.331, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.005e-04, train_time=0.344 -[v016] 2022-01-31 08:54:38,207 (trainer:653) INFO: 182epoch:train:55-81batch: iter_time=0.295, forward_time=0.034, loss=0.821, loss_att=0.361, loss_ctc=1.280, acc=0.981, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.005e-04, train_time=0.394 -[v016] 2022-01-31 08:54:53,897 (trainer:653) INFO: 182epoch:train:82-108batch: iter_time=0.474, forward_time=0.037, loss=0.994, loss_att=0.412, loss_ctc=1.577, acc=0.980, backward_time=0.023, optim_step_time=0.025, optim0_lr0=1.005e-04, train_time=0.581 -[v016] 2022-01-31 08:55:07,069 (trainer:653) INFO: 182epoch:train:109-135batch: iter_time=0.380, forward_time=0.036, loss=0.878, loss_att=0.398, loss_ctc=1.358, acc=0.979, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.004e-04, train_time=0.486 -[v016] 2022-01-31 08:55:15,684 (trainer:653) INFO: 182epoch:train:136-162batch: iter_time=0.218, forward_time=0.035, loss=0.923, loss_att=0.418, loss_ctc=1.428, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.004e-04, train_time=0.319 -[v016] 2022-01-31 08:55:27,213 (trainer:653) INFO: 182epoch:train:163-189batch: iter_time=0.315, forward_time=0.035, loss=0.786, loss_att=0.347, loss_ctc=1.226, acc=0.983, backward_time=0.025, optim_step_time=0.028, optim0_lr0=1.004e-04, train_time=0.427 -[v016] 2022-01-31 08:55:50,592 (trainer:653) INFO: 182epoch:train:190-216batch: iter_time=0.494, forward_time=0.211, loss=0.982, loss_att=0.446, loss_ctc=1.519, acc=0.980, backward_time=0.039, optim_step_time=0.029, optim0_lr0=1.004e-04, train_time=0.856 -[v016] 2022-01-31 08:56:05,188 (trainer:653) INFO: 182epoch:train:217-243batch: iter_time=0.415, forward_time=0.047, loss=0.970, loss_att=0.351, loss_ctc=1.589, acc=0.984, backward_time=0.024, optim_step_time=0.025, optim0_lr0=1.004e-04, train_time=0.550 -[v016] 2022-01-31 08:56:15,258 (trainer:653) INFO: 182epoch:train:244-270batch: iter_time=0.273, forward_time=0.034, loss=0.941, loss_att=0.406, loss_ctc=1.477, acc=0.981, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.004e-04, train_time=0.373 -[v016] 2022-01-31 08:56:25,846 (trainer:653) INFO: 182epoch:train:271-297batch: iter_time=0.295, forward_time=0.033, loss=0.822, loss_att=0.333, loss_ctc=1.311, acc=0.985, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.004e-04, train_time=0.392 -[v016] 2022-01-31 08:56:35,860 (trainer:653) INFO: 182epoch:train:298-324batch: iter_time=0.269, forward_time=0.035, loss=1.075, loss_att=0.426, loss_ctc=1.723, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.003e-04, train_time=0.371 -[v016] 2022-01-31 08:56:43,887 (trainer:653) INFO: 182epoch:train:325-351batch: iter_time=0.201, forward_time=0.033, loss=0.921, loss_att=0.314, loss_ctc=1.528, acc=0.985, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.003e-04, train_time=0.297 -[v016] 2022-01-31 08:56:58,802 (trainer:653) INFO: 182epoch:train:352-378batch: iter_time=0.453, forward_time=0.034, loss=0.972, loss_att=0.443, loss_ctc=1.502, acc=0.978, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.003e-04, train_time=0.552 -[v016] 2022-01-31 08:57:09,389 (trainer:653) INFO: 182epoch:train:379-405batch: iter_time=0.293, forward_time=0.034, loss=0.954, loss_att=0.404, loss_ctc=1.505, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.003e-04, train_time=0.392 -[v016] 2022-01-31 08:57:20,527 (trainer:653) INFO: 182epoch:train:406-432batch: iter_time=0.311, forward_time=0.035, loss=1.145, loss_att=0.496, loss_ctc=1.794, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.003e-04, train_time=0.412 -[v016] 2022-01-31 08:57:30,706 (trainer:653) INFO: 182epoch:train:433-459batch: iter_time=0.279, forward_time=0.034, loss=0.943, loss_att=0.370, loss_ctc=1.516, acc=0.983, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.003e-04, train_time=0.377 -[v016] 2022-01-31 08:57:39,325 (trainer:653) INFO: 182epoch:train:460-486batch: iter_time=0.222, forward_time=0.033, loss=1.070, loss_att=0.455, loss_ctc=1.686, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.003e-04, train_time=0.319 -[v016] 2022-01-31 08:57:49,824 (trainer:653) INFO: 182epoch:train:487-513batch: iter_time=0.286, forward_time=0.036, loss=1.203, loss_att=0.490, loss_ctc=1.915, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.002e-04, train_time=0.389 -[v016] 2022-01-31 08:58:00,283 (trainer:653) INFO: 182epoch:train:514-540batch: iter_time=0.291, forward_time=0.033, loss=1.051, loss_att=0.504, loss_ctc=1.598, acc=0.973, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.002e-04, train_time=0.387 -[v016] 2022-01-31 08:59:23,580 (trainer:328) INFO: 182epoch results: [train] iter_time=0.318, forward_time=0.044, loss=0.956, loss_att=0.405, loss_ctc=1.507, acc=0.981, backward_time=0.024, optim_step_time=0.024, optim0_lr0=1.004e-04, train_time=0.433, time=3 minutes and 57.29 seconds, total_count=99554, gpu_max_cached_mem_GB=5.824, [valid] loss=8.093, loss_att=6.635, loss_ctc=9.551, acc=0.905, cer=0.099, wer=0.401, cer_ctc=0.146, time=48.72 seconds, total_count=32396, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.4 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 08:59:26,246 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 08:59:26,261 (trainer:261) INFO: 183/200epoch started. Estimated time to finish: 32 minutes and 21.5 seconds -[v016] 2022-01-31 08:59:29,964 (trainer:653) INFO: 183epoch:train:1-27batch: iter_time=0.032, forward_time=0.032, loss=1.046, loss_att=0.387, loss_ctc=1.704, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.002e-04, train_time=0.128 -[v016] 2022-01-31 08:59:33,356 (trainer:653) INFO: 183epoch:train:28-54batch: iter_time=0.029, forward_time=0.033, loss=0.845, loss_att=0.365, loss_ctc=1.326, acc=0.983, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.002e-04, train_time=0.125 -[v016] 2022-01-31 08:59:40,818 (trainer:653) INFO: 183epoch:train:55-81batch: iter_time=0.171, forward_time=0.036, loss=1.151, loss_att=0.472, loss_ctc=1.831, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.002e-04, train_time=0.276 -[v016] 2022-01-31 08:59:45,987 (trainer:653) INFO: 183epoch:train:82-108batch: iter_time=0.091, forward_time=0.035, loss=0.883, loss_att=0.376, loss_ctc=1.390, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.002e-04, train_time=0.191 -[v016] 2022-01-31 08:59:51,805 (trainer:653) INFO: 183epoch:train:109-135batch: iter_time=0.120, forward_time=0.033, loss=1.011, loss_att=0.439, loss_ctc=1.584, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=1.002e-04, train_time=0.215 -[v016] 2022-01-31 08:59:59,259 (trainer:653) INFO: 183epoch:train:136-162batch: iter_time=0.084, forward_time=0.114, loss=1.021, loss_att=0.419, loss_ctc=1.622, acc=0.980, backward_time=0.027, optim_step_time=0.025, optim0_lr0=1.001e-04, train_time=0.276 -[v016] 2022-01-31 09:00:03,771 (trainer:653) INFO: 183epoch:train:163-189batch: iter_time=0.068, forward_time=0.034, loss=1.049, loss_att=0.400, loss_ctc=1.698, acc=0.981, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.167 -[v016] 2022-01-31 09:00:08,459 (trainer:653) INFO: 183epoch:train:190-216batch: iter_time=0.074, forward_time=0.034, loss=0.832, loss_att=0.326, loss_ctc=1.339, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.173 -[v016] 2022-01-31 09:00:13,932 (trainer:653) INFO: 183epoch:train:217-243batch: iter_time=0.104, forward_time=0.034, loss=0.931, loss_att=0.385, loss_ctc=1.478, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.202 -[v016] 2022-01-31 09:00:17,345 (trainer:653) INFO: 183epoch:train:244-270batch: iter_time=0.029, forward_time=0.034, loss=0.870, loss_att=0.352, loss_ctc=1.388, acc=0.984, backward_time=0.023, optim_step_time=0.022, optim0_lr0=1.001e-04, train_time=0.126 -[v016] 2022-01-31 09:00:20,975 (trainer:653) INFO: 183epoch:train:271-297batch: iter_time=0.041, forward_time=0.032, loss=1.034, loss_att=0.429, loss_ctc=1.638, acc=0.980, backward_time=0.021, optim_step_time=0.022, optim0_lr0=1.001e-04, train_time=0.134 -[v016] 2022-01-31 09:00:29,750 (trainer:653) INFO: 183epoch:train:298-324batch: iter_time=0.132, forward_time=0.099, loss=0.986, loss_att=0.437, loss_ctc=1.536, acc=0.977, backward_time=0.029, optim_step_time=0.043, optim0_lr0=1.001e-04, train_time=0.325 -[v016] 2022-01-31 09:00:34,814 (trainer:653) INFO: 183epoch:train:325-351batch: iter_time=0.083, forward_time=0.038, loss=1.106, loss_att=0.517, loss_ctc=1.695, acc=0.976, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.187 -[v016] 2022-01-31 09:00:39,065 (trainer:653) INFO: 183epoch:train:352-378batch: iter_time=0.056, forward_time=0.035, loss=1.085, loss_att=0.395, loss_ctc=1.775, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.000e-04, train_time=0.157 -[v016] 2022-01-31 09:00:42,024 (trainer:653) INFO: 183epoch:train:379-405batch: iter_time=0.008, forward_time=0.034, loss=0.915, loss_att=0.446, loss_ctc=1.384, acc=0.973, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.000e-04, train_time=0.109 -[v016] 2022-01-31 09:00:45,362 (trainer:653) INFO: 183epoch:train:406-432batch: iter_time=0.024, forward_time=0.033, loss=0.978, loss_att=0.449, loss_ctc=1.506, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.000e-04, train_time=0.123 -[v016] 2022-01-31 09:00:49,778 (trainer:653) INFO: 183epoch:train:433-459batch: iter_time=0.062, forward_time=0.035, loss=1.023, loss_att=0.397, loss_ctc=1.648, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=1.000e-04, train_time=0.163 -[v016] 2022-01-31 09:00:54,434 (trainer:653) INFO: 183epoch:train:460-486batch: iter_time=0.077, forward_time=0.032, loss=0.762, loss_att=0.337, loss_ctc=1.186, acc=0.982, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.999e-05, train_time=0.172 -[v016] 2022-01-31 09:00:57,533 (trainer:653) INFO: 183epoch:train:487-513batch: iter_time=0.021, forward_time=0.032, loss=1.093, loss_att=0.508, loss_ctc=1.678, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.997e-05, train_time=0.115 -[v016] 2022-01-31 09:01:00,470 (trainer:653) INFO: 183epoch:train:514-540batch: iter_time=0.016, forward_time=0.032, loss=1.019, loss_att=0.398, loss_ctc=1.640, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.996e-05, train_time=0.109 -[v016] 2022-01-31 09:01:36,284 (trainer:328) INFO: 183epoch results: [train] iter_time=0.065, forward_time=0.041, loss=0.978, loss_att=0.410, loss_ctc=1.545, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=1.001e-04, train_time=0.173, time=1 minute and 34.83 seconds, total_count=100101, gpu_max_cached_mem_GB=5.824, [valid] loss=8.060, loss_att=6.610, loss_ctc=9.509, acc=0.904, cer=0.101, wer=0.404, cer_ctc=0.146, time=7.3 seconds, total_count=32574, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.81 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:01:38,227 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:01:38,240 (trainer:261) INFO: 184/200epoch started. Estimated time to finish: 30 minutes and 36.15 seconds -[v016] 2022-01-31 09:01:40,963 (trainer:653) INFO: 184epoch:train:1-27batch: iter_time=0.007, forward_time=0.032, loss=1.119, loss_att=0.475, loss_ctc=1.763, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.994e-05, train_time=0.100 -[v016] 2022-01-31 09:01:43,398 (trainer:653) INFO: 184epoch:train:28-54batch: iter_time=8.234e-05, forward_time=0.031, loss=1.075, loss_att=0.451, loss_ctc=1.700, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.993e-05, train_time=0.090 -[v016] 2022-01-31 09:01:46,030 (trainer:653) INFO: 184epoch:train:55-81batch: iter_time=0.002, forward_time=0.033, loss=1.075, loss_att=0.463, loss_ctc=1.687, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.992e-05, train_time=0.097 -[v016] 2022-01-31 09:01:48,829 (trainer:653) INFO: 184epoch:train:82-108batch: iter_time=0.011, forward_time=0.032, loss=0.836, loss_att=0.294, loss_ctc=1.378, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.990e-05, train_time=0.103 -[v016] 2022-01-31 09:01:51,584 (trainer:653) INFO: 184epoch:train:109-135batch: iter_time=0.005, forward_time=0.034, loss=1.190, loss_att=0.450, loss_ctc=1.929, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.989e-05, train_time=0.102 -[v016] 2022-01-31 09:01:54,089 (trainer:653) INFO: 184epoch:train:136-162batch: iter_time=0.002, forward_time=0.031, loss=0.861, loss_att=0.363, loss_ctc=1.359, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.987e-05, train_time=0.093 -[v016] 2022-01-31 09:01:56,562 (trainer:653) INFO: 184epoch:train:163-189batch: iter_time=7.787e-05, forward_time=0.032, loss=0.857, loss_att=0.315, loss_ctc=1.399, acc=0.987, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.986e-05, train_time=0.091 -[v016] 2022-01-31 09:01:59,052 (trainer:653) INFO: 184epoch:train:190-216batch: iter_time=7.843e-05, forward_time=0.032, loss=0.936, loss_att=0.393, loss_ctc=1.480, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.985e-05, train_time=0.092 -[v016] 2022-01-31 09:02:01,558 (trainer:653) INFO: 184epoch:train:217-243batch: iter_time=0.002, forward_time=0.032, loss=0.939, loss_att=0.392, loss_ctc=1.486, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.983e-05, train_time=0.093 -[v016] 2022-01-31 09:02:04,195 (trainer:653) INFO: 184epoch:train:244-270batch: iter_time=0.005, forward_time=0.032, loss=1.007, loss_att=0.426, loss_ctc=1.588, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.982e-05, train_time=0.097 -[v016] 2022-01-31 09:02:06,927 (trainer:653) INFO: 184epoch:train:271-297batch: iter_time=0.010, forward_time=0.031, loss=1.052, loss_att=0.473, loss_ctc=1.631, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.981e-05, train_time=0.101 -[v016] 2022-01-31 09:02:09,370 (trainer:653) INFO: 184epoch:train:298-324batch: iter_time=7.631e-05, forward_time=0.031, loss=0.920, loss_att=0.427, loss_ctc=1.413, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.979e-05, train_time=0.090 -[v016] 2022-01-31 09:02:11,804 (trainer:653) INFO: 184epoch:train:325-351batch: iter_time=7.572e-05, forward_time=0.031, loss=0.848, loss_att=0.384, loss_ctc=1.313, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.978e-05, train_time=0.090 -[v016] 2022-01-31 09:02:14,284 (trainer:653) INFO: 184epoch:train:352-378batch: iter_time=7.876e-05, forward_time=0.032, loss=0.921, loss_att=0.368, loss_ctc=1.475, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.977e-05, train_time=0.092 -[v016] 2022-01-31 09:02:16,764 (trainer:653) INFO: 184epoch:train:379-405batch: iter_time=7.786e-05, forward_time=0.032, loss=0.940, loss_att=0.354, loss_ctc=1.527, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.975e-05, train_time=0.092 -[v016] 2022-01-31 09:02:20,898 (trainer:653) INFO: 184epoch:train:406-432batch: iter_time=0.059, forward_time=0.033, loss=1.132, loss_att=0.500, loss_ctc=1.764, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.974e-05, train_time=0.153 -[v016] 2022-01-31 09:02:23,375 (trainer:653) INFO: 184epoch:train:433-459batch: iter_time=7.817e-05, forward_time=0.032, loss=1.047, loss_att=0.528, loss_ctc=1.566, acc=0.972, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.973e-05, train_time=0.092 -[v016] 2022-01-31 09:02:25,938 (trainer:653) INFO: 184epoch:train:460-486batch: iter_time=8.125e-05, forward_time=0.033, loss=0.914, loss_att=0.371, loss_ctc=1.458, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.971e-05, train_time=0.095 -[v016] 2022-01-31 09:02:28,501 (trainer:653) INFO: 184epoch:train:487-513batch: iter_time=0.002, forward_time=0.032, loss=0.786, loss_att=0.377, loss_ctc=1.196, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.970e-05, train_time=0.095 -[v016] 2022-01-31 09:02:31,047 (trainer:653) INFO: 184epoch:train:514-540batch: iter_time=8.287e-05, forward_time=0.033, loss=0.957, loss_att=0.409, loss_ctc=1.506, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.969e-05, train_time=0.094 -[v016] 2022-01-31 09:03:05,256 (trainer:328) INFO: 184epoch results: [train] iter_time=0.005, forward_time=0.032, loss=0.972, loss_att=0.413, loss_ctc=1.532, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.981e-05, train_time=0.097, time=53.5 seconds, total_count=100648, gpu_max_cached_mem_GB=5.824, [valid] loss=7.965, loss_att=6.541, loss_ctc=9.390, acc=0.905, cer=0.100, wer=0.401, cer_ctc=0.141, time=6.01 seconds, total_count=32752, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.5 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:03:08,098 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:03:08,111 (trainer:261) INFO: 185/200epoch started. Estimated time to finish: 28 minutes and 46.37 seconds -[v016] 2022-01-31 09:03:10,842 (trainer:653) INFO: 185epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=0.856, loss_att=0.350, loss_ctc=1.362, acc=0.986, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.967e-05, train_time=0.101 -[v016] 2022-01-31 09:03:13,418 (trainer:653) INFO: 185epoch:train:28-54batch: iter_time=8.983e-05, forward_time=0.034, loss=1.081, loss_att=0.412, loss_ctc=1.750, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.966e-05, train_time=0.095 -[v016] 2022-01-31 09:03:15,898 (trainer:653) INFO: 185epoch:train:55-81batch: iter_time=8.360e-05, forward_time=0.032, loss=0.768, loss_att=0.338, loss_ctc=1.198, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.964e-05, train_time=0.092 -[v016] 2022-01-31 09:03:18,328 (trainer:653) INFO: 185epoch:train:82-108batch: iter_time=8.138e-05, forward_time=0.032, loss=0.966, loss_att=0.463, loss_ctc=1.469, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.963e-05, train_time=0.090 -[v016] 2022-01-31 09:03:20,852 (trainer:653) INFO: 185epoch:train:109-135batch: iter_time=8.014e-05, forward_time=0.032, loss=1.069, loss_att=0.440, loss_ctc=1.699, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.962e-05, train_time=0.093 -[v016] 2022-01-31 09:03:23,293 (trainer:653) INFO: 185epoch:train:136-162batch: iter_time=8.168e-05, forward_time=0.032, loss=0.854, loss_att=0.358, loss_ctc=1.351, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.960e-05, train_time=0.090 -[v016] 2022-01-31 09:03:25,735 (trainer:653) INFO: 185epoch:train:163-189batch: iter_time=7.943e-05, forward_time=0.031, loss=0.893, loss_att=0.452, loss_ctc=1.334, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.959e-05, train_time=0.090 -[v016] 2022-01-31 09:03:28,283 (trainer:653) INFO: 185epoch:train:190-216batch: iter_time=7.879e-05, forward_time=0.033, loss=1.071, loss_att=0.428, loss_ctc=1.714, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.958e-05, train_time=0.094 -[v016] 2022-01-31 09:03:30,749 (trainer:653) INFO: 185epoch:train:217-243batch: iter_time=7.777e-05, forward_time=0.032, loss=1.005, loss_att=0.385, loss_ctc=1.624, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.956e-05, train_time=0.091 -[v016] 2022-01-31 09:03:33,324 (trainer:653) INFO: 185epoch:train:244-270batch: iter_time=7.626e-05, forward_time=0.034, loss=1.103, loss_att=0.397, loss_ctc=1.810, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.955e-05, train_time=0.095 -[v016] 2022-01-31 09:03:35,760 (trainer:653) INFO: 185epoch:train:271-297batch: iter_time=7.736e-05, forward_time=0.032, loss=0.778, loss_att=0.383, loss_ctc=1.173, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.954e-05, train_time=0.090 -[v016] 2022-01-31 09:03:38,331 (trainer:653) INFO: 185epoch:train:298-324batch: iter_time=8.459e-05, forward_time=0.034, loss=1.108, loss_att=0.523, loss_ctc=1.693, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.952e-05, train_time=0.095 -[v016] 2022-01-31 09:03:40,982 (trainer:653) INFO: 185epoch:train:325-351batch: iter_time=0.006, forward_time=0.033, loss=0.944, loss_att=0.380, loss_ctc=1.507, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.951e-05, train_time=0.098 -[v016] 2022-01-31 09:03:43,494 (trainer:653) INFO: 185epoch:train:352-378batch: iter_time=7.810e-05, forward_time=0.033, loss=0.805, loss_att=0.367, loss_ctc=1.243, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.950e-05, train_time=0.093 -[v016] 2022-01-31 09:03:45,960 (trainer:653) INFO: 185epoch:train:379-405batch: iter_time=8.063e-05, forward_time=0.032, loss=0.989, loss_att=0.427, loss_ctc=1.551, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.948e-05, train_time=0.091 -[v016] 2022-01-31 09:03:48,519 (trainer:653) INFO: 185epoch:train:406-432batch: iter_time=7.880e-05, forward_time=0.033, loss=1.018, loss_att=0.367, loss_ctc=1.669, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.947e-05, train_time=0.095 -[v016] 2022-01-31 09:03:50,982 (trainer:653) INFO: 185epoch:train:433-459batch: iter_time=7.734e-05, forward_time=0.032, loss=0.919, loss_att=0.335, loss_ctc=1.503, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.946e-05, train_time=0.091 -[v016] 2022-01-31 09:03:53,465 (trainer:653) INFO: 185epoch:train:460-486batch: iter_time=8.033e-05, forward_time=0.033, loss=0.933, loss_att=0.435, loss_ctc=1.432, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.944e-05, train_time=0.092 -[v016] 2022-01-31 09:03:56,066 (trainer:653) INFO: 185epoch:train:487-513batch: iter_time=8.154e-05, forward_time=0.034, loss=1.072, loss_att=0.446, loss_ctc=1.698, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.943e-05, train_time=0.096 -[v016] 2022-01-31 09:03:58,614 (trainer:653) INFO: 185epoch:train:514-540batch: iter_time=7.898e-05, forward_time=0.033, loss=0.895, loss_att=0.344, loss_ctc=1.447, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.942e-05, train_time=0.094 -[v016] 2022-01-31 09:04:32,755 (trainer:328) INFO: 185epoch results: [train] iter_time=5.451e-04, forward_time=0.033, loss=0.955, loss_att=0.402, loss_ctc=1.508, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.954e-05, train_time=0.093, time=51.21 seconds, total_count=101195, gpu_max_cached_mem_GB=5.824, [valid] loss=8.089, loss_att=6.707, loss_ctc=9.471, acc=0.903, cer=0.104, wer=0.407, cer_ctc=0.147, time=5.62 seconds, total_count=32930, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.82 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:04:34,827 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 09:04:34,840 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/180epoch.pth -[v016] 2022-01-31 09:04:34,840 (trainer:261) INFO: 186/200epoch started. Estimated time to finish: 26 minutes and 56.55 seconds -[v016] 2022-01-31 09:04:37,463 (trainer:653) INFO: 186epoch:train:1-27batch: iter_time=0.003, forward_time=0.032, loss=1.038, loss_att=0.452, loss_ctc=1.625, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.940e-05, train_time=0.097 -[v016] 2022-01-31 09:04:39,944 (trainer:653) INFO: 186epoch:train:28-54batch: iter_time=8.744e-05, forward_time=0.032, loss=0.883, loss_att=0.388, loss_ctc=1.377, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.939e-05, train_time=0.092 -[v016] 2022-01-31 09:04:42,500 (trainer:653) INFO: 186epoch:train:55-81batch: iter_time=8.755e-05, forward_time=0.033, loss=0.998, loss_att=0.431, loss_ctc=1.564, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.937e-05, train_time=0.094 -[v016] 2022-01-31 09:04:44,906 (trainer:653) INFO: 186epoch:train:82-108batch: iter_time=7.633e-05, forward_time=0.031, loss=0.927, loss_att=0.424, loss_ctc=1.429, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.936e-05, train_time=0.089 -[v016] 2022-01-31 09:04:47,381 (trainer:653) INFO: 186epoch:train:109-135batch: iter_time=7.455e-05, forward_time=0.032, loss=0.894, loss_att=0.400, loss_ctc=1.388, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.935e-05, train_time=0.091 -[v016] 2022-01-31 09:04:49,877 (trainer:653) INFO: 186epoch:train:136-162batch: iter_time=7.796e-05, forward_time=0.032, loss=0.920, loss_att=0.396, loss_ctc=1.445, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.933e-05, train_time=0.092 -[v016] 2022-01-31 09:04:52,373 (trainer:653) INFO: 186epoch:train:163-189batch: iter_time=7.640e-05, forward_time=0.032, loss=0.972, loss_att=0.438, loss_ctc=1.507, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.932e-05, train_time=0.092 -[v016] 2022-01-31 09:04:54,890 (trainer:653) INFO: 186epoch:train:190-216batch: iter_time=7.696e-05, forward_time=0.033, loss=0.976, loss_att=0.454, loss_ctc=1.498, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.931e-05, train_time=0.093 -[v016] 2022-01-31 09:04:57,362 (trainer:653) INFO: 186epoch:train:217-243batch: iter_time=8.192e-05, forward_time=0.032, loss=1.017, loss_att=0.441, loss_ctc=1.592, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.929e-05, train_time=0.091 -[v016] 2022-01-31 09:04:59,910 (trainer:653) INFO: 186epoch:train:244-270batch: iter_time=8.457e-05, forward_time=0.033, loss=1.058, loss_att=0.427, loss_ctc=1.689, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.928e-05, train_time=0.094 -[v016] 2022-01-31 09:05:02,404 (trainer:653) INFO: 186epoch:train:271-297batch: iter_time=7.843e-05, forward_time=0.033, loss=0.987, loss_att=0.435, loss_ctc=1.539, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.927e-05, train_time=0.092 -[v016] 2022-01-31 09:05:04,857 (trainer:653) INFO: 186epoch:train:298-324batch: iter_time=7.690e-05, forward_time=0.032, loss=0.957, loss_att=0.421, loss_ctc=1.492, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.925e-05, train_time=0.091 -[v016] 2022-01-31 09:05:07,291 (trainer:653) INFO: 186epoch:train:325-351batch: iter_time=7.672e-05, forward_time=0.032, loss=0.883, loss_att=0.359, loss_ctc=1.408, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.924e-05, train_time=0.090 -[v016] 2022-01-31 09:05:09,908 (trainer:653) INFO: 186epoch:train:352-378batch: iter_time=8.322e-05, forward_time=0.034, loss=1.051, loss_att=0.398, loss_ctc=1.704, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.923e-05, train_time=0.097 -[v016] 2022-01-31 09:05:12,484 (trainer:653) INFO: 186epoch:train:379-405batch: iter_time=8.242e-05, forward_time=0.033, loss=0.945, loss_att=0.381, loss_ctc=1.508, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.922e-05, train_time=0.095 -[v016] 2022-01-31 09:05:15,061 (trainer:653) INFO: 186epoch:train:406-432batch: iter_time=0.004, forward_time=0.032, loss=0.976, loss_att=0.456, loss_ctc=1.497, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.920e-05, train_time=0.095 -[v016] 2022-01-31 09:05:17,816 (trainer:653) INFO: 186epoch:train:433-459batch: iter_time=0.010, forward_time=0.032, loss=1.031, loss_att=0.435, loss_ctc=1.628, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.919e-05, train_time=0.102 -[v016] 2022-01-31 09:05:20,376 (trainer:653) INFO: 186epoch:train:460-486batch: iter_time=8.060e-05, forward_time=0.033, loss=1.097, loss_att=0.465, loss_ctc=1.730, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.918e-05, train_time=0.095 -[v016] 2022-01-31 09:05:22,934 (trainer:653) INFO: 186epoch:train:487-513batch: iter_time=8.104e-05, forward_time=0.033, loss=0.877, loss_att=0.358, loss_ctc=1.397, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.916e-05, train_time=0.095 -[v016] 2022-01-31 09:05:25,431 (trainer:653) INFO: 186epoch:train:514-540batch: iter_time=7.785e-05, forward_time=0.032, loss=0.803, loss_att=0.299, loss_ctc=1.306, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.915e-05, train_time=0.092 -[v016] 2022-01-31 09:05:59,171 (trainer:328) INFO: 186epoch results: [train] iter_time=9.246e-04, forward_time=0.032, loss=0.962, loss_att=0.412, loss_ctc=1.513, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.927e-05, train_time=0.093, time=51.29 seconds, total_count=101742, gpu_max_cached_mem_GB=5.824, [valid] loss=8.084, loss_att=6.635, loss_ctc=9.533, acc=0.904, cer=0.101, wer=0.402, cer_ctc=0.145, time=5.67 seconds, total_count=33108, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.37 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:06:01,234 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:06:01,273 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/184epoch.pth -[v016] 2022-01-31 09:06:01,273 (trainer:261) INFO: 187/200epoch started. Estimated time to finish: 25 minutes and 6.98 seconds -[v016] 2022-01-31 09:06:03,893 (trainer:653) INFO: 187epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.938, loss_att=0.439, loss_ctc=1.437, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.913e-05, train_time=0.097 -[v016] 2022-01-31 09:06:06,318 (trainer:653) INFO: 187epoch:train:28-54batch: iter_time=8.230e-05, forward_time=0.032, loss=0.955, loss_att=0.431, loss_ctc=1.479, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.912e-05, train_time=0.090 -[v016] 2022-01-31 09:06:08,816 (trainer:653) INFO: 187epoch:train:55-81batch: iter_time=8.133e-05, forward_time=0.032, loss=0.835, loss_att=0.306, loss_ctc=1.364, acc=0.987, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.911e-05, train_time=0.092 -[v016] 2022-01-31 09:06:11,332 (trainer:653) INFO: 187epoch:train:82-108batch: iter_time=0.001, forward_time=0.032, loss=0.902, loss_att=0.354, loss_ctc=1.451, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.909e-05, train_time=0.093 -[v016] 2022-01-31 09:06:13,829 (trainer:653) INFO: 187epoch:train:109-135batch: iter_time=7.627e-05, forward_time=0.032, loss=0.968, loss_att=0.392, loss_ctc=1.543, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.908e-05, train_time=0.092 -[v016] 2022-01-31 09:06:16,390 (trainer:653) INFO: 187epoch:train:136-162batch: iter_time=7.780e-05, forward_time=0.032, loss=0.794, loss_att=0.358, loss_ctc=1.230, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.907e-05, train_time=0.095 -[v016] 2022-01-31 09:06:18,878 (trainer:653) INFO: 187epoch:train:163-189batch: iter_time=8.032e-05, forward_time=0.032, loss=0.942, loss_att=0.363, loss_ctc=1.521, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.905e-05, train_time=0.092 -[v016] 2022-01-31 09:06:21,370 (trainer:653) INFO: 187epoch:train:190-216batch: iter_time=8.372e-05, forward_time=0.032, loss=0.955, loss_att=0.375, loss_ctc=1.534, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.904e-05, train_time=0.092 -[v016] 2022-01-31 09:06:24,024 (trainer:653) INFO: 187epoch:train:217-243batch: iter_time=0.007, forward_time=0.031, loss=0.854, loss_att=0.328, loss_ctc=1.381, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.903e-05, train_time=0.098 -[v016] 2022-01-31 09:06:26,541 (trainer:653) INFO: 187epoch:train:244-270batch: iter_time=7.710e-05, forward_time=0.032, loss=0.875, loss_att=0.343, loss_ctc=1.407, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.901e-05, train_time=0.093 -[v016] 2022-01-31 09:06:29,006 (trainer:653) INFO: 187epoch:train:271-297batch: iter_time=7.766e-05, forward_time=0.032, loss=0.884, loss_att=0.415, loss_ctc=1.353, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.900e-05, train_time=0.091 -[v016] 2022-01-31 09:06:31,464 (trainer:653) INFO: 187epoch:train:298-324batch: iter_time=7.576e-05, forward_time=0.031, loss=0.881, loss_att=0.321, loss_ctc=1.440, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.899e-05, train_time=0.091 -[v016] 2022-01-31 09:06:33,918 (trainer:653) INFO: 187epoch:train:325-351batch: iter_time=7.512e-05, forward_time=0.031, loss=1.048, loss_att=0.458, loss_ctc=1.638, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.898e-05, train_time=0.091 -[v016] 2022-01-31 09:06:36,425 (trainer:653) INFO: 187epoch:train:352-378batch: iter_time=8.580e-05, forward_time=0.033, loss=1.139, loss_att=0.484, loss_ctc=1.795, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.896e-05, train_time=0.093 -[v016] 2022-01-31 09:06:38,913 (trainer:653) INFO: 187epoch:train:379-405batch: iter_time=7.680e-05, forward_time=0.032, loss=0.915, loss_att=0.335, loss_ctc=1.495, acc=0.984, backward_time=0.021, optim_step_time=0.020, optim0_lr0=9.895e-05, train_time=0.092 -[v016] 2022-01-31 09:06:41,424 (trainer:653) INFO: 187epoch:train:406-432batch: iter_time=7.523e-05, forward_time=0.032, loss=0.984, loss_att=0.433, loss_ctc=1.534, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.894e-05, train_time=0.093 -[v016] 2022-01-31 09:06:43,919 (trainer:653) INFO: 187epoch:train:433-459batch: iter_time=7.733e-05, forward_time=0.032, loss=1.043, loss_att=0.467, loss_ctc=1.619, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.892e-05, train_time=0.092 -[v016] 2022-01-31 09:06:46,510 (trainer:653) INFO: 187epoch:train:460-486batch: iter_time=0.006, forward_time=0.031, loss=1.049, loss_att=0.495, loss_ctc=1.603, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.891e-05, train_time=0.096 -[v016] 2022-01-31 09:06:49,067 (trainer:653) INFO: 187epoch:train:487-513batch: iter_time=1.078e-04, forward_time=0.032, loss=1.054, loss_att=0.424, loss_ctc=1.684, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.890e-05, train_time=0.095 -[v016] 2022-01-31 09:06:51,657 (trainer:653) INFO: 187epoch:train:514-540batch: iter_time=9.599e-05, forward_time=0.034, loss=0.977, loss_att=0.389, loss_ctc=1.565, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.888e-05, train_time=0.096 -[v016] 2022-01-31 09:07:25,523 (trainer:328) INFO: 187epoch results: [train] iter_time=9.492e-04, forward_time=0.032, loss=0.951, loss_att=0.395, loss_ctc=1.507, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.901e-05, train_time=0.093, time=51.13 seconds, total_count=102289, gpu_max_cached_mem_GB=5.824, [valid] loss=8.074, loss_att=6.636, loss_ctc=9.511, acc=0.904, cer=0.101, wer=0.398, cer_ctc=0.144, time=5.52 seconds, total_count=33286, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.6 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:07:27,546 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 09:07:27,560 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/178epoch.pth, exp/asr_train_asr_raw_en_word/179epoch.pth -[v016] 2022-01-31 09:07:27,560 (trainer:261) INFO: 188/200epoch started. Estimated time to finish: 23 minutes and 17.68 seconds -[v016] 2022-01-31 09:07:30,278 (trainer:653) INFO: 188epoch:train:1-27batch: iter_time=0.004, forward_time=0.034, loss=0.903, loss_att=0.349, loss_ctc=1.457, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.887e-05, train_time=0.100 -[v016] 2022-01-31 09:07:32,750 (trainer:653) INFO: 188epoch:train:28-54batch: iter_time=9.268e-05, forward_time=0.032, loss=1.012, loss_att=0.496, loss_ctc=1.529, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.885e-05, train_time=0.091 -[v016] 2022-01-31 09:07:35,265 (trainer:653) INFO: 188epoch:train:55-81batch: iter_time=8.432e-05, forward_time=0.033, loss=0.891, loss_att=0.410, loss_ctc=1.372, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.884e-05, train_time=0.093 -[v016] 2022-01-31 09:07:37,840 (trainer:653) INFO: 188epoch:train:82-108batch: iter_time=1.044e-04, forward_time=0.034, loss=1.151, loss_att=0.439, loss_ctc=1.864, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.883e-05, train_time=0.095 -[v016] 2022-01-31 09:07:40,386 (trainer:653) INFO: 188epoch:train:109-135batch: iter_time=8.659e-05, forward_time=0.033, loss=1.111, loss_att=0.521, loss_ctc=1.701, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.882e-05, train_time=0.094 -[v016] 2022-01-31 09:07:43,008 (trainer:653) INFO: 188epoch:train:136-162batch: iter_time=0.008, forward_time=0.031, loss=0.858, loss_att=0.414, loss_ctc=1.301, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.880e-05, train_time=0.097 -[v016] 2022-01-31 09:07:45,544 (trainer:653) INFO: 188epoch:train:163-189batch: iter_time=7.820e-05, forward_time=0.033, loss=0.893, loss_att=0.332, loss_ctc=1.453, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.879e-05, train_time=0.094 -[v016] 2022-01-31 09:07:47,980 (trainer:653) INFO: 188epoch:train:190-216batch: iter_time=7.803e-05, forward_time=0.031, loss=0.802, loss_att=0.352, loss_ctc=1.252, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.878e-05, train_time=0.090 -[v016] 2022-01-31 09:07:50,506 (trainer:653) INFO: 188epoch:train:217-243batch: iter_time=8.098e-05, forward_time=0.033, loss=1.043, loss_att=0.486, loss_ctc=1.600, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.876e-05, train_time=0.093 -[v016] 2022-01-31 09:07:52,979 (trainer:653) INFO: 188epoch:train:244-270batch: iter_time=7.805e-05, forward_time=0.032, loss=0.909, loss_att=0.427, loss_ctc=1.391, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.875e-05, train_time=0.091 -[v016] 2022-01-31 09:07:55,593 (trainer:653) INFO: 188epoch:train:271-297batch: iter_time=8.620e-05, forward_time=0.034, loss=1.152, loss_att=0.411, loss_ctc=1.892, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.874e-05, train_time=0.097 -[v016] 2022-01-31 09:07:58,050 (trainer:653) INFO: 188epoch:train:298-324batch: iter_time=7.902e-05, forward_time=0.032, loss=0.936, loss_att=0.390, loss_ctc=1.482, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.872e-05, train_time=0.091 -[v016] 2022-01-31 09:08:00,551 (trainer:653) INFO: 188epoch:train:325-351batch: iter_time=7.792e-05, forward_time=0.032, loss=0.911, loss_att=0.338, loss_ctc=1.483, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.871e-05, train_time=0.092 -[v016] 2022-01-31 09:08:03,022 (trainer:653) INFO: 188epoch:train:352-378batch: iter_time=7.853e-05, forward_time=0.032, loss=0.942, loss_att=0.347, loss_ctc=1.537, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.870e-05, train_time=0.091 -[v016] 2022-01-31 09:08:05,524 (trainer:653) INFO: 188epoch:train:379-405batch: iter_time=7.985e-05, forward_time=0.032, loss=0.928, loss_att=0.385, loss_ctc=1.471, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.869e-05, train_time=0.092 -[v016] 2022-01-31 09:08:07,964 (trainer:653) INFO: 188epoch:train:406-432batch: iter_time=8.822e-05, forward_time=0.032, loss=0.855, loss_att=0.431, loss_ctc=1.279, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.867e-05, train_time=0.090 -[v016] 2022-01-31 09:08:10,524 (trainer:653) INFO: 188epoch:train:433-459batch: iter_time=8.795e-05, forward_time=0.033, loss=0.974, loss_att=0.420, loss_ctc=1.528, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.866e-05, train_time=0.095 -[v016] 2022-01-31 09:08:13,072 (trainer:653) INFO: 188epoch:train:460-486batch: iter_time=9.108e-05, forward_time=0.033, loss=0.877, loss_att=0.362, loss_ctc=1.392, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.865e-05, train_time=0.094 -[v016] 2022-01-31 09:08:15,503 (trainer:653) INFO: 188epoch:train:487-513batch: iter_time=8.044e-05, forward_time=0.032, loss=0.906, loss_att=0.386, loss_ctc=1.425, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.863e-05, train_time=0.090 -[v016] 2022-01-31 09:08:18,079 (trainer:653) INFO: 188epoch:train:514-540batch: iter_time=7.956e-05, forward_time=0.033, loss=0.937, loss_att=0.399, loss_ctc=1.475, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.862e-05, train_time=0.095 -[v016] 2022-01-31 09:08:52,065 (trainer:328) INFO: 188epoch results: [train] iter_time=9.834e-04, forward_time=0.033, loss=0.948, loss_att=0.403, loss_ctc=1.492, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.874e-05, train_time=0.094, time=51.42 seconds, total_count=102836, gpu_max_cached_mem_GB=5.824, [valid] loss=8.138, loss_att=6.695, loss_ctc=9.581, acc=0.902, cer=0.104, wer=0.407, cer_ctc=0.149, time=5.48 seconds, total_count=33464, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.61 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:08:54,018 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 09:08:54,056 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/177epoch.pth, exp/asr_train_asr_raw_en_word/183epoch.pth -[v016] 2022-01-31 09:08:54,056 (trainer:261) INFO: 189/200epoch started. Estimated time to finish: 21 minutes and 28.66 seconds -[v016] 2022-01-31 09:08:56,738 (trainer:653) INFO: 189epoch:train:1-27batch: iter_time=0.004, forward_time=0.033, loss=1.014, loss_att=0.385, loss_ctc=1.643, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.860e-05, train_time=0.099 -[v016] 2022-01-31 09:08:59,255 (trainer:653) INFO: 189epoch:train:28-54batch: iter_time=8.615e-05, forward_time=0.033, loss=0.914, loss_att=0.367, loss_ctc=1.460, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.859e-05, train_time=0.093 -[v016] 2022-01-31 09:09:01,778 (trainer:653) INFO: 189epoch:train:55-81batch: iter_time=7.987e-05, forward_time=0.033, loss=0.966, loss_att=0.418, loss_ctc=1.515, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.858e-05, train_time=0.093 -[v016] 2022-01-31 09:09:04,306 (trainer:653) INFO: 189epoch:train:82-108batch: iter_time=7.650e-05, forward_time=0.032, loss=0.877, loss_att=0.360, loss_ctc=1.393, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.857e-05, train_time=0.093 -[v016] 2022-01-31 09:09:06,920 (trainer:653) INFO: 189epoch:train:109-135batch: iter_time=8.036e-05, forward_time=0.033, loss=1.061, loss_att=0.443, loss_ctc=1.678, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.855e-05, train_time=0.097 -[v016] 2022-01-31 09:09:09,471 (trainer:653) INFO: 189epoch:train:136-162batch: iter_time=8.653e-05, forward_time=0.032, loss=1.135, loss_att=0.445, loss_ctc=1.825, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.854e-05, train_time=0.094 -[v016] 2022-01-31 09:09:12,181 (trainer:653) INFO: 189epoch:train:163-189batch: iter_time=0.008, forward_time=0.032, loss=0.803, loss_att=0.364, loss_ctc=1.241, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.853e-05, train_time=0.100 -[v016] 2022-01-31 09:09:14,692 (trainer:653) INFO: 189epoch:train:190-216batch: iter_time=7.956e-05, forward_time=0.032, loss=0.978, loss_att=0.443, loss_ctc=1.513, acc=0.976, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.851e-05, train_time=0.093 -[v016] 2022-01-31 09:09:17,463 (trainer:653) INFO: 189epoch:train:217-243batch: iter_time=0.007, forward_time=0.033, loss=0.909, loss_att=0.347, loss_ctc=1.471, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.850e-05, train_time=0.102 -[v016] 2022-01-31 09:09:20,124 (trainer:653) INFO: 189epoch:train:244-270batch: iter_time=0.005, forward_time=0.032, loss=0.848, loss_att=0.365, loss_ctc=1.332, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.849e-05, train_time=0.098 -[v016] 2022-01-31 09:09:22,763 (trainer:653) INFO: 189epoch:train:271-297batch: iter_time=0.006, forward_time=0.031, loss=0.943, loss_att=0.410, loss_ctc=1.475, acc=0.980, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.848e-05, train_time=0.098 -[v016] 2022-01-31 09:09:25,280 (trainer:653) INFO: 189epoch:train:298-324batch: iter_time=7.994e-05, forward_time=0.032, loss=0.958, loss_att=0.452, loss_ctc=1.463, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.846e-05, train_time=0.093 -[v016] 2022-01-31 09:09:31,172 (trainer:653) INFO: 189epoch:train:325-351batch: iter_time=0.028, forward_time=0.095, loss=0.923, loss_att=0.474, loss_ctc=1.371, acc=0.973, backward_time=0.028, optim_step_time=0.047, optim0_lr0=9.845e-05, train_time=0.218 -[v016] 2022-01-31 09:09:33,786 (trainer:653) INFO: 189epoch:train:352-378batch: iter_time=0.003, forward_time=0.032, loss=0.860, loss_att=0.436, loss_ctc=1.284, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.844e-05, train_time=0.097 -[v016] 2022-01-31 09:09:36,355 (trainer:653) INFO: 189epoch:train:379-405batch: iter_time=8.122e-05, forward_time=0.033, loss=1.120, loss_att=0.436, loss_ctc=1.803, acc=0.980, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.842e-05, train_time=0.095 -[v016] 2022-01-31 09:09:39,264 (trainer:653) INFO: 189epoch:train:406-432batch: iter_time=0.018, forward_time=0.030, loss=0.994, loss_att=0.474, loss_ctc=1.514, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.841e-05, train_time=0.108 -[v016] 2022-01-31 09:09:41,659 (trainer:653) INFO: 189epoch:train:433-459batch: iter_time=7.920e-05, forward_time=0.030, loss=1.006, loss_att=0.467, loss_ctc=1.545, acc=0.973, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.840e-05, train_time=0.088 -[v016] 2022-01-31 09:09:44,572 (trainer:653) INFO: 189epoch:train:460-486batch: iter_time=0.016, forward_time=0.031, loss=0.849, loss_att=0.308, loss_ctc=1.390, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.838e-05, train_time=0.108 -[v016] 2022-01-31 09:09:47,389 (trainer:653) INFO: 189epoch:train:487-513batch: iter_time=0.006, forward_time=0.033, loss=1.112, loss_att=0.393, loss_ctc=1.830, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.837e-05, train_time=0.104 -[v016] 2022-01-31 09:09:49,974 (trainer:653) INFO: 189epoch:train:514-540batch: iter_time=1.115e-04, forward_time=0.033, loss=0.964, loss_att=0.407, loss_ctc=1.521, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.836e-05, train_time=0.096 -[v016] 2022-01-31 09:10:25,118 (trainer:328) INFO: 189epoch results: [train] iter_time=0.005, forward_time=0.035, loss=0.958, loss_att=0.408, loss_ctc=1.508, acc=0.980, backward_time=0.022, optim_step_time=0.023, optim0_lr0=9.848e-05, train_time=0.103, time=56.66 seconds, total_count=103383, gpu_max_cached_mem_GB=5.824, [valid] loss=8.153, loss_att=6.711, loss_ctc=9.595, acc=0.903, cer=0.104, wer=0.403, cer_ctc=0.145, time=5.93 seconds, total_count=33642, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.48 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:10:27,255 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:10:27,314 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/186epoch.pth -[v016] 2022-01-31 09:10:27,314 (trainer:261) INFO: 190/200epoch started. Estimated time to finish: 19 minutes and 40.35 seconds -[v016] 2022-01-31 09:10:29,939 (trainer:653) INFO: 190epoch:train:1-27batch: iter_time=0.004, forward_time=0.031, loss=0.888, loss_att=0.386, loss_ctc=1.390, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.834e-05, train_time=0.097 -[v016] 2022-01-31 09:10:34,255 (trainer:653) INFO: 190epoch:train:28-54batch: iter_time=8.982e-05, forward_time=0.091, loss=0.901, loss_att=0.291, loss_ctc=1.511, acc=0.986, backward_time=0.026, optim_step_time=0.022, optim0_lr0=9.833e-05, train_time=0.160 -[v016] 2022-01-31 09:10:36,802 (trainer:653) INFO: 190epoch:train:55-81batch: iter_time=0.002, forward_time=0.032, loss=0.806, loss_att=0.332, loss_ctc=1.280, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.832e-05, train_time=0.094 -[v016] 2022-01-31 09:10:40,363 (trainer:653) INFO: 190epoch:train:82-108batch: iter_time=0.035, forward_time=0.033, loss=1.130, loss_att=0.531, loss_ctc=1.728, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.830e-05, train_time=0.132 -[v016] 2022-01-31 09:10:42,949 (trainer:653) INFO: 190epoch:train:109-135batch: iter_time=8.658e-05, forward_time=0.032, loss=1.007, loss_att=0.405, loss_ctc=1.608, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.829e-05, train_time=0.096 -[v016] 2022-01-31 09:10:45,773 (trainer:653) INFO: 190epoch:train:136-162batch: iter_time=0.008, forward_time=0.033, loss=0.993, loss_att=0.439, loss_ctc=1.547, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.828e-05, train_time=0.104 -[v016] 2022-01-31 09:10:48,438 (trainer:653) INFO: 190epoch:train:163-189batch: iter_time=0.005, forward_time=0.032, loss=0.895, loss_att=0.357, loss_ctc=1.432, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.827e-05, train_time=0.099 -[v016] 2022-01-31 09:10:51,342 (trainer:653) INFO: 190epoch:train:190-216batch: iter_time=0.016, forward_time=0.031, loss=0.873, loss_att=0.424, loss_ctc=1.322, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.825e-05, train_time=0.107 -[v016] 2022-01-31 09:10:54,643 (trainer:653) INFO: 190epoch:train:217-243batch: iter_time=0.028, forward_time=0.032, loss=1.005, loss_att=0.388, loss_ctc=1.622, acc=0.984, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.824e-05, train_time=0.122 -[v016] 2022-01-31 09:10:57,184 (trainer:653) INFO: 190epoch:train:244-270batch: iter_time=4.708e-04, forward_time=0.031, loss=0.939, loss_att=0.350, loss_ctc=1.527, acc=0.983, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.823e-05, train_time=0.094 -[v016] 2022-01-31 09:10:59,935 (trainer:653) INFO: 190epoch:train:271-297batch: iter_time=0.007, forward_time=0.032, loss=1.033, loss_att=0.421, loss_ctc=1.645, acc=0.981, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.821e-05, train_time=0.102 -[v016] 2022-01-31 09:11:02,828 (trainer:653) INFO: 190epoch:train:298-324batch: iter_time=0.012, forward_time=0.032, loss=1.030, loss_att=0.389, loss_ctc=1.670, acc=0.981, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.820e-05, train_time=0.107 -[v016] 2022-01-31 09:11:05,309 (trainer:653) INFO: 190epoch:train:325-351batch: iter_time=8.185e-04, forward_time=0.031, loss=0.947, loss_att=0.437, loss_ctc=1.456, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.819e-05, train_time=0.092 -[v016] 2022-01-31 09:11:07,956 (trainer:653) INFO: 190epoch:train:352-378batch: iter_time=0.005, forward_time=0.032, loss=0.995, loss_att=0.492, loss_ctc=1.499, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.818e-05, train_time=0.098 -[v016] 2022-01-31 09:11:10,514 (trainer:653) INFO: 190epoch:train:379-405batch: iter_time=9.030e-05, forward_time=0.032, loss=0.877, loss_att=0.371, loss_ctc=1.383, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.816e-05, train_time=0.094 -[v016] 2022-01-31 09:11:13,333 (trainer:653) INFO: 190epoch:train:406-432batch: iter_time=0.009, forward_time=0.033, loss=0.943, loss_att=0.371, loss_ctc=1.516, acc=0.982, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.815e-05, train_time=0.104 -[v016] 2022-01-31 09:11:16,385 (trainer:653) INFO: 190epoch:train:433-459batch: iter_time=0.022, forward_time=0.030, loss=0.877, loss_att=0.394, loss_ctc=1.360, acc=0.976, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.814e-05, train_time=0.113 -[v016] 2022-01-31 09:11:19,103 (trainer:653) INFO: 190epoch:train:460-486batch: iter_time=0.005, forward_time=0.033, loss=0.919, loss_att=0.388, loss_ctc=1.450, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.813e-05, train_time=0.100 -[v016] 2022-01-31 09:11:21,898 (trainer:653) INFO: 190epoch:train:487-513batch: iter_time=0.012, forward_time=0.031, loss=0.990, loss_att=0.396, loss_ctc=1.583, acc=0.979, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.811e-05, train_time=0.103 -[v016] 2022-01-31 09:11:26,201 (trainer:653) INFO: 190epoch:train:514-540batch: iter_time=0.046, forward_time=0.036, loss=0.869, loss_att=0.415, loss_ctc=1.324, acc=0.981, backward_time=0.027, optim_step_time=0.023, optim0_lr0=9.810e-05, train_time=0.159 -[v016] 2022-01-31 09:12:21,768 (trainer:328) INFO: 190epoch results: [train] iter_time=0.011, forward_time=0.035, loss=0.951, loss_att=0.401, loss_ctc=1.502, acc=0.980, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.822e-05, train_time=0.110, time=1 minute and 0.39 seconds, total_count=103930, gpu_max_cached_mem_GB=5.824, [valid] loss=8.051, loss_att=6.731, loss_ctc=9.371, acc=0.904, cer=0.102, wer=0.404, cer_ctc=0.146, time=13.74 seconds, total_count=33820, gpu_max_cached_mem_GB=5.824, [att_plot] time=40.28 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:12:24,346 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:12:24,395 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/189epoch.pth -[v016] 2022-01-31 09:12:24,396 (trainer:261) INFO: 191/200epoch started. Estimated time to finish: 17 minutes and 53.62 seconds -[v016] 2022-01-31 09:12:29,976 (trainer:653) INFO: 191epoch:train:1-27batch: iter_time=0.092, forward_time=0.036, loss=0.875, loss_att=0.304, loss_ctc=1.446, acc=0.985, backward_time=0.025, optim_step_time=0.023, optim0_lr0=9.808e-05, train_time=0.199 -[v016] 2022-01-31 09:12:34,047 (trainer:653) INFO: 191epoch:train:28-54batch: iter_time=0.057, forward_time=0.032, loss=0.974, loss_att=0.462, loss_ctc=1.486, acc=0.972, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.807e-05, train_time=0.151 -[v016] 2022-01-31 09:12:37,654 (trainer:653) INFO: 191epoch:train:55-81batch: iter_time=0.036, forward_time=0.034, loss=0.879, loss_att=0.357, loss_ctc=1.402, acc=0.984, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.806e-05, train_time=0.133 -[v016] 2022-01-31 09:12:41,166 (trainer:653) INFO: 191epoch:train:82-108batch: iter_time=0.027, forward_time=0.035, loss=0.847, loss_att=0.382, loss_ctc=1.311, acc=0.984, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.805e-05, train_time=0.130 -[v016] 2022-01-31 09:12:45,927 (trainer:653) INFO: 191epoch:train:109-135batch: iter_time=0.076, forward_time=0.034, loss=0.903, loss_att=0.314, loss_ctc=1.492, acc=0.983, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.803e-05, train_time=0.176 -[v016] 2022-01-31 09:12:51,030 (trainer:653) INFO: 191epoch:train:136-162batch: iter_time=0.061, forward_time=0.037, loss=0.940, loss_att=0.404, loss_ctc=1.477, acc=0.979, backward_time=0.024, optim_step_time=0.031, optim0_lr0=9.802e-05, train_time=0.188 -[v016] 2022-01-31 09:13:02,984 (trainer:653) INFO: 191epoch:train:163-189batch: iter_time=0.314, forward_time=0.046, loss=0.947, loss_att=0.429, loss_ctc=1.465, acc=0.980, backward_time=0.025, optim_step_time=0.027, optim0_lr0=9.801e-05, train_time=0.440 -[v016] 2022-01-31 09:13:16,721 (trainer:653) INFO: 191epoch:train:190-216batch: iter_time=0.387, forward_time=0.039, loss=0.767, loss_att=0.356, loss_ctc=1.178, acc=0.983, backward_time=0.026, optim_step_time=0.029, optim0_lr0=9.799e-05, train_time=0.508 -[v016] 2022-01-31 09:13:36,719 (trainer:653) INFO: 191epoch:train:217-243batch: iter_time=0.594, forward_time=0.055, loss=0.829, loss_att=0.310, loss_ctc=1.348, acc=0.987, backward_time=0.026, optim_step_time=0.030, optim0_lr0=9.798e-05, train_time=0.741 -[v016] 2022-01-31 09:13:47,193 (trainer:653) INFO: 191epoch:train:244-270batch: iter_time=0.280, forward_time=0.035, loss=0.928, loss_att=0.370, loss_ctc=1.486, acc=0.982, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.797e-05, train_time=0.388 -[v016] 2022-01-31 09:14:02,341 (trainer:653) INFO: 191epoch:train:271-297batch: iter_time=0.446, forward_time=0.041, loss=1.075, loss_att=0.448, loss_ctc=1.702, acc=0.976, backward_time=0.026, optim_step_time=0.024, optim0_lr0=9.796e-05, train_time=0.561 -[v016] 2022-01-31 09:14:19,146 (trainer:653) INFO: 191epoch:train:298-324batch: iter_time=0.383, forward_time=0.152, loss=0.922, loss_att=0.363, loss_ctc=1.481, acc=0.984, backward_time=0.034, optim_step_time=0.024, optim0_lr0=9.794e-05, train_time=0.622 -[v016] 2022-01-31 09:14:35,427 (trainer:653) INFO: 191epoch:train:325-351batch: iter_time=0.503, forward_time=0.035, loss=0.877, loss_att=0.403, loss_ctc=1.350, acc=0.977, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.793e-05, train_time=0.603 -[v016] 2022-01-31 09:14:46,380 (trainer:653) INFO: 191epoch:train:352-378batch: iter_time=0.304, forward_time=0.034, loss=0.892, loss_att=0.474, loss_ctc=1.310, acc=0.975, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.792e-05, train_time=0.405 -[v016] 2022-01-31 09:14:56,142 (trainer:653) INFO: 191epoch:train:379-405batch: iter_time=0.263, forward_time=0.034, loss=0.951, loss_att=0.431, loss_ctc=1.472, acc=0.977, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.791e-05, train_time=0.362 -[v016] 2022-01-31 09:15:07,920 (trainer:653) INFO: 191epoch:train:406-432batch: iter_time=0.332, forward_time=0.034, loss=1.122, loss_att=0.452, loss_ctc=1.793, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.789e-05, train_time=0.436 -[v016] 2022-01-31 09:15:26,113 (trainer:653) INFO: 191epoch:train:433-459batch: iter_time=0.564, forward_time=0.036, loss=1.113, loss_att=0.455, loss_ctc=1.770, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.788e-05, train_time=0.674 -[v016] 2022-01-31 09:15:35,457 (trainer:653) INFO: 191epoch:train:460-486batch: iter_time=0.244, forward_time=0.035, loss=0.868, loss_att=0.341, loss_ctc=1.396, acc=0.985, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.787e-05, train_time=0.346 -[v016] 2022-01-31 09:15:44,155 (trainer:653) INFO: 191epoch:train:487-513batch: iter_time=0.224, forward_time=0.034, loss=0.917, loss_att=0.443, loss_ctc=1.392, acc=0.976, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.786e-05, train_time=0.322 -[v016] 2022-01-31 09:15:53,593 (trainer:653) INFO: 191epoch:train:514-540batch: iter_time=0.251, forward_time=0.034, loss=1.084, loss_att=0.456, loss_ctc=1.711, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.784e-05, train_time=0.349 -[v016] 2022-01-31 09:17:32,000 (trainer:328) INFO: 191epoch results: [train] iter_time=0.270, forward_time=0.043, loss=0.935, loss_att=0.398, loss_ctc=1.472, acc=0.980, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.796e-05, train_time=0.385, time=3 minutes and 30.91 seconds, total_count=104477, gpu_max_cached_mem_GB=5.824, [valid] loss=8.045, loss_att=6.665, loss_ctc=9.425, acc=0.904, cer=0.100, wer=0.404, cer_ctc=0.145, time=1 minute and 4.52 seconds, total_count=33998, gpu_max_cached_mem_GB=5.824, [att_plot] time=31.97 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:17:36,521 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 09:17:36,537 (trainer:261) INFO: 192/200epoch started. Estimated time to finish: 16 minutes and 17.04 seconds -[v016] 2022-01-31 09:17:42,392 (trainer:653) INFO: 192epoch:train:1-27batch: iter_time=0.105, forward_time=0.035, loss=0.869, loss_att=0.358, loss_ctc=1.380, acc=0.986, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.783e-05, train_time=0.208 -[v016] 2022-01-31 09:17:48,554 (trainer:653) INFO: 192epoch:train:28-54batch: iter_time=0.133, forward_time=0.033, loss=0.882, loss_att=0.334, loss_ctc=1.430, acc=0.983, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.781e-05, train_time=0.228 -[v016] 2022-01-31 09:17:56,375 (trainer:653) INFO: 192epoch:train:55-81batch: iter_time=0.189, forward_time=0.034, loss=0.729, loss_att=0.366, loss_ctc=1.092, acc=0.980, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.780e-05, train_time=0.289 -[v016] 2022-01-31 09:18:02,319 (trainer:653) INFO: 192epoch:train:82-108batch: iter_time=0.118, forward_time=0.035, loss=0.930, loss_att=0.280, loss_ctc=1.580, acc=0.989, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.779e-05, train_time=0.220 -[v016] 2022-01-31 09:18:09,162 (trainer:653) INFO: 192epoch:train:109-135batch: iter_time=0.156, forward_time=0.034, loss=0.796, loss_att=0.339, loss_ctc=1.253, acc=0.984, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.778e-05, train_time=0.253 -[v016] 2022-01-31 09:18:14,301 (trainer:653) INFO: 192epoch:train:136-162batch: iter_time=0.088, forward_time=0.034, loss=0.916, loss_att=0.396, loss_ctc=1.437, acc=0.982, backward_time=0.024, optim_step_time=0.024, optim0_lr0=9.776e-05, train_time=0.190 -[v016] 2022-01-31 09:18:22,031 (trainer:653) INFO: 192epoch:train:163-189batch: iter_time=0.186, forward_time=0.034, loss=0.932, loss_att=0.369, loss_ctc=1.494, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.775e-05, train_time=0.286 -[v016] 2022-01-31 09:18:27,189 (trainer:653) INFO: 192epoch:train:190-216batch: iter_time=0.091, forward_time=0.034, loss=0.806, loss_att=0.321, loss_ctc=1.291, acc=0.986, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.774e-05, train_time=0.191 -[v016] 2022-01-31 09:18:31,181 (trainer:653) INFO: 192epoch:train:217-243batch: iter_time=0.051, forward_time=0.033, loss=0.931, loss_att=0.391, loss_ctc=1.471, acc=0.981, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.773e-05, train_time=0.148 -[v016] 2022-01-31 09:18:39,428 (trainer:653) INFO: 192epoch:train:244-270batch: iter_time=0.110, forward_time=0.119, loss=1.002, loss_att=0.440, loss_ctc=1.564, acc=0.979, backward_time=0.028, optim_step_time=0.024, optim0_lr0=9.771e-05, train_time=0.305 -[v016] 2022-01-31 09:18:45,453 (trainer:653) INFO: 192epoch:train:271-297batch: iter_time=0.100, forward_time=0.038, loss=0.935, loss_att=0.385, loss_ctc=1.485, acc=0.984, backward_time=0.035, optim_step_time=0.023, optim0_lr0=9.770e-05, train_time=0.222 -[v016] 2022-01-31 09:18:53,993 (trainer:653) INFO: 192epoch:train:298-324batch: iter_time=0.210, forward_time=0.038, loss=0.999, loss_att=0.394, loss_ctc=1.604, acc=0.984, backward_time=0.025, optim_step_time=0.023, optim0_lr0=9.769e-05, train_time=0.317 -[v016] 2022-01-31 09:19:00,604 (trainer:653) INFO: 192epoch:train:325-351batch: iter_time=0.144, forward_time=0.034, loss=0.903, loss_att=0.393, loss_ctc=1.413, acc=0.977, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.768e-05, train_time=0.245 -[v016] 2022-01-31 09:19:07,104 (trainer:653) INFO: 192epoch:train:352-378batch: iter_time=0.143, forward_time=0.033, loss=0.992, loss_att=0.415, loss_ctc=1.569, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.766e-05, train_time=0.241 -[v016] 2022-01-31 09:19:16,110 (trainer:653) INFO: 192epoch:train:379-405batch: iter_time=0.228, forward_time=0.036, loss=1.011, loss_att=0.396, loss_ctc=1.626, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.765e-05, train_time=0.333 -[v016] 2022-01-31 09:19:23,775 (trainer:653) INFO: 192epoch:train:406-432batch: iter_time=0.183, forward_time=0.035, loss=1.076, loss_att=0.496, loss_ctc=1.656, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.764e-05, train_time=0.284 -[v016] 2022-01-31 09:19:29,946 (trainer:653) INFO: 192epoch:train:433-459batch: iter_time=0.128, forward_time=0.034, loss=0.948, loss_att=0.456, loss_ctc=1.440, acc=0.975, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.763e-05, train_time=0.228 -[v016] 2022-01-31 09:19:39,229 (trainer:653) INFO: 192epoch:train:460-486batch: iter_time=0.242, forward_time=0.035, loss=0.904, loss_att=0.396, loss_ctc=1.413, acc=0.981, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.761e-05, train_time=0.344 -[v016] 2022-01-31 09:19:49,497 (trainer:653) INFO: 192epoch:train:487-513batch: iter_time=0.281, forward_time=0.034, loss=0.889, loss_att=0.402, loss_ctc=1.375, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.760e-05, train_time=0.380 -[v016] 2022-01-31 09:19:54,815 (trainer:653) INFO: 192epoch:train:514-540batch: iter_time=0.095, forward_time=0.034, loss=0.967, loss_att=0.460, loss_ctc=1.473, acc=0.975, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.759e-05, train_time=0.197 -[v016] 2022-01-31 09:21:08,316 (trainer:328) INFO: 192epoch results: [train] iter_time=0.149, forward_time=0.039, loss=0.921, loss_att=0.390, loss_ctc=1.451, acc=0.981, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.771e-05, train_time=0.255, time=2 minutes and 20.04 seconds, total_count=105024, gpu_max_cached_mem_GB=5.824, [valid] loss=8.052, loss_att=6.658, loss_ctc=9.445, acc=0.905, cer=0.100, wer=0.397, cer_ctc=0.143, time=37.53 seconds, total_count=34176, gpu_max_cached_mem_GB=5.824, [att_plot] time=34.06 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:21:11,867 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 09:21:11,881 (trainer:261) INFO: 193/200epoch started. Estimated time to finish: 14 minutes and 33.45 seconds -[v016] 2022-01-31 09:21:22,935 (trainer:653) INFO: 193epoch:train:1-27batch: iter_time=0.221, forward_time=0.078, loss=0.888, loss_att=0.415, loss_ctc=1.360, acc=0.980, backward_time=0.054, optim_step_time=0.025, optim0_lr0=9.757e-05, train_time=0.407 -[v016] 2022-01-31 09:21:31,588 (trainer:653) INFO: 193epoch:train:28-54batch: iter_time=0.209, forward_time=0.042, loss=1.071, loss_att=0.461, loss_ctc=1.680, acc=0.978, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.756e-05, train_time=0.320 -[v016] 2022-01-31 09:21:36,938 (trainer:653) INFO: 193epoch:train:55-81batch: iter_time=0.101, forward_time=0.033, loss=1.009, loss_att=0.472, loss_ctc=1.546, acc=0.974, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.755e-05, train_time=0.198 -[v016] 2022-01-31 09:21:42,229 (trainer:653) INFO: 193epoch:train:82-108batch: iter_time=0.096, forward_time=0.034, loss=0.970, loss_att=0.415, loss_ctc=1.526, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.753e-05, train_time=0.196 -[v016] 2022-01-31 09:21:49,099 (trainer:653) INFO: 193epoch:train:109-135batch: iter_time=0.158, forward_time=0.033, loss=0.873, loss_att=0.352, loss_ctc=1.394, acc=0.982, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.752e-05, train_time=0.254 -[v016] 2022-01-31 09:21:56,786 (trainer:653) INFO: 193epoch:train:136-162batch: iter_time=0.187, forward_time=0.033, loss=0.991, loss_att=0.500, loss_ctc=1.482, acc=0.974, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.751e-05, train_time=0.284 -[v016] 2022-01-31 09:22:02,249 (trainer:653) INFO: 193epoch:train:163-189batch: iter_time=0.099, forward_time=0.035, loss=0.996, loss_att=0.371, loss_ctc=1.621, acc=0.985, backward_time=0.024, optim_step_time=0.022, optim0_lr0=9.750e-05, train_time=0.202 -[v016] 2022-01-31 09:22:09,241 (trainer:653) INFO: 193epoch:train:190-216batch: iter_time=0.158, forward_time=0.035, loss=1.032, loss_att=0.388, loss_ctc=1.676, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.748e-05, train_time=0.259 -[v016] 2022-01-31 09:22:18,483 (trainer:653) INFO: 193epoch:train:217-243batch: iter_time=0.241, forward_time=0.035, loss=1.040, loss_att=0.476, loss_ctc=1.605, acc=0.976, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.747e-05, train_time=0.342 -[v016] 2022-01-31 09:22:24,413 (trainer:653) INFO: 193epoch:train:244-270batch: iter_time=0.120, forward_time=0.034, loss=0.984, loss_att=0.407, loss_ctc=1.561, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.746e-05, train_time=0.219 -[v016] 2022-01-31 09:22:30,237 (trainer:653) INFO: 193epoch:train:271-297batch: iter_time=0.111, forward_time=0.036, loss=1.044, loss_att=0.417, loss_ctc=1.671, acc=0.983, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.745e-05, train_time=0.215 -[v016] 2022-01-31 09:22:37,355 (trainer:653) INFO: 193epoch:train:298-324batch: iter_time=0.163, forward_time=0.034, loss=0.910, loss_att=0.372, loss_ctc=1.448, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.743e-05, train_time=0.263 -[v016] 2022-01-31 09:22:46,063 (trainer:653) INFO: 193epoch:train:325-351batch: iter_time=0.222, forward_time=0.035, loss=0.950, loss_att=0.385, loss_ctc=1.516, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.742e-05, train_time=0.322 -[v016] 2022-01-31 09:22:54,036 (trainer:653) INFO: 193epoch:train:352-378batch: iter_time=0.197, forward_time=0.033, loss=0.899, loss_att=0.361, loss_ctc=1.437, acc=0.981, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.741e-05, train_time=0.295 -[v016] 2022-01-31 09:23:03,617 (trainer:653) INFO: 193epoch:train:379-405batch: iter_time=0.254, forward_time=0.034, loss=0.786, loss_att=0.400, loss_ctc=1.171, acc=0.979, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.740e-05, train_time=0.355 -[v016] 2022-01-31 09:23:10,861 (trainer:653) INFO: 193epoch:train:406-432batch: iter_time=0.174, forward_time=0.032, loss=0.932, loss_att=0.462, loss_ctc=1.402, acc=0.974, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.738e-05, train_time=0.268 -[v016] 2022-01-31 09:23:19,344 (trainer:653) INFO: 193epoch:train:433-459batch: iter_time=0.165, forward_time=0.046, loss=0.803, loss_att=0.371, loss_ctc=1.234, acc=0.980, backward_time=0.059, optim_step_time=0.023, optim0_lr0=9.737e-05, train_time=0.314 -[v016] 2022-01-31 09:23:27,591 (trainer:653) INFO: 193epoch:train:460-486batch: iter_time=0.211, forward_time=0.032, loss=1.003, loss_att=0.384, loss_ctc=1.622, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.736e-05, train_time=0.305 -[v016] 2022-01-31 09:23:35,092 (trainer:653) INFO: 193epoch:train:487-513batch: iter_time=0.184, forward_time=0.032, loss=0.812, loss_att=0.298, loss_ctc=1.326, acc=0.988, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.735e-05, train_time=0.278 -[v016] 2022-01-31 09:23:41,533 (trainer:653) INFO: 193epoch:train:514-540batch: iter_time=0.148, forward_time=0.031, loss=0.909, loss_att=0.463, loss_ctc=1.354, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.733e-05, train_time=0.238 -[v016] 2022-01-31 09:24:43,736 (trainer:328) INFO: 193epoch results: [train] iter_time=0.170, forward_time=0.037, loss=0.941, loss_att=0.407, loss_ctc=1.475, acc=0.980, backward_time=0.026, optim_step_time=0.022, optim0_lr0=9.745e-05, train_time=0.276, time=2 minutes and 31.09 seconds, total_count=105571, gpu_max_cached_mem_GB=5.824, [valid] loss=8.188, loss_att=6.675, loss_ctc=9.700, acc=0.904, cer=0.102, wer=0.406, cer_ctc=0.148, time=33 seconds, total_count=34354, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.75 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:24:45,854 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:24:45,867 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/190epoch.pth -[v016] 2022-01-31 09:24:45,867 (trainer:261) INFO: 194/200epoch started. Estimated time to finish: 12 minutes and 48.51 seconds -[v016] 2022-01-31 09:24:48,847 (trainer:653) INFO: 194epoch:train:1-27batch: iter_time=0.015, forward_time=0.032, loss=0.858, loss_att=0.386, loss_ctc=1.331, acc=0.977, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.732e-05, train_time=0.110 -[v016] 2022-01-31 09:24:51,852 (trainer:653) INFO: 194epoch:train:28-54batch: iter_time=0.019, forward_time=0.032, loss=1.072, loss_att=0.415, loss_ctc=1.729, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.731e-05, train_time=0.111 -[v016] 2022-01-31 09:24:54,761 (trainer:653) INFO: 194epoch:train:55-81batch: iter_time=0.014, forward_time=0.032, loss=1.212, loss_att=0.469, loss_ctc=1.955, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.729e-05, train_time=0.108 -[v016] 2022-01-31 09:24:58,510 (trainer:653) INFO: 194epoch:train:82-108batch: iter_time=0.046, forward_time=0.032, loss=1.129, loss_att=0.502, loss_ctc=1.757, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.728e-05, train_time=0.139 -[v016] 2022-01-31 09:25:01,752 (trainer:653) INFO: 194epoch:train:109-135batch: iter_time=0.028, forward_time=0.031, loss=0.853, loss_att=0.377, loss_ctc=1.330, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.727e-05, train_time=0.120 -[v016] 2022-01-31 09:25:04,239 (trainer:653) INFO: 194epoch:train:136-162batch: iter_time=8.472e-05, forward_time=0.032, loss=0.848, loss_att=0.371, loss_ctc=1.324, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.726e-05, train_time=0.092 -[v016] 2022-01-31 09:25:07,533 (trainer:653) INFO: 194epoch:train:163-189batch: iter_time=0.030, forward_time=0.031, loss=0.844, loss_att=0.329, loss_ctc=1.359, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.724e-05, train_time=0.122 -[v016] 2022-01-31 09:25:10,239 (trainer:653) INFO: 194epoch:train:190-216batch: iter_time=0.009, forward_time=0.031, loss=1.053, loss_att=0.458, loss_ctc=1.647, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.723e-05, train_time=0.100 -[v016] 2022-01-31 09:25:13,907 (trainer:653) INFO: 194epoch:train:217-243batch: iter_time=0.045, forward_time=0.031, loss=1.106, loss_att=0.565, loss_ctc=1.647, acc=0.971, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.722e-05, train_time=0.136 -[v016] 2022-01-31 09:25:16,409 (trainer:653) INFO: 194epoch:train:244-270batch: iter_time=4.682e-04, forward_time=0.031, loss=0.951, loss_att=0.331, loss_ctc=1.570, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.721e-05, train_time=0.092 -[v016] 2022-01-31 09:25:19,045 (trainer:653) INFO: 194epoch:train:271-297batch: iter_time=0.004, forward_time=0.032, loss=0.817, loss_att=0.366, loss_ctc=1.267, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.719e-05, train_time=0.097 -[v016] 2022-01-31 09:25:23,528 (trainer:653) INFO: 194epoch:train:298-324batch: iter_time=0.073, forward_time=0.032, loss=0.801, loss_att=0.336, loss_ctc=1.265, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.718e-05, train_time=0.166 -[v016] 2022-01-31 09:25:26,049 (trainer:653) INFO: 194epoch:train:325-351batch: iter_time=8.859e-04, forward_time=0.032, loss=0.971, loss_att=0.440, loss_ctc=1.502, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.717e-05, train_time=0.093 -[v016] 2022-01-31 09:25:28,584 (trainer:653) INFO: 194epoch:train:352-378batch: iter_time=0.001, forward_time=0.032, loss=0.851, loss_att=0.337, loss_ctc=1.364, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.716e-05, train_time=0.094 -[v016] 2022-01-31 09:25:31,632 (trainer:653) INFO: 194epoch:train:379-405batch: iter_time=0.019, forward_time=0.032, loss=0.893, loss_att=0.380, loss_ctc=1.405, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.715e-05, train_time=0.113 -[v016] 2022-01-31 09:25:34,166 (trainer:653) INFO: 194epoch:train:406-432batch: iter_time=7.823e-05, forward_time=0.032, loss=1.047, loss_att=0.471, loss_ctc=1.623, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.713e-05, train_time=0.094 -[v016] 2022-01-31 09:25:37,292 (trainer:653) INFO: 194epoch:train:433-459batch: iter_time=0.022, forward_time=0.032, loss=0.982, loss_att=0.410, loss_ctc=1.554, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.712e-05, train_time=0.116 -[v016] 2022-01-31 09:25:40,245 (trainer:653) INFO: 194epoch:train:460-486batch: iter_time=0.019, forward_time=0.031, loss=0.941, loss_att=0.450, loss_ctc=1.433, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.711e-05, train_time=0.109 -[v016] 2022-01-31 09:25:42,845 (trainer:653) INFO: 194epoch:train:487-513batch: iter_time=0.001, forward_time=0.032, loss=1.084, loss_att=0.408, loss_ctc=1.760, acc=0.982, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.710e-05, train_time=0.096 -[v016] 2022-01-31 09:25:45,650 (trainer:653) INFO: 194epoch:train:514-540batch: iter_time=0.010, forward_time=0.032, loss=0.872, loss_att=0.353, loss_ctc=1.391, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.708e-05, train_time=0.104 -[v016] 2022-01-31 09:26:19,934 (trainer:328) INFO: 194epoch results: [train] iter_time=0.018, forward_time=0.032, loss=0.957, loss_att=0.408, loss_ctc=1.506, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.720e-05, train_time=0.110, time=1 minute and 0.46 seconds, total_count=106118, gpu_max_cached_mem_GB=5.824, [valid] loss=8.227, loss_att=6.683, loss_ctc=9.770, acc=0.904, cer=0.102, wer=0.400, cer_ctc=0.144, time=6.17 seconds, total_count=34532, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.44 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:26:21,851 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:26:21,874 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/181epoch.pth -[v016] 2022-01-31 09:26:21,874 (trainer:261) INFO: 195/200epoch started. Estimated time to finish: 10 minutes and 58.24 seconds -[v016] 2022-01-31 09:26:25,951 (trainer:653) INFO: 195epoch:train:1-27batch: iter_time=0.056, forward_time=0.033, loss=0.787, loss_att=0.348, loss_ctc=1.226, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.707e-05, train_time=0.151 -[v016] 2022-01-31 09:26:28,411 (trainer:653) INFO: 195epoch:train:28-54batch: iter_time=8.263e-05, forward_time=0.032, loss=0.684, loss_att=0.307, loss_ctc=1.060, acc=0.987, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.706e-05, train_time=0.091 -[v016] 2022-01-31 09:26:30,856 (trainer:653) INFO: 195epoch:train:55-81batch: iter_time=7.545e-05, forward_time=0.032, loss=0.986, loss_att=0.429, loss_ctc=1.542, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.704e-05, train_time=0.090 -[v016] 2022-01-31 09:26:33,318 (trainer:653) INFO: 195epoch:train:82-108batch: iter_time=7.654e-05, forward_time=0.032, loss=0.816, loss_att=0.343, loss_ctc=1.290, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.703e-05, train_time=0.091 -[v016] 2022-01-31 09:26:35,828 (trainer:653) INFO: 195epoch:train:109-135batch: iter_time=7.731e-05, forward_time=0.032, loss=0.830, loss_att=0.364, loss_ctc=1.296, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.702e-05, train_time=0.093 -[v016] 2022-01-31 09:26:38,350 (trainer:653) INFO: 195epoch:train:136-162batch: iter_time=7.538e-05, forward_time=0.032, loss=1.017, loss_att=0.376, loss_ctc=1.658, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.701e-05, train_time=0.093 -[v016] 2022-01-31 09:26:40,894 (trainer:653) INFO: 195epoch:train:163-189batch: iter_time=8.111e-05, forward_time=0.033, loss=0.901, loss_att=0.326, loss_ctc=1.476, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.699e-05, train_time=0.094 -[v016] 2022-01-31 09:26:43,684 (trainer:653) INFO: 195epoch:train:190-216batch: iter_time=0.010, forward_time=0.032, loss=1.074, loss_att=0.470, loss_ctc=1.678, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.698e-05, train_time=0.103 -[v016] 2022-01-31 09:26:46,181 (trainer:653) INFO: 195epoch:train:217-243batch: iter_time=7.661e-05, forward_time=0.032, loss=0.908, loss_att=0.352, loss_ctc=1.465, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.697e-05, train_time=0.092 -[v016] 2022-01-31 09:26:48,614 (trainer:653) INFO: 195epoch:train:244-270batch: iter_time=7.600e-05, forward_time=0.031, loss=0.768, loss_att=0.287, loss_ctc=1.249, acc=0.989, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.696e-05, train_time=0.090 -[v016] 2022-01-31 09:26:51,267 (trainer:653) INFO: 195epoch:train:271-297batch: iter_time=0.005, forward_time=0.032, loss=0.937, loss_att=0.379, loss_ctc=1.495, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.694e-05, train_time=0.098 -[v016] 2022-01-31 09:26:53,717 (trainer:653) INFO: 195epoch:train:298-324batch: iter_time=7.538e-05, forward_time=0.032, loss=0.833, loss_att=0.403, loss_ctc=1.263, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.693e-05, train_time=0.091 -[v016] 2022-01-31 09:26:56,214 (trainer:653) INFO: 195epoch:train:325-351batch: iter_time=7.752e-05, forward_time=0.032, loss=0.947, loss_att=0.390, loss_ctc=1.504, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.692e-05, train_time=0.092 -[v016] 2022-01-31 09:27:01,275 (trainer:653) INFO: 195epoch:train:352-378batch: iter_time=0.015, forward_time=0.082, loss=0.955, loss_att=0.356, loss_ctc=1.554, acc=0.983, backward_time=0.022, optim_step_time=0.032, optim0_lr0=9.691e-05, train_time=0.187 -[v016] 2022-01-31 09:27:04,339 (trainer:653) INFO: 195epoch:train:379-405batch: iter_time=8.139e-05, forward_time=0.047, loss=0.807, loss_att=0.339, loss_ctc=1.275, acc=0.982, backward_time=0.029, optim_step_time=0.021, optim0_lr0=9.690e-05, train_time=0.113 -[v016] 2022-01-31 09:27:06,865 (trainer:653) INFO: 195epoch:train:406-432batch: iter_time=7.923e-05, forward_time=0.033, loss=0.911, loss_att=0.413, loss_ctc=1.409, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.688e-05, train_time=0.093 -[v016] 2022-01-31 09:27:09,928 (trainer:653) INFO: 195epoch:train:433-459batch: iter_time=0.021, forward_time=0.032, loss=0.931, loss_att=0.439, loss_ctc=1.424, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.687e-05, train_time=0.113 -[v016] 2022-01-31 09:27:12,441 (trainer:653) INFO: 195epoch:train:460-486batch: iter_time=9.832e-05, forward_time=0.032, loss=0.948, loss_att=0.351, loss_ctc=1.544, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.686e-05, train_time=0.093 -[v016] 2022-01-31 09:27:14,896 (trainer:653) INFO: 195epoch:train:487-513batch: iter_time=9.239e-05, forward_time=0.031, loss=0.786, loss_att=0.345, loss_ctc=1.228, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.685e-05, train_time=0.091 -[v016] 2022-01-31 09:27:17,330 (trainer:653) INFO: 195epoch:train:514-540batch: iter_time=7.753e-05, forward_time=0.031, loss=1.002, loss_att=0.465, loss_ctc=1.540, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.683e-05, train_time=0.090 -[v016] 2022-01-31 09:27:51,723 (trainer:328) INFO: 195epoch results: [train] iter_time=0.005, forward_time=0.035, loss=0.890, loss_att=0.373, loss_ctc=1.407, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.695e-05, train_time=0.102, time=56.19 seconds, total_count=106665, gpu_max_cached_mem_GB=5.824, [valid] loss=8.169, loss_att=6.680, loss_ctc=9.658, acc=0.904, cer=0.102, wer=0.407, cer_ctc=0.143, time=5.65 seconds, total_count=34710, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.01 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:27:53,736 (trainer:375) INFO: The best model has been updated: train.loss, train.acc -[v016] 2022-01-31 09:27:53,773 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/194epoch.pth -[v016] 2022-01-31 09:27:53,773 (trainer:261) INFO: 196/200epoch started. Estimated time to finish: 9 minutes and 8.03 seconds -[v016] 2022-01-31 09:27:56,456 (trainer:653) INFO: 196epoch:train:1-27batch: iter_time=0.003, forward_time=0.033, loss=0.971, loss_att=0.337, loss_ctc=1.604, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.682e-05, train_time=0.099 -[v016] 2022-01-31 09:27:58,960 (trainer:653) INFO: 196epoch:train:28-54batch: iter_time=8.424e-05, forward_time=0.032, loss=1.082, loss_att=0.507, loss_ctc=1.658, acc=0.975, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.681e-05, train_time=0.093 -[v016] 2022-01-31 09:28:01,686 (trainer:653) INFO: 196epoch:train:55-81batch: iter_time=0.005, forward_time=0.034, loss=0.911, loss_att=0.375, loss_ctc=1.448, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.679e-05, train_time=0.101 -[v016] 2022-01-31 09:28:04,165 (trainer:653) INFO: 196epoch:train:82-108batch: iter_time=8.323e-05, forward_time=0.033, loss=0.946, loss_att=0.436, loss_ctc=1.456, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.678e-05, train_time=0.092 -[v016] 2022-01-31 09:28:06,746 (trainer:653) INFO: 196epoch:train:109-135batch: iter_time=0.003, forward_time=0.033, loss=0.816, loss_att=0.334, loss_ctc=1.298, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.677e-05, train_time=0.095 -[v016] 2022-01-31 09:28:09,275 (trainer:653) INFO: 196epoch:train:136-162batch: iter_time=8.907e-05, forward_time=0.034, loss=0.921, loss_att=0.383, loss_ctc=1.458, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.676e-05, train_time=0.093 -[v016] 2022-01-31 09:28:11,864 (trainer:653) INFO: 196epoch:train:163-189batch: iter_time=8.689e-05, forward_time=0.034, loss=0.802, loss_att=0.291, loss_ctc=1.314, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.675e-05, train_time=0.096 -[v016] 2022-01-31 09:28:14,394 (trainer:653) INFO: 196epoch:train:190-216batch: iter_time=8.664e-05, forward_time=0.033, loss=0.869, loss_att=0.377, loss_ctc=1.362, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.673e-05, train_time=0.093 -[v016] 2022-01-31 09:28:16,881 (trainer:653) INFO: 196epoch:train:217-243batch: iter_time=8.455e-05, forward_time=0.032, loss=0.853, loss_att=0.376, loss_ctc=1.330, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.672e-05, train_time=0.092 -[v016] 2022-01-31 09:28:19,365 (trainer:653) INFO: 196epoch:train:244-270batch: iter_time=8.412e-05, forward_time=0.032, loss=0.946, loss_att=0.405, loss_ctc=1.487, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.671e-05, train_time=0.092 -[v016] 2022-01-31 09:28:21,894 (trainer:653) INFO: 196epoch:train:271-297batch: iter_time=9.464e-04, forward_time=0.032, loss=0.928, loss_att=0.377, loss_ctc=1.479, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.670e-05, train_time=0.093 -[v016] 2022-01-31 09:28:24,472 (trainer:653) INFO: 196epoch:train:298-324batch: iter_time=8.663e-05, forward_time=0.033, loss=0.883, loss_att=0.392, loss_ctc=1.374, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.668e-05, train_time=0.095 -[v016] 2022-01-31 09:28:26,977 (trainer:653) INFO: 196epoch:train:325-351batch: iter_time=8.221e-05, forward_time=0.032, loss=1.061, loss_att=0.489, loss_ctc=1.634, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.667e-05, train_time=0.093 -[v016] 2022-01-31 09:28:29,406 (trainer:653) INFO: 196epoch:train:352-378batch: iter_time=8.004e-05, forward_time=0.031, loss=0.807, loss_att=0.366, loss_ctc=1.247, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.666e-05, train_time=0.090 -[v016] 2022-01-31 09:28:32,047 (trainer:653) INFO: 196epoch:train:379-405batch: iter_time=0.003, forward_time=0.033, loss=0.996, loss_att=0.433, loss_ctc=1.559, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.665e-05, train_time=0.098 -[v016] 2022-01-31 09:28:34,535 (trainer:653) INFO: 196epoch:train:406-432batch: iter_time=8.377e-05, forward_time=0.032, loss=0.994, loss_att=0.402, loss_ctc=1.586, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.664e-05, train_time=0.092 -[v016] 2022-01-31 09:28:37,386 (trainer:653) INFO: 196epoch:train:433-459batch: iter_time=0.013, forward_time=0.032, loss=1.155, loss_att=0.442, loss_ctc=1.868, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.662e-05, train_time=0.105 -[v016] 2022-01-31 09:28:39,816 (trainer:653) INFO: 196epoch:train:460-486batch: iter_time=7.730e-05, forward_time=0.031, loss=0.914, loss_att=0.394, loss_ctc=1.434, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.661e-05, train_time=0.090 -[v016] 2022-01-31 09:28:42,242 (trainer:653) INFO: 196epoch:train:487-513batch: iter_time=7.893e-05, forward_time=0.031, loss=0.996, loss_att=0.435, loss_ctc=1.557, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.660e-05, train_time=0.090 -[v016] 2022-01-31 09:28:44,693 (trainer:653) INFO: 196epoch:train:514-540batch: iter_time=7.647e-05, forward_time=0.031, loss=0.966, loss_att=0.408, loss_ctc=1.524, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.659e-05, train_time=0.091 -[v016] 2022-01-31 09:29:19,487 (trainer:328) INFO: 196epoch results: [train] iter_time=0.001, forward_time=0.032, loss=0.942, loss_att=0.400, loss_ctc=1.483, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.670e-05, train_time=0.094, time=51.6 seconds, total_count=107212, gpu_max_cached_mem_GB=5.824, [valid] loss=8.220, loss_att=6.705, loss_ctc=9.734, acc=0.903, cer=0.102, wer=0.401, cer_ctc=0.143, time=5.82 seconds, total_count=34888, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.29 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:29:21,486 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:29:21,508 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/188epoch.pth -[v016] 2022-01-31 09:29:21,508 (trainer:261) INFO: 197/200epoch started. Estimated time to finish: 7 minutes and 17.93 seconds -[v016] 2022-01-31 09:29:24,162 (trainer:653) INFO: 197epoch:train:1-27batch: iter_time=0.004, forward_time=0.032, loss=0.820, loss_att=0.369, loss_ctc=1.271, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.657e-05, train_time=0.098 -[v016] 2022-01-31 09:29:26,586 (trainer:653) INFO: 197epoch:train:28-54batch: iter_time=7.933e-05, forward_time=0.031, loss=0.841, loss_att=0.406, loss_ctc=1.276, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.656e-05, train_time=0.090 -[v016] 2022-01-31 09:29:29,071 (trainer:653) INFO: 197epoch:train:55-81batch: iter_time=7.780e-05, forward_time=0.032, loss=0.740, loss_att=0.320, loss_ctc=1.160, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.655e-05, train_time=0.092 -[v016] 2022-01-31 09:29:31,530 (trainer:653) INFO: 197epoch:train:82-108batch: iter_time=7.753e-05, forward_time=0.032, loss=0.929, loss_att=0.337, loss_ctc=1.522, acc=0.987, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.653e-05, train_time=0.091 -[v016] 2022-01-31 09:29:34,241 (trainer:653) INFO: 197epoch:train:109-135batch: iter_time=0.009, forward_time=0.032, loss=0.814, loss_att=0.364, loss_ctc=1.264, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.652e-05, train_time=0.100 -[v016] 2022-01-31 09:29:36,843 (trainer:653) INFO: 197epoch:train:136-162batch: iter_time=0.004, forward_time=0.032, loss=0.807, loss_att=0.350, loss_ctc=1.263, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.651e-05, train_time=0.096 -[v016] 2022-01-31 09:29:39,268 (trainer:653) INFO: 197epoch:train:163-189batch: iter_time=8.148e-05, forward_time=0.031, loss=0.809, loss_att=0.386, loss_ctc=1.232, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.650e-05, train_time=0.090 -[v016] 2022-01-31 09:29:41,797 (trainer:653) INFO: 197epoch:train:190-216batch: iter_time=7.925e-05, forward_time=0.032, loss=0.895, loss_att=0.365, loss_ctc=1.425, acc=0.985, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.649e-05, train_time=0.093 -[v016] 2022-01-31 09:29:44,320 (trainer:653) INFO: 197epoch:train:217-243batch: iter_time=7.748e-05, forward_time=0.032, loss=0.993, loss_att=0.403, loss_ctc=1.583, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.647e-05, train_time=0.093 -[v016] 2022-01-31 09:29:46,814 (trainer:653) INFO: 197epoch:train:244-270batch: iter_time=7.766e-05, forward_time=0.032, loss=1.029, loss_att=0.451, loss_ctc=1.607, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.646e-05, train_time=0.092 -[v016] 2022-01-31 09:29:49,321 (trainer:653) INFO: 197epoch:train:271-297batch: iter_time=7.762e-05, forward_time=0.032, loss=1.044, loss_att=0.442, loss_ctc=1.647, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.645e-05, train_time=0.093 -[v016] 2022-01-31 09:29:52,078 (trainer:653) INFO: 197epoch:train:298-324batch: iter_time=0.013, forward_time=0.031, loss=0.894, loss_att=0.394, loss_ctc=1.394, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.644e-05, train_time=0.102 -[v016] 2022-01-31 09:29:55,628 (trainer:653) INFO: 197epoch:train:325-351batch: iter_time=0.043, forward_time=0.031, loss=0.799, loss_att=0.411, loss_ctc=1.186, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.643e-05, train_time=0.131 -[v016] 2022-01-31 09:29:58,175 (trainer:653) INFO: 197epoch:train:352-378batch: iter_time=7.796e-05, forward_time=0.032, loss=0.829, loss_att=0.304, loss_ctc=1.355, acc=0.988, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.641e-05, train_time=0.094 -[v016] 2022-01-31 09:30:00,655 (trainer:653) INFO: 197epoch:train:379-405batch: iter_time=7.929e-05, forward_time=0.032, loss=1.001, loss_att=0.440, loss_ctc=1.562, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.640e-05, train_time=0.092 -[v016] 2022-01-31 09:30:03,127 (trainer:653) INFO: 197epoch:train:406-432batch: iter_time=7.704e-05, forward_time=0.032, loss=0.886, loss_att=0.381, loss_ctc=1.391, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.639e-05, train_time=0.091 -[v016] 2022-01-31 09:30:05,690 (trainer:653) INFO: 197epoch:train:433-459batch: iter_time=7.820e-05, forward_time=0.033, loss=0.977, loss_att=0.428, loss_ctc=1.526, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.638e-05, train_time=0.095 -[v016] 2022-01-31 09:30:08,122 (trainer:653) INFO: 197epoch:train:460-486batch: iter_time=8.346e-05, forward_time=0.031, loss=0.906, loss_att=0.410, loss_ctc=1.402, acc=0.976, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.637e-05, train_time=0.090 -[v016] 2022-01-31 09:30:10,677 (trainer:653) INFO: 197epoch:train:487-513batch: iter_time=8.526e-05, forward_time=0.033, loss=1.115, loss_att=0.493, loss_ctc=1.737, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.635e-05, train_time=0.094 -[v016] 2022-01-31 09:30:13,241 (trainer:653) INFO: 197epoch:train:514-540batch: iter_time=0.005, forward_time=0.031, loss=0.885, loss_att=0.413, loss_ctc=1.357, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.634e-05, train_time=0.095 -[v016] 2022-01-31 09:30:47,187 (trainer:328) INFO: 197epoch results: [train] iter_time=0.004, forward_time=0.032, loss=0.900, loss_att=0.393, loss_ctc=1.407, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.645e-05, train_time=0.096, time=52.48 seconds, total_count=107759, gpu_max_cached_mem_GB=5.824, [valid] loss=8.223, loss_att=6.717, loss_ctc=9.730, acc=0.903, cer=0.100, wer=0.408, cer_ctc=0.147, time=5.51 seconds, total_count=35066, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.69 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:30:49,182 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:30:49,234 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/182epoch.pth, exp/asr_train_asr_raw_en_word/196epoch.pth -[v016] 2022-01-31 09:30:49,234 (trainer:261) INFO: 198/200epoch started. Estimated time to finish: 5 minutes and 28.08 seconds -[v016] 2022-01-31 09:30:51,839 (trainer:653) INFO: 198epoch:train:1-27batch: iter_time=0.004, forward_time=0.032, loss=0.853, loss_att=0.366, loss_ctc=1.341, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.633e-05, train_time=0.096 -[v016] 2022-01-31 09:30:54,343 (trainer:653) INFO: 198epoch:train:28-54batch: iter_time=8.099e-05, forward_time=0.033, loss=1.050, loss_att=0.403, loss_ctc=1.697, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.631e-05, train_time=0.093 -[v016] 2022-01-31 09:30:56,873 (trainer:653) INFO: 198epoch:train:55-81batch: iter_time=7.713e-05, forward_time=0.033, loss=0.721, loss_att=0.246, loss_ctc=1.195, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.630e-05, train_time=0.094 -[v016] 2022-01-31 09:30:59,445 (trainer:653) INFO: 198epoch:train:82-108batch: iter_time=9.639e-05, forward_time=0.034, loss=0.874, loss_att=0.394, loss_ctc=1.353, acc=0.983, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.629e-05, train_time=0.095 -[v016] 2022-01-31 09:31:01,967 (trainer:653) INFO: 198epoch:train:109-135batch: iter_time=9.343e-05, forward_time=0.033, loss=0.893, loss_att=0.379, loss_ctc=1.406, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.628e-05, train_time=0.093 -[v016] 2022-01-31 09:31:04,405 (trainer:653) INFO: 198epoch:train:136-162batch: iter_time=8.194e-05, forward_time=0.031, loss=0.656, loss_att=0.297, loss_ctc=1.016, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.627e-05, train_time=0.090 -[v016] 2022-01-31 09:31:07,106 (trainer:653) INFO: 198epoch:train:163-189batch: iter_time=0.007, forward_time=0.033, loss=0.855, loss_att=0.417, loss_ctc=1.293, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.625e-05, train_time=0.100 -[v016] 2022-01-31 09:31:09,663 (trainer:653) INFO: 198epoch:train:190-216batch: iter_time=9.527e-05, forward_time=0.033, loss=0.872, loss_att=0.332, loss_ctc=1.411, acc=0.985, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.624e-05, train_time=0.094 -[v016] 2022-01-31 09:31:12,163 (trainer:653) INFO: 198epoch:train:217-243batch: iter_time=8.875e-05, forward_time=0.033, loss=1.129, loss_att=0.460, loss_ctc=1.798, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.623e-05, train_time=0.092 -[v016] 2022-01-31 09:31:14,738 (trainer:653) INFO: 198epoch:train:244-270batch: iter_time=9.399e-05, forward_time=0.033, loss=0.913, loss_att=0.386, loss_ctc=1.440, acc=0.985, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.622e-05, train_time=0.095 -[v016] 2022-01-31 09:31:17,207 (trainer:653) INFO: 198epoch:train:271-297batch: iter_time=8.880e-05, forward_time=0.032, loss=0.873, loss_att=0.418, loss_ctc=1.328, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.621e-05, train_time=0.091 -[v016] 2022-01-31 09:31:19,834 (trainer:653) INFO: 198epoch:train:298-324batch: iter_time=9.472e-05, forward_time=0.033, loss=0.965, loss_att=0.378, loss_ctc=1.553, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.619e-05, train_time=0.097 -[v016] 2022-01-31 09:31:22,343 (trainer:653) INFO: 198epoch:train:325-351batch: iter_time=8.339e-05, forward_time=0.032, loss=0.965, loss_att=0.411, loss_ctc=1.520, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.618e-05, train_time=0.093 -[v016] 2022-01-31 09:31:24,815 (trainer:653) INFO: 198epoch:train:352-378batch: iter_time=8.207e-05, forward_time=0.031, loss=0.923, loss_att=0.389, loss_ctc=1.458, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.617e-05, train_time=0.091 -[v016] 2022-01-31 09:31:27,235 (trainer:653) INFO: 198epoch:train:379-405batch: iter_time=7.787e-05, forward_time=0.031, loss=0.949, loss_att=0.418, loss_ctc=1.480, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.616e-05, train_time=0.089 -[v016] 2022-01-31 09:31:29,697 (trainer:653) INFO: 198epoch:train:406-432batch: iter_time=7.605e-05, forward_time=0.031, loss=0.871, loss_att=0.375, loss_ctc=1.367, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.615e-05, train_time=0.091 -[v016] 2022-01-31 09:31:32,132 (trainer:653) INFO: 198epoch:train:433-459batch: iter_time=8.582e-05, forward_time=0.031, loss=0.866, loss_att=0.383, loss_ctc=1.348, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.613e-05, train_time=0.090 -[v016] 2022-01-31 09:31:34,626 (trainer:653) INFO: 198epoch:train:460-486batch: iter_time=7.854e-05, forward_time=0.032, loss=0.834, loss_att=0.372, loss_ctc=1.295, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.612e-05, train_time=0.092 -[v016] 2022-01-31 09:31:37,137 (trainer:653) INFO: 198epoch:train:487-513batch: iter_time=1.148e-04, forward_time=0.032, loss=0.937, loss_att=0.456, loss_ctc=1.418, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.611e-05, train_time=0.093 -[v016] 2022-01-31 09:31:39,615 (trainer:653) INFO: 198epoch:train:514-540batch: iter_time=7.897e-05, forward_time=0.032, loss=0.994, loss_att=0.397, loss_ctc=1.590, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.610e-05, train_time=0.092 -[v016] 2022-01-31 09:32:13,902 (trainer:328) INFO: 198epoch results: [train] iter_time=6.018e-04, forward_time=0.032, loss=0.901, loss_att=0.383, loss_ctc=1.419, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.621e-05, train_time=0.093, time=51.14 seconds, total_count=108306, gpu_max_cached_mem_GB=5.824, [valid] loss=8.114, loss_att=6.701, loss_ctc=9.527, acc=0.903, cer=0.102, wer=0.401, cer_ctc=0.144, time=5.94 seconds, total_count=35244, gpu_max_cached_mem_GB=5.824, [att_plot] time=27.58 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:32:16,063 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:32:16,081 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/187epoch.pth, exp/asr_train_asr_raw_en_word/193epoch.pth -[v016] 2022-01-31 09:32:16,082 (trainer:261) INFO: 199/200epoch started. Estimated time to finish: 3 minutes and 38.46 seconds -[v016] 2022-01-31 09:32:18,747 (trainer:653) INFO: 199epoch:train:1-27batch: iter_time=0.004, forward_time=0.033, loss=0.884, loss_att=0.357, loss_ctc=1.412, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.608e-05, train_time=0.098 -[v016] 2022-01-31 09:32:21,239 (trainer:653) INFO: 199epoch:train:28-54batch: iter_time=8.520e-05, forward_time=0.032, loss=0.796, loss_att=0.328, loss_ctc=1.264, acc=0.988, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.607e-05, train_time=0.092 -[v016] 2022-01-31 09:32:23,839 (trainer:653) INFO: 199epoch:train:55-81batch: iter_time=7.884e-05, forward_time=0.033, loss=0.929, loss_att=0.345, loss_ctc=1.513, acc=0.986, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.606e-05, train_time=0.096 -[v016] 2022-01-31 09:32:26,404 (trainer:653) INFO: 199epoch:train:82-108batch: iter_time=8.128e-05, forward_time=0.034, loss=0.957, loss_att=0.380, loss_ctc=1.534, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.605e-05, train_time=0.095 -[v016] 2022-01-31 09:32:29,262 (trainer:653) INFO: 199epoch:train:109-135batch: iter_time=0.011, forward_time=0.033, loss=0.903, loss_att=0.375, loss_ctc=1.432, acc=0.979, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.603e-05, train_time=0.106 -[v016] 2022-01-31 09:32:31,765 (trainer:653) INFO: 199epoch:train:136-162batch: iter_time=8.701e-05, forward_time=0.032, loss=0.926, loss_att=0.397, loss_ctc=1.456, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.602e-05, train_time=0.093 -[v016] 2022-01-31 09:32:34,244 (trainer:653) INFO: 199epoch:train:163-189batch: iter_time=8.479e-05, forward_time=0.032, loss=0.941, loss_att=0.354, loss_ctc=1.528, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.601e-05, train_time=0.092 -[v016] 2022-01-31 09:32:36,790 (trainer:653) INFO: 199epoch:train:190-216batch: iter_time=8.854e-05, forward_time=0.033, loss=0.767, loss_att=0.283, loss_ctc=1.252, acc=0.988, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.600e-05, train_time=0.094 -[v016] 2022-01-31 09:32:39,250 (trainer:653) INFO: 199epoch:train:217-243batch: iter_time=0.001, forward_time=0.031, loss=0.907, loss_att=0.398, loss_ctc=1.416, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.599e-05, train_time=0.091 -[v016] 2022-01-31 09:32:41,693 (trainer:653) INFO: 199epoch:train:244-270batch: iter_time=7.885e-05, forward_time=0.031, loss=0.835, loss_att=0.341, loss_ctc=1.329, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.597e-05, train_time=0.090 -[v016] 2022-01-31 09:32:44,124 (trainer:653) INFO: 199epoch:train:271-297batch: iter_time=8.000e-05, forward_time=0.031, loss=1.061, loss_att=0.423, loss_ctc=1.700, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.596e-05, train_time=0.090 -[v016] 2022-01-31 09:32:46,583 (trainer:653) INFO: 199epoch:train:298-324batch: iter_time=8.173e-05, forward_time=0.032, loss=0.999, loss_att=0.439, loss_ctc=1.559, acc=0.978, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.595e-05, train_time=0.091 -[v016] 2022-01-31 09:32:49,172 (trainer:653) INFO: 199epoch:train:325-351batch: iter_time=0.005, forward_time=0.031, loss=1.073, loss_att=0.480, loss_ctc=1.667, acc=0.974, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.594e-05, train_time=0.096 -[v016] 2022-01-31 09:32:51,682 (trainer:653) INFO: 199epoch:train:352-378batch: iter_time=8.532e-05, forward_time=0.032, loss=0.878, loss_att=0.398, loss_ctc=1.358, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.593e-05, train_time=0.093 -[v016] 2022-01-31 09:32:54,173 (trainer:653) INFO: 199epoch:train:379-405batch: iter_time=8.226e-05, forward_time=0.032, loss=0.903, loss_att=0.397, loss_ctc=1.410, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.592e-05, train_time=0.092 -[v016] 2022-01-31 09:32:56,646 (trainer:653) INFO: 199epoch:train:406-432batch: iter_time=7.947e-05, forward_time=0.031, loss=0.773, loss_att=0.312, loss_ctc=1.235, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.590e-05, train_time=0.091 -[v016] 2022-01-31 09:32:59,203 (trainer:653) INFO: 199epoch:train:433-459batch: iter_time=7.933e-05, forward_time=0.032, loss=1.009, loss_att=0.343, loss_ctc=1.674, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.589e-05, train_time=0.094 -[v016] 2022-01-31 09:33:01,675 (trainer:653) INFO: 199epoch:train:460-486batch: iter_time=7.938e-05, forward_time=0.032, loss=0.934, loss_att=0.387, loss_ctc=1.481, acc=0.983, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.588e-05, train_time=0.091 -[v016] 2022-01-31 09:33:04,114 (trainer:653) INFO: 199epoch:train:487-513batch: iter_time=7.931e-05, forward_time=0.032, loss=0.929, loss_att=0.371, loss_ctc=1.488, acc=0.980, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.587e-05, train_time=0.090 -[v016] 2022-01-31 09:33:06,698 (trainer:653) INFO: 199epoch:train:514-540batch: iter_time=0.003, forward_time=0.032, loss=1.156, loss_att=0.452, loss_ctc=1.859, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.586e-05, train_time=0.095 -[v016] 2022-01-31 09:33:42,494 (trainer:328) INFO: 199epoch results: [train] iter_time=0.001, forward_time=0.032, loss=0.928, loss_att=0.379, loss_ctc=1.478, acc=0.982, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.597e-05, train_time=0.093, time=51.33 seconds, total_count=108853, gpu_max_cached_mem_GB=5.824, [valid] loss=8.117, loss_att=6.745, loss_ctc=9.489, acc=0.907, cer=0.098, wer=0.398, cer_ctc=0.138, time=6.31 seconds, total_count=35422, gpu_max_cached_mem_GB=5.824, [att_plot] time=28.77 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:33:45,046 (trainer:373) INFO: There are no improvements in this epoch -[v016] 2022-01-31 09:33:45,061 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/157epoch.pth, exp/asr_train_asr_raw_en_word/191epoch.pth -[v016] 2022-01-31 09:33:45,061 (trainer:261) INFO: 200/200epoch started. Estimated time to finish: 1 minute and 49.12 seconds -[v016] 2022-01-31 09:33:47,766 (trainer:653) INFO: 200epoch:train:1-27batch: iter_time=0.004, forward_time=0.033, loss=0.716, loss_att=0.313, loss_ctc=1.119, acc=0.984, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.584e-05, train_time=0.100 -[v016] 2022-01-31 09:33:50,376 (trainer:653) INFO: 200epoch:train:28-54batch: iter_time=0.006, forward_time=0.031, loss=0.935, loss_att=0.422, loss_ctc=1.448, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.583e-05, train_time=0.096 -[v016] 2022-01-31 09:33:52,784 (trainer:653) INFO: 200epoch:train:55-81batch: iter_time=7.918e-05, forward_time=0.030, loss=0.861, loss_att=0.408, loss_ctc=1.315, acc=0.977, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.582e-05, train_time=0.089 -[v016] 2022-01-31 09:33:55,433 (trainer:653) INFO: 200epoch:train:82-108batch: iter_time=0.007, forward_time=0.031, loss=0.826, loss_att=0.326, loss_ctc=1.325, acc=0.981, backward_time=0.021, optim_step_time=0.021, optim0_lr0=9.581e-05, train_time=0.098 -[v016] 2022-01-31 09:33:58,139 (trainer:653) INFO: 200epoch:train:109-135batch: iter_time=0.002, forward_time=0.034, loss=0.802, loss_att=0.329, loss_ctc=1.276, acc=0.984, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.579e-05, train_time=0.100 -[v016] 2022-01-31 09:34:00,872 (trainer:653) INFO: 200epoch:train:136-162batch: iter_time=1.250e-04, forward_time=0.035, loss=0.842, loss_att=0.342, loss_ctc=1.341, acc=0.982, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.578e-05, train_time=0.101 -[v016] 2022-01-31 09:34:03,639 (trainer:653) INFO: 200epoch:train:163-189batch: iter_time=1.124e-04, forward_time=0.035, loss=0.861, loss_att=0.347, loss_ctc=1.376, acc=0.984, backward_time=0.024, optim_step_time=0.023, optim0_lr0=9.577e-05, train_time=0.102 -[v016] 2022-01-31 09:34:06,308 (trainer:653) INFO: 200epoch:train:190-216batch: iter_time=1.508e-04, forward_time=0.034, loss=0.983, loss_att=0.388, loss_ctc=1.579, acc=0.981, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.576e-05, train_time=0.099 -[v016] 2022-01-31 09:34:09,499 (trainer:653) INFO: 200epoch:train:217-243batch: iter_time=0.019, forward_time=0.034, loss=0.935, loss_att=0.403, loss_ctc=1.467, acc=0.980, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.575e-05, train_time=0.118 -[v016] 2022-01-31 09:34:12,309 (trainer:653) INFO: 200epoch:train:244-270batch: iter_time=0.005, forward_time=0.034, loss=0.858, loss_att=0.336, loss_ctc=1.381, acc=0.986, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.573e-05, train_time=0.104 -[v016] 2022-01-31 09:34:15,961 (trainer:653) INFO: 200epoch:train:271-297batch: iter_time=0.039, forward_time=0.033, loss=0.887, loss_att=0.375, loss_ctc=1.398, acc=0.982, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.572e-05, train_time=0.135 -[v016] 2022-01-31 09:34:20,018 (trainer:653) INFO: 200epoch:train:298-324batch: iter_time=0.017, forward_time=0.051, loss=0.937, loss_att=0.316, loss_ctc=1.559, acc=0.984, backward_time=0.033, optim_step_time=0.023, optim0_lr0=9.571e-05, train_time=0.150 -[v016] 2022-01-31 09:34:22,740 (trainer:653) INFO: 200epoch:train:325-351batch: iter_time=1.205e-04, forward_time=0.034, loss=0.881, loss_att=0.364, loss_ctc=1.398, acc=0.984, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.570e-05, train_time=0.101 -[v016] 2022-01-31 09:34:25,469 (trainer:653) INFO: 200epoch:train:352-378batch: iter_time=1.119e-04, forward_time=0.034, loss=0.916, loss_att=0.399, loss_ctc=1.433, acc=0.982, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.569e-05, train_time=0.101 -[v016] 2022-01-31 09:34:27,941 (trainer:653) INFO: 200epoch:train:379-405batch: iter_time=8.177e-05, forward_time=0.031, loss=0.858, loss_att=0.414, loss_ctc=1.301, acc=0.978, backward_time=0.022, optim_step_time=0.022, optim0_lr0=9.567e-05, train_time=0.091 -[v016] 2022-01-31 09:34:31,434 (trainer:653) INFO: 200epoch:train:406-432batch: iter_time=0.035, forward_time=0.032, loss=0.781, loss_att=0.300, loss_ctc=1.261, acc=0.986, backward_time=0.022, optim_step_time=0.021, optim0_lr0=9.566e-05, train_time=0.129 -[v016] 2022-01-31 09:34:34,045 (trainer:653) INFO: 200epoch:train:433-459batch: iter_time=9.182e-05, forward_time=0.034, loss=0.950, loss_att=0.390, loss_ctc=1.510, acc=0.982, backward_time=0.023, optim_step_time=0.022, optim0_lr0=9.565e-05, train_time=0.096 -[v016] 2022-01-31 09:34:36,765 (trainer:653) INFO: 200epoch:train:460-486batch: iter_time=1.153e-04, forward_time=0.035, loss=0.830, loss_att=0.402, loss_ctc=1.258, acc=0.978, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.564e-05, train_time=0.100 -[v016] 2022-01-31 09:34:40,698 (trainer:653) INFO: 200epoch:train:487-513batch: iter_time=0.003, forward_time=0.062, loss=1.044, loss_att=0.482, loss_ctc=1.606, acc=0.975, backward_time=0.035, optim_step_time=0.024, optim0_lr0=9.563e-05, train_time=0.145 -[v016] 2022-01-31 09:34:44,153 (trainer:653) INFO: 200epoch:train:514-540batch: iter_time=0.004, forward_time=0.059, loss=0.851, loss_att=0.408, loss_ctc=1.295, acc=0.983, backward_time=0.023, optim_step_time=0.023, optim0_lr0=9.562e-05, train_time=0.128 -[v016] 2022-01-31 09:35:24,097 (trainer:328) INFO: 200epoch results: [train] iter_time=0.007, forward_time=0.037, loss=0.876, loss_att=0.372, loss_ctc=1.380, acc=0.982, backward_time=0.024, optim_step_time=0.022, optim0_lr0=9.573e-05, train_time=0.109, time=59.9 seconds, total_count=109400, gpu_max_cached_mem_GB=5.824, [valid] loss=8.380, loss_att=6.880, loss_ctc=9.879, acc=0.902, cer=0.104, wer=0.408, cer_ctc=0.147, time=6.85 seconds, total_count=35600, gpu_max_cached_mem_GB=5.824, [att_plot] time=32.29 seconds, total_count=0, gpu_max_cached_mem_GB=5.824 -[v016] 2022-01-31 09:35:28,377 (trainer:375) INFO: The best model has been updated: train.loss -[v016] 2022-01-31 09:35:28,398 (trainer:413) INFO: The model files were removed: exp/asr_train_asr_raw_en_word/185epoch.pth -[v016] 2022-01-31 09:35:28,398 (trainer:431) INFO: The training was finished at 200 epochs -[v016] 2022-01-31 09:35:28,417 (average_nbest_models:64) INFO: Averaging 5best models: criterion="train.loss": exp/asr_train_asr_raw_en_word/train.loss.ave_5best.pth -[v016] 2022-01-31 09:35:31,585 (average_nbest_models:64) INFO: Averaging 5best models: criterion="valid.loss": exp/asr_train_asr_raw_en_word/valid.loss.ave_5best.pth -[v016] 2022-01-31 09:35:40,583 (average_nbest_models:64) INFO: Averaging 5best models: criterion="train.acc": exp/asr_train_asr_raw_en_word/train.acc.ave_5best.pth -[v016] 2022-01-31 09:35:41,104 (average_nbest_models:64) INFO: Averaging 5best models: criterion="valid.acc": exp/asr_train_asr_raw_en_word/valid.acc.ave_5best.pth -# Accounting: begin_time=1643620020 -# Accounting: end_time=1643639772 -# Accounting: time=19752 threads=1 -# Finished at Mon Jan 31 09:36:12 EST 2022 with status 0