JustPaste.it

Transformer 16 layers

epoch:        1 | nupdates:          402 | lr: 0.006700 | lrcriterion: 0.006700 | runtime: 00:07:41 | bch(ms): 1148.24 | smp(ms): 3.35 | fwd(ms): 433.08 | crit-fwd(ms): 22.23 | bwd(ms): 637.68 | optim(ms): 61.02 | loss:   79.62127 | train-TER: 184.04 | train-WER: 155.98 | lists/dev.lst-loss:   36.50141 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 761.38
epoch:        2 | nupdates:          804 | lr: 0.013400 | lrcriterion: 0.013400 | runtime: 00:07:32 | bch(ms): 1126.31 | smp(ms): 7.81 | fwd(ms): 421.71 | crit-fwd(ms): 21.37 | bwd(ms): 642.40 | optim(ms): 57.33 | loss:   34.09406 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss:   31.94590 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.20
epoch:        3 | nupdates:         1206 | lr: 0.020100 | lrcriterion: 0.020100 | runtime: 00:07:37 | bch(ms): 1137.09 | smp(ms): 6.89 | fwd(ms): 421.21 | crit-fwd(ms): 21.01 | bwd(ms): 653.89 | optim(ms): 57.32 | loss:   31.66174 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss:   30.70076 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 768.85
epoch:        4 | nupdates:         1608 | lr: 0.026800 | lrcriterion: 0.026800 | runtime: 00:07:36 | bch(ms): 1134.58 | smp(ms): 7.41 | fwd(ms): 422.17 | crit-fwd(ms): 21.11 | bwd(ms): 649.80 | optim(ms): 57.39 | loss:   30.66355 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss:   30.00350 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.55
epoch:        5 | nupdates:         2010 | lr: 0.033500 | lrcriterion: 0.033500 | runtime: 00:07:35 | bch(ms): 1134.09 | smp(ms): 6.93 | fwd(ms): 423.48 | crit-fwd(ms): 21.15 | bwd(ms): 648.60 | optim(ms): 57.42 | loss:   30.05698 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss:   29.69616 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.88
epoch:        6 | nupdates:         2412 | lr: 0.040200 | lrcriterion: 0.040200 | runtime: 00:07:35 | bch(ms): 1132.80 | smp(ms): 6.23 | fwd(ms): 421.72 | crit-fwd(ms): 20.82 | bwd(ms): 648.32 | optim(ms): 57.40 | loss:   29.64941 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss:   29.19304 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.76
epoch:        7 | nupdates:         2814 | lr: 0.046900 | lrcriterion: 0.046900 | runtime: 00:07:33 | bch(ms): 1127.89 | smp(ms): 6.59 | fwd(ms): 420.74 | crit-fwd(ms): 21.16 | bwd(ms): 644.62 | optim(ms): 57.47 | loss:   29.34847 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss:   29.54366 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 775.12
epoch:        8 | nupdates:         3216 | lr: 0.053600 | lrcriterion: 0.053600 | runtime: 00:07:35 | bch(ms): 1133.11 | smp(ms): 6.81 | fwd(ms): 421.49 | crit-fwd(ms): 21.36 | bwd(ms): 649.40 | optim(ms): 57.41 | loss:   29.17970 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss:   29.02254 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.55
epoch:        9 | nupdates:         3618 | lr: 0.060300 | lrcriterion: 0.060300 | runtime: 00:07:34 | bch(ms): 1131.26 | smp(ms): 8.04 | fwd(ms): 420.30 | crit-fwd(ms): 21.14 | bwd(ms): 648.43 | optim(ms): 57.41 | loss:   29.04865 | train-TER: 99.97 | train-WER: 99.99 | lists/dev.lst-loss:   28.78550 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.81
epoch:       10 | nupdates:         4020 | lr: 0.067000 | lrcriterion: 0.067000 | runtime: 00:07:32 | bch(ms): 1125.92 | smp(ms): 6.84 | fwd(ms): 419.38 | crit-fwd(ms): 21.22 | bwd(ms): 644.47 | optim(ms): 57.41 | loss:   28.90197 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss:   28.52354 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.48
epoch:       11 | nupdates:         4422 | lr: 0.073700 | lrcriterion: 0.073700 | runtime: 00:07:34 | bch(ms): 1131.37 | smp(ms): 7.69 | fwd(ms): 420.70 | crit-fwd(ms): 21.03 | bwd(ms): 648.66 | optim(ms): 57.35 | loss:   28.79002 | train-TER: 99.94 | train-WER: 100.00 | lists/dev.lst-loss:   28.63813 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.74
epoch:       12 | nupdates:         4824 | lr: 0.080400 | lrcriterion: 0.080400 | runtime: 00:07:35 | bch(ms): 1132.57 | smp(ms): 6.71 | fwd(ms): 421.69 | crit-fwd(ms): 21.23 | bwd(ms): 648.70 | optim(ms): 57.33 | loss:   28.71151 | train-TER: 99.75 | train-WER: 99.94 | lists/dev.lst-loss:   28.78160 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 771.92
epoch:       13 | nupdates:         5226 | lr: 0.087100 | lrcriterion: 0.087100 | runtime: 00:07:35 | bch(ms): 1132.22 | smp(ms): 7.09 | fwd(ms): 421.24 | crit-fwd(ms): 20.96 | bwd(ms): 648.54 | optim(ms): 57.30 | loss:   28.55661 | train-TER: 99.79 | train-WER: 100.00 | lists/dev.lst-loss:   28.21670 | lists/dev.lst-TER: 99.73 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.16
epoch:       14 | nupdates:         5628 | lr: 0.093800 | lrcriterion: 0.093800 | runtime: 00:07:40 | bch(ms): 1144.84 | smp(ms): 6.44 | fwd(ms): 422.38 | crit-fwd(ms): 21.09 | bwd(ms): 660.54 | optim(ms): 57.30 | loss:   28.44571 | train-TER: 99.75 | train-WER: 99.91 | lists/dev.lst-loss:   28.02138 | lists/dev.lst-TER: 99.35 | lists/dev.lst-WER: 99.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 763.64
epoch:       15 | nupdates:         6030 | lr: 0.100500 | lrcriterion: 0.100500 | runtime: 00:07:40 | bch(ms): 1145.86 | smp(ms): 8.44 | fwd(ms): 420.19 | crit-fwd(ms): 21.05 | bwd(ms): 663.58 | optim(ms): 57.29 | loss:   28.31598 | train-TER: 99.60 | train-WER: 99.82 | lists/dev.lst-loss:   28.49923 | lists/dev.lst-TER: 99.84 | lists/dev.lst-WER: 99.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 762.96
epoch:       16 | nupdates:         6432 | lr: 0.107200 | lrcriterion: 0.107200 | runtime: 00:07:40 | bch(ms): 1144.95 | smp(ms): 5.84 | fwd(ms): 422.15 | crit-fwd(ms): 20.92 | bwd(ms): 660.73 | optim(ms): 57.28 | loss:   28.13958 | train-TER: 99.46 | train-WER: 99.69 | lists/dev.lst-loss:   27.89934 | lists/dev.lst-TER: 97.08 | lists/dev.lst-WER: 98.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 763.57
epoch:       17 | nupdates:         6834 | lr: 0.113900 | lrcriterion: 0.113900 | runtime: 00:07:42 | bch(ms): 1151.12 | smp(ms): 7.27 | fwd(ms): 422.82 | crit-fwd(ms): 20.99 | bwd(ms): 666.03 | optim(ms): 57.25 | loss:   27.90646 | train-TER: 99.19 | train-WER: 99.50 | lists/dev.lst-loss:   27.97491 | lists/dev.lst-TER: 94.38 | lists/dev.lst-WER: 97.69 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 759.47
epoch:       18 | nupdates:         7236 | lr: 0.120600 | lrcriterion: 0.120600 | runtime: 00:07:41 | bch(ms): 1147.21 | smp(ms): 7.50 | fwd(ms): 422.58 | crit-fwd(ms): 20.92 | bwd(ms): 662.31 | optim(ms): 57.27 | loss:   27.66473 | train-TER: 99.54 | train-WER: 99.57 | lists/dev.lst-loss:   27.13344 | lists/dev.lst-TER: 96.15 | lists/dev.lst-WER: 97.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 762.07
epoch:       19 | nupdates:         7638 | lr: 0.127300 | lrcriterion: 0.127300 | runtime: 00:07:35 | bch(ms): 1132.63 | smp(ms): 6.93 | fwd(ms): 422.31 | crit-fwd(ms): 21.09 | bwd(ms): 647.89 | optim(ms): 57.26 | loss:   27.37545 | train-TER: 98.89 | train-WER: 98.97 | lists/dev.lst-loss:   26.81882 | lists/dev.lst-TER: 93.12 | lists/dev.lst-WER: 96.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 771.88
epoch:       20 | nupdates:         8040 | lr: 0.134000 | lrcriterion: 0.134000 | runtime: 00:07:39 | bch(ms): 1144.09 | smp(ms): 6.70 | fwd(ms): 421.11 | crit-fwd(ms): 20.88 | bwd(ms): 660.73 | optim(ms): 57.25 | loss:   27.08303 | train-TER: 97.37 | train-WER: 98.48 | lists/dev.lst-loss:   26.36108 | lists/dev.lst-TER: 96.25 | lists/dev.lst-WER: 97.52 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 764.14
epoch:       21 | nupdates:         8442 | lr: 0.140700 | lrcriterion: 0.140700 | runtime: 00:07:35 | bch(ms): 1133.09 | smp(ms): 6.55 | fwd(ms): 422.54 | crit-fwd(ms): 20.99 | bwd(ms): 648.53 | optim(ms): 57.25 | loss:   26.74288 | train-TER: 97.55 | train-WER: 98.28 | lists/dev.lst-loss:   25.92736 | lists/dev.lst-TER: 93.99 | lists/dev.lst-WER: 96.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.56
epoch:       22 | nupdates:         8844 | lr: 0.147400 | lrcriterion: 0.147400 | runtime: 00:07:39 | bch(ms): 1143.29 | smp(ms): 7.71 | fwd(ms): 420.74 | crit-fwd(ms): 20.98 | bwd(ms): 659.74 | optim(ms): 57.27 | loss:   26.44379 | train-TER: 96.80 | train-WER: 97.86 | lists/dev.lst-loss:   25.62425 | lists/dev.lst-TER: 90.80 | lists/dev.lst-WER: 95.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 764.68
epoch:       23 | nupdates:         9246 | lr: 0.154100 | lrcriterion: 0.154100 | runtime: 00:07:40 | bch(ms): 1144.41 | smp(ms): 6.14 | fwd(ms): 422.02 | crit-fwd(ms): 20.95 | bwd(ms): 660.24 | optim(ms): 57.26 | loss:   26.14073 | train-TER: 94.92 | train-WER: 97.05 | lists/dev.lst-loss:   25.54093 | lists/dev.lst-TER: 96.45 | lists/dev.lst-WER: 97.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 763.93
epoch:       24 | nupdates:         9648 | lr: 0.160800 | lrcriterion: 0.160800 | runtime: 00:07:36 | bch(ms): 1135.44 | smp(ms): 6.84 | fwd(ms): 421.56 | crit-fwd(ms): 20.99 | bwd(ms): 651.30 | optim(ms): 57.25 | loss:   25.76430 | train-TER: 95.55 | train-WER: 97.08 | lists/dev.lst-loss:   24.96298 | lists/dev.lst-TER: 85.65 | lists/dev.lst-WER: 92.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 769.96
epoch:       25 | nupdates:        10050 | lr: 0.167500 | lrcriterion: 0.167500 | runtime: 00:07:40 | bch(ms): 1145.72 | smp(ms): 7.84 | fwd(ms): 421.36 | crit-fwd(ms): 21.14 | bwd(ms): 661.91 | optim(ms): 57.24 | loss:   25.44469 | train-TER: 93.56 | train-WER: 96.13 | lists/dev.lst-loss:   24.83387 | lists/dev.lst-TER: 95.02 | lists/dev.lst-WER: 96.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 763.05
epoch:       26 | nupdates:        10452 | lr: 0.174200 | lrcriterion: 0.174200 | runtime: 00:07:36 | bch(ms): 1134.99 | smp(ms): 7.48 | fwd(ms): 422.21 | crit-fwd(ms): 21.05 | bwd(ms): 649.59 | optim(ms): 57.25 | loss:   25.11919 | train-TER: 92.50 | train-WER: 95.46 | lists/dev.lst-loss:   24.26034 | lists/dev.lst-TER: 91.94 | lists/dev.lst-WER: 94.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 770.27
epoch:       27 | nupdates:        10854 | lr: 0.180900 | lrcriterion: 0.180900 | runtime: 00:07:36 | bch(ms): 1136.29 | smp(ms): 4.03 | fwd(ms): 420.85 | crit-fwd(ms): 20.82 | bwd(ms): 652.13 | optim(ms): 57.25 | loss:   24.77388 | train-TER: 90.07 | train-WER: 94.50 | lists/dev.lst-loss:   23.71284 | lists/dev.lst-TER: 85.51 | lists/dev.lst-WER: 92.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 769.39
epoch:       28 | nupdates:        11256 | lr: 0.187600 | lrcriterion: 0.187600 | runtime: 00:07:41 | bch(ms): 1148.20 | smp(ms): 7.24 | fwd(ms): 424.22 | crit-fwd(ms): 21.29 | bwd(ms): 661.97 | optim(ms): 57.26 | loss:   24.41542 | train-TER: 89.43 | train-WER: 94.19 | lists/dev.lst-loss:   23.46172 | lists/dev.lst-TER: 83.32 | lists/dev.lst-WER: 92.65 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 761.41
epoch:       29 | nupdates:        11658 | lr: 0.194300 | lrcriterion: 0.194300 | runtime: 00:07:37 | bch(ms): 1139.27 | smp(ms): 7.38 | fwd(ms): 423.15 | crit-fwd(ms): 21.20 | bwd(ms): 654.07 | optim(ms): 57.24 | loss:   24.05792 | train-TER: 88.41 | train-WER: 93.59 | lists/dev.lst-loss:   23.07679 | lists/dev.lst-TER: 80.20 | lists/dev.lst-WER: 88.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 767.37
epoch:       30 | nupdates:        12060 | lr: 0.201000 | lrcriterion: 0.201000 | runtime: 00:07:40 | bch(ms): 1146.24 | smp(ms): 5.74 | fwd(ms): 422.23 | crit-fwd(ms): 20.94 | bwd(ms): 661.27 | optim(ms): 57.26 | loss:   23.72896 | train-TER: 87.26 | train-WER: 92.82 | lists/dev.lst-loss:   22.68104 | lists/dev.lst-TER: 79.57 | lists/dev.lst-WER: 89.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 762.71
epoch:       31 | nupdates:        12462 | lr: 0.207700 | lrcriterion: 0.207700 | runtime: 00:07:35 | bch(ms): 1134.16 | smp(ms): 7.41 | fwd(ms): 421.47 | crit-fwd(ms): 20.97 | bwd(ms): 650.63 | optim(ms): 57.25 | loss:   23.36377 | train-TER: 85.41 | train-WER: 92.92 | lists/dev.lst-loss:   22.25256 | lists/dev.lst-TER: 85.17 | lists/dev.lst-WER: 91.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.83
epoch:       32 | nupdates:        12864 | lr: 0.214400 | lrcriterion: 0.214400 | runtime: 00:07:34 | bch(ms): 1130.29 | smp(ms): 6.98 | fwd(ms): 419.55 | crit-fwd(ms): 20.89 | bwd(ms): 648.30 | optim(ms): 57.24 | loss:   23.05476 | train-TER: 83.63 | train-WER: 91.63 | lists/dev.lst-loss:   22.02975 | lists/dev.lst-TER: 77.81 | lists/dev.lst-WER: 88.27 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.47
epoch:       33 | nupdates:        13266 | lr: 0.221100 | lrcriterion: 0.221100 | runtime: 00:07:39 | bch(ms): 1143.79 | smp(ms): 7.93 | fwd(ms): 421.71 | crit-fwd(ms): 21.19 | bwd(ms): 659.89 | optim(ms): 57.28 | loss:   22.74303 | train-TER: 84.53 | train-WER: 91.64 | lists/dev.lst-loss:   21.54951 | lists/dev.lst-TER: 83.62 | lists/dev.lst-WER: 90.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 764.34
epoch:       34 | nupdates:        13668 | lr: 0.227800 | lrcriterion: 0.227800 | runtime: 00:07:34 | bch(ms): 1130.16 | smp(ms): 6.86 | fwd(ms): 422.02 | crit-fwd(ms): 20.98 | bwd(ms): 646.11 | optim(ms): 57.25 | loss:   22.44189 | train-TER: 84.06 | train-WER: 91.63 | lists/dev.lst-loss:   21.30642 | lists/dev.lst-TER: 83.39 | lists/dev.lst-WER: 90.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 773.56
epoch:       35 | nupdates:        14070 | lr: 0.234500 | lrcriterion: 0.234500 | runtime: 00:07:35 | bch(ms): 1133.66 | smp(ms): 6.15 | fwd(ms): 422.27 | crit-fwd(ms): 21.41 | bwd(ms): 649.64 | optim(ms): 57.24 | loss:   22.12480 | train-TER: 81.17 | train-WER: 90.52 | lists/dev.lst-loss:   21.02684 | lists/dev.lst-TER: 79.89 | lists/dev.lst-WER: 88.21 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.17
epoch:       36 | nupdates:        14472 | lr: 0.241200 | lrcriterion: 0.241200 | runtime: 00:07:41 | bch(ms): 1148.84 | smp(ms): 7.76 | fwd(ms): 422.67 | crit-fwd(ms): 21.23 | bwd(ms): 663.88 | optim(ms): 57.24 | loss:   21.81555 | train-TER: 82.22 | train-WER: 90.66 | lists/dev.lst-loss:   21.11835 | lists/dev.lst-TER: 87.32 | lists/dev.lst-WER: 91.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 760.98
epoch:       37 | nupdates:        14874 | lr: 0.247900 | lrcriterion: 0.247900 | runtime: 00:07:35 | bch(ms): 1133.09 | smp(ms): 6.44 | fwd(ms): 424.03 | crit-fwd(ms): 20.94 | bwd(ms): 647.02 | optim(ms): 57.27 | loss:   21.55370 | train-TER: 83.25 | train-WER: 90.94 | lists/dev.lst-loss:   20.36272 | lists/dev.lst-TER: 73.52 | lists/dev.lst-WER: 86.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 771.56
epoch:       38 | nupdates:        15276 | lr: 0.254600 | lrcriterion: 0.254600 | runtime: 00:07:40 | bch(ms): 1145.25 | smp(ms): 5.53 | fwd(ms): 422.56 | crit-fwd(ms): 21.01 | bwd(ms): 660.47 | optim(ms): 57.26 | loss:   21.29312 | train-TER: 77.29 | train-WER: 88.79 | lists/dev.lst-loss:   20.38654 | lists/dev.lst-TER: 80.81 | lists/dev.lst-WER: 89.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 763.37
epoch:       39 | nupdates:        15678 | lr: 0.261300 | lrcriterion: 0.261300 | runtime: 00:07:36 | bch(ms): 1136.41 | smp(ms): 5.52 | fwd(ms): 423.50 | crit-fwd(ms): 21.09 | bwd(ms): 650.86 | optim(ms): 57.24 | loss:   21.02385 | train-TER: 78.98 | train-WER: 89.40 | lists/dev.lst-loss:   19.79664 | lists/dev.lst-TER: 73.98 | lists/dev.lst-WER: 86.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 769.31
epoch:       40 | nupdates:        16080 | lr: 0.268000 | lrcriterion: 0.268000 | runtime: 00:07:35 | bch(ms): 1133.78 | smp(ms): 5.99 | fwd(ms): 422.21 | crit-fwd(ms): 21.01 | bwd(ms): 649.54 | optim(ms): 57.24 | loss:   20.73723 | train-TER: 78.32 | train-WER: 89.33 | lists/dev.lst-loss:   19.84775 | lists/dev.lst-TER: 80.65 | lists/dev.lst-WER: 88.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 771.09
epoch:       41 | nupdates:        16482 | lr: 0.274700 | lrcriterion: 0.274700 | runtime: 00:07:36 | bch(ms): 1135.47 | smp(ms): 7.55 | fwd(ms): 422.66 | crit-fwd(ms): 21.11 | bwd(ms): 650.73 | optim(ms): 57.25 | loss:   20.50850 | train-TER: 78.49 | train-WER: 88.83 | lists/dev.lst-loss:   19.27892 | lists/dev.lst-TER: 76.16 | lists/dev.lst-WER: 85.96 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 769.95
epoch:       42 | nupdates:        16884 | lr: 0.281400 | lrcriterion: 0.281400 | runtime: 00:07:40 | bch(ms): 1144.84 | smp(ms): 7.08 | fwd(ms): 422.66 | crit-fwd(ms): 21.39 | bwd(ms): 660.14 | optim(ms): 57.25 | loss:   20.24121 | train-TER: 73.76 | train-WER: 87.45 | lists/dev.lst-loss:   19.32172 | lists/dev.lst-TER: 77.82 | lists/dev.lst-WER: 86.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 763.64
epoch:       43 | nupdates:        17286 | lr: 0.288100 | lrcriterion: 0.288100 | runtime: 00:07:37 | bch(ms): 1137.63 | smp(ms): 6.74 | fwd(ms): 421.10 | crit-fwd(ms): 21.22 | bwd(ms): 654.51 | optim(ms): 57.29 | loss:   19.99094 | train-TER: 75.62 | train-WER: 87.67 | lists/dev.lst-loss:   18.68604 | lists/dev.lst-TER: 70.70 | lists/dev.lst-WER: 84.20 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 768.48
epoch:       44 | nupdates:        17688 | lr: 0.294800 | lrcriterion: 0.294800 | runtime: 00:07:41 | bch(ms): 1149.25 | smp(ms): 7.17 | fwd(ms): 423.18 | crit-fwd(ms): 21.00 | bwd(ms): 663.77 | optim(ms): 57.37 | loss:   19.70648 | train-TER: 73.36 | train-WER: 86.51 | lists/dev.lst-loss:   18.57847 | lists/dev.lst-TER: 75.76 | lists/dev.lst-WER: 85.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 760.71
epoch:       45 | nupdates:        18090 | lr: 0.301500 | lrcriterion: 0.301500 | runtime: 00:07:34 | bch(ms): 1131.64 | smp(ms): 6.11 | fwd(ms): 421.76 | crit-fwd(ms): 20.98 | bwd(ms): 647.01 | optim(ms): 57.36 | loss:   19.43742 | train-TER: 73.22 | train-WER: 86.27 | lists/dev.lst-loss:   18.34961 | lists/dev.lst-TER: 74.32 | lists/dev.lst-WER: 85.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.55
epoch:       46 | nupdates:        18492 | lr: 0.308200 | lrcriterion: 0.308200 | runtime: 00:07:33 | bch(ms): 1128.48 | smp(ms): 5.51 | fwd(ms): 419.93 | crit-fwd(ms): 20.83 | bwd(ms): 646.09 | optim(ms): 57.25 | loss:   19.05118 | train-TER: 74.11 | train-WER: 85.84 | lists/dev.lst-loss:   17.58894 | lists/dev.lst-TER: 64.14 | lists/dev.lst-WER: 80.34 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 774.71
epoch:       47 | nupdates:        18894 | lr: 0.314900 | lrcriterion: 0.314900 | runtime: 00:07:41 | bch(ms): 1146.95 | smp(ms): 7.46 | fwd(ms): 422.25 | crit-fwd(ms): 21.00 | bwd(ms): 662.48 | optim(ms): 57.24 | loss:   18.66011 | train-TER: 73.10 | train-WER: 85.56 | lists/dev.lst-loss:   17.66062 | lists/dev.lst-TER: 74.50 | lists/dev.lst-WER: 84.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 762.24
epoch:       48 | nupdates:        19296 | lr: 0.321600 | lrcriterion: 0.321600 | runtime: 00:07:34 | bch(ms): 1130.11 | smp(ms): 4.35 | fwd(ms): 420.30 | crit-fwd(ms): 21.03 | bwd(ms): 646.78 | optim(ms): 57.23 | loss:   18.27108 | train-TER: 71.31 | train-WER: 84.50 | lists/dev.lst-loss:   16.95911 | lists/dev.lst-TER: 60.44 | lists/dev.lst-WER: 79.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.60
epoch:       49 | nupdates:        19698 | lr: 0.328300 | lrcriterion: 0.328300 | runtime: 00:07:41 | bch(ms): 1147.74 | smp(ms): 7.97 | fwd(ms): 421.57 | crit-fwd(ms): 21.26 | bwd(ms): 663.84 | optim(ms): 57.24 | loss:   17.92903 | train-TER: 67.56 | train-WER: 82.58 | lists/dev.lst-loss:   16.82782 | lists/dev.lst-TER: 68.85 | lists/dev.lst-WER: 81.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 761.71
epoch:       50 | nupdates:        20100 | lr: 0.335000 | lrcriterion: 0.335000 | runtime: 00:07:35 | bch(ms): 1134.06 | smp(ms): 8.06 | fwd(ms): 422.51 | crit-fwd(ms): 21.11 | bwd(ms): 649.76 | optim(ms): 57.25 | loss:   17.54452 | train-TER: 66.47 | train-WER: 81.19 | lists/dev.lst-loss:   16.13805 | lists/dev.lst-TER: 61.37 | lists/dev.lst-WER: 76.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.90
epoch:       51 | nupdates:        20502 | lr: 0.341700 | lrcriterion: 0.341700 | runtime: 00:07:40 | bch(ms): 1145.50 | smp(ms): 6.64 | fwd(ms): 423.10 | crit-fwd(ms): 21.18 | bwd(ms): 660.40 | optim(ms): 57.25 | loss:   17.13757 | train-TER: 67.73 | train-WER: 81.21 | lists/dev.lst-loss:   15.61902 | lists/dev.lst-TER: 59.84 | lists/dev.lst-WER: 75.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 763.20
epoch:       52 | nupdates:        20904 | lr: 0.348400 | lrcriterion: 0.348400 | runtime: 00:07:39 | bch(ms): 1143.70 | smp(ms): 6.74 | fwd(ms): 421.51 | crit-fwd(ms): 21.00 | bwd(ms): 660.00 | optim(ms): 57.26 | loss:   16.81060 | train-TER: 63.35 | train-WER: 79.55 | lists/dev.lst-loss:   15.24510 | lists/dev.lst-TER: 62.60 | lists/dev.lst-WER: 76.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 764.40
epoch:       53 | nupdates:        21306 | lr: 0.355100 | lrcriterion: 0.355100 | runtime: 00:07:36 | bch(ms): 1134.64 | smp(ms): 6.45 | fwd(ms): 422.00 | crit-fwd(ms): 21.01 | bwd(ms): 650.10 | optim(ms): 57.24 | loss:   16.43567 | train-TER: 59.04 | train-WER: 77.53 | lists/dev.lst-loss:   14.91175 | lists/dev.lst-TER: 56.93 | lists/dev.lst-WER: 73.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.51
epoch:       54 | nupdates:        21708 | lr: 0.361800 | lrcriterion: 0.361800 | runtime: 00:07:40 | bch(ms): 1145.43 | smp(ms): 3.26 | fwd(ms): 421.35 | crit-fwd(ms): 20.96 | bwd(ms): 660.83 | optim(ms): 57.19 | loss:   16.11873 | train-TER: 60.63 | train-WER: 77.64 | lists/dev.lst-loss:   14.38565 | lists/dev.lst-TER: 52.80 | lists/dev.lst-WER: 70.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 763.25
epoch:       55 | nupdates:        22110 | lr: 0.368500 | lrcriterion: 0.368500 | runtime: 00:07:41 | bch(ms): 1148.49 | smp(ms): 8.92 | fwd(ms): 422.61 | crit-fwd(ms): 21.27 | bwd(ms): 663.87 | optim(ms): 57.20 | loss:   15.75892 | train-TER: 60.39 | train-WER: 77.63 | lists/dev.lst-loss:   14.29904 | lists/dev.lst-TER: 48.81 | lists/dev.lst-WER: 68.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 761.21
epoch:       56 | nupdates:        22512 | lr: 0.375200 | lrcriterion: 0.375200 | runtime: 00:07:39 | bch(ms): 1141.89 | smp(ms): 6.19 | fwd(ms): 422.49 | crit-fwd(ms): 20.97 | bwd(ms): 657.11 | optim(ms): 57.23 | loss:   15.45886 | train-TER: 60.37 | train-WER: 77.06 | lists/dev.lst-loss:   13.65482 | lists/dev.lst-TER: 47.63 | lists/dev.lst-WER: 67.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 765.61
epoch:       57 | nupdates:        22914 | lr: 0.381900 | lrcriterion: 0.381900 | runtime: 00:07:40 | bch(ms): 1145.51 | smp(ms): 7.15 | fwd(ms): 421.78 | crit-fwd(ms): 21.01 | bwd(ms): 661.45 | optim(ms): 57.22 | loss:   15.17435 | train-TER: 59.77 | train-WER: 76.54 | lists/dev.lst-loss:   13.44365 | lists/dev.lst-TER: 44.45 | lists/dev.lst-WER: 65.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 122 | hrs:   97.62 | thrpt(sec/sec): 763.20
epoch:       58 | nupdates:        23316 | lr: 0.388600 | lrcriterion: 0.388600 | runtime: 00:07:40 | bch(ms): 1145.86 | smp(ms): 6.04 | fwd(ms): 421.68 | crit-fwd(ms): 21.06 | bwd(ms): 662.17 | optim(ms): 57.19 | loss:   14.84819 | train-TER: 60.43 | train-WER: 76.06 | lists/dev.lst-loss:   13.51374 | lists/dev.lst-TER: 49.12 | lists/dev.lst-WER: 67.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 762.96
epoch:       59 | nupdates:        23718 | lr: 0.395300 | lrcriterion: 0.395300 | runtime: 00:07:36 | bch(ms): 1134.66 | smp(ms): 8.54 | fwd(ms): 422.14 | crit-fwd(ms): 21.04 | bwd(ms): 650.54 | optim(ms): 57.20 | loss:   14.56374 | train-TER: 54.85 | train-WER: 73.34 | lists/dev.lst-loss:   13.13301 | lists/dev.lst-TER: 48.60 | lists/dev.lst-WER: 66.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 770.49
epoch:       60 | nupdates:        24120 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1129.16 | smp(ms): 6.76 | fwd(ms): 421.10 | crit-fwd(ms): 21.06 | bwd(ms): 645.35 | optim(ms): 57.22 | loss:   16.87386 | train-TER: 67.22 | train-WER: 81.42 | lists/dev.lst-loss:   13.63964 | lists/dev.lst-TER: 42.41 | lists/dev.lst-WER: 65.45 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 774.25
epoch:       61 | nupdates:        24522 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.10 | smp(ms): 8.86 | fwd(ms): 418.07 | crit-fwd(ms): 21.04 | bwd(ms): 645.10 | optim(ms): 57.23 | loss:   21.45547 | train-TER: 77.48 | train-WER: 90.32 | lists/dev.lst-loss:   13.55002 | lists/dev.lst-TER: 47.99 | lists/dev.lst-WER: 67.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.04
epoch:       62 | nupdates:        24924 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.91 | smp(ms): 5.11 | fwd(ms): 418.81 | crit-fwd(ms): 21.12 | bwd(ms): 639.95 | optim(ms): 57.26 | loss:   20.71633 | train-TER: 76.02 | train-WER: 88.70 | lists/dev.lst-loss:   13.30020 | lists/dev.lst-TER: 46.06 | lists/dev.lst-WER: 65.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.94
epoch:       63 | nupdates:        25326 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.37 | smp(ms): 5.89 | fwd(ms): 418.99 | crit-fwd(ms): 20.97 | bwd(ms): 637.86 | optim(ms): 57.25 | loss:   20.17442 | train-TER: 69.40 | train-WER: 84.32 | lists/dev.lst-loss:   13.28457 | lists/dev.lst-TER: 44.68 | lists/dev.lst-WER: 66.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.02
epoch:       64 | nupdates:        25728 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.02 | smp(ms): 6.42 | fwd(ms): 419.43 | crit-fwd(ms): 21.06 | bwd(ms): 637.73 | optim(ms): 57.26 | loss:   20.08063 | train-TER: 75.05 | train-WER: 88.59 | lists/dev.lst-loss:   13.02198 | lists/dev.lst-TER: 46.80 | lists/dev.lst-WER: 65.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.26
epoch:       65 | nupdates:        26130 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.49 | smp(ms): 6.99 | fwd(ms): 418.26 | crit-fwd(ms): 21.55 | bwd(ms): 639.27 | optim(ms): 57.25 | loss:   19.58498 | train-TER: 68.09 | train-WER: 83.71 | lists/dev.lst-loss:   12.71989 | lists/dev.lst-TER: 44.05 | lists/dev.lst-WER: 64.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.93
epoch:       66 | nupdates:        26532 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.26 | smp(ms): 6.72 | fwd(ms): 418.77 | crit-fwd(ms): 20.96 | bwd(ms): 651.84 | optim(ms): 57.24 | loss:   19.72613 | train-TER: 72.76 | train-WER: 88.07 | lists/dev.lst-loss:   12.66421 | lists/dev.lst-TER: 43.31 | lists/dev.lst-WER: 63.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.45
epoch:       67 | nupdates:        26934 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.62 | smp(ms): 7.50 | fwd(ms): 416.98 | crit-fwd(ms): 21.20 | bwd(ms): 651.13 | optim(ms): 57.25 | loss:   19.40530 | train-TER: 75.97 | train-WER: 88.02 | lists/dev.lst-loss:   12.70186 | lists/dev.lst-TER: 48.45 | lists/dev.lst-WER: 66.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.25
epoch:       68 | nupdates:        27336 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.95 | smp(ms): 7.58 | fwd(ms): 418.23 | crit-fwd(ms): 21.26 | bwd(ms): 643.42 | optim(ms): 57.26 | loss:   19.21337 | train-TER: 73.86 | train-WER: 86.98 | lists/dev.lst-loss:   12.63130 | lists/dev.lst-TER: 46.08 | lists/dev.lst-WER: 66.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.84
epoch:       69 | nupdates:        27738 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.62 | smp(ms): 7.27 | fwd(ms): 418.83 | crit-fwd(ms): 21.04 | bwd(ms): 644.53 | optim(ms): 57.20 | loss:   18.99999 | train-TER: 60.46 | train-WER: 79.11 | lists/dev.lst-loss:   12.46292 | lists/dev.lst-TER: 41.57 | lists/dev.lst-WER: 61.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.68
epoch:       70 | nupdates:        28140 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.23 | smp(ms): 6.42 | fwd(ms): 419.49 | crit-fwd(ms): 21.29 | bwd(ms): 655.77 | optim(ms): 57.23 | loss:   18.98772 | train-TER: 76.27 | train-WER: 87.71 | lists/dev.lst-loss:   12.18081 | lists/dev.lst-TER: 45.37 | lists/dev.lst-WER: 64.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 768.75
epoch:       71 | nupdates:        28542 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.40 | smp(ms): 7.20 | fwd(ms): 417.76 | crit-fwd(ms): 21.23 | bwd(ms): 643.34 | optim(ms): 57.24 | loss:   18.84176 | train-TER: 73.31 | train-WER: 86.87 | lists/dev.lst-loss:   12.14791 | lists/dev.lst-TER: 45.42 | lists/dev.lst-WER: 63.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.22
epoch:       72 | nupdates:        28944 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.11 | smp(ms): 6.66 | fwd(ms): 418.96 | crit-fwd(ms): 21.20 | bwd(ms): 643.23 | optim(ms): 57.24 | loss:   18.80567 | train-TER: 73.30 | train-WER: 86.68 | lists/dev.lst-loss:   12.02671 | lists/dev.lst-TER: 42.09 | lists/dev.lst-WER: 61.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.72
epoch:       73 | nupdates:        29346 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.13 | smp(ms): 7.75 | fwd(ms): 418.28 | crit-fwd(ms): 21.02 | bwd(ms): 650.23 | optim(ms): 57.27 | loss:   18.77794 | train-TER: 72.03 | train-WER: 86.25 | lists/dev.lst-loss:   12.01790 | lists/dev.lst-TER: 40.61 | lists/dev.lst-WER: 61.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.90
epoch:       74 | nupdates:        29748 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.32 | smp(ms): 7.54 | fwd(ms): 418.35 | crit-fwd(ms): 21.14 | bwd(ms): 653.94 | optim(ms): 57.23 | loss:   18.32982 | train-TER: 62.36 | train-WER: 78.98 | lists/dev.lst-loss:   11.77249 | lists/dev.lst-TER: 40.03 | lists/dev.lst-WER: 60.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.72
epoch:       75 | nupdates:        30150 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.74 | smp(ms): 7.07 | fwd(ms): 417.21 | crit-fwd(ms): 21.14 | bwd(ms): 653.29 | optim(ms): 57.25 | loss:   18.10331 | train-TER: 67.54 | train-WER: 83.25 | lists/dev.lst-loss:   11.88006 | lists/dev.lst-TER: 44.97 | lists/dev.lst-WER: 63.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.80
epoch:       76 | nupdates:        30552 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.24 | smp(ms): 7.33 | fwd(ms): 418.31 | crit-fwd(ms): 21.06 | bwd(ms): 642.41 | optim(ms): 57.23 | loss:   18.19987 | train-TER: 66.21 | train-WER: 81.83 | lists/dev.lst-loss:   11.64802 | lists/dev.lst-TER: 38.08 | lists/dev.lst-WER: 59.33 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.33
epoch:       77 | nupdates:        30954 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.16 | smp(ms): 6.83 | fwd(ms): 418.81 | crit-fwd(ms): 21.14 | bwd(ms): 652.94 | optim(ms): 57.22 | loss:   17.87337 | train-TER: 65.52 | train-WER: 81.45 | lists/dev.lst-loss:   11.49395 | lists/dev.lst-TER: 43.04 | lists/dev.lst-WER: 61.59 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 770.83
epoch:       78 | nupdates:        31356 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.47 | smp(ms): 7.16 | fwd(ms): 418.49 | crit-fwd(ms): 20.92 | bwd(ms): 641.50 | optim(ms): 57.23 | loss:   17.93354 | train-TER: 66.74 | train-WER: 82.42 | lists/dev.lst-loss:   11.53457 | lists/dev.lst-TER: 44.62 | lists/dev.lst-WER: 62.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.86
epoch:       79 | nupdates:        31758 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1121.90 | smp(ms): 7.80 | fwd(ms): 418.90 | crit-fwd(ms): 21.27 | bwd(ms): 640.79 | optim(ms): 57.24 | loss:   17.75793 | train-TER: 61.36 | train-WER: 79.35 | lists/dev.lst-loss:   11.33377 | lists/dev.lst-TER: 40.68 | lists/dev.lst-WER: 59.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.26
epoch:       80 | nupdates:        32160 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.48 | smp(ms): 7.78 | fwd(ms): 418.51 | crit-fwd(ms): 21.31 | bwd(ms): 641.91 | optim(ms): 57.22 | loss:   17.75346 | train-TER: 63.90 | train-WER: 81.03 | lists/dev.lst-loss:   11.22176 | lists/dev.lst-TER: 40.38 | lists/dev.lst-WER: 59.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.86
epoch:       81 | nupdates:        32562 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.61 | smp(ms): 7.85 | fwd(ms): 418.22 | crit-fwd(ms): 21.18 | bwd(ms): 643.19 | optim(ms): 57.22 | loss:   17.48617 | train-TER: 69.01 | train-WER: 83.84 | lists/dev.lst-loss:   11.07498 | lists/dev.lst-TER: 35.81 | lists/dev.lst-WER: 56.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.07
epoch:       82 | nupdates:        32964 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.38 | smp(ms): 7.23 | fwd(ms): 418.50 | crit-fwd(ms): 21.13 | bwd(ms): 656.16 | optim(ms): 57.23 | loss:   17.39745 | train-TER: 63.26 | train-WER: 79.87 | lists/dev.lst-loss:   10.84792 | lists/dev.lst-TER: 36.81 | lists/dev.lst-WER: 56.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 768.65
epoch:       83 | nupdates:        33366 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.75 | smp(ms): 7.89 | fwd(ms): 417.85 | crit-fwd(ms): 21.14 | bwd(ms): 654.77 | optim(ms): 57.23 | loss:   17.28212 | train-TER: 65.13 | train-WER: 81.28 | lists/dev.lst-loss:   11.26261 | lists/dev.lst-TER: 42.08 | lists/dev.lst-WER: 60.51 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.43
epoch:       84 | nupdates:        33768 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.63 | smp(ms): 7.56 | fwd(ms): 418.39 | crit-fwd(ms): 21.14 | bwd(ms): 640.19 | optim(ms): 57.25 | loss:   17.15141 | train-TER: 64.19 | train-WER: 81.78 | lists/dev.lst-loss:   10.67227 | lists/dev.lst-TER: 35.93 | lists/dev.lst-WER: 56.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.14
epoch:       85 | nupdates:        34170 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.12 | smp(ms): 5.89 | fwd(ms): 418.70 | crit-fwd(ms): 20.91 | bwd(ms): 649.21 | optim(ms): 57.25 | loss:   17.23015 | train-TER: 59.35 | train-WER: 77.02 | lists/dev.lst-loss:   10.85940 | lists/dev.lst-TER: 40.46 | lists/dev.lst-WER: 58.30 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.59
epoch:       86 | nupdates:        34572 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.93 | smp(ms): 6.37 | fwd(ms): 419.06 | crit-fwd(ms): 21.07 | bwd(ms): 638.80 | optim(ms): 57.24 | loss:   16.96564 | train-TER: 59.62 | train-WER: 77.21 | lists/dev.lst-loss:   10.54389 | lists/dev.lst-TER: 33.87 | lists/dev.lst-WER: 54.50 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.63
epoch:       87 | nupdates:        34974 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1136.42 | smp(ms): 6.93 | fwd(ms): 419.02 | crit-fwd(ms): 21.06 | bwd(ms): 655.43 | optim(ms): 57.21 | loss:   16.96073 | train-TER: 68.13 | train-WER: 84.00 | lists/dev.lst-loss:   10.39644 | lists/dev.lst-TER: 33.70 | lists/dev.lst-WER: 54.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 769.30
epoch:       88 | nupdates:        35376 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.80 | smp(ms): 6.66 | fwd(ms): 417.09 | crit-fwd(ms): 21.29 | bwd(ms): 650.51 | optim(ms): 57.28 | loss:   16.97702 | train-TER: 61.65 | train-WER: 78.93 | lists/dev.lst-loss:   10.37635 | lists/dev.lst-TER: 34.83 | lists/dev.lst-WER: 54.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.81
epoch:       89 | nupdates:        35778 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.01 | smp(ms): 6.28 | fwd(ms): 419.88 | crit-fwd(ms): 21.10 | bwd(ms): 639.82 | optim(ms): 57.26 | loss:   16.70030 | train-TER: 61.79 | train-WER: 79.76 | lists/dev.lst-loss:   10.30520 | lists/dev.lst-TER: 35.69 | lists/dev.lst-WER: 54.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.18
epoch:       90 | nupdates:        36180 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.76 | smp(ms): 7.48 | fwd(ms): 417.94 | crit-fwd(ms): 20.95 | bwd(ms): 639.86 | optim(ms): 57.25 | loss:   16.57162 | train-TER: 64.12 | train-WER: 80.89 | lists/dev.lst-loss:   10.44773 | lists/dev.lst-TER: 37.63 | lists/dev.lst-WER: 56.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.74
epoch:       91 | nupdates:        36582 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.21 | smp(ms): 5.99 | fwd(ms): 417.96 | crit-fwd(ms): 21.07 | bwd(ms): 641.30 | optim(ms): 57.23 | loss:   16.66347 | train-TER: 72.31 | train-WER: 86.37 | lists/dev.lst-loss:   10.27144 | lists/dev.lst-TER: 36.66 | lists/dev.lst-WER: 55.65 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.73
epoch:       92 | nupdates:        36984 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.99 | smp(ms): 7.79 | fwd(ms): 416.70 | crit-fwd(ms): 21.11 | bwd(ms): 644.19 | optim(ms): 57.24 | loss:   16.51025 | train-TER: 62.98 | train-WER: 80.44 | lists/dev.lst-loss:   10.24336 | lists/dev.lst-TER: 37.91 | lists/dev.lst-WER: 55.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.50
epoch:       93 | nupdates:        37386 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.46 | smp(ms): 7.91 | fwd(ms): 418.74 | crit-fwd(ms): 21.16 | bwd(ms): 638.47 | optim(ms): 57.23 | loss:   16.45285 | train-TER: 58.88 | train-WER: 76.47 | lists/dev.lst-loss:   10.05003 | lists/dev.lst-TER: 36.03 | lists/dev.lst-WER: 54.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.96
epoch:       94 | nupdates:        37788 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.92 | smp(ms): 7.03 | fwd(ms): 419.59 | crit-fwd(ms): 21.21 | bwd(ms): 642.18 | optim(ms): 57.23 | loss:   16.21421 | train-TER: 55.38 | train-WER: 74.05 | lists/dev.lst-loss:   10.35817 | lists/dev.lst-TER: 39.70 | lists/dev.lst-WER: 57.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 777.86
epoch:       95 | nupdates:        38190 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.96 | smp(ms): 6.40 | fwd(ms): 418.07 | crit-fwd(ms): 21.08 | bwd(ms): 638.74 | optim(ms): 57.26 | loss:   16.16825 | train-TER: 60.08 | train-WER: 78.45 | lists/dev.lst-loss:    9.88431 | lists/dev.lst-TER: 32.12 | lists/dev.lst-WER: 51.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.31
epoch:       96 | nupdates:        38592 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.12 | smp(ms): 6.94 | fwd(ms): 417.99 | crit-fwd(ms): 21.18 | bwd(ms): 650.34 | optim(ms): 57.25 | loss:   16.20026 | train-TER: 63.33 | train-WER: 79.86 | lists/dev.lst-loss:    9.79642 | lists/dev.lst-TER: 33.20 | lists/dev.lst-WER: 52.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.59
epoch:       97 | nupdates:        38994 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1124.70 | smp(ms): 7.61 | fwd(ms): 418.32 | crit-fwd(ms): 21.22 | bwd(ms): 644.16 | optim(ms): 57.24 | loss:   16.09557 | train-TER: 58.97 | train-WER: 76.51 | lists/dev.lst-loss:    9.88127 | lists/dev.lst-TER: 34.17 | lists/dev.lst-WER: 52.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.32
epoch:       98 | nupdates:        39396 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.37 | smp(ms): 4.69 | fwd(ms): 417.67 | crit-fwd(ms): 20.97 | bwd(ms): 637.75 | optim(ms): 57.24 | loss:   15.98377 | train-TER: 61.28 | train-WER: 78.19 | lists/dev.lst-loss:    9.94061 | lists/dev.lst-TER: 33.23 | lists/dev.lst-WER: 52.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.72
epoch:       99 | nupdates:        39798 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.48 | smp(ms): 7.05 | fwd(ms): 419.57 | crit-fwd(ms): 21.06 | bwd(ms): 640.84 | optim(ms): 57.23 | loss:   15.81249 | train-TER: 57.55 | train-WER: 74.73 | lists/dev.lst-loss:    9.96920 | lists/dev.lst-TER: 36.11 | lists/dev.lst-WER: 53.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.85
epoch:      100 | nupdates:        40200 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.62 | smp(ms): 7.26 | fwd(ms): 418.33 | crit-fwd(ms): 21.10 | bwd(ms): 643.28 | optim(ms): 57.22 | loss:   15.76856 | train-TER: 59.21 | train-WER: 77.85 | lists/dev.lst-loss:    9.51413 | lists/dev.lst-TER: 30.03 | lists/dev.lst-WER: 49.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.07
epoch:      101 | nupdates:        40602 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.74 | smp(ms): 6.39 | fwd(ms): 417.90 | crit-fwd(ms): 21.04 | bwd(ms): 651.28 | optim(ms): 57.24 | loss:   15.81209 | train-TER: 61.84 | train-WER: 79.23 | lists/dev.lst-loss:    9.53090 | lists/dev.lst-TER: 30.82 | lists/dev.lst-WER: 50.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.48
epoch:      102 | nupdates:        41004 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.38 | smp(ms): 3.82 | fwd(ms): 418.55 | crit-fwd(ms): 21.18 | bwd(ms): 641.00 | optim(ms): 57.25 | loss:   15.74271 | train-TER: 53.49 | train-WER: 72.16 | lists/dev.lst-loss:    9.50530 | lists/dev.lst-TER: 32.22 | lists/dev.lst-WER: 50.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.93
epoch:      103 | nupdates:        41406 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.01 | smp(ms): 8.31 | fwd(ms): 418.96 | crit-fwd(ms): 21.07 | bwd(ms): 641.75 | optim(ms): 57.25 | loss:   15.66112 | train-TER: 57.97 | train-WER: 74.97 | lists/dev.lst-loss:    9.41947 | lists/dev.lst-TER: 32.10 | lists/dev.lst-WER: 50.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.49
epoch:      104 | nupdates:        41808 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 7.73 | fwd(ms): 417.89 | crit-fwd(ms): 21.45 | bwd(ms): 640.54 | optim(ms): 57.23 | loss:   15.52963 | train-TER: 55.11 | train-WER: 73.25 | lists/dev.lst-loss:    9.42631 | lists/dev.lst-TER: 29.26 | lists/dev.lst-WER: 48.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.97
epoch:      105 | nupdates:        42210 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.11 | smp(ms): 7.14 | fwd(ms): 419.47 | crit-fwd(ms): 21.01 | bwd(ms): 652.28 | optim(ms): 57.24 | loss:   15.51499 | train-TER: 59.74 | train-WER: 77.59 | lists/dev.lst-loss:    9.35540 | lists/dev.lst-TER: 31.02 | lists/dev.lst-WER: 49.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.87
epoch:      106 | nupdates:        42612 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.01 | smp(ms): 7.68 | fwd(ms): 418.97 | crit-fwd(ms): 21.25 | bwd(ms): 642.72 | optim(ms): 57.25 | loss:   15.45425 | train-TER: 57.54 | train-WER: 75.21 | lists/dev.lst-loss:    9.14207 | lists/dev.lst-TER: 29.30 | lists/dev.lst-WER: 48.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.79
epoch:      107 | nupdates:        43014 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.45 | smp(ms): 7.03 | fwd(ms): 417.94 | crit-fwd(ms): 20.93 | bwd(ms): 652.00 | optim(ms): 57.24 | loss:   15.57122 | train-TER: 61.49 | train-WER: 77.95 | lists/dev.lst-loss:    9.31035 | lists/dev.lst-TER: 30.57 | lists/dev.lst-WER: 49.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.00
epoch:      108 | nupdates:        43416 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:28 | bch(ms): 1116.64 | smp(ms): 6.87 | fwd(ms): 418.93 | crit-fwd(ms): 21.18 | bwd(ms): 635.80 | optim(ms): 57.24 | loss:   15.27094 | train-TER: 58.17 | train-WER: 76.04 | lists/dev.lst-loss:    9.14575 | lists/dev.lst-TER: 31.28 | lists/dev.lst-WER: 49.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.92
epoch:      109 | nupdates:        43818 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.61 | smp(ms): 7.85 | fwd(ms): 417.61 | crit-fwd(ms): 21.15 | bwd(ms): 640.69 | optim(ms): 57.23 | loss:   15.31628 | train-TER: 55.99 | train-WER: 73.51 | lists/dev.lst-loss:    9.24124 | lists/dev.lst-TER: 31.79 | lists/dev.lst-WER: 50.12 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.16
epoch:      110 | nupdates:        44220 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.60 | smp(ms): 7.31 | fwd(ms): 417.53 | crit-fwd(ms): 21.18 | bwd(ms): 641.78 | optim(ms): 57.22 | loss:   15.14866 | train-TER: 52.46 | train-WER: 71.79 | lists/dev.lst-loss:    9.46158 | lists/dev.lst-TER: 33.22 | lists/dev.lst-WER: 51.26 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.47
epoch:      111 | nupdates:        44622 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.36 | smp(ms): 6.25 | fwd(ms): 417.26 | crit-fwd(ms): 21.06 | bwd(ms): 641.07 | optim(ms): 57.29 | loss:   15.13038 | train-TER: 63.11 | train-WER: 79.56 | lists/dev.lst-loss:    9.24710 | lists/dev.lst-TER: 32.18 | lists/dev.lst-WER: 50.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.33
epoch:      112 | nupdates:        45024 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.70 | smp(ms): 8.38 | fwd(ms): 418.81 | crit-fwd(ms): 21.05 | bwd(ms): 641.54 | optim(ms): 57.25 | loss:   14.79451 | train-TER: 55.67 | train-WER: 73.78 | lists/dev.lst-loss:    9.48923 | lists/dev.lst-TER: 34.71 | lists/dev.lst-WER: 51.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.70
epoch:      113 | nupdates:        45426 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.32 | smp(ms): 7.22 | fwd(ms): 419.14 | crit-fwd(ms): 21.21 | bwd(ms): 643.22 | optim(ms): 57.22 | loss:   15.04601 | train-TER: 57.83 | train-WER: 77.00 | lists/dev.lst-loss:    8.84531 | lists/dev.lst-TER: 28.22 | lists/dev.lst-WER: 47.08 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 777.58
epoch:      114 | nupdates:        45828 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.75 | smp(ms): 6.37 | fwd(ms): 417.87 | crit-fwd(ms): 20.90 | bwd(ms): 652.50 | optim(ms): 57.22 | loss:   14.98419 | train-TER: 54.90 | train-WER: 73.11 | lists/dev.lst-loss:    8.84740 | lists/dev.lst-TER: 28.65 | lists/dev.lst-WER: 46.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.79
epoch:      115 | nupdates:        46230 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.20 | smp(ms): 6.90 | fwd(ms): 417.62 | crit-fwd(ms): 21.23 | bwd(ms): 652.60 | optim(ms): 57.22 | loss:   14.90790 | train-TER: 54.74 | train-WER: 72.87 | lists/dev.lst-loss:    9.17924 | lists/dev.lst-TER: 34.00 | lists/dev.lst-WER: 50.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.16
epoch:      116 | nupdates:        46632 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:28 | bch(ms): 1116.33 | smp(ms): 6.13 | fwd(ms): 417.84 | crit-fwd(ms): 21.07 | bwd(ms): 636.08 | optim(ms): 57.26 | loss:   14.75618 | train-TER: 54.01 | train-WER: 72.20 | lists/dev.lst-loss:    9.03953 | lists/dev.lst-TER: 32.32 | lists/dev.lst-WER: 49.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 783.14
epoch:      117 | nupdates:        47034 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.72 | smp(ms): 7.69 | fwd(ms): 417.78 | crit-fwd(ms): 21.17 | bwd(ms): 640.88 | optim(ms): 57.22 | loss:   14.70447 | train-TER: 56.60 | train-WER: 74.05 | lists/dev.lst-loss:    8.68354 | lists/dev.lst-TER: 28.65 | lists/dev.lst-WER: 46.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.08
epoch:      118 | nupdates:        47436 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.00 | smp(ms): 6.40 | fwd(ms): 419.00 | crit-fwd(ms): 21.18 | bwd(ms): 651.91 | optim(ms): 57.25 | loss:   14.44669 | train-TER: 60.53 | train-WER: 77.53 | lists/dev.lst-loss:    8.61744 | lists/dev.lst-TER: 28.26 | lists/dev.lst-WER: 46.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 771.62
epoch:      119 | nupdates:        47838 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.27 | smp(ms): 4.22 | fwd(ms): 418.88 | crit-fwd(ms): 21.04 | bwd(ms): 648.67 | optim(ms): 57.32 | loss:   14.79736 | train-TER: 57.66 | train-WER: 74.98 | lists/dev.lst-loss:    8.73393 | lists/dev.lst-TER: 29.20 | lists/dev.lst-WER: 47.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.49
epoch:      120 | nupdates:        48240 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.77 | smp(ms): 6.86 | fwd(ms): 419.23 | crit-fwd(ms): 21.22 | bwd(ms): 639.35 | optim(ms): 57.24 | loss:   14.56824 | train-TER: 55.75 | train-WER: 73.51 | lists/dev.lst-loss:    8.78212 | lists/dev.lst-TER: 30.67 | lists/dev.lst-WER: 47.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.04
epoch:      121 | nupdates:        48642 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.75 | smp(ms): 6.83 | fwd(ms): 418.89 | crit-fwd(ms): 21.04 | bwd(ms): 639.34 | optim(ms): 57.23 | loss:   14.55233 | train-TER: 51.83 | train-WER: 70.12 | lists/dev.lst-loss:    8.54195 | lists/dev.lst-TER: 28.51 | lists/dev.lst-WER: 46.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.06
epoch:      122 | nupdates:        49044 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.38 | smp(ms): 6.72 | fwd(ms): 417.57 | crit-fwd(ms): 21.09 | bwd(ms): 641.02 | optim(ms): 57.22 | loss:   14.63787 | train-TER: 52.36 | train-WER: 71.13 | lists/dev.lst-loss:    8.48944 | lists/dev.lst-TER: 28.34 | lists/dev.lst-WER: 45.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.31
epoch:      123 | nupdates:        49446 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.46 | smp(ms): 6.02 | fwd(ms): 418.48 | crit-fwd(ms): 21.30 | bwd(ms): 648.68 | optim(ms): 57.26 | loss:   14.38288 | train-TER: 56.75 | train-WER: 74.53 | lists/dev.lst-loss:    8.54591 | lists/dev.lst-TER: 28.70 | lists/dev.lst-WER: 46.51 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 774.04
epoch:      124 | nupdates:        49848 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.11 | smp(ms): 7.97 | fwd(ms): 418.06 | crit-fwd(ms): 21.13 | bwd(ms): 642.75 | optim(ms): 57.22 | loss:   14.52782 | train-TER: 63.02 | train-WER: 80.15 | lists/dev.lst-loss:    8.46953 | lists/dev.lst-TER: 26.28 | lists/dev.lst-WER: 44.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.41
epoch:      125 | nupdates:        50250 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.36 | smp(ms): 6.24 | fwd(ms): 417.97 | crit-fwd(ms): 21.13 | bwd(ms): 651.07 | optim(ms): 57.23 | loss:   14.28490 | train-TER: 55.92 | train-WER: 73.66 | lists/dev.lst-loss:    8.39460 | lists/dev.lst-TER: 26.71 | lists/dev.lst-WER: 44.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.74
epoch:      126 | nupdates:        50652 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.37 | smp(ms): 7.22 | fwd(ms): 418.08 | crit-fwd(ms): 21.16 | bwd(ms): 640.12 | optim(ms): 57.22 | loss:   14.30071 | train-TER: 51.42 | train-WER: 69.99 | lists/dev.lst-loss:    8.45202 | lists/dev.lst-TER: 28.54 | lists/dev.lst-WER: 45.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.32
epoch:      127 | nupdates:        51054 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.50 | smp(ms): 6.19 | fwd(ms): 418.02 | crit-fwd(ms): 21.01 | bwd(ms): 641.46 | optim(ms): 57.24 | loss:   14.16151 | train-TER: 58.02 | train-WER: 75.33 | lists/dev.lst-loss:    8.34970 | lists/dev.lst-TER: 26.30 | lists/dev.lst-WER: 44.20 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.53
epoch:      128 | nupdates:        51456 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.72 | smp(ms): 7.15 | fwd(ms): 419.47 | crit-fwd(ms): 21.15 | bwd(ms): 651.32 | optim(ms): 57.21 | loss:   14.27378 | train-TER: 54.79 | train-WER: 73.47 | lists/dev.lst-loss:    8.38338 | lists/dev.lst-TER: 26.80 | lists/dev.lst-WER: 44.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.81
epoch:      129 | nupdates:        51858 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.82 | smp(ms): 6.32 | fwd(ms): 418.65 | crit-fwd(ms): 20.99 | bwd(ms): 638.10 | optim(ms): 57.22 | loss:   14.27120 | train-TER: 47.64 | train-WER: 67.11 | lists/dev.lst-loss:    8.61761 | lists/dev.lst-TER: 30.06 | lists/dev.lst-WER: 46.98 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.40
epoch:      130 | nupdates:        52260 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.54 | smp(ms): 6.17 | fwd(ms): 418.09 | crit-fwd(ms): 20.92 | bwd(ms): 639.05 | optim(ms): 57.25 | loss:   14.22493 | train-TER: 56.97 | train-WER: 75.34 | lists/dev.lst-loss:    8.38831 | lists/dev.lst-TER: 27.07 | lists/dev.lst-WER: 44.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.90
epoch:      131 | nupdates:        52662 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1135.17 | smp(ms): 7.17 | fwd(ms): 419.02 | crit-fwd(ms): 21.01 | bwd(ms): 653.97 | optim(ms): 57.21 | loss:   14.15012 | train-TER: 48.26 | train-WER: 66.47 | lists/dev.lst-loss:    8.24389 | lists/dev.lst-TER: 26.25 | lists/dev.lst-WER: 43.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.15
epoch:      132 | nupdates:        53064 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.02 | smp(ms): 8.45 | fwd(ms): 416.94 | crit-fwd(ms): 21.20 | bwd(ms): 653.04 | optim(ms): 57.25 | loss:   14.06675 | train-TER: 49.62 | train-WER: 68.83 | lists/dev.lst-loss:    8.20475 | lists/dev.lst-TER: 25.15 | lists/dev.lst-WER: 43.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.29
epoch:      133 | nupdates:        53466 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1129.34 | smp(ms): 5.51 | fwd(ms): 417.24 | crit-fwd(ms): 21.23 | bwd(ms): 650.27 | optim(ms): 57.24 | loss:   14.13045 | train-TER: 53.23 | train-WER: 70.71 | lists/dev.lst-loss:    8.45529 | lists/dev.lst-TER: 30.17 | lists/dev.lst-WER: 46.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 774.12
epoch:      134 | nupdates:        53868 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.69 | smp(ms): 5.10 | fwd(ms): 418.72 | crit-fwd(ms): 20.96 | bwd(ms): 640.99 | optim(ms): 57.25 | loss:   13.92196 | train-TER: 53.81 | train-WER: 73.25 | lists/dev.lst-loss:    8.14939 | lists/dev.lst-TER: 25.41 | lists/dev.lst-WER: 43.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.71
epoch:      135 | nupdates:        54270 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1126.56 | smp(ms): 7.44 | fwd(ms): 418.16 | crit-fwd(ms): 21.08 | bwd(ms): 645.95 | optim(ms): 57.22 | loss:   13.85039 | train-TER: 55.79 | train-WER: 74.12 | lists/dev.lst-loss:    8.05329 | lists/dev.lst-TER: 24.56 | lists/dev.lst-WER: 42.45 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.03
epoch:      136 | nupdates:        54672 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.13 | smp(ms): 6.73 | fwd(ms): 420.51 | crit-fwd(ms): 21.10 | bwd(ms): 654.46 | optim(ms): 57.23 | loss:   13.76668 | train-TER: 42.65 | train-WER: 62.36 | lists/dev.lst-loss:    8.38886 | lists/dev.lst-TER: 27.73 | lists/dev.lst-WER: 45.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 768.82
epoch:      137 | nupdates:        55074 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.51 | smp(ms): 6.49 | fwd(ms): 418.75 | crit-fwd(ms): 21.01 | bwd(ms): 640.40 | optim(ms): 57.26 | loss:   13.59661 | train-TER: 51.50 | train-WER: 69.32 | lists/dev.lst-loss:    8.15681 | lists/dev.lst-TER: 26.36 | lists/dev.lst-WER: 43.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.53
epoch:      138 | nupdates:        55476 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.27 | smp(ms): 6.58 | fwd(ms): 418.45 | crit-fwd(ms): 20.97 | bwd(ms): 638.65 | optim(ms): 57.25 | loss:   13.81801 | train-TER: 54.59 | train-WER: 72.60 | lists/dev.lst-loss:    7.96134 | lists/dev.lst-TER: 24.83 | lists/dev.lst-WER: 42.46 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.09
epoch:      139 | nupdates:        55878 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.52 | smp(ms): 6.20 | fwd(ms): 417.46 | crit-fwd(ms): 20.99 | bwd(ms): 638.32 | optim(ms): 57.26 | loss:   13.70655 | train-TER: 47.13 | train-WER: 66.18 | lists/dev.lst-loss:    8.01994 | lists/dev.lst-TER: 26.69 | lists/dev.lst-WER: 43.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.61
epoch:      140 | nupdates:        56280 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.82 | smp(ms): 7.56 | fwd(ms): 417.32 | crit-fwd(ms): 21.02 | bwd(ms): 640.10 | optim(ms): 57.26 | loss:   13.70011 | train-TER: 53.84 | train-WER: 72.36 | lists/dev.lst-loss:    8.19977 | lists/dev.lst-TER: 27.70 | lists/dev.lst-WER: 44.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.70
epoch:      141 | nupdates:        56682 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1121.92 | smp(ms): 6.89 | fwd(ms): 418.91 | crit-fwd(ms): 21.00 | bwd(ms): 640.59 | optim(ms): 57.24 | loss:   13.63012 | train-TER: 48.99 | train-WER: 68.01 | lists/dev.lst-loss:    7.94642 | lists/dev.lst-TER: 24.27 | lists/dev.lst-WER: 41.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.25
epoch:      142 | nupdates:        57084 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.39 | smp(ms): 6.96 | fwd(ms): 418.33 | crit-fwd(ms): 21.33 | bwd(ms): 650.13 | optim(ms): 57.26 | loss:   13.45313 | train-TER: 58.71 | train-WER: 75.33 | lists/dev.lst-loss:    8.08680 | lists/dev.lst-TER: 26.78 | lists/dev.lst-WER: 43.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.41
epoch:      143 | nupdates:        57486 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.77 | smp(ms): 5.94 | fwd(ms): 419.40 | crit-fwd(ms): 21.08 | bwd(ms): 639.17 | optim(ms): 57.23 | loss:   13.41076 | train-TER: 52.01 | train-WER: 70.68 | lists/dev.lst-loss:    7.79057 | lists/dev.lst-TER: 24.24 | lists/dev.lst-WER: 41.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.04
epoch:      144 | nupdates:        57888 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.61 | smp(ms): 7.52 | fwd(ms): 417.67 | crit-fwd(ms): 21.29 | bwd(ms): 654.73 | optim(ms): 57.23 | loss:   13.50784 | train-TER: 49.80 | train-WER: 67.70 | lists/dev.lst-loss:    7.82797 | lists/dev.lst-TER: 24.47 | lists/dev.lst-WER: 41.63 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.53
epoch:      145 | nupdates:        58290 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.62 | smp(ms): 8.08 | fwd(ms): 418.27 | crit-fwd(ms): 21.01 | bwd(ms): 642.08 | optim(ms): 57.22 | loss:   13.60574 | train-TER: 53.65 | train-WER: 71.02 | lists/dev.lst-loss:    7.89450 | lists/dev.lst-TER: 24.69 | lists/dev.lst-WER: 41.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.76
epoch:      146 | nupdates:        58692 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.67 | smp(ms): 4.76 | fwd(ms): 418.44 | crit-fwd(ms): 21.08 | bwd(ms): 639.10 | optim(ms): 57.25 | loss:   13.35476 | train-TER: 43.18 | train-WER: 63.36 | lists/dev.lst-loss:    8.20162 | lists/dev.lst-TER: 28.46 | lists/dev.lst-WER: 44.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.81
epoch:      147 | nupdates:        59094 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.45 | smp(ms): 7.45 | fwd(ms): 417.46 | crit-fwd(ms): 21.00 | bwd(ms): 639.82 | optim(ms): 57.23 | loss:   13.47927 | train-TER: 52.87 | train-WER: 72.35 | lists/dev.lst-loss:    7.85984 | lists/dev.lst-TER: 25.10 | lists/dev.lst-WER: 41.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.96
epoch:      148 | nupdates:        59496 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.02 | smp(ms): 6.66 | fwd(ms): 416.54 | crit-fwd(ms): 21.18 | bwd(ms): 641.34 | optim(ms): 57.22 | loss:   13.18582 | train-TER: 46.08 | train-WER: 65.95 | lists/dev.lst-loss:    7.93400 | lists/dev.lst-TER: 25.89 | lists/dev.lst-WER: 42.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.56
epoch:      149 | nupdates:        59898 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.89 | smp(ms): 4.96 | fwd(ms): 418.69 | crit-fwd(ms): 21.08 | bwd(ms): 639.19 | optim(ms): 57.24 | loss:   13.08399 | train-TER: 49.58 | train-WER: 68.11 | lists/dev.lst-loss:    7.71010 | lists/dev.lst-TER: 24.09 | lists/dev.lst-WER: 41.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.66
epoch:      150 | nupdates:        60300 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.66 | smp(ms): 6.52 | fwd(ms): 418.09 | crit-fwd(ms): 21.12 | bwd(ms): 654.55 | optim(ms): 57.20 | loss:   13.22116 | train-TER: 52.56 | train-WER: 69.53 | lists/dev.lst-loss:    7.74704 | lists/dev.lst-TER: 25.23 | lists/dev.lst-WER: 41.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.49
epoch:      151 | nupdates:        60702 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.24 | smp(ms): 6.89 | fwd(ms): 417.76 | crit-fwd(ms): 20.98 | bwd(ms): 644.57 | optim(ms): 57.21 | loss:   13.38768 | train-TER: 53.51 | train-WER: 71.08 | lists/dev.lst-loss:    7.78949 | lists/dev.lst-TER: 25.18 | lists/dev.lst-WER: 41.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.64
epoch:      152 | nupdates:        61104 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.62 | smp(ms): 8.88 | fwd(ms): 417.45 | crit-fwd(ms): 21.04 | bwd(ms): 642.11 | optim(ms): 57.19 | loss:   13.26836 | train-TER: 44.32 | train-WER: 63.81 | lists/dev.lst-loss:    7.86794 | lists/dev.lst-TER: 25.89 | lists/dev.lst-WER: 42.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.45
epoch:      153 | nupdates:        61506 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.38 | smp(ms): 7.34 | fwd(ms): 419.23 | crit-fwd(ms): 21.01 | bwd(ms): 640.85 | optim(ms): 57.23 | loss:   13.18466 | train-TER: 47.50 | train-WER: 65.92 | lists/dev.lst-loss:    7.70928 | lists/dev.lst-TER: 24.17 | lists/dev.lst-WER: 41.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.93
epoch:      154 | nupdates:        61908 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.31 | smp(ms): 6.48 | fwd(ms): 418.28 | crit-fwd(ms): 21.08 | bwd(ms): 650.27 | optim(ms): 57.23 | loss:   13.10210 | train-TER: 45.53 | train-WER: 65.00 | lists/dev.lst-loss:    7.77708 | lists/dev.lst-TER: 24.79 | lists/dev.lst-WER: 41.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.77
epoch:      155 | nupdates:        62310 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.83 | smp(ms): 6.22 | fwd(ms): 418.51 | crit-fwd(ms): 20.98 | bwd(ms): 640.07 | optim(ms): 57.22 | loss:   13.12608 | train-TER: 44.62 | train-WER: 63.28 | lists/dev.lst-loss:    7.59663 | lists/dev.lst-TER: 22.21 | lists/dev.lst-WER: 39.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.00
epoch:      156 | nupdates:        62712 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.43 | smp(ms): 6.76 | fwd(ms): 418.89 | crit-fwd(ms): 21.03 | bwd(ms): 649.43 | optim(ms): 57.24 | loss:   13.05531 | train-TER: 45.62 | train-WER: 63.95 | lists/dev.lst-loss:    7.70725 | lists/dev.lst-TER: 24.76 | lists/dev.lst-WER: 41.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.38
epoch:      157 | nupdates:        63114 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.45 | smp(ms): 6.78 | fwd(ms): 419.30 | crit-fwd(ms): 21.02 | bwd(ms): 642.16 | optim(ms): 57.21 | loss:   12.89740 | train-TER: 46.18 | train-WER: 64.81 | lists/dev.lst-loss:    7.59010 | lists/dev.lst-TER: 22.50 | lists/dev.lst-WER: 39.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.18
epoch:      158 | nupdates:        63516 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.07 | smp(ms): 7.00 | fwd(ms): 418.13 | crit-fwd(ms): 21.22 | bwd(ms): 640.84 | optim(ms): 57.22 | loss:   12.96884 | train-TER: 52.76 | train-WER: 71.60 | lists/dev.lst-loss:    7.63837 | lists/dev.lst-TER: 24.35 | lists/dev.lst-WER: 40.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.83
epoch:      159 | nupdates:        63918 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.10 | smp(ms): 7.45 | fwd(ms): 417.91 | crit-fwd(ms): 21.14 | bwd(ms): 641.20 | optim(ms): 57.22 | loss:   12.94717 | train-TER: 50.14 | train-WER: 69.38 | lists/dev.lst-loss:    7.63473 | lists/dev.lst-TER: 23.67 | lists/dev.lst-WER: 40.25 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 779.81
epoch:      160 | nupdates:        64320 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.46 | smp(ms): 8.16 | fwd(ms): 419.25 | crit-fwd(ms): 21.10 | bwd(ms): 641.92 | optim(ms): 57.23 | loss:   13.01450 | train-TER: 51.79 | train-WER: 70.33 | lists/dev.lst-loss:    7.53934 | lists/dev.lst-TER: 24.36 | lists/dev.lst-WER: 40.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.17
epoch:      161 | nupdates:        64722 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.51 | smp(ms): 6.54 | fwd(ms): 420.62 | crit-fwd(ms): 21.13 | bwd(ms): 642.59 | optim(ms): 57.21 | loss:   12.94276 | train-TER: 52.15 | train-WER: 70.01 | lists/dev.lst-loss:    7.44481 | lists/dev.lst-TER: 23.17 | lists/dev.lst-WER: 39.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.76
epoch:      162 | nupdates:        65124 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.15 | smp(ms): 6.49 | fwd(ms): 419.42 | crit-fwd(ms): 21.15 | bwd(ms): 637.86 | optim(ms): 57.25 | loss:   12.85309 | train-TER: 48.45 | train-WER: 66.35 | lists/dev.lst-loss:    7.52816 | lists/dev.lst-TER: 22.57 | lists/dev.lst-WER: 39.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.17
epoch:      163 | nupdates:        65526 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.16 | smp(ms): 7.12 | fwd(ms): 418.06 | crit-fwd(ms): 21.06 | bwd(ms): 651.79 | optim(ms): 57.23 | loss:   12.88853 | train-TER: 46.10 | train-WER: 64.72 | lists/dev.lst-loss:    7.46618 | lists/dev.lst-TER: 22.31 | lists/dev.lst-WER: 39.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.20
epoch:      164 | nupdates:        65928 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.98 | smp(ms): 7.31 | fwd(ms): 417.12 | crit-fwd(ms): 21.17 | bwd(ms): 651.93 | optim(ms): 57.21 | loss:   12.89770 | train-TER: 49.42 | train-WER: 66.45 | lists/dev.lst-loss:    7.44288 | lists/dev.lst-TER: 23.12 | lists/dev.lst-WER: 39.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.00
epoch:      165 | nupdates:        66330 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.13 | smp(ms): 6.31 | fwd(ms): 418.44 | crit-fwd(ms): 21.02 | bwd(ms): 640.59 | optim(ms): 57.21 | loss:   12.82855 | train-TER: 44.71 | train-WER: 62.38 | lists/dev.lst-loss:    7.53362 | lists/dev.lst-TER: 23.73 | lists/dev.lst-WER: 39.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.79
epoch:      166 | nupdates:        66732 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.58 | smp(ms): 7.46 | fwd(ms): 419.10 | crit-fwd(ms): 21.07 | bwd(ms): 642.36 | optim(ms): 57.21 | loss:   12.69368 | train-TER: 50.51 | train-WER: 67.88 | lists/dev.lst-loss:    7.61495 | lists/dev.lst-TER: 24.11 | lists/dev.lst-WER: 40.03 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.09
epoch:      167 | nupdates:        67134 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.02 | smp(ms): 6.36 | fwd(ms): 418.00 | crit-fwd(ms): 21.08 | bwd(ms): 638.25 | optim(ms): 57.24 | loss:   12.65514 | train-TER: 45.95 | train-WER: 63.24 | lists/dev.lst-loss:    7.33882 | lists/dev.lst-TER: 21.88 | lists/dev.lst-WER: 38.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.96
epoch:      168 | nupdates:        67536 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1127.67 | smp(ms): 6.83 | fwd(ms): 418.23 | crit-fwd(ms): 21.08 | bwd(ms): 647.42 | optim(ms): 57.25 | loss:   12.83542 | train-TER: 44.58 | train-WER: 63.24 | lists/dev.lst-loss:    7.41125 | lists/dev.lst-TER: 22.21 | lists/dev.lst-WER: 38.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 775.27
epoch:      169 | nupdates:        67938 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.20 | smp(ms): 7.57 | fwd(ms): 418.63 | crit-fwd(ms): 20.93 | bwd(ms): 641.24 | optim(ms): 57.21 | loss:   12.70959 | train-TER: 47.70 | train-WER: 66.45 | lists/dev.lst-loss:    7.30663 | lists/dev.lst-TER: 21.59 | lists/dev.lst-WER: 38.34 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.05
epoch:      170 | nupdates:        68340 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.94 | smp(ms): 6.95 | fwd(ms): 419.36 | crit-fwd(ms): 21.02 | bwd(ms): 652.48 | optim(ms): 57.21 | loss:   12.56968 | train-TER: 48.72 | train-WER: 67.40 | lists/dev.lst-loss:    7.30601 | lists/dev.lst-TER: 21.41 | lists/dev.lst-WER: 38.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.99
epoch:      171 | nupdates:        68742 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.99 | smp(ms): 5.98 | fwd(ms): 418.80 | crit-fwd(ms): 21.00 | bwd(ms): 648.57 | optim(ms): 57.26 | loss:   12.83445 | train-TER: 47.83 | train-WER: 66.34 | lists/dev.lst-loss:    7.29749 | lists/dev.lst-TER: 21.47 | lists/dev.lst-WER: 38.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.68
epoch:      172 | nupdates:        69144 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.70 | smp(ms): 6.54 | fwd(ms): 417.44 | crit-fwd(ms): 20.99 | bwd(ms): 650.20 | optim(ms): 57.21 | loss:   12.52775 | train-TER: 43.22 | train-WER: 62.62 | lists/dev.lst-loss:    7.33210 | lists/dev.lst-TER: 22.74 | lists/dev.lst-WER: 38.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 773.88
epoch:      173 | nupdates:        69546 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1117.31 | smp(ms): 6.84 | fwd(ms): 418.11 | crit-fwd(ms): 21.06 | bwd(ms): 637.34 | optim(ms): 57.22 | loss:   12.65324 | train-TER: 45.97 | train-WER: 63.40 | lists/dev.lst-loss:    7.28360 | lists/dev.lst-TER: 21.46 | lists/dev.lst-WER: 37.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 782.46
epoch:      174 | nupdates:        69948 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.42 | smp(ms): 7.87 | fwd(ms): 419.40 | crit-fwd(ms): 21.11 | bwd(ms): 651.48 | optim(ms): 57.23 | loss:   12.54826 | train-TER: 47.45 | train-WER: 65.42 | lists/dev.lst-loss:    7.56915 | lists/dev.lst-TER: 24.63 | lists/dev.lst-WER: 40.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 771.33
epoch:      175 | nupdates:        70350 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.94 | smp(ms): 6.74 | fwd(ms): 419.25 | crit-fwd(ms): 21.28 | bwd(ms): 641.94 | optim(ms): 57.24 | loss:   12.55889 | train-TER: 51.52 | train-WER: 69.10 | lists/dev.lst-loss:    7.35429 | lists/dev.lst-TER: 22.77 | lists/dev.lst-WER: 38.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.54
epoch:      176 | nupdates:        70752 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.57 | smp(ms): 6.11 | fwd(ms): 419.06 | crit-fwd(ms): 21.06 | bwd(ms): 636.95 | optim(ms): 57.25 | loss:   12.51755 | train-TER: 48.08 | train-WER: 65.64 | lists/dev.lst-loss:    7.58862 | lists/dev.lst-TER: 25.15 | lists/dev.lst-WER: 40.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.58
epoch:      177 | nupdates:        71154 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.85 | smp(ms): 7.96 | fwd(ms): 418.59 | crit-fwd(ms): 21.19 | bwd(ms): 640.02 | optim(ms): 57.23 | loss:   12.38473 | train-TER: 46.26 | train-WER: 64.17 | lists/dev.lst-loss:    7.27269 | lists/dev.lst-TER: 22.15 | lists/dev.lst-WER: 38.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.98
epoch:      178 | nupdates:        71556 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.99 | smp(ms): 6.47 | fwd(ms): 418.52 | crit-fwd(ms): 21.04 | bwd(ms): 639.09 | optim(ms): 57.22 | loss:   12.35725 | train-TER: 47.20 | train-WER: 65.81 | lists/dev.lst-loss:    7.11603 | lists/dev.lst-TER: 20.92 | lists/dev.lst-WER: 37.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.59
epoch:      179 | nupdates:        71958 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.61 | smp(ms): 6.48 | fwd(ms): 417.94 | crit-fwd(ms): 21.08 | bwd(ms): 649.59 | optim(ms): 57.25 | loss:   12.20913 | train-TER: 50.72 | train-WER: 68.27 | lists/dev.lst-loss:    7.19737 | lists/dev.lst-TER: 21.30 | lists/dev.lst-WER: 37.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 773.94
epoch:      180 | nupdates:        72360 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.28 | smp(ms): 7.30 | fwd(ms): 418.29 | crit-fwd(ms): 21.39 | bwd(ms): 641.99 | optim(ms): 57.21 | loss:   12.12032 | train-TER: 51.38 | train-WER: 68.51 | lists/dev.lst-loss:    7.21357 | lists/dev.lst-TER: 22.31 | lists/dev.lst-WER: 37.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.00
epoch:      181 | nupdates:        72762 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.96 | smp(ms): 8.03 | fwd(ms): 418.35 | crit-fwd(ms): 21.09 | bwd(ms): 639.64 | optim(ms): 57.22 | loss:   12.24439 | train-TER: 54.08 | train-WER: 72.33 | lists/dev.lst-loss:    7.33857 | lists/dev.lst-TER: 22.95 | lists/dev.lst-WER: 38.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.61
epoch:      182 | nupdates:        73164 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.16 | smp(ms): 6.62 | fwd(ms): 417.44 | crit-fwd(ms): 21.18 | bwd(ms): 638.53 | optim(ms): 57.23 | loss:   12.00566 | train-TER: 42.76 | train-WER: 60.91 | lists/dev.lst-loss:    7.16530 | lists/dev.lst-TER: 22.56 | lists/dev.lst-WER: 38.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.86
epoch:      183 | nupdates:        73566 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.27 | smp(ms): 5.40 | fwd(ms): 418.21 | crit-fwd(ms): 20.97 | bwd(ms): 637.05 | optim(ms): 57.24 | loss:   12.17233 | train-TER: 47.49 | train-WER: 66.26 | lists/dev.lst-loss:    7.11299 | lists/dev.lst-TER: 21.56 | lists/dev.lst-WER: 37.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 782.49
epoch:      184 | nupdates:        73968 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.39 | smp(ms): 5.92 | fwd(ms): 419.01 | crit-fwd(ms): 21.00 | bwd(ms): 637.66 | optim(ms): 57.25 | loss:   12.02063 | train-TER: 46.95 | train-WER: 64.83 | lists/dev.lst-loss:    7.14865 | lists/dev.lst-TER: 21.92 | lists/dev.lst-WER: 37.46 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.70
epoch:      185 | nupdates:        74370 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.38 | smp(ms): 7.09 | fwd(ms): 418.20 | crit-fwd(ms): 21.00 | bwd(ms): 639.12 | optim(ms): 57.22 | loss:   12.04784 | train-TER: 46.15 | train-WER: 64.90 | lists/dev.lst-loss:    7.18734 | lists/dev.lst-TER: 22.26 | lists/dev.lst-WER: 37.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.01
epoch:      186 | nupdates:        74772 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.32 | smp(ms): 5.64 | fwd(ms): 418.47 | crit-fwd(ms): 21.13 | bwd(ms): 637.26 | optim(ms): 57.24 | loss:   11.96989 | train-TER: 48.49 | train-WER: 66.87 | lists/dev.lst-loss:    7.15873 | lists/dev.lst-TER: 21.69 | lists/dev.lst-WER: 37.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.75
epoch:      187 | nupdates:        75174 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:33 | bch(ms): 1127.48 | smp(ms): 4.51 | fwd(ms): 417.08 | crit-fwd(ms): 21.02 | bwd(ms): 648.04 | optim(ms): 57.28 | loss:   11.85950 | train-TER: 47.92 | train-WER: 66.06 | lists/dev.lst-loss:    7.07227 | lists/dev.lst-TER: 21.04 | lists/dev.lst-WER: 36.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 775.40
epoch:      188 | nupdates:        75576 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:34 | bch(ms): 1131.71 | smp(ms): 6.96 | fwd(ms): 419.13 | crit-fwd(ms): 21.10 | bwd(ms): 650.50 | optim(ms): 57.22 | loss:   12.02631 | train-TER: 44.41 | train-WER: 63.74 | lists/dev.lst-loss:    7.10498 | lists/dev.lst-TER: 21.35 | lists/dev.lst-WER: 36.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.50
epoch:      189 | nupdates:        75978 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.01 | smp(ms): 5.98 | fwd(ms): 418.85 | crit-fwd(ms): 21.10 | bwd(ms): 638.06 | optim(ms): 57.22 | loss:   11.90251 | train-TER: 46.85 | train-WER: 64.79 | lists/dev.lst-loss:    7.07784 | lists/dev.lst-TER: 21.86 | lists/dev.lst-WER: 37.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.27
epoch:      190 | nupdates:        76380 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.69 | smp(ms): 7.24 | fwd(ms): 417.62 | crit-fwd(ms): 21.07 | bwd(ms): 637.58 | optim(ms): 57.23 | loss:   11.90915 | train-TER: 45.61 | train-WER: 64.17 | lists/dev.lst-loss:    7.03675 | lists/dev.lst-TER: 21.47 | lists/dev.lst-WER: 36.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 782.19
epoch:      191 | nupdates:        76782 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.02 | smp(ms): 6.63 | fwd(ms): 419.15 | crit-fwd(ms): 21.14 | bwd(ms): 637.88 | optim(ms): 57.21 | loss:   11.79472 | train-TER: 46.92 | train-WER: 64.50 | lists/dev.lst-loss:    7.10484 | lists/dev.lst-TER: 21.51 | lists/dev.lst-WER: 36.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 781.26
epoch:      192 | nupdates:        77184 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.31 | smp(ms): 8.42 | fwd(ms): 417.18 | crit-fwd(ms): 21.21 | bwd(ms): 641.02 | optim(ms): 57.22 | loss:   11.80307 | train-TER: 46.62 | train-WER: 65.40 | lists/dev.lst-loss:    7.07330 | lists/dev.lst-TER: 21.57 | lists/dev.lst-WER: 37.02 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.36
epoch:      193 | nupdates:        77586 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.22 | smp(ms): 6.69 | fwd(ms): 418.93 | crit-fwd(ms): 21.21 | bwd(ms): 640.22 | optim(ms): 57.23 | loss:   12.06413 | train-TER: 48.57 | train-WER: 66.70 | lists/dev.lst-loss:    7.03203 | lists/dev.lst-TER: 21.37 | lists/dev.lst-WER: 36.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.73
epoch:      194 | nupdates:        77988 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.58 | smp(ms): 5.37 | fwd(ms): 418.36 | crit-fwd(ms): 21.02 | bwd(ms): 639.06 | optim(ms): 57.27 | loss:   11.67942 | train-TER: 46.09 | train-WER: 64.49 | lists/dev.lst-loss:    7.03581 | lists/dev.lst-TER: 20.56 | lists/dev.lst-WER: 36.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.87
epoch:      195 | nupdates:        78390 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:35 | bch(ms): 1132.91 | smp(ms): 6.36 | fwd(ms): 420.04 | crit-fwd(ms): 20.94 | bwd(ms): 650.78 | optim(ms): 57.24 | loss:   11.70607 | train-TER: 44.72 | train-WER: 62.43 | lists/dev.lst-loss:    7.00646 | lists/dev.lst-TER: 21.22 | lists/dev.lst-WER: 36.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.69
epoch:      196 | nupdates:        78792 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:32 | bch(ms): 1125.15 | smp(ms): 5.98 | fwd(ms): 420.07 | crit-fwd(ms): 21.16 | bwd(ms): 643.05 | optim(ms): 57.21 | loss:   11.80809 | train-TER: 46.86 | train-WER: 64.91 | lists/dev.lst-loss:    7.12295 | lists/dev.lst-TER: 21.52 | lists/dev.lst-WER: 36.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.01
epoch:      197 | nupdates:        79194 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.63 | smp(ms): 6.19 | fwd(ms): 417.83 | crit-fwd(ms): 20.97 | bwd(ms): 639.53 | optim(ms): 57.21 | loss:   11.69644 | train-TER: 43.32 | train-WER: 61.62 | lists/dev.lst-loss:    6.96446 | lists/dev.lst-TER: 20.75 | lists/dev.lst-WER: 36.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.83
epoch:      198 | nupdates:        79596 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.16 | smp(ms): 6.39 | fwd(ms): 418.16 | crit-fwd(ms): 21.00 | bwd(ms): 638.59 | optim(ms): 57.22 | loss:   11.79784 | train-TER: 38.89 | train-WER: 56.61 | lists/dev.lst-loss:    6.97371 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 35.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 781.16
epoch:      199 | nupdates:        79998 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:34 | bch(ms): 1131.15 | smp(ms): 4.49 | fwd(ms): 419.28 | crit-fwd(ms): 21.14 | bwd(ms): 650.09 | optim(ms): 57.24 | loss:   11.79763 | train-TER: 48.71 | train-WER: 66.80 | lists/dev.lst-loss:    6.99532 | lists/dev.lst-TER: 20.75 | lists/dev.lst-WER: 36.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.88
epoch:      200 | nupdates:        80400 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1123.05 | smp(ms): 7.03 | fwd(ms): 419.44 | crit-fwd(ms): 21.00 | bwd(ms): 641.49 | optim(ms): 57.23 | loss:   11.90821 | train-TER: 37.77 | train-WER: 55.31 | lists/dev.lst-loss:    7.09134 | lists/dev.lst-TER: 21.99 | lists/dev.lst-WER: 36.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.46
epoch:      201 | nupdates:        80802 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.10 | smp(ms): 8.10 | fwd(ms): 416.96 | crit-fwd(ms): 20.99 | bwd(ms): 643.15 | optim(ms): 57.21 | loss:   11.59235 | train-TER: 44.88 | train-WER: 62.62 | lists/dev.lst-loss:    6.95186 | lists/dev.lst-TER: 20.59 | lists/dev.lst-WER: 36.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.12
epoch:      202 | nupdates:        81204 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1116.54 | smp(ms): 6.82 | fwd(ms): 417.27 | crit-fwd(ms): 21.03 | bwd(ms): 637.02 | optim(ms): 57.29 | loss:   11.71110 | train-TER: 48.04 | train-WER: 66.29 | lists/dev.lst-loss:    7.03448 | lists/dev.lst-TER: 20.88 | lists/dev.lst-WER: 36.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 783.00
epoch:      203 | nupdates:        81606 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.32 | smp(ms): 6.36 | fwd(ms): 417.40 | crit-fwd(ms): 21.09 | bwd(ms): 637.67 | optim(ms): 57.27 | loss:   11.54316 | train-TER: 41.60 | train-WER: 59.75 | lists/dev.lst-loss:    7.01641 | lists/dev.lst-TER: 20.97 | lists/dev.lst-WER: 36.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.45
epoch:      204 | nupdates:        82008 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.91 | smp(ms): 3.54 | fwd(ms): 418.10 | crit-fwd(ms): 20.96 | bwd(ms): 637.51 | optim(ms): 57.24 | loss:   11.44882 | train-TER: 42.26 | train-WER: 60.62 | lists/dev.lst-loss:    7.09944 | lists/dev.lst-TER: 22.50 | lists/dev.lst-WER: 37.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.34
epoch:      205 | nupdates:        82410 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1116.35 | smp(ms): 4.79 | fwd(ms): 416.43 | crit-fwd(ms): 20.94 | bwd(ms): 637.69 | optim(ms): 57.26 | loss:   11.52040 | train-TER: 38.64 | train-WER: 58.98 | lists/dev.lst-loss:    6.98894 | lists/dev.lst-TER: 21.54 | lists/dev.lst-WER: 36.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 783.13
epoch:      206 | nupdates:        82812 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.36 | smp(ms): 7.46 | fwd(ms): 419.81 | crit-fwd(ms): 21.13 | bwd(ms): 639.34 | optim(ms): 57.24 | loss:   11.45530 | train-TER: 43.13 | train-WER: 60.77 | lists/dev.lst-loss:    7.04795 | lists/dev.lst-TER: 21.64 | lists/dev.lst-WER: 36.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 122 | hrs:   97.62 | thrpt(sec/sec): 779.63
epoch:      207 | nupdates:        83214 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.08 | smp(ms): 6.95 | fwd(ms): 419.82 | crit-fwd(ms): 21.27 | bwd(ms): 640.21 | optim(ms): 57.23 | loss:   11.75678 | train-TER: 47.76 | train-WER: 64.76 | lists/dev.lst-loss:    6.97346 | lists/dev.lst-TER: 20.85 | lists/dev.lst-WER: 35.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.13
epoch:      208 | nupdates:        83616 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.89 | smp(ms): 8.04 | fwd(ms): 417.32 | crit-fwd(ms): 21.20 | bwd(ms): 637.75 | optim(ms): 57.27 | loss:   11.60338 | train-TER: 43.14 | train-WER: 61.07 | lists/dev.lst-loss:    6.88011 | lists/dev.lst-TER: 20.62 | lists/dev.lst-WER: 35.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.36
epoch:      209 | nupdates:        84018 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1124.03 | smp(ms): 5.33 | fwd(ms): 418.75 | crit-fwd(ms): 21.10 | bwd(ms): 642.51 | optim(ms): 57.25 | loss:   11.48685 | train-TER: 47.57 | train-WER: 65.82 | lists/dev.lst-loss:    7.02744 | lists/dev.lst-TER: 21.79 | lists/dev.lst-WER: 36.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.78
epoch:      210 | nupdates:        84420 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.57 | smp(ms): 7.56 | fwd(ms): 418.89 | crit-fwd(ms): 21.34 | bwd(ms): 640.49 | optim(ms): 57.22 | loss:   11.59111 | train-TER: 49.94 | train-WER: 67.48 | lists/dev.lst-loss:    6.92240 | lists/dev.lst-TER: 20.96 | lists/dev.lst-WER: 35.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.48
epoch:      211 | nupdates:        84822 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.97 | smp(ms): 6.16 | fwd(ms): 418.66 | crit-fwd(ms): 20.97 | bwd(ms): 638.47 | optim(ms): 57.24 | loss:   11.45393 | train-TER: 40.08 | train-WER: 57.28 | lists/dev.lst-loss:    6.85382 | lists/dev.lst-TER: 21.27 | lists/dev.lst-WER: 36.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 781.30
epoch:      212 | nupdates:        85224 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1123.87 | smp(ms): 7.47 | fwd(ms): 418.89 | crit-fwd(ms): 21.27 | bwd(ms): 642.56 | optim(ms): 57.23 | loss:   11.52129 | train-TER: 48.04 | train-WER: 64.44 | lists/dev.lst-loss:    6.85867 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 35.43 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.89
epoch:      213 | nupdates:        85626 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:35 | bch(ms): 1132.40 | smp(ms): 6.40 | fwd(ms): 419.14 | crit-fwd(ms): 21.13 | bwd(ms): 651.43 | optim(ms): 57.23 | loss:   11.37089 | train-TER: 46.13 | train-WER: 64.66 | lists/dev.lst-loss:    6.84399 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 35.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.03
epoch:      214 | nupdates:        86028 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:37 | bch(ms): 1138.37 | smp(ms): 8.17 | fwd(ms): 419.76 | crit-fwd(ms): 21.15 | bwd(ms): 656.30 | optim(ms): 57.22 | loss:   11.55306 | train-TER: 48.10 | train-WER: 66.27 | lists/dev.lst-loss:    6.91602 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 35.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 767.98
epoch:      215 | nupdates:        86430 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.38 | smp(ms): 6.77 | fwd(ms): 417.81 | crit-fwd(ms): 21.21 | bwd(ms): 640.56 | optim(ms): 57.22 | loss:   11.43209 | train-TER: 48.28 | train-WER: 64.79 | lists/dev.lst-loss:    6.98994 | lists/dev.lst-TER: 21.60 | lists/dev.lst-WER: 36.50 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.31
epoch:      216 | nupdates:        86832 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.26 | smp(ms): 7.02 | fwd(ms): 418.27 | crit-fwd(ms): 20.95 | bwd(ms): 639.75 | optim(ms): 57.24 | loss:   11.50092 | train-TER: 40.00 | train-WER: 56.62 | lists/dev.lst-loss:    7.02892 | lists/dev.lst-TER: 21.76 | lists/dev.lst-WER: 36.52 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.40
epoch:      217 | nupdates:        87234 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1115.78 | smp(ms): 7.42 | fwd(ms): 417.25 | crit-fwd(ms): 21.05 | bwd(ms): 636.36 | optim(ms): 57.26 | loss:   11.42197 | train-TER: 50.97 | train-WER: 68.04 | lists/dev.lst-loss:    7.06908 | lists/dev.lst-TER: 22.15 | lists/dev.lst-WER: 36.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 783.53
epoch:      218 | nupdates:        87636 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.70 | smp(ms): 7.17 | fwd(ms): 418.37 | crit-fwd(ms): 21.04 | bwd(ms): 639.85 | optim(ms): 57.25 | loss:   11.40922 | train-TER: 47.70 | train-WER: 65.62 | lists/dev.lst-loss:    6.86247 | lists/dev.lst-TER: 20.82 | lists/dev.lst-WER: 35.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.09
epoch:      219 | nupdates:        88038 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1124.29 | smp(ms): 8.33 | fwd(ms): 417.72 | crit-fwd(ms): 21.17 | bwd(ms): 644.72 | optim(ms): 57.21 | loss:   11.31004 | train-TER: 37.47 | train-WER: 56.57 | lists/dev.lst-loss:    6.88911 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 35.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.60
epoch:      220 | nupdates:        88440 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1121.99 | smp(ms): 6.85 | fwd(ms): 418.45 | crit-fwd(ms): 21.01 | bwd(ms): 641.33 | optim(ms): 57.24 | loss:   11.33801 | train-TER: 41.46 | train-WER: 59.99 | lists/dev.lst-loss:    6.75162 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 35.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.20
epoch:      221 | nupdates:        88842 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1134.03 | smp(ms): 6.71 | fwd(ms): 419.69 | crit-fwd(ms): 20.99 | bwd(ms): 652.11 | optim(ms): 57.23 | loss:   11.38815 | train-TER: 42.83 | train-WER: 60.08 | lists/dev.lst-loss:    6.81624 | lists/dev.lst-TER: 20.55 | lists/dev.lst-WER: 35.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.92
epoch:      222 | nupdates:        89244 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.90 | smp(ms): 7.13 | fwd(ms): 418.55 | crit-fwd(ms): 21.05 | bwd(ms): 643.21 | optim(ms): 57.24 | loss:   11.41717 | train-TER: 43.01 | train-WER: 61.60 | lists/dev.lst-loss:    6.86301 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 35.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.87
epoch:      223 | nupdates:        89646 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.42 | smp(ms): 6.04 | fwd(ms): 417.75 | crit-fwd(ms): 21.16 | bwd(ms): 638.55 | optim(ms): 57.23 | loss:   11.30616 | train-TER: 42.63 | train-WER: 61.00 | lists/dev.lst-loss:    6.79989 | lists/dev.lst-TER: 20.41 | lists/dev.lst-WER: 35.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.68
epoch:      224 | nupdates:        90048 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:27 | bch(ms): 1113.07 | smp(ms): 4.46 | fwd(ms): 418.06 | crit-fwd(ms): 21.01 | bwd(ms): 633.15 | optim(ms): 57.31 | loss:   11.35378 | train-TER: 45.34 | train-WER: 62.81 | lists/dev.lst-loss:    6.98529 | lists/dev.lst-TER: 21.46 | lists/dev.lst-WER: 35.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 785.44
epoch:      225 | nupdates:        90450 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.32 | smp(ms): 7.27 | fwd(ms): 419.52 | crit-fwd(ms): 21.15 | bwd(ms): 638.87 | optim(ms): 57.23 | loss:   11.37245 | train-TER: 45.70 | train-WER: 63.60 | lists/dev.lst-loss:    6.90978 | lists/dev.lst-TER: 21.21 | lists/dev.lst-WER: 36.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.35
epoch:      226 | nupdates:        90852 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.51 | smp(ms): 6.56 | fwd(ms): 418.06 | crit-fwd(ms): 20.99 | bwd(ms): 641.05 | optim(ms): 57.22 | loss:   11.17685 | train-TER: 45.52 | train-WER: 64.04 | lists/dev.lst-loss:    6.79407 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.53
epoch:      227 | nupdates:        91254 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:36 | bch(ms): 1134.82 | smp(ms): 8.27 | fwd(ms): 417.47 | crit-fwd(ms): 21.13 | bwd(ms): 654.90 | optim(ms): 57.23 | loss:   11.31527 | train-TER: 40.23 | train-WER: 57.57 | lists/dev.lst-loss:    6.76190 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 770.38
epoch:      228 | nupdates:        91656 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1134.21 | smp(ms): 6.39 | fwd(ms): 419.50 | crit-fwd(ms): 21.01 | bwd(ms): 652.53 | optim(ms): 57.22 | loss:   11.28642 | train-TER: 43.90 | train-WER: 61.89 | lists/dev.lst-loss:    6.92776 | lists/dev.lst-TER: 21.05 | lists/dev.lst-WER: 35.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.80
epoch:      229 | nupdates:        92058 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.49 | smp(ms): 4.92 | fwd(ms): 418.72 | crit-fwd(ms): 21.08 | bwd(ms): 637.59 | optim(ms): 57.27 | loss:   11.27643 | train-TER: 46.77 | train-WER: 64.95 | lists/dev.lst-loss:    6.83402 | lists/dev.lst-TER: 20.42 | lists/dev.lst-WER: 35.21 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.63
epoch:      230 | nupdates:        92460 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.39 | smp(ms): 7.38 | fwd(ms): 417.09 | crit-fwd(ms): 21.14 | bwd(ms): 641.19 | optim(ms): 57.23 | loss:   11.35871 | train-TER: 42.95 | train-WER: 61.34 | lists/dev.lst-loss:    6.82054 | lists/dev.lst-TER: 20.53 | lists/dev.lst-WER: 35.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.31
epoch:      231 | nupdates:        92862 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.48 | smp(ms): 7.49 | fwd(ms): 418.10 | crit-fwd(ms): 21.08 | bwd(ms): 640.24 | optim(ms): 57.24 | loss:   11.56612 | train-TER: 49.68 | train-WER: 66.69 | lists/dev.lst-loss:    6.91017 | lists/dev.lst-TER: 21.23 | lists/dev.lst-WER: 35.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.25
epoch:      232 | nupdates:        93264 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.74 | smp(ms): 8.22 | fwd(ms): 418.32 | crit-fwd(ms): 21.16 | bwd(ms): 643.02 | optim(ms): 57.21 | loss:   11.34977 | train-TER: 40.18 | train-WER: 58.00 | lists/dev.lst-loss:    6.70046 | lists/dev.lst-TER: 20.08 | lists/dev.lst-WER: 34.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.98
epoch:      233 | nupdates:        93666 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:34 | bch(ms): 1131.26 | smp(ms): 7.24 | fwd(ms): 418.40 | crit-fwd(ms): 20.99 | bwd(ms): 650.61 | optim(ms): 57.22 | loss:   11.22591 | train-TER: 41.61 | train-WER: 60.07 | lists/dev.lst-loss:    6.75398 | lists/dev.lst-TER: 19.89 | lists/dev.lst-WER: 34.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 772.81
epoch:      234 | nupdates:        94068 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.11 | smp(ms): 6.94 | fwd(ms): 418.88 | crit-fwd(ms): 21.11 | bwd(ms): 650.90 | optim(ms): 57.24 | loss:   11.00878 | train-TER: 42.84 | train-WER: 60.60 | lists/dev.lst-loss:    6.84965 | lists/dev.lst-TER: 20.49 | lists/dev.lst-WER: 35.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.23
epoch:      235 | nupdates:        94470 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.91 | smp(ms): 7.42 | fwd(ms): 417.00 | crit-fwd(ms): 21.15 | bwd(ms): 639.56 | optim(ms): 57.23 | loss:   11.32189 | train-TER: 38.02 | train-WER: 56.16 | lists/dev.lst-loss:    6.81756 | lists/dev.lst-TER: 20.86 | lists/dev.lst-WER: 35.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.34
epoch:      236 | nupdates:        94872 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.14 | smp(ms): 7.24 | fwd(ms): 419.31 | crit-fwd(ms): 21.36 | bwd(ms): 641.70 | optim(ms): 57.21 | loss:   11.12376 | train-TER: 39.15 | train-WER: 57.22 | lists/dev.lst-loss:    6.85788 | lists/dev.lst-TER: 20.71 | lists/dev.lst-WER: 35.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.40
epoch:      237 | nupdates:        95274 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.51 | smp(ms): 5.76 | fwd(ms): 418.50 | crit-fwd(ms): 20.98 | bwd(ms): 640.05 | optim(ms): 57.20 | loss:   11.04973 | train-TER: 43.80 | train-WER: 60.77 | lists/dev.lst-loss:    6.80430 | lists/dev.lst-TER: 20.59 | lists/dev.lst-WER: 35.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.23
epoch:      238 | nupdates:        95676 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.83 | smp(ms): 6.42 | fwd(ms): 417.66 | crit-fwd(ms): 20.89 | bwd(ms): 636.04 | optim(ms): 57.24 | loss:   10.98742 | train-TER: 45.40 | train-WER: 61.95 | lists/dev.lst-loss:    6.83968 | lists/dev.lst-TER: 20.04 | lists/dev.lst-WER: 34.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 783.50
epoch:      239 | nupdates:        96078 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:36 | bch(ms): 1135.97 | smp(ms): 6.94 | fwd(ms): 419.49 | crit-fwd(ms): 21.11 | bwd(ms): 654.20 | optim(ms): 57.22 | loss:   11.19168 | train-TER: 46.59 | train-WER: 63.54 | lists/dev.lst-loss:    6.95753 | lists/dev.lst-TER: 21.54 | lists/dev.lst-WER: 35.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 769.61
epoch:      240 | nupdates:        96480 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.58 | smp(ms): 5.98 | fwd(ms): 418.13 | crit-fwd(ms): 20.89 | bwd(ms): 640.13 | optim(ms): 57.23 | loss:   11.11112 | train-TER: 45.69 | train-WER: 63.95 | lists/dev.lst-loss:    6.71408 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 34.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.18
epoch:      241 | nupdates:        96882 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.10 | smp(ms): 7.62 | fwd(ms): 418.14 | crit-fwd(ms): 21.06 | bwd(ms): 651.71 | optim(ms): 57.24 | loss:   11.23949 | train-TER: 43.75 | train-WER: 62.11 | lists/dev.lst-loss:    6.64316 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 34.49 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 772.24
epoch:      242 | nupdates:        97284 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.39 | smp(ms): 4.26 | fwd(ms): 418.71 | crit-fwd(ms): 21.32 | bwd(ms): 651.51 | optim(ms): 57.25 | loss:   11.18350 | train-TER: 42.52 | train-WER: 60.17 | lists/dev.lst-loss:    6.76315 | lists/dev.lst-TER: 20.53 | lists/dev.lst-WER: 35.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.04
epoch:      243 | nupdates:        97686 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1117.32 | smp(ms): 6.08 | fwd(ms): 418.90 | crit-fwd(ms): 21.02 | bwd(ms): 636.55 | optim(ms): 57.27 | loss:   11.22291 | train-TER: 45.10 | train-WER: 62.08 | lists/dev.lst-loss:    6.80712 | lists/dev.lst-TER: 20.70 | lists/dev.lst-WER: 35.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.45
epoch:      244 | nupdates:        98088 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.87 | smp(ms): 7.04 | fwd(ms): 418.33 | crit-fwd(ms): 21.11 | bwd(ms): 641.29 | optim(ms): 57.21 | loss:   11.18604 | train-TER: 40.21 | train-WER: 57.68 | lists/dev.lst-loss:    6.79022 | lists/dev.lst-TER: 20.35 | lists/dev.lst-WER: 34.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.28
epoch:      245 | nupdates:        98490 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1119.09 | smp(ms): 6.54 | fwd(ms): 418.17 | crit-fwd(ms): 21.22 | bwd(ms): 638.78 | optim(ms): 57.24 | loss:   11.07367 | train-TER: 41.98 | train-WER: 59.97 | lists/dev.lst-loss:    6.84947 | lists/dev.lst-TER: 20.99 | lists/dev.lst-WER: 35.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.21
epoch:      246 | nupdates:        98892 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.90 | smp(ms): 6.66 | fwd(ms): 419.24 | crit-fwd(ms): 21.00 | bwd(ms): 642.09 | optim(ms): 57.21 | loss:   11.04590 | train-TER: 45.50 | train-WER: 63.13 | lists/dev.lst-loss:    6.79369 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.87
epoch:      247 | nupdates:        99294 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.00 | smp(ms): 7.35 | fwd(ms): 418.30 | crit-fwd(ms): 20.99 | bwd(ms): 639.64 | optim(ms): 57.22 | loss:   11.00134 | train-TER: 41.46 | train-WER: 59.29 | lists/dev.lst-loss:    6.85750 | lists/dev.lst-TER: 20.40 | lists/dev.lst-WER: 34.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.58
epoch:      248 | nupdates:        99696 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.13 | smp(ms): 7.12 | fwd(ms): 418.69 | crit-fwd(ms): 21.17 | bwd(ms): 641.34 | optim(ms): 57.22 | loss:   11.27691 | train-TER: 43.79 | train-WER: 60.88 | lists/dev.lst-loss:    6.72764 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.10
epoch:      249 | nupdates:       100098 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.45 | smp(ms): 7.58 | fwd(ms): 418.00 | crit-fwd(ms): 21.31 | bwd(ms): 641.27 | optim(ms): 57.22 | loss:   10.83702 | train-TER: 42.93 | train-WER: 60.01 | lists/dev.lst-loss:    6.83052 | lists/dev.lst-TER: 20.44 | lists/dev.lst-WER: 34.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.57
epoch:      250 | nupdates:       100500 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.41 | smp(ms): 7.24 | fwd(ms): 417.67 | crit-fwd(ms): 21.05 | bwd(ms): 642.77 | optim(ms): 57.22 | loss:   11.11319 | train-TER: 43.88 | train-WER: 62.51 | lists/dev.lst-loss:    6.77070 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.90
epoch:      251 | nupdates:       100902 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.82 | smp(ms): 7.18 | fwd(ms): 418.80 | crit-fwd(ms): 21.01 | bwd(ms): 642.03 | optim(ms): 57.21 | loss:   11.04168 | train-TER: 44.84 | train-WER: 63.76 | lists/dev.lst-loss:    6.69973 | lists/dev.lst-TER: 19.36 | lists/dev.lst-WER: 34.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.62
epoch:      252 | nupdates:       101304 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1133.04 | smp(ms): 7.78 | fwd(ms): 419.10 | crit-fwd(ms): 21.38 | bwd(ms): 651.87 | optim(ms): 57.25 | loss:   11.08078 | train-TER: 44.58 | train-WER: 61.91 | lists/dev.lst-loss:    6.76998 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.59
epoch:      253 | nupdates:       101706 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.26 | smp(ms): 5.35 | fwd(ms): 417.59 | crit-fwd(ms): 21.01 | bwd(ms): 635.27 | optim(ms): 57.26 | loss:   11.24814 | train-TER: 38.11 | train-WER: 56.34 | lists/dev.lst-loss:    6.78449 | lists/dev.lst-TER: 20.79 | lists/dev.lst-WER: 35.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 783.90
epoch:      254 | nupdates:       102108 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.00 | smp(ms): 6.07 | fwd(ms): 417.59 | crit-fwd(ms): 21.08 | bwd(ms): 635.41 | optim(ms): 57.24 | loss:   11.06087 | train-TER: 41.26 | train-WER: 59.08 | lists/dev.lst-loss:    6.90967 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 35.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 784.08
epoch:      255 | nupdates:       102510 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.92 | smp(ms): 5.45 | fwd(ms): 419.11 | crit-fwd(ms): 20.99 | bwd(ms): 637.59 | optim(ms): 57.28 | loss:   11.10428 | train-TER: 42.38 | train-WER: 60.94 | lists/dev.lst-loss:    6.83471 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 781.34
epoch:      256 | nupdates:       102912 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1119.90 | smp(ms): 5.78 | fwd(ms): 418.65 | crit-fwd(ms): 20.97 | bwd(ms): 639.20 | optim(ms): 57.24 | loss:   11.01318 | train-TER: 48.53 | train-WER: 67.12 | lists/dev.lst-loss:    6.69787 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.65
epoch:      257 | nupdates:       103314 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:32 | bch(ms): 1124.40 | smp(ms): 7.39 | fwd(ms): 418.11 | crit-fwd(ms): 21.08 | bwd(ms): 643.84 | optim(ms): 57.19 | loss:   11.09951 | train-TER: 42.85 | train-WER: 60.55 | lists/dev.lst-loss:    6.75729 | lists/dev.lst-TER: 20.51 | lists/dev.lst-WER: 34.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.53
epoch:      258 | nupdates:       103716 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.63 | smp(ms): 7.41 | fwd(ms): 419.20 | crit-fwd(ms): 21.06 | bwd(ms): 642.51 | optim(ms): 57.22 | loss:   11.07322 | train-TER: 39.44 | train-WER: 57.80 | lists/dev.lst-loss:    6.73136 | lists/dev.lst-TER: 20.08 | lists/dev.lst-WER: 34.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.06
epoch:      259 | nupdates:       104118 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1119.56 | smp(ms): 4.98 | fwd(ms): 418.44 | crit-fwd(ms): 20.80 | bwd(ms): 638.01 | optim(ms): 57.23 | loss:   11.11710 | train-TER: 37.77 | train-WER: 55.48 | lists/dev.lst-loss:    6.74001 | lists/dev.lst-TER: 20.68 | lists/dev.lst-WER: 35.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.88
epoch:      260 | nupdates:       104520 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.68 | smp(ms): 6.34 | fwd(ms): 419.24 | crit-fwd(ms): 21.05 | bwd(ms): 640.53 | optim(ms): 57.22 | loss:   11.03792 | train-TER: 45.23 | train-WER: 63.77 | lists/dev.lst-loss:    6.85008 | lists/dev.lst-TER: 20.61 | lists/dev.lst-WER: 34.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 779.41
epoch:      261 | nupdates:       104922 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.75 | smp(ms): 6.28 | fwd(ms): 419.29 | crit-fwd(ms): 21.34 | bwd(ms): 639.37 | optim(ms): 57.24 | loss:   10.83485 | train-TER: 41.45 | train-WER: 59.86 | lists/dev.lst-loss:    6.70959 | lists/dev.lst-TER: 20.10 | lists/dev.lst-WER: 34.57 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.05
epoch:      262 | nupdates:       105324 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.72 | smp(ms): 5.99 | fwd(ms): 417.15 | crit-fwd(ms): 20.94 | bwd(ms): 639.49 | optim(ms): 57.22 | loss:   11.04013 | train-TER: 49.24 | train-WER: 67.48 | lists/dev.lst-loss:    6.66456 | lists/dev.lst-TER: 20.04 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.47
epoch:      263 | nupdates:       105726 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.00 | smp(ms): 6.30 | fwd(ms): 419.03 | crit-fwd(ms): 21.12 | bwd(ms): 638.98 | optim(ms): 57.24 | loss:   10.96142 | train-TER: 43.78 | train-WER: 61.61 | lists/dev.lst-loss:    6.72319 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.58
epoch:      264 | nupdates:       106128 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1119.28 | smp(ms): 8.23 | fwd(ms): 418.56 | crit-fwd(ms): 21.09 | bwd(ms): 638.49 | optim(ms): 57.26 | loss:   11.09634 | train-TER: 40.15 | train-WER: 57.50 | lists/dev.lst-loss:    6.70202 | lists/dev.lst-TER: 20.06 | lists/dev.lst-WER: 34.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.08
epoch:      265 | nupdates:       106530 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.43 | smp(ms): 6.62 | fwd(ms): 419.79 | crit-fwd(ms): 21.00 | bwd(ms): 639.61 | optim(ms): 57.23 | loss:   11.13880 | train-TER: 45.62 | train-WER: 63.36 | lists/dev.lst-loss:    6.71379 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.58
epoch:      266 | nupdates:       106932 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:32 | bch(ms): 1124.40 | smp(ms): 6.82 | fwd(ms): 418.56 | crit-fwd(ms): 20.97 | bwd(ms): 643.30 | optim(ms): 57.22 | loss:   10.88673 | train-TER: 42.52 | train-WER: 61.18 | lists/dev.lst-loss:    6.65110 | lists/dev.lst-TER: 19.89 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.52
epoch:      267 | nupdates:       107334 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.42 | smp(ms): 6.28 | fwd(ms): 421.13 | crit-fwd(ms): 21.31 | bwd(ms): 640.06 | optim(ms): 57.23 | loss:   10.95675 | train-TER: 39.80 | train-WER: 58.01 | lists/dev.lst-loss:    6.72858 | lists/dev.lst-TER: 20.40 | lists/dev.lst-WER: 34.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.20
epoch:      268 | nupdates:       107736 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1124.18 | smp(ms): 8.59 | fwd(ms): 419.11 | crit-fwd(ms): 21.19 | bwd(ms): 642.87 | optim(ms): 57.23 | loss:   11.17714 | train-TER: 48.56 | train-WER: 66.28 | lists/dev.lst-loss:    6.67676 | lists/dev.lst-TER: 20.03 | lists/dev.lst-WER: 34.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.68
epoch:      269 | nupdates:       108138 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.81 | smp(ms): 6.28 | fwd(ms): 420.07 | crit-fwd(ms): 21.05 | bwd(ms): 637.69 | optim(ms): 57.25 | loss:   10.78095 | train-TER: 47.56 | train-WER: 66.00 | lists/dev.lst-loss:    6.71272 | lists/dev.lst-TER: 20.10 | lists/dev.lst-WER: 34.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.71
epoch:      270 | nupdates:       108540 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1116.39 | smp(ms): 6.95 | fwd(ms): 417.47 | crit-fwd(ms): 21.09 | bwd(ms): 636.94 | optim(ms): 57.24 | loss:   11.03590 | train-TER: 46.37 | train-WER: 64.37 | lists/dev.lst-loss:    6.73831 | lists/dev.lst-TER: 20.14 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 783.10
epoch:      271 | nupdates:       108942 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.00 | smp(ms): 6.99 | fwd(ms): 418.83 | crit-fwd(ms): 21.24 | bwd(ms): 639.76 | optim(ms): 57.28 | loss:   10.93185 | train-TER: 45.13 | train-WER: 63.25 | lists/dev.lst-loss:    6.76600 | lists/dev.lst-TER: 20.28 | lists/dev.lst-WER: 34.57 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.88
epoch:      272 | nupdates:       109344 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.13 | smp(ms): 7.83 | fwd(ms): 417.76 | crit-fwd(ms): 21.00 | bwd(ms): 642.48 | optim(ms): 57.23 | loss:   10.85380 | train-TER: 41.66 | train-WER: 60.17 | lists/dev.lst-loss:    6.65032 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 34.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.10
epoch:      273 | nupdates:       109746 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1131.82 | smp(ms): 5.96 | fwd(ms): 418.44 | crit-fwd(ms): 20.95 | bwd(ms): 651.34 | optim(ms): 57.24 | loss:   10.94733 | train-TER: 45.17 | train-WER: 62.96 | lists/dev.lst-loss:    6.74055 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.42
epoch:      274 | nupdates:       110148 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.80 | smp(ms): 7.06 | fwd(ms): 417.97 | crit-fwd(ms): 21.06 | bwd(ms): 640.52 | optim(ms): 57.24 | loss:   11.00493 | train-TER: 49.53 | train-WER: 66.56 | lists/dev.lst-loss:    6.74047 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.02
epoch:      275 | nupdates:       110550 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:32 | bch(ms): 1125.21 | smp(ms): 6.50 | fwd(ms): 419.94 | crit-fwd(ms): 21.05 | bwd(ms): 643.25 | optim(ms): 57.22 | loss:   10.80539 | train-TER: 43.48 | train-WER: 61.44 | lists/dev.lst-loss:    6.75868 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 34.69 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.96
epoch:      276 | nupdates:       110952 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.59 | smp(ms): 8.57 | fwd(ms): 418.32 | crit-fwd(ms): 21.04 | bwd(ms): 638.16 | optim(ms): 57.21 | loss:   11.12784 | train-TER: 42.98 | train-WER: 60.52 | lists/dev.lst-loss:    6.71512 | lists/dev.lst-TER: 20.46 | lists/dev.lst-WER: 34.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.56
epoch:      277 | nupdates:       111354 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.59 | smp(ms): 6.90 | fwd(ms): 417.83 | crit-fwd(ms): 21.05 | bwd(ms): 639.44 | optim(ms): 57.21 | loss:   10.87850 | train-TER: 41.97 | train-WER: 60.31 | lists/dev.lst-loss:    6.68581 | lists/dev.lst-TER: 19.65 | lists/dev.lst-WER: 34.08 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.87
epoch:      278 | nupdates:       111756 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1121.92 | smp(ms): 7.11 | fwd(ms): 418.23 | crit-fwd(ms): 21.00 | bwd(ms): 641.45 | optim(ms): 57.21 | loss:   11.03103 | train-TER: 51.17 | train-WER: 68.92 | lists/dev.lst-loss:    6.74854 | lists/dev.lst-TER: 19.91 | lists/dev.lst-WER: 34.30 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.24
epoch:      279 | nupdates:       112158 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.44 | smp(ms): 7.12 | fwd(ms): 417.95 | crit-fwd(ms): 20.96 | bwd(ms): 638.54 | optim(ms): 57.26 | loss:   10.86679 | train-TER: 42.17 | train-WER: 60.41 | lists/dev.lst-loss:    6.67381 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 34.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.67
epoch:      280 | nupdates:       112560 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1117.98 | smp(ms): 6.25 | fwd(ms): 418.75 | crit-fwd(ms): 21.21 | bwd(ms): 637.21 | optim(ms): 57.25 | loss:   11.15947 | train-TER: 44.50 | train-WER: 63.00 | lists/dev.lst-loss:    6.68154 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 34.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.99
epoch:      281 | nupdates:       112962 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.49 | smp(ms): 4.78 | fwd(ms): 419.11 | crit-fwd(ms): 20.95 | bwd(ms): 638.88 | optim(ms): 57.23 | loss:   10.88759 | train-TER: 42.82 | train-WER: 59.89 | lists/dev.lst-loss:    6.73656 | lists/dev.lst-TER: 20.24 | lists/dev.lst-WER: 34.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.24
epoch:      282 | nupdates:       113364 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.92 | smp(ms): 6.08 | fwd(ms): 419.17 | crit-fwd(ms): 21.08 | bwd(ms): 642.55 | optim(ms): 57.23 | loss:   10.83481 | train-TER: 36.57 | train-WER: 53.01 | lists/dev.lst-loss:    6.68294 | lists/dev.lst-TER: 20.16 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.86
epoch:      283 | nupdates:       113766 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.65 | smp(ms): 7.74 | fwd(ms): 417.82 | crit-fwd(ms): 21.46 | bwd(ms): 638.43 | optim(ms): 57.23 | loss:   10.79162 | train-TER: 42.49 | train-WER: 60.67 | lists/dev.lst-loss:    6.64335 | lists/dev.lst-TER: 19.98 | lists/dev.lst-WER: 34.25 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 781.52
epoch:      284 | nupdates:       114168 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.74 | smp(ms): 6.28 | fwd(ms): 418.41 | crit-fwd(ms): 21.20 | bwd(ms): 638.25 | optim(ms): 57.24 | loss:   11.00945 | train-TER: 41.27 | train-WER: 59.70 | lists/dev.lst-loss:    6.71452 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.46
epoch:      285 | nupdates:       114570 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.92 | smp(ms): 8.06 | fwd(ms): 417.63 | crit-fwd(ms): 20.98 | bwd(ms): 640.99 | optim(ms): 57.26 | loss:   10.71856 | train-TER: 38.88 | train-WER: 56.04 | lists/dev.lst-loss:    6.69798 | lists/dev.lst-TER: 20.33 | lists/dev.lst-WER: 34.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.94
epoch:      286 | nupdates:       114972 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.79 | smp(ms): 6.23 | fwd(ms): 420.08 | crit-fwd(ms): 21.22 | bwd(ms): 641.90 | optim(ms): 57.22 | loss:   10.65459 | train-TER: 34.91 | train-WER: 53.93 | lists/dev.lst-loss:    6.71353 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.95
epoch:      287 | nupdates:       115374 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.05 | smp(ms): 7.07 | fwd(ms): 417.90 | crit-fwd(ms): 21.16 | bwd(ms): 640.21 | optim(ms): 57.23 | loss:   10.84945 | train-TER: 40.57 | train-WER: 58.15 | lists/dev.lst-loss:    6.72145 | lists/dev.lst-TER: 20.18 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.54
epoch:      288 | nupdates:       115776 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.59 | smp(ms): 7.89 | fwd(ms): 419.67 | crit-fwd(ms): 21.07 | bwd(ms): 641.55 | optim(ms): 57.25 | loss:   10.99489 | train-TER: 44.54 | train-WER: 63.27 | lists/dev.lst-loss:    6.75089 | lists/dev.lst-TER: 20.29 | lists/dev.lst-WER: 34.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.09
epoch:      289 | nupdates:       116178 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1115.77 | smp(ms): 6.60 | fwd(ms): 417.77 | crit-fwd(ms): 21.13 | bwd(ms): 635.72 | optim(ms): 57.25 | loss:   10.75101 | train-TER: 47.20 | train-WER: 65.20 | lists/dev.lst-loss:    6.71355 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.26 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 783.54
epoch:      290 | nupdates:       116580 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1116.17 | smp(ms): 5.01 | fwd(ms): 417.35 | crit-fwd(ms): 21.22 | bwd(ms): 636.82 | optim(ms): 57.31 | loss:   10.87084 | train-TER: 42.11 | train-WER: 61.14 | lists/dev.lst-loss:    6.62369 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 783.26
epoch:      291 | nupdates:       116982 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:35 | bch(ms): 1133.74 | smp(ms): 6.64 | fwd(ms): 420.00 | crit-fwd(ms): 21.20 | bwd(ms): 651.73 | optim(ms): 57.22 | loss:   10.79659 | train-TER: 43.60 | train-WER: 61.68 | lists/dev.lst-loss:    6.74688 | lists/dev.lst-TER: 20.03 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 771.12
epoch:      292 | nupdates:       117384 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1121.99 | smp(ms): 7.09 | fwd(ms): 418.69 | crit-fwd(ms): 21.24 | bwd(ms): 639.50 | optim(ms): 57.25 | loss:   11.02203 | train-TER: 45.46 | train-WER: 62.18 | lists/dev.lst-loss:    6.72946 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.20
epoch:      293 | nupdates:       117786 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.59 | smp(ms): 5.23 | fwd(ms): 419.82 | crit-fwd(ms): 20.98 | bwd(ms): 637.83 | optim(ms): 57.24 | loss:   10.71788 | train-TER: 45.93 | train-WER: 62.56 | lists/dev.lst-loss:    6.67587 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 34.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.86
epoch:      294 | nupdates:       118188 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1131.09 | smp(ms): 6.03 | fwd(ms): 418.64 | crit-fwd(ms): 21.14 | bwd(ms): 650.45 | optim(ms): 57.29 | loss:   10.81870 | train-TER: 42.28 | train-WER: 60.43 | lists/dev.lst-loss:    6.71912 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 772.92
epoch:      295 | nupdates:       118590 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.12 | smp(ms): 5.62 | fwd(ms): 418.59 | crit-fwd(ms): 20.94 | bwd(ms): 639.79 | optim(ms): 57.21 | loss:   10.74011 | train-TER: 33.24 | train-WER: 50.45 | lists/dev.lst-loss:    6.68437 | lists/dev.lst-TER: 20.42 | lists/dev.lst-WER: 34.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.80
epoch:      296 | nupdates:       118992 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.63 | smp(ms): 6.35 | fwd(ms): 419.74 | crit-fwd(ms): 21.44 | bwd(ms): 640.33 | optim(ms): 57.22 | loss:   10.97935 | train-TER: 40.88 | train-WER: 58.69 | lists/dev.lst-loss:    6.69050 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 34.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 778.75
epoch:      297 | nupdates:       119394 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.56 | smp(ms): 6.09 | fwd(ms): 419.98 | crit-fwd(ms): 21.03 | bwd(ms): 640.21 | optim(ms): 57.23 | loss:   10.78796 | train-TER: 39.46 | train-WER: 56.49 | lists/dev.lst-loss:    6.62739 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.80
epoch:      298 | nupdates:       119796 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1130.05 | smp(ms): 5.78 | fwd(ms): 417.43 | crit-fwd(ms): 21.06 | bwd(ms): 650.62 | optim(ms): 57.25 | loss:   10.89956 | train-TER: 41.28 | train-WER: 59.25 | lists/dev.lst-loss:    6.69034 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 773.64
epoch:      299 | nupdates:       120198 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.57 | smp(ms): 7.73 | fwd(ms): 418.21 | crit-fwd(ms): 21.10 | bwd(ms): 642.34 | optim(ms): 57.23 | loss:   10.77005 | train-TER: 39.67 | train-WER: 56.60 | lists/dev.lst-loss:    6.67104 | lists/dev.lst-TER: 20.02 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.79
epoch:      300 | nupdates:       120600 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.34 | smp(ms): 6.57 | fwd(ms): 417.52 | crit-fwd(ms): 20.98 | bwd(ms): 640.47 | optim(ms): 57.22 | loss:   10.81043 | train-TER: 32.92 | train-WER: 50.34 | lists/dev.lst-loss:    6.65966 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.34
epoch:      301 | nupdates:       121002 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.99 | smp(ms): 8.63 | fwd(ms): 418.01 | crit-fwd(ms): 21.24 | bwd(ms): 644.50 | optim(ms): 57.20 | loss:   10.77536 | train-TER: 40.79 | train-WER: 59.21 | lists/dev.lst-loss:    6.66066 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 34.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.12
epoch:      302 | nupdates:       121404 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.83 | smp(ms): 6.81 | fwd(ms): 418.93 | crit-fwd(ms): 21.06 | bwd(ms): 638.90 | optim(ms): 57.25 | loss:   10.70175 | train-TER: 39.35 | train-WER: 57.08 | lists/dev.lst-loss:    6.77147 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 34.33 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.69
epoch:      303 | nupdates:       121806 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.50 | smp(ms): 7.28 | fwd(ms): 417.64 | crit-fwd(ms): 21.13 | bwd(ms): 642.63 | optim(ms): 57.23 | loss:   10.68096 | train-TER: 43.08 | train-WER: 60.83 | lists/dev.lst-loss:    6.63917 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.84
epoch:      304 | nupdates:       122208 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1125.04 | smp(ms): 8.38 | fwd(ms): 419.41 | crit-fwd(ms): 20.99 | bwd(ms): 643.42 | optim(ms): 57.22 | loss:   10.79036 | train-TER: 41.55 | train-WER: 59.67 | lists/dev.lst-loss:    6.69519 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.09
epoch:      305 | nupdates:       122610 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.74 | smp(ms): 8.37 | fwd(ms): 417.39 | crit-fwd(ms): 21.45 | bwd(ms): 642.71 | optim(ms): 57.24 | loss:   10.74811 | train-TER: 43.41 | train-WER: 62.10 | lists/dev.lst-loss:    6.68067 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 34.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.67
epoch:      306 | nupdates:       123012 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.50 | smp(ms): 7.21 | fwd(ms): 418.78 | crit-fwd(ms): 20.91 | bwd(ms): 640.54 | optim(ms): 57.23 | loss:   10.82780 | train-TER: 39.32 | train-WER: 56.80 | lists/dev.lst-loss:    6.68922 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.53
epoch:      307 | nupdates:       123414 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.33 | smp(ms): 5.98 | fwd(ms): 418.25 | crit-fwd(ms): 21.02 | bwd(ms): 640.78 | optim(ms): 57.23 | loss:   10.77024 | train-TER: 42.98 | train-WER: 60.80 | lists/dev.lst-loss:    6.69091 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.65
epoch:      308 | nupdates:       123816 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1123.24 | smp(ms): 7.75 | fwd(ms): 418.50 | crit-fwd(ms): 21.28 | bwd(ms): 642.70 | optim(ms): 57.22 | loss:   10.79831 | train-TER: 47.42 | train-WER: 65.42 | lists/dev.lst-loss:    6.73109 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.33
epoch:      309 | nupdates:       124218 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.42 | smp(ms): 6.56 | fwd(ms): 418.40 | crit-fwd(ms): 21.13 | bwd(ms): 641.11 | optim(ms): 57.22 | loss:   10.83720 | train-TER: 47.26 | train-WER: 64.28 | lists/dev.lst-loss:    6.59614 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.59
epoch:      310 | nupdates:       124620 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.64 | smp(ms): 6.50 | fwd(ms): 418.93 | crit-fwd(ms): 21.01 | bwd(ms): 643.30 | optim(ms): 57.22 | loss:   10.66964 | train-TER: 45.04 | train-WER: 61.98 | lists/dev.lst-loss:    6.65539 | lists/dev.lst-TER: 19.75 | lists/dev.lst-WER: 33.97 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.36
epoch:      311 | nupdates:       125022 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.89 | smp(ms): 7.20 | fwd(ms): 419.49 | crit-fwd(ms): 21.05 | bwd(ms): 641.41 | optim(ms): 57.23 | loss:   10.77329 | train-TER: 44.26 | train-WER: 61.64 | lists/dev.lst-loss:    6.66448 | lists/dev.lst-TER: 20.25 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.57
epoch:      312 | nupdates:       125424 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.31 | smp(ms): 8.00 | fwd(ms): 417.83 | crit-fwd(ms): 21.16 | bwd(ms): 641.28 | optim(ms): 57.24 | loss:   10.75939 | train-TER: 36.91 | train-WER: 54.57 | lists/dev.lst-loss:    6.65007 | lists/dev.lst-TER: 19.75 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.66
epoch:      313 | nupdates:       125826 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.29 | smp(ms): 8.35 | fwd(ms): 418.65 | crit-fwd(ms): 21.17 | bwd(ms): 639.55 | optim(ms): 57.23 | loss:   10.73199 | train-TER: 42.92 | train-WER: 60.65 | lists/dev.lst-loss:    6.68610 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.38
epoch:      314 | nupdates:       126228 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.67 | smp(ms): 5.97 | fwd(ms): 419.82 | crit-fwd(ms): 20.91 | bwd(ms): 642.55 | optim(ms): 57.22 | loss:   10.88882 | train-TER: 43.85 | train-WER: 61.34 | lists/dev.lst-loss:    6.73855 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.34
epoch:      315 | nupdates:       126630 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.69 | smp(ms): 6.35 | fwd(ms): 418.62 | crit-fwd(ms): 21.18 | bwd(ms): 639.94 | optim(ms): 57.22 | loss:   10.61482 | train-TER: 37.20 | train-WER: 55.39 | lists/dev.lst-loss:    6.70637 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.10
epoch:      316 | nupdates:       127032 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.74 | smp(ms): 7.50 | fwd(ms): 417.94 | crit-fwd(ms): 21.16 | bwd(ms): 638.72 | optim(ms): 57.25 | loss:   10.90136 | train-TER: 42.60 | train-WER: 61.17 | lists/dev.lst-loss:    6.65119 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.46
epoch:      317 | nupdates:       127434 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.30 | smp(ms): 6.25 | fwd(ms): 418.80 | crit-fwd(ms): 21.12 | bwd(ms): 639.20 | optim(ms): 57.24 | loss:   10.88599 | train-TER: 40.91 | train-WER: 59.08 | lists/dev.lst-loss:    6.73520 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 34.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.37
epoch:      318 | nupdates:       127836 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.89 | smp(ms): 8.39 | fwd(ms): 417.60 | crit-fwd(ms): 21.16 | bwd(ms): 640.08 | optim(ms): 57.27 | loss:   10.65374 | train-TER: 37.64 | train-WER: 55.30 | lists/dev.lst-loss:    6.62736 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.66
epoch:      319 | nupdates:       128238 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:35 | bch(ms): 1132.73 | smp(ms): 7.64 | fwd(ms): 417.82 | crit-fwd(ms): 21.12 | bwd(ms): 653.03 | optim(ms): 57.24 | loss:   10.60002 | train-TER: 41.01 | train-WER: 58.90 | lists/dev.lst-loss:    6.71207 | lists/dev.lst-TER: 19.66 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 771.81
epoch:      320 | nupdates:       128640 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1124.00 | smp(ms): 7.56 | fwd(ms): 419.28 | crit-fwd(ms): 21.06 | bwd(ms): 642.56 | optim(ms): 57.25 | loss:   10.76944 | train-TER: 46.30 | train-WER: 63.90 | lists/dev.lst-loss:    6.69706 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.80
epoch:      321 | nupdates:       129042 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.98 | smp(ms): 5.75 | fwd(ms): 419.26 | crit-fwd(ms): 21.06 | bwd(ms): 637.64 | optim(ms): 57.25 | loss:   10.73401 | train-TER: 53.35 | train-WER: 70.94 | lists/dev.lst-loss:    6.66058 | lists/dev.lst-TER: 19.50 | lists/dev.lst-WER: 33.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.29
epoch:      322 | nupdates:       129444 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.78 | smp(ms): 6.89 | fwd(ms): 418.60 | crit-fwd(ms): 21.12 | bwd(ms): 641.97 | optim(ms): 57.23 | loss:   10.62311 | train-TER: 38.92 | train-WER: 57.53 | lists/dev.lst-loss:    6.66115 | lists/dev.lst-TER: 19.57 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.65
epoch:      323 | nupdates:       129846 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.84 | smp(ms): 5.79 | fwd(ms): 417.97 | crit-fwd(ms): 21.07 | bwd(ms): 639.58 | optim(ms): 57.21 | loss:   10.70284 | train-TER: 46.31 | train-WER: 64.30 | lists/dev.lst-loss:    6.67914 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.69
epoch:      324 | nupdates:       130248 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.68 | smp(ms): 6.62 | fwd(ms): 420.21 | crit-fwd(ms): 21.11 | bwd(ms): 639.13 | optim(ms): 57.23 | loss:   10.76655 | train-TER: 39.30 | train-WER: 57.20 | lists/dev.lst-loss:    6.65189 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.41
epoch:      325 | nupdates:       130650 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.14 | smp(ms): 7.86 | fwd(ms): 416.98 | crit-fwd(ms): 21.08 | bwd(ms): 638.64 | optim(ms): 57.25 | loss:   10.88024 | train-TER: 44.67 | train-WER: 62.40 | lists/dev.lst-loss:    6.69408 | lists/dev.lst-TER: 19.90 | lists/dev.lst-WER: 34.03 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.88
epoch:      326 | nupdates:       131052 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1123.36 | smp(ms): 8.33 | fwd(ms): 418.92 | crit-fwd(ms): 21.02 | bwd(ms): 642.17 | optim(ms): 57.22 | loss:   10.78969 | train-TER: 46.04 | train-WER: 63.21 | lists/dev.lst-loss:    6.67542 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.24
epoch:      327 | nupdates:       131454 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.61 | smp(ms): 6.71 | fwd(ms): 418.87 | crit-fwd(ms): 21.13 | bwd(ms): 638.55 | optim(ms): 57.26 | loss:   10.70045 | train-TER: 45.91 | train-WER: 62.29 | lists/dev.lst-loss:    6.70422 | lists/dev.lst-TER: 20.17 | lists/dev.lst-WER: 34.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.85
epoch:      328 | nupdates:       131856 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.68 | smp(ms): 7.01 | fwd(ms): 419.48 | crit-fwd(ms): 21.02 | bwd(ms): 639.24 | optim(ms): 57.26 | loss:   10.83294 | train-TER: 39.03 | train-WER: 57.63 | lists/dev.lst-loss:    6.67976 | lists/dev.lst-TER: 19.60 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.10
epoch:      329 | nupdates:       132258 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1124.21 | smp(ms): 7.42 | fwd(ms): 418.58 | crit-fwd(ms): 21.16 | bwd(ms): 643.45 | optim(ms): 57.23 | loss:   10.69132 | train-TER: 41.46 | train-WER: 58.36 | lists/dev.lst-loss:    6.70156 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.66
epoch:      330 | nupdates:       132660 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.06 | smp(ms): 7.23 | fwd(ms): 417.86 | crit-fwd(ms): 21.15 | bwd(ms): 640.94 | optim(ms): 57.23 | loss:   10.85531 | train-TER: 41.36 | train-WER: 58.88 | lists/dev.lst-loss:    6.67632 | lists/dev.lst-TER: 20.09 | lists/dev.lst-WER: 34.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.84
epoch:      331 | nupdates:       133062 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.99 | smp(ms): 5.75 | fwd(ms): 419.02 | crit-fwd(ms): 20.90 | bwd(ms): 639.73 | optim(ms): 57.24 | loss:   10.80438 | train-TER: 41.58 | train-WER: 58.68 | lists/dev.lst-loss:    6.67867 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.89
epoch:      332 | nupdates:       133464 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:33 | bch(ms): 1129.12 | smp(ms): 6.69 | fwd(ms): 420.57 | crit-fwd(ms): 21.19 | bwd(ms): 646.30 | optim(ms): 57.23 | loss:   10.82993 | train-TER: 41.24 | train-WER: 58.64 | lists/dev.lst-loss:    6.57723 | lists/dev.lst-TER: 19.50 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 774.27
epoch:      333 | nupdates:       133866 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:36 | bch(ms): 1134.89 | smp(ms): 7.13 | fwd(ms): 418.16 | crit-fwd(ms): 21.05 | bwd(ms): 654.69 | optim(ms): 57.23 | loss:   10.78275 | train-TER: 41.07 | train-WER: 59.83 | lists/dev.lst-loss:    6.75549 | lists/dev.lst-TER: 20.17 | lists/dev.lst-WER: 34.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 770.34
epoch:      334 | nupdates:       134268 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1125.25 | smp(ms): 6.91 | fwd(ms): 418.37 | crit-fwd(ms): 21.16 | bwd(ms): 644.84 | optim(ms): 57.20 | loss:   10.77315 | train-TER: 43.41 | train-WER: 60.68 | lists/dev.lst-loss:    6.69076 | lists/dev.lst-TER: 20.25 | lists/dev.lst-WER: 34.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 776.93
epoch:      335 | nupdates:       134670 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 7.32 | fwd(ms): 418.66 | crit-fwd(ms): 21.15 | bwd(ms): 640.25 | optim(ms): 57.23 | loss:   10.73087 | train-TER: 39.07 | train-WER: 57.27 | lists/dev.lst-loss:    6.73155 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 34.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.97
epoch:      336 | nupdates:       135072 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1117.05 | smp(ms): 7.42 | fwd(ms): 417.77 | crit-fwd(ms): 21.40 | bwd(ms): 637.09 | optim(ms): 57.25 | loss:   10.89123 | train-TER: 37.99 | train-WER: 54.81 | lists/dev.lst-loss:    6.75205 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 782.64
epoch:      337 | nupdates:       135474 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1119.21 | smp(ms): 6.95 | fwd(ms): 417.85 | crit-fwd(ms): 21.09 | bwd(ms): 639.37 | optim(ms): 57.24 | loss:   11.02013 | train-TER: 44.59 | train-WER: 61.33 | lists/dev.lst-loss:    6.73084 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.13
epoch:      338 | nupdates:       135876 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.79 | smp(ms): 8.22 | fwd(ms): 417.09 | crit-fwd(ms): 21.01 | bwd(ms): 640.96 | optim(ms): 57.23 | loss:   10.85372 | train-TER: 45.72 | train-WER: 63.84 | lists/dev.lst-loss:    6.65583 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.73
epoch:      339 | nupdates:       136278 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.27 | smp(ms): 5.73 | fwd(ms): 419.20 | crit-fwd(ms): 21.09 | bwd(ms): 639.03 | optim(ms): 57.23 | loss:   10.95398 | train-TER: 41.21 | train-WER: 59.35 | lists/dev.lst-loss:    6.67316 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.69
epoch:      340 | nupdates:       136680 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.39 | smp(ms): 7.26 | fwd(ms): 417.62 | crit-fwd(ms): 21.01 | bwd(ms): 641.43 | optim(ms): 57.21 | loss:   10.87525 | train-TER: 44.39 | train-WER: 61.18 | lists/dev.lst-loss:    6.69762 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.61
epoch:      341 | nupdates:       137082 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.64 | smp(ms): 8.20 | fwd(ms): 418.02 | crit-fwd(ms): 20.93 | bwd(ms): 641.33 | optim(ms): 57.24 | loss:   10.92946 | train-TER: 47.92 | train-WER: 64.85 | lists/dev.lst-loss:    6.60496 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.44
epoch:      342 | nupdates:       137484 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.08 | smp(ms): 4.54 | fwd(ms): 418.69 | crit-fwd(ms): 20.98 | bwd(ms): 639.44 | optim(ms): 57.21 | loss:   10.55190 | train-TER: 40.16 | train-WER: 58.84 | lists/dev.lst-loss:    6.62945 | lists/dev.lst-TER: 19.47 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.52
epoch:      343 | nupdates:       137886 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:34 | bch(ms): 1131.34 | smp(ms): 7.58 | fwd(ms): 417.90 | crit-fwd(ms): 20.98 | bwd(ms): 651.43 | optim(ms): 57.21 | loss:   10.77964 | train-TER: 38.16 | train-WER: 54.80 | lists/dev.lst-loss:    6.69175 | lists/dev.lst-TER: 19.65 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 772.76
epoch:      344 | nupdates:       138288 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1116.61 | smp(ms): 5.33 | fwd(ms): 418.18 | crit-fwd(ms): 20.97 | bwd(ms): 635.78 | optim(ms): 57.23 | loss:   10.92030 | train-TER: 44.31 | train-WER: 61.06 | lists/dev.lst-loss:    6.68560 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.95
epoch:      345 | nupdates:       138690 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.88 | smp(ms): 8.06 | fwd(ms): 416.78 | crit-fwd(ms): 21.07 | bwd(ms): 640.89 | optim(ms): 57.19 | loss:   10.72552 | train-TER: 35.15 | train-WER: 54.80 | lists/dev.lst-loss:    6.67925 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.66
epoch:      346 | nupdates:       139092 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:32 | bch(ms): 1125.22 | smp(ms): 6.33 | fwd(ms): 418.75 | crit-fwd(ms): 20.92 | bwd(ms): 644.24 | optim(ms): 57.18 | loss:   10.66137 | train-TER: 42.73 | train-WER: 60.39 | lists/dev.lst-loss:    6.71087 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 33.98 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.96
epoch:      347 | nupdates:       139494 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.56 | smp(ms): 7.02 | fwd(ms): 418.85 | crit-fwd(ms): 21.05 | bwd(ms): 639.60 | optim(ms): 57.22 | loss:   10.87768 | train-TER: 40.39 | train-WER: 58.12 | lists/dev.lst-loss:    6.65764 | lists/dev.lst-TER: 19.67 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.19
epoch:      348 | nupdates:       139896 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.68 | smp(ms): 6.53 | fwd(ms): 417.16 | crit-fwd(ms): 21.00 | bwd(ms): 641.09 | optim(ms): 57.23 | loss:   10.93024 | train-TER: 48.29 | train-WER: 65.10 | lists/dev.lst-loss:    6.64501 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.11
epoch:      349 | nupdates:       140298 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.77 | smp(ms): 6.65 | fwd(ms): 419.90 | crit-fwd(ms): 21.05 | bwd(ms): 640.52 | optim(ms): 57.22 | loss:   10.83907 | train-TER: 41.24 | train-WER: 59.29 | lists/dev.lst-loss:    6.71243 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.66
epoch:      350 | nupdates:       140700 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.40 | smp(ms): 7.12 | fwd(ms): 418.32 | crit-fwd(ms): 20.95 | bwd(ms): 640.06 | optim(ms): 57.24 | loss:   10.64456 | train-TER: 47.36 | train-WER: 64.98 | lists/dev.lst-loss:    6.60474 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.30
epoch:      351 | nupdates:       141102 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1123.63 | smp(ms): 6.93 | fwd(ms): 418.48 | crit-fwd(ms): 21.39 | bwd(ms): 643.42 | optim(ms): 57.21 | loss:   10.56230 | train-TER: 42.91 | train-WER: 61.16 | lists/dev.lst-loss:    6.59990 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.06
epoch:      352 | nupdates:       141504 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.26 | smp(ms): 5.71 | fwd(ms): 419.46 | crit-fwd(ms): 20.99 | bwd(ms): 638.94 | optim(ms): 57.25 | loss:   10.67672 | train-TER: 35.06 | train-WER: 51.89 | lists/dev.lst-loss:    6.59618 | lists/dev.lst-TER: 19.66 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 780.40
epoch:      353 | nupdates:       141906 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.20 | smp(ms): 8.04 | fwd(ms): 418.37 | crit-fwd(ms): 20.98 | bwd(ms): 640.77 | optim(ms): 57.22 | loss:   10.99347 | train-TER: 40.91 | train-WER: 57.35 | lists/dev.lst-loss:    6.66943 | lists/dev.lst-TER: 19.64 | lists/dev.lst-WER: 33.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.74
epoch:      354 | nupdates:       142308 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.88 | smp(ms): 7.20 | fwd(ms): 418.56 | crit-fwd(ms): 21.02 | bwd(ms): 639.07 | optim(ms): 57.23 | loss:   10.61850 | train-TER: 36.69 | train-WER: 54.70 | lists/dev.lst-loss:    6.66907 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.66
epoch:      355 | nupdates:       142710 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1121.94 | smp(ms): 7.51 | fwd(ms): 418.77 | crit-fwd(ms): 21.09 | bwd(ms): 640.83 | optim(ms): 57.21 | loss:   10.72346 | train-TER: 41.79 | train-WER: 59.93 | lists/dev.lst-loss:    6.65510 | lists/dev.lst-TER: 19.60 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs:   97.62 | thrpt(sec/sec): 779.23
epoch:      356 | nupdates:       143112 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.20 | smp(ms): 7.40 | fwd(ms): 418.91 | crit-fwd(ms): 21.13 | bwd(ms): 639.00 | optim(ms): 57.22 | loss:   10.80536 | train-TER: 48.13 | train-WER: 65.24 | lists/dev.lst-loss:    6.66143 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.44
epoch:      357 | nupdates:       143514 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.68 | smp(ms): 6.11 | fwd(ms): 417.78 | crit-fwd(ms): 21.02 | bwd(ms): 639.69 | optim(ms): 57.22 | loss:   10.57769 | train-TER: 38.02 | train-WER: 56.00 | lists/dev.lst-loss:    6.73684 | lists/dev.lst-TER: 19.88 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.80
epoch:      358 | nupdates:       143916 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.92 | smp(ms): 5.47 | fwd(ms): 417.57 | crit-fwd(ms): 21.04 | bwd(ms): 639.12 | optim(ms): 57.24 | loss:   10.63500 | train-TER: 40.68 | train-WER: 58.58 | lists/dev.lst-loss:    6.71481 | lists/dev.lst-TER: 19.90 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.33
epoch:      359 | nupdates:       144318 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.19 | smp(ms): 6.65 | fwd(ms): 418.51 | crit-fwd(ms): 21.00 | bwd(ms): 637.75 | optim(ms): 57.22 | loss:   10.94275 | train-TER: 43.29 | train-WER: 61.43 | lists/dev.lst-loss:    6.62894 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.84
epoch:      360 | nupdates:       144720 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1119.19 | smp(ms): 5.86 | fwd(ms): 417.40 | crit-fwd(ms): 21.04 | bwd(ms): 639.65 | optim(ms): 57.22 | loss:   10.70565 | train-TER: 44.41 | train-WER: 62.68 | lists/dev.lst-loss:    6.73623 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.15
epoch:      361 | nupdates:       145122 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1119.25 | smp(ms): 5.72 | fwd(ms): 417.23 | crit-fwd(ms): 20.92 | bwd(ms): 639.30 | optim(ms): 57.24 | loss:   10.80538 | train-TER: 44.84 | train-WER: 62.61 | lists/dev.lst-loss:    6.65564 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.10
epoch:      362 | nupdates:       145524 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.93 | smp(ms): 6.25 | fwd(ms): 417.72 | crit-fwd(ms): 21.02 | bwd(ms): 638.63 | optim(ms): 57.25 | loss:   10.60469 | train-TER: 44.62 | train-WER: 61.79 | lists/dev.lst-loss:    6.67576 | lists/dev.lst-TER: 19.63 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.32
epoch:      363 | nupdates:       145926 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.65 | smp(ms): 6.99 | fwd(ms): 418.94 | crit-fwd(ms): 21.01 | bwd(ms): 641.12 | optim(ms): 57.20 | loss:   10.81291 | train-TER: 47.05 | train-WER: 64.34 | lists/dev.lst-loss:    6.63599 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.74
epoch:      364 | nupdates:       146328 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.51 | smp(ms): 6.31 | fwd(ms): 417.10 | crit-fwd(ms): 21.09 | bwd(ms): 639.50 | optim(ms): 57.22 | loss:   10.82430 | train-TER: 42.32 | train-WER: 60.30 | lists/dev.lst-loss:    6.66549 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.62
epoch:      365 | nupdates:       146730 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.79 | smp(ms): 6.72 | fwd(ms): 418.29 | crit-fwd(ms): 20.95 | bwd(ms): 642.36 | optim(ms): 57.19 | loss:   10.68717 | train-TER: 47.24 | train-WER: 65.46 | lists/dev.lst-loss:    6.70168 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.64
epoch:      366 | nupdates:       147132 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1123.72 | smp(ms): 7.98 | fwd(ms): 419.31 | crit-fwd(ms): 21.11 | bwd(ms): 642.50 | optim(ms): 57.23 | loss:   10.70517 | train-TER: 41.96 | train-WER: 59.62 | lists/dev.lst-loss:    6.70760 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.99
epoch:      367 | nupdates:       147534 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:33 | bch(ms): 1128.79 | smp(ms): 8.14 | fwd(ms): 419.81 | crit-fwd(ms): 21.25 | bwd(ms): 646.95 | optim(ms): 57.19 | loss:   10.73120 | train-TER: 31.01 | train-WER: 48.88 | lists/dev.lst-loss:    6.69520 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 33.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 774.50
epoch:      368 | nupdates:       147936 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.24 | smp(ms): 6.52 | fwd(ms): 417.76 | crit-fwd(ms): 21.05 | bwd(ms): 641.21 | optim(ms): 57.21 | loss:   10.68916 | train-TER: 42.01 | train-WER: 59.07 | lists/dev.lst-loss:    6.74897 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.71
epoch:      369 | nupdates:       148338 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1117.61 | smp(ms): 6.13 | fwd(ms): 418.39 | crit-fwd(ms): 21.26 | bwd(ms): 636.24 | optim(ms): 57.24 | loss:   10.69075 | train-TER: 43.12 | train-WER: 60.67 | lists/dev.lst-loss:    6.58688 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.25
epoch:      370 | nupdates:       148740 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.40 | smp(ms): 7.72 | fwd(ms): 417.65 | crit-fwd(ms): 21.28 | bwd(ms): 642.40 | optim(ms): 57.21 | loss:   10.87215 | train-TER: 40.21 | train-WER: 58.63 | lists/dev.lst-loss:    6.61945 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.91
epoch:      371 | nupdates:       149142 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.24 | smp(ms): 6.42 | fwd(ms): 418.67 | crit-fwd(ms): 20.97 | bwd(ms): 639.23 | optim(ms): 57.22 | loss:   10.61025 | train-TER: 46.16 | train-WER: 62.50 | lists/dev.lst-loss:    6.68208 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.41
epoch:      372 | nupdates:       149544 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.79 | smp(ms): 5.11 | fwd(ms): 418.69 | crit-fwd(ms): 21.00 | bwd(ms): 638.65 | optim(ms): 57.21 | loss:   10.74536 | train-TER: 40.76 | train-WER: 57.79 | lists/dev.lst-loss:    6.68823 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.73
epoch:      373 | nupdates:       149946 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1116.46 | smp(ms): 7.35 | fwd(ms): 416.65 | crit-fwd(ms): 21.16 | bwd(ms): 637.79 | optim(ms): 57.21 | loss:   10.89943 | train-TER: 38.84 | train-WER: 57.21 | lists/dev.lst-loss:    6.69341 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 783.06
epoch:      374 | nupdates:       150348 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.50 | smp(ms): 7.09 | fwd(ms): 417.02 | crit-fwd(ms): 21.20 | bwd(ms): 640.63 | optim(ms): 57.23 | loss:   10.71602 | train-TER: 37.35 | train-WER: 55.89 | lists/dev.lst-loss:    6.63854 | lists/dev.lst-TER: 19.59 | lists/dev.lst-WER: 33.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 780.93
epoch:      375 | nupdates:       150750 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1115.36 | smp(ms): 6.82 | fwd(ms): 417.23 | crit-fwd(ms): 21.07 | bwd(ms): 635.92 | optim(ms): 57.25 | loss:   10.74817 | train-TER: 38.59 | train-WER: 55.37 | lists/dev.lst-loss:    6.68849 | lists/dev.lst-TER: 20.18 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 783.83
epoch:      376 | nupdates:       151152 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.78 | smp(ms): 8.22 | fwd(ms): 417.07 | crit-fwd(ms): 21.21 | bwd(ms): 643.75 | optim(ms): 57.21 | loss:   10.77428 | train-TER: 41.59 | train-WER: 60.24 | lists/dev.lst-loss:    6.61870 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.65
epoch:      377 | nupdates:       151554 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.40 | smp(ms): 6.81 | fwd(ms): 420.51 | crit-fwd(ms): 21.18 | bwd(ms): 638.97 | optim(ms): 57.22 | loss:   10.63653 | train-TER: 40.69 | train-WER: 58.46 | lists/dev.lst-loss:    6.64540 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.61
epoch:      378 | nupdates:       151956 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.65 | smp(ms): 6.22 | fwd(ms): 418.68 | crit-fwd(ms): 21.26 | bwd(ms): 637.80 | optim(ms): 57.24 | loss:   10.87476 | train-TER: 44.23 | train-WER: 61.85 | lists/dev.lst-loss:    6.63541 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.52
epoch:      379 | nupdates:       152358 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.86 | smp(ms): 6.84 | fwd(ms): 418.92 | crit-fwd(ms): 20.91 | bwd(ms): 640.92 | optim(ms): 57.21 | loss:   10.59453 | train-TER: 42.60 | train-WER: 60.01 | lists/dev.lst-loss:    6.57962 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 33.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 779.28
epoch:      380 | nupdates:       152760 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1126.29 | smp(ms): 6.61 | fwd(ms): 418.76 | crit-fwd(ms): 21.23 | bwd(ms): 645.36 | optim(ms): 57.26 | loss:   10.74273 | train-TER: 48.93 | train-WER: 65.37 | lists/dev.lst-loss:    6.69067 | lists/dev.lst-TER: 19.63 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 776.22
epoch:      381 | nupdates:       153162 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 6.71 | fwd(ms): 418.56 | crit-fwd(ms): 20.99 | bwd(ms): 639.91 | optim(ms): 57.22 | loss:   10.73482 | train-TER: 44.53 | train-WER: 62.77 | lists/dev.lst-loss:    6.72419 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 779.97
epoch:      382 | nupdates:       153564 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.83 | smp(ms): 6.43 | fwd(ms): 418.62 | crit-fwd(ms): 21.02 | bwd(ms): 643.12 | optim(ms): 57.23 | loss:   10.73894 | train-TER: 34.70 | train-WER: 52.31 | lists/dev.lst-loss:    6.66490 | lists/dev.lst-TER: 19.79 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.92
epoch:      383 | nupdates:       153966 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.83 | smp(ms): 7.19 | fwd(ms): 418.61 | crit-fwd(ms): 21.11 | bwd(ms): 644.22 | optim(ms): 57.22 | loss:   10.84190 | train-TER: 47.90 | train-WER: 65.20 | lists/dev.lst-loss:    6.64215 | lists/dev.lst-TER: 19.62 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.23
epoch:      384 | nupdates:       154368 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1118.47 | smp(ms): 7.17 | fwd(ms): 418.47 | crit-fwd(ms): 21.06 | bwd(ms): 637.92 | optim(ms): 57.24 | loss:   10.76920 | train-TER: 42.60 | train-WER: 60.00 | lists/dev.lst-loss:    6.61777 | lists/dev.lst-TER: 19.57 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.65
epoch:      385 | nupdates:       154770 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.39 | smp(ms): 7.13 | fwd(ms): 419.08 | crit-fwd(ms): 21.07 | bwd(ms): 643.21 | optim(ms): 57.22 | loss:   10.84138 | train-TER: 44.53 | train-WER: 62.33 | lists/dev.lst-loss:    6.65517 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.53
epoch:      386 | nupdates:       155172 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1119.36 | smp(ms): 6.84 | fwd(ms): 417.83 | crit-fwd(ms): 21.14 | bwd(ms): 639.66 | optim(ms): 57.25 | loss:   10.75169 | train-TER: 43.95 | train-WER: 62.08 | lists/dev.lst-loss:    6.60215 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 781.02
epoch:      387 | nupdates:       155574 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1126.64 | smp(ms): 7.29 | fwd(ms): 419.80 | crit-fwd(ms): 21.05 | bwd(ms): 644.80 | optim(ms): 57.21 | loss:   10.65912 | train-TER: 34.57 | train-WER: 51.59 | lists/dev.lst-loss:    6.66376 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 775.98
epoch:      388 | nupdates:       155976 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.30 | smp(ms): 7.31 | fwd(ms): 418.33 | crit-fwd(ms): 21.31 | bwd(ms): 641.73 | optim(ms): 57.21 | loss:   10.62669 | train-TER: 46.35 | train-WER: 63.95 | lists/dev.lst-loss:    6.67349 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 33.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.98
epoch:      389 | nupdates:       156378 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.34 | smp(ms): 7.23 | fwd(ms): 418.26 | crit-fwd(ms): 21.16 | bwd(ms): 643.89 | optim(ms): 57.20 | loss:   10.75452 | train-TER: 45.12 | train-WER: 62.49 | lists/dev.lst-loss:    6.67610 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 777.56
epoch:      390 | nupdates:       156780 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.01 | smp(ms): 7.92 | fwd(ms): 418.60 | crit-fwd(ms): 21.23 | bwd(ms): 642.24 | optim(ms): 57.22 | loss:   10.73723 | train-TER: 50.22 | train-WER: 68.62 | lists/dev.lst-loss:    6.64329 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.49
epoch:      391 | nupdates:       157182 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.19 | smp(ms): 8.26 | fwd(ms): 418.19 | crit-fwd(ms): 21.11 | bwd(ms): 641.52 | optim(ms): 57.25 | loss:   10.75576 | train-TER: 42.55 | train-WER: 60.68 | lists/dev.lst-loss:    6.64239 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 779.05
epoch:      392 | nupdates:       157584 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.35 | smp(ms): 7.34 | fwd(ms): 418.32 | crit-fwd(ms): 21.10 | bwd(ms): 643.46 | optim(ms): 57.24 | loss:   10.64738 | train-TER: 41.47 | train-WER: 59.60 | lists/dev.lst-loss:    6.61881 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.56
epoch:      393 | nupdates:       157986 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:28 | bch(ms): 1116.80 | smp(ms): 6.79 | fwd(ms): 417.06 | crit-fwd(ms): 21.20 | bwd(ms): 637.89 | optim(ms): 57.26 | loss:   10.47069 | train-TER: 41.11 | train-WER: 57.11 | lists/dev.lst-loss:    6.59647 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 782.82
epoch:      394 | nupdates:       158388 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:30 | bch(ms): 1119.47 | smp(ms): 4.96 | fwd(ms): 417.22 | crit-fwd(ms): 20.93 | bwd(ms): 638.43 | optim(ms): 57.23 | loss:   10.66487 | train-TER: 43.43 | train-WER: 60.14 | lists/dev.lst-loss:    6.64685 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 780.95
epoch:      395 | nupdates:       158790 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1125.30 | smp(ms): 7.04 | fwd(ms): 419.28 | crit-fwd(ms): 21.30 | bwd(ms): 643.98 | optim(ms): 57.23 | loss:   10.68931 | train-TER: 44.86 | train-WER: 62.54 | lists/dev.lst-loss:    6.60740 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.91
epoch:      396 | nupdates:       159192 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.13 | smp(ms): 6.57 | fwd(ms): 419.13 | crit-fwd(ms): 21.08 | bwd(ms): 642.24 | optim(ms): 57.23 | loss:   10.60523 | train-TER: 38.68 | train-WER: 56.60 | lists/dev.lst-loss:    6.57608 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 777.71
epoch:      397 | nupdates:       159594 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.64 | smp(ms): 7.56 | fwd(ms): 418.76 | crit-fwd(ms): 20.96 | bwd(ms): 642.06 | optim(ms): 57.23 | loss:   10.74693 | train-TER: 40.34 | train-WER: 57.30 | lists/dev.lst-loss:    6.60898 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs:   97.62 | thrpt(sec/sec): 778.74
epoch:      398 | nupdates:       159996 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:28 | bch(ms): 1116.67 | smp(ms): 5.10 | fwd(ms): 417.85 | crit-fwd(ms): 21.01 | bwd(ms): 636.57 | optim(ms): 57.25 | loss:   10.58123 | train-TER: 44.81 | train-WER: 61.63 | lists/dev.lst-loss:    6.59653 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.88[[ | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 782.90
epoch:      399 | nupdates:       160398 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.11 | smp(ms): 8.13 | fwd(ms): 418.90 | crit-fwd(ms): 21.12 | bwd(ms): 642.17 | optim(ms): 57.25 | loss:   10.53012 | train-TER: 40.06 | train-WER: 56.77 | lists/dev.lst-loss:    6.62226 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.42
epoch:      400 | nupdates:       160800 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.56 | smp(ms): 7.06 | fwd(ms): 418.75 | crit-fwd(ms): 21.09 | bwd(ms): 641.36 | optim(ms): 57.24 | loss:   10.64156 | train-TER: 52.41 | train-WER: 68.82 | lists/dev.lst-loss:    6.67411 | lists/dev.lst-TER: 19.79 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 778.80
epoch:      401 | nupdates:       161202 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1118.23 | smp(ms): 3.67 | fwd(ms): 417.46 | crit-fwd(ms): 20.88 | bwd(ms): 637.65 | optim(ms): 57.31 | loss:   10.64980 | train-TER: 42.47 | train-WER: 60.65 | lists/dev.lst-loss:    6.61162 | lists/dev.lst-TER: 19.59 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 781.81
epoch:      402 | nupdates:       161604 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.50 | smp(ms): 4.92 | fwd(ms): 420.02 | crit-fwd(ms): 20.92 | bwd(ms): 642.55 | optim(ms): 57.33 | loss:   10.77812 | train-TER: 48.15 | train-WER: 65.94 | lists/dev.lst-loss:    6.58243 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 777.45
epoch:      403 | nupdates:       162006 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.55 | smp(ms): 6.38 | fwd(ms): 419.54 | crit-fwd(ms): 20.96 | bwd(ms): 640.69 | optim(ms): 57.22 | loss:   10.65866 | train-TER: 41.94 | train-WER: 60.21 | lists/dev.lst-loss:    6.61306 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs:   97.62 | thrpt(sec/sec): 778.81
epoch:      404 | nupdates:       162408 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1125.92 | smp(ms): 7.74 | fwd(ms): 418.89 | crit-fwd(ms): 21.13 | bwd(ms): 644.72 | optim(ms): 57.24 | loss:   10.54506 | train-TER: 43.04 | train-WER: 60.40 | lists/dev.lst-loss:    6.61504 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs:   97.62 | thrpt(sec/sec): 776.48