epoch: 1 | nupdates: 402 | lr: 0.006700 | lrcriterion: 0.006700 | runtime: 00:07:41 | bch(ms): 1148.24 | smp(ms): 3.35 | fwd(ms): 433.08 | crit-fwd(ms): 22.23 | bwd(ms): 637.68 | optim(ms): 61.02 | loss: 79.62127 | train-TER: 184.04 | train-WER: 155.98 | lists/dev.lst-loss: 36.50141 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 761.38
epoch: 2 | nupdates: 804 | lr: 0.013400 | lrcriterion: 0.013400 | runtime: 00:07:32 | bch(ms): 1126.31 | smp(ms): 7.81 | fwd(ms): 421.71 | crit-fwd(ms): 21.37 | bwd(ms): 642.40 | optim(ms): 57.33 | loss: 34.09406 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 31.94590 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.20
epoch: 3 | nupdates: 1206 | lr: 0.020100 | lrcriterion: 0.020100 | runtime: 00:07:37 | bch(ms): 1137.09 | smp(ms): 6.89 | fwd(ms): 421.21 | crit-fwd(ms): 21.01 | bwd(ms): 653.89 | optim(ms): 57.32 | loss: 31.66174 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 30.70076 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 768.85
epoch: 4 | nupdates: 1608 | lr: 0.026800 | lrcriterion: 0.026800 | runtime: 00:07:36 | bch(ms): 1134.58 | smp(ms): 7.41 | fwd(ms): 422.17 | crit-fwd(ms): 21.11 | bwd(ms): 649.80 | optim(ms): 57.39 | loss: 30.66355 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 30.00350 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.55
epoch: 5 | nupdates: 2010 | lr: 0.033500 | lrcriterion: 0.033500 | runtime: 00:07:35 | bch(ms): 1134.09 | smp(ms): 6.93 | fwd(ms): 423.48 | crit-fwd(ms): 21.15 | bwd(ms): 648.60 | optim(ms): 57.42 | loss: 30.05698 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 29.69616 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.88
epoch: 6 | nupdates: 2412 | lr: 0.040200 | lrcriterion: 0.040200 | runtime: 00:07:35 | bch(ms): 1132.80 | smp(ms): 6.23 | fwd(ms): 421.72 | crit-fwd(ms): 20.82 | bwd(ms): 648.32 | optim(ms): 57.40 | loss: 29.64941 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss: 29.19304 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.76
epoch: 7 | nupdates: 2814 | lr: 0.046900 | lrcriterion: 0.046900 | runtime: 00:07:33 | bch(ms): 1127.89 | smp(ms): 6.59 | fwd(ms): 420.74 | crit-fwd(ms): 21.16 | bwd(ms): 644.62 | optim(ms): 57.47 | loss: 29.34847 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss: 29.54366 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 775.12
epoch: 8 | nupdates: 3216 | lr: 0.053600 | lrcriterion: 0.053600 | runtime: 00:07:35 | bch(ms): 1133.11 | smp(ms): 6.81 | fwd(ms): 421.49 | crit-fwd(ms): 21.36 | bwd(ms): 649.40 | optim(ms): 57.41 | loss: 29.17970 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss: 29.02254 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.55
epoch: 9 | nupdates: 3618 | lr: 0.060300 | lrcriterion: 0.060300 | runtime: 00:07:34 | bch(ms): 1131.26 | smp(ms): 8.04 | fwd(ms): 420.30 | crit-fwd(ms): 21.14 | bwd(ms): 648.43 | optim(ms): 57.41 | loss: 29.04865 | train-TER: 99.97 | train-WER: 99.99 | lists/dev.lst-loss: 28.78550 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.81
epoch: 10 | nupdates: 4020 | lr: 0.067000 | lrcriterion: 0.067000 | runtime: 00:07:32 | bch(ms): 1125.92 | smp(ms): 6.84 | fwd(ms): 419.38 | crit-fwd(ms): 21.22 | bwd(ms): 644.47 | optim(ms): 57.41 | loss: 28.90197 | train-TER: 99.99 | train-WER: 100.00 | lists/dev.lst-loss: 28.52354 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.48
epoch: 11 | nupdates: 4422 | lr: 0.073700 | lrcriterion: 0.073700 | runtime: 00:07:34 | bch(ms): 1131.37 | smp(ms): 7.69 | fwd(ms): 420.70 | crit-fwd(ms): 21.03 | bwd(ms): 648.66 | optim(ms): 57.35 | loss: 28.79002 | train-TER: 99.94 | train-WER: 100.00 | lists/dev.lst-loss: 28.63813 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.74
epoch: 12 | nupdates: 4824 | lr: 0.080400 | lrcriterion: 0.080400 | runtime: 00:07:35 | bch(ms): 1132.57 | smp(ms): 6.71 | fwd(ms): 421.69 | crit-fwd(ms): 21.23 | bwd(ms): 648.70 | optim(ms): 57.33 | loss: 28.71151 | train-TER: 99.75 | train-WER: 99.94 | lists/dev.lst-loss: 28.78160 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 771.92
epoch: 13 | nupdates: 5226 | lr: 0.087100 | lrcriterion: 0.087100 | runtime: 00:07:35 | bch(ms): 1132.22 | smp(ms): 7.09 | fwd(ms): 421.24 | crit-fwd(ms): 20.96 | bwd(ms): 648.54 | optim(ms): 57.30 | loss: 28.55661 | train-TER: 99.79 | train-WER: 100.00 | lists/dev.lst-loss: 28.21670 | lists/dev.lst-TER: 99.73 | lists/dev.lst-WER: 100.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.16
epoch: 14 | nupdates: 5628 | lr: 0.093800 | lrcriterion: 0.093800 | runtime: 00:07:40 | bch(ms): 1144.84 | smp(ms): 6.44 | fwd(ms): 422.38 | crit-fwd(ms): 21.09 | bwd(ms): 660.54 | optim(ms): 57.30 | loss: 28.44571 | train-TER: 99.75 | train-WER: 99.91 | lists/dev.lst-loss: 28.02138 | lists/dev.lst-TER: 99.35 | lists/dev.lst-WER: 99.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 763.64
epoch: 15 | nupdates: 6030 | lr: 0.100500 | lrcriterion: 0.100500 | runtime: 00:07:40 | bch(ms): 1145.86 | smp(ms): 8.44 | fwd(ms): 420.19 | crit-fwd(ms): 21.05 | bwd(ms): 663.58 | optim(ms): 57.29 | loss: 28.31598 | train-TER: 99.60 | train-WER: 99.82 | lists/dev.lst-loss: 28.49923 | lists/dev.lst-TER: 99.84 | lists/dev.lst-WER: 99.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 762.96
epoch: 16 | nupdates: 6432 | lr: 0.107200 | lrcriterion: 0.107200 | runtime: 00:07:40 | bch(ms): 1144.95 | smp(ms): 5.84 | fwd(ms): 422.15 | crit-fwd(ms): 20.92 | bwd(ms): 660.73 | optim(ms): 57.28 | loss: 28.13958 | train-TER: 99.46 | train-WER: 99.69 | lists/dev.lst-loss: 27.89934 | lists/dev.lst-TER: 97.08 | lists/dev.lst-WER: 98.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 763.57
epoch: 17 | nupdates: 6834 | lr: 0.113900 | lrcriterion: 0.113900 | runtime: 00:07:42 | bch(ms): 1151.12 | smp(ms): 7.27 | fwd(ms): 422.82 | crit-fwd(ms): 20.99 | bwd(ms): 666.03 | optim(ms): 57.25 | loss: 27.90646 | train-TER: 99.19 | train-WER: 99.50 | lists/dev.lst-loss: 27.97491 | lists/dev.lst-TER: 94.38 | lists/dev.lst-WER: 97.69 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 759.47
epoch: 18 | nupdates: 7236 | lr: 0.120600 | lrcriterion: 0.120600 | runtime: 00:07:41 | bch(ms): 1147.21 | smp(ms): 7.50 | fwd(ms): 422.58 | crit-fwd(ms): 20.92 | bwd(ms): 662.31 | optim(ms): 57.27 | loss: 27.66473 | train-TER: 99.54 | train-WER: 99.57 | lists/dev.lst-loss: 27.13344 | lists/dev.lst-TER: 96.15 | lists/dev.lst-WER: 97.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 762.07
epoch: 19 | nupdates: 7638 | lr: 0.127300 | lrcriterion: 0.127300 | runtime: 00:07:35 | bch(ms): 1132.63 | smp(ms): 6.93 | fwd(ms): 422.31 | crit-fwd(ms): 21.09 | bwd(ms): 647.89 | optim(ms): 57.26 | loss: 27.37545 | train-TER: 98.89 | train-WER: 98.97 | lists/dev.lst-loss: 26.81882 | lists/dev.lst-TER: 93.12 | lists/dev.lst-WER: 96.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 771.88
epoch: 20 | nupdates: 8040 | lr: 0.134000 | lrcriterion: 0.134000 | runtime: 00:07:39 | bch(ms): 1144.09 | smp(ms): 6.70 | fwd(ms): 421.11 | crit-fwd(ms): 20.88 | bwd(ms): 660.73 | optim(ms): 57.25 | loss: 27.08303 | train-TER: 97.37 | train-WER: 98.48 | lists/dev.lst-loss: 26.36108 | lists/dev.lst-TER: 96.25 | lists/dev.lst-WER: 97.52 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 764.14
epoch: 21 | nupdates: 8442 | lr: 0.140700 | lrcriterion: 0.140700 | runtime: 00:07:35 | bch(ms): 1133.09 | smp(ms): 6.55 | fwd(ms): 422.54 | crit-fwd(ms): 20.99 | bwd(ms): 648.53 | optim(ms): 57.25 | loss: 26.74288 | train-TER: 97.55 | train-WER: 98.28 | lists/dev.lst-loss: 25.92736 | lists/dev.lst-TER: 93.99 | lists/dev.lst-WER: 96.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.56
epoch: 22 | nupdates: 8844 | lr: 0.147400 | lrcriterion: 0.147400 | runtime: 00:07:39 | bch(ms): 1143.29 | smp(ms): 7.71 | fwd(ms): 420.74 | crit-fwd(ms): 20.98 | bwd(ms): 659.74 | optim(ms): 57.27 | loss: 26.44379 | train-TER: 96.80 | train-WER: 97.86 | lists/dev.lst-loss: 25.62425 | lists/dev.lst-TER: 90.80 | lists/dev.lst-WER: 95.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 764.68
epoch: 23 | nupdates: 9246 | lr: 0.154100 | lrcriterion: 0.154100 | runtime: 00:07:40 | bch(ms): 1144.41 | smp(ms): 6.14 | fwd(ms): 422.02 | crit-fwd(ms): 20.95 | bwd(ms): 660.24 | optim(ms): 57.26 | loss: 26.14073 | train-TER: 94.92 | train-WER: 97.05 | lists/dev.lst-loss: 25.54093 | lists/dev.lst-TER: 96.45 | lists/dev.lst-WER: 97.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 763.93
epoch: 24 | nupdates: 9648 | lr: 0.160800 | lrcriterion: 0.160800 | runtime: 00:07:36 | bch(ms): 1135.44 | smp(ms): 6.84 | fwd(ms): 421.56 | crit-fwd(ms): 20.99 | bwd(ms): 651.30 | optim(ms): 57.25 | loss: 25.76430 | train-TER: 95.55 | train-WER: 97.08 | lists/dev.lst-loss: 24.96298 | lists/dev.lst-TER: 85.65 | lists/dev.lst-WER: 92.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 769.96
epoch: 25 | nupdates: 10050 | lr: 0.167500 | lrcriterion: 0.167500 | runtime: 00:07:40 | bch(ms): 1145.72 | smp(ms): 7.84 | fwd(ms): 421.36 | crit-fwd(ms): 21.14 | bwd(ms): 661.91 | optim(ms): 57.24 | loss: 25.44469 | train-TER: 93.56 | train-WER: 96.13 | lists/dev.lst-loss: 24.83387 | lists/dev.lst-TER: 95.02 | lists/dev.lst-WER: 96.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 763.05
epoch: 26 | nupdates: 10452 | lr: 0.174200 | lrcriterion: 0.174200 | runtime: 00:07:36 | bch(ms): 1134.99 | smp(ms): 7.48 | fwd(ms): 422.21 | crit-fwd(ms): 21.05 | bwd(ms): 649.59 | optim(ms): 57.25 | loss: 25.11919 | train-TER: 92.50 | train-WER: 95.46 | lists/dev.lst-loss: 24.26034 | lists/dev.lst-TER: 91.94 | lists/dev.lst-WER: 94.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 770.27
epoch: 27 | nupdates: 10854 | lr: 0.180900 | lrcriterion: 0.180900 | runtime: 00:07:36 | bch(ms): 1136.29 | smp(ms): 4.03 | fwd(ms): 420.85 | crit-fwd(ms): 20.82 | bwd(ms): 652.13 | optim(ms): 57.25 | loss: 24.77388 | train-TER: 90.07 | train-WER: 94.50 | lists/dev.lst-loss: 23.71284 | lists/dev.lst-TER: 85.51 | lists/dev.lst-WER: 92.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 769.39
epoch: 28 | nupdates: 11256 | lr: 0.187600 | lrcriterion: 0.187600 | runtime: 00:07:41 | bch(ms): 1148.20 | smp(ms): 7.24 | fwd(ms): 424.22 | crit-fwd(ms): 21.29 | bwd(ms): 661.97 | optim(ms): 57.26 | loss: 24.41542 | train-TER: 89.43 | train-WER: 94.19 | lists/dev.lst-loss: 23.46172 | lists/dev.lst-TER: 83.32 | lists/dev.lst-WER: 92.65 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 761.41
epoch: 29 | nupdates: 11658 | lr: 0.194300 | lrcriterion: 0.194300 | runtime: 00:07:37 | bch(ms): 1139.27 | smp(ms): 7.38 | fwd(ms): 423.15 | crit-fwd(ms): 21.20 | bwd(ms): 654.07 | optim(ms): 57.24 | loss: 24.05792 | train-TER: 88.41 | train-WER: 93.59 | lists/dev.lst-loss: 23.07679 | lists/dev.lst-TER: 80.20 | lists/dev.lst-WER: 88.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 767.37
epoch: 30 | nupdates: 12060 | lr: 0.201000 | lrcriterion: 0.201000 | runtime: 00:07:40 | bch(ms): 1146.24 | smp(ms): 5.74 | fwd(ms): 422.23 | crit-fwd(ms): 20.94 | bwd(ms): 661.27 | optim(ms): 57.26 | loss: 23.72896 | train-TER: 87.26 | train-WER: 92.82 | lists/dev.lst-loss: 22.68104 | lists/dev.lst-TER: 79.57 | lists/dev.lst-WER: 89.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 762.71
epoch: 31 | nupdates: 12462 | lr: 0.207700 | lrcriterion: 0.207700 | runtime: 00:07:35 | bch(ms): 1134.16 | smp(ms): 7.41 | fwd(ms): 421.47 | crit-fwd(ms): 20.97 | bwd(ms): 650.63 | optim(ms): 57.25 | loss: 23.36377 | train-TER: 85.41 | train-WER: 92.92 | lists/dev.lst-loss: 22.25256 | lists/dev.lst-TER: 85.17 | lists/dev.lst-WER: 91.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.83
epoch: 32 | nupdates: 12864 | lr: 0.214400 | lrcriterion: 0.214400 | runtime: 00:07:34 | bch(ms): 1130.29 | smp(ms): 6.98 | fwd(ms): 419.55 | crit-fwd(ms): 20.89 | bwd(ms): 648.30 | optim(ms): 57.24 | loss: 23.05476 | train-TER: 83.63 | train-WER: 91.63 | lists/dev.lst-loss: 22.02975 | lists/dev.lst-TER: 77.81 | lists/dev.lst-WER: 88.27 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.47
epoch: 33 | nupdates: 13266 | lr: 0.221100 | lrcriterion: 0.221100 | runtime: 00:07:39 | bch(ms): 1143.79 | smp(ms): 7.93 | fwd(ms): 421.71 | crit-fwd(ms): 21.19 | bwd(ms): 659.89 | optim(ms): 57.28 | loss: 22.74303 | train-TER: 84.53 | train-WER: 91.64 | lists/dev.lst-loss: 21.54951 | lists/dev.lst-TER: 83.62 | lists/dev.lst-WER: 90.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 764.34
epoch: 34 | nupdates: 13668 | lr: 0.227800 | lrcriterion: 0.227800 | runtime: 00:07:34 | bch(ms): 1130.16 | smp(ms): 6.86 | fwd(ms): 422.02 | crit-fwd(ms): 20.98 | bwd(ms): 646.11 | optim(ms): 57.25 | loss: 22.44189 | train-TER: 84.06 | train-WER: 91.63 | lists/dev.lst-loss: 21.30642 | lists/dev.lst-TER: 83.39 | lists/dev.lst-WER: 90.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 773.56
epoch: 35 | nupdates: 14070 | lr: 0.234500 | lrcriterion: 0.234500 | runtime: 00:07:35 | bch(ms): 1133.66 | smp(ms): 6.15 | fwd(ms): 422.27 | crit-fwd(ms): 21.41 | bwd(ms): 649.64 | optim(ms): 57.24 | loss: 22.12480 | train-TER: 81.17 | train-WER: 90.52 | lists/dev.lst-loss: 21.02684 | lists/dev.lst-TER: 79.89 | lists/dev.lst-WER: 88.21 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.17
epoch: 36 | nupdates: 14472 | lr: 0.241200 | lrcriterion: 0.241200 | runtime: 00:07:41 | bch(ms): 1148.84 | smp(ms): 7.76 | fwd(ms): 422.67 | crit-fwd(ms): 21.23 | bwd(ms): 663.88 | optim(ms): 57.24 | loss: 21.81555 | train-TER: 82.22 | train-WER: 90.66 | lists/dev.lst-loss: 21.11835 | lists/dev.lst-TER: 87.32 | lists/dev.lst-WER: 91.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 760.98
epoch: 37 | nupdates: 14874 | lr: 0.247900 | lrcriterion: 0.247900 | runtime: 00:07:35 | bch(ms): 1133.09 | smp(ms): 6.44 | fwd(ms): 424.03 | crit-fwd(ms): 20.94 | bwd(ms): 647.02 | optim(ms): 57.27 | loss: 21.55370 | train-TER: 83.25 | train-WER: 90.94 | lists/dev.lst-loss: 20.36272 | lists/dev.lst-TER: 73.52 | lists/dev.lst-WER: 86.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 771.56
epoch: 38 | nupdates: 15276 | lr: 0.254600 | lrcriterion: 0.254600 | runtime: 00:07:40 | bch(ms): 1145.25 | smp(ms): 5.53 | fwd(ms): 422.56 | crit-fwd(ms): 21.01 | bwd(ms): 660.47 | optim(ms): 57.26 | loss: 21.29312 | train-TER: 77.29 | train-WER: 88.79 | lists/dev.lst-loss: 20.38654 | lists/dev.lst-TER: 80.81 | lists/dev.lst-WER: 89.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 763.37
epoch: 39 | nupdates: 15678 | lr: 0.261300 | lrcriterion: 0.261300 | runtime: 00:07:36 | bch(ms): 1136.41 | smp(ms): 5.52 | fwd(ms): 423.50 | crit-fwd(ms): 21.09 | bwd(ms): 650.86 | optim(ms): 57.24 | loss: 21.02385 | train-TER: 78.98 | train-WER: 89.40 | lists/dev.lst-loss: 19.79664 | lists/dev.lst-TER: 73.98 | lists/dev.lst-WER: 86.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 769.31
epoch: 40 | nupdates: 16080 | lr: 0.268000 | lrcriterion: 0.268000 | runtime: 00:07:35 | bch(ms): 1133.78 | smp(ms): 5.99 | fwd(ms): 422.21 | crit-fwd(ms): 21.01 | bwd(ms): 649.54 | optim(ms): 57.24 | loss: 20.73723 | train-TER: 78.32 | train-WER: 89.33 | lists/dev.lst-loss: 19.84775 | lists/dev.lst-TER: 80.65 | lists/dev.lst-WER: 88.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 771.09
epoch: 41 | nupdates: 16482 | lr: 0.274700 | lrcriterion: 0.274700 | runtime: 00:07:36 | bch(ms): 1135.47 | smp(ms): 7.55 | fwd(ms): 422.66 | crit-fwd(ms): 21.11 | bwd(ms): 650.73 | optim(ms): 57.25 | loss: 20.50850 | train-TER: 78.49 | train-WER: 88.83 | lists/dev.lst-loss: 19.27892 | lists/dev.lst-TER: 76.16 | lists/dev.lst-WER: 85.96 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 769.95
epoch: 42 | nupdates: 16884 | lr: 0.281400 | lrcriterion: 0.281400 | runtime: 00:07:40 | bch(ms): 1144.84 | smp(ms): 7.08 | fwd(ms): 422.66 | crit-fwd(ms): 21.39 | bwd(ms): 660.14 | optim(ms): 57.25 | loss: 20.24121 | train-TER: 73.76 | train-WER: 87.45 | lists/dev.lst-loss: 19.32172 | lists/dev.lst-TER: 77.82 | lists/dev.lst-WER: 86.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 763.64
epoch: 43 | nupdates: 17286 | lr: 0.288100 | lrcriterion: 0.288100 | runtime: 00:07:37 | bch(ms): 1137.63 | smp(ms): 6.74 | fwd(ms): 421.10 | crit-fwd(ms): 21.22 | bwd(ms): 654.51 | optim(ms): 57.29 | loss: 19.99094 | train-TER: 75.62 | train-WER: 87.67 | lists/dev.lst-loss: 18.68604 | lists/dev.lst-TER: 70.70 | lists/dev.lst-WER: 84.20 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 768.48
epoch: 44 | nupdates: 17688 | lr: 0.294800 | lrcriterion: 0.294800 | runtime: 00:07:41 | bch(ms): 1149.25 | smp(ms): 7.17 | fwd(ms): 423.18 | crit-fwd(ms): 21.00 | bwd(ms): 663.77 | optim(ms): 57.37 | loss: 19.70648 | train-TER: 73.36 | train-WER: 86.51 | lists/dev.lst-loss: 18.57847 | lists/dev.lst-TER: 75.76 | lists/dev.lst-WER: 85.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 760.71
epoch: 45 | nupdates: 18090 | lr: 0.301500 | lrcriterion: 0.301500 | runtime: 00:07:34 | bch(ms): 1131.64 | smp(ms): 6.11 | fwd(ms): 421.76 | crit-fwd(ms): 20.98 | bwd(ms): 647.01 | optim(ms): 57.36 | loss: 19.43742 | train-TER: 73.22 | train-WER: 86.27 | lists/dev.lst-loss: 18.34961 | lists/dev.lst-TER: 74.32 | lists/dev.lst-WER: 85.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.55
epoch: 46 | nupdates: 18492 | lr: 0.308200 | lrcriterion: 0.308200 | runtime: 00:07:33 | bch(ms): 1128.48 | smp(ms): 5.51 | fwd(ms): 419.93 | crit-fwd(ms): 20.83 | bwd(ms): 646.09 | optim(ms): 57.25 | loss: 19.05118 | train-TER: 74.11 | train-WER: 85.84 | lists/dev.lst-loss: 17.58894 | lists/dev.lst-TER: 64.14 | lists/dev.lst-WER: 80.34 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 774.71
epoch: 47 | nupdates: 18894 | lr: 0.314900 | lrcriterion: 0.314900 | runtime: 00:07:41 | bch(ms): 1146.95 | smp(ms): 7.46 | fwd(ms): 422.25 | crit-fwd(ms): 21.00 | bwd(ms): 662.48 | optim(ms): 57.24 | loss: 18.66011 | train-TER: 73.10 | train-WER: 85.56 | lists/dev.lst-loss: 17.66062 | lists/dev.lst-TER: 74.50 | lists/dev.lst-WER: 84.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 762.24
epoch: 48 | nupdates: 19296 | lr: 0.321600 | lrcriterion: 0.321600 | runtime: 00:07:34 | bch(ms): 1130.11 | smp(ms): 4.35 | fwd(ms): 420.30 | crit-fwd(ms): 21.03 | bwd(ms): 646.78 | optim(ms): 57.23 | loss: 18.27108 | train-TER: 71.31 | train-WER: 84.50 | lists/dev.lst-loss: 16.95911 | lists/dev.lst-TER: 60.44 | lists/dev.lst-WER: 79.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.60
epoch: 49 | nupdates: 19698 | lr: 0.328300 | lrcriterion: 0.328300 | runtime: 00:07:41 | bch(ms): 1147.74 | smp(ms): 7.97 | fwd(ms): 421.57 | crit-fwd(ms): 21.26 | bwd(ms): 663.84 | optim(ms): 57.24 | loss: 17.92903 | train-TER: 67.56 | train-WER: 82.58 | lists/dev.lst-loss: 16.82782 | lists/dev.lst-TER: 68.85 | lists/dev.lst-WER: 81.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 761.71
epoch: 50 | nupdates: 20100 | lr: 0.335000 | lrcriterion: 0.335000 | runtime: 00:07:35 | bch(ms): 1134.06 | smp(ms): 8.06 | fwd(ms): 422.51 | crit-fwd(ms): 21.11 | bwd(ms): 649.76 | optim(ms): 57.25 | loss: 17.54452 | train-TER: 66.47 | train-WER: 81.19 | lists/dev.lst-loss: 16.13805 | lists/dev.lst-TER: 61.37 | lists/dev.lst-WER: 76.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.90
epoch: 51 | nupdates: 20502 | lr: 0.341700 | lrcriterion: 0.341700 | runtime: 00:07:40 | bch(ms): 1145.50 | smp(ms): 6.64 | fwd(ms): 423.10 | crit-fwd(ms): 21.18 | bwd(ms): 660.40 | optim(ms): 57.25 | loss: 17.13757 | train-TER: 67.73 | train-WER: 81.21 | lists/dev.lst-loss: 15.61902 | lists/dev.lst-TER: 59.84 | lists/dev.lst-WER: 75.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 763.20
epoch: 52 | nupdates: 20904 | lr: 0.348400 | lrcriterion: 0.348400 | runtime: 00:07:39 | bch(ms): 1143.70 | smp(ms): 6.74 | fwd(ms): 421.51 | crit-fwd(ms): 21.00 | bwd(ms): 660.00 | optim(ms): 57.26 | loss: 16.81060 | train-TER: 63.35 | train-WER: 79.55 | lists/dev.lst-loss: 15.24510 | lists/dev.lst-TER: 62.60 | lists/dev.lst-WER: 76.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 764.40
epoch: 53 | nupdates: 21306 | lr: 0.355100 | lrcriterion: 0.355100 | runtime: 00:07:36 | bch(ms): 1134.64 | smp(ms): 6.45 | fwd(ms): 422.00 | crit-fwd(ms): 21.01 | bwd(ms): 650.10 | optim(ms): 57.24 | loss: 16.43567 | train-TER: 59.04 | train-WER: 77.53 | lists/dev.lst-loss: 14.91175 | lists/dev.lst-TER: 56.93 | lists/dev.lst-WER: 73.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.51
epoch: 54 | nupdates: 21708 | lr: 0.361800 | lrcriterion: 0.361800 | runtime: 00:07:40 | bch(ms): 1145.43 | smp(ms): 3.26 | fwd(ms): 421.35 | crit-fwd(ms): 20.96 | bwd(ms): 660.83 | optim(ms): 57.19 | loss: 16.11873 | train-TER: 60.63 | train-WER: 77.64 | lists/dev.lst-loss: 14.38565 | lists/dev.lst-TER: 52.80 | lists/dev.lst-WER: 70.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 763.25
epoch: 55 | nupdates: 22110 | lr: 0.368500 | lrcriterion: 0.368500 | runtime: 00:07:41 | bch(ms): 1148.49 | smp(ms): 8.92 | fwd(ms): 422.61 | crit-fwd(ms): 21.27 | bwd(ms): 663.87 | optim(ms): 57.20 | loss: 15.75892 | train-TER: 60.39 | train-WER: 77.63 | lists/dev.lst-loss: 14.29904 | lists/dev.lst-TER: 48.81 | lists/dev.lst-WER: 68.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 761.21
epoch: 56 | nupdates: 22512 | lr: 0.375200 | lrcriterion: 0.375200 | runtime: 00:07:39 | bch(ms): 1141.89 | smp(ms): 6.19 | fwd(ms): 422.49 | crit-fwd(ms): 20.97 | bwd(ms): 657.11 | optim(ms): 57.23 | loss: 15.45886 | train-TER: 60.37 | train-WER: 77.06 | lists/dev.lst-loss: 13.65482 | lists/dev.lst-TER: 47.63 | lists/dev.lst-WER: 67.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 765.61
epoch: 57 | nupdates: 22914 | lr: 0.381900 | lrcriterion: 0.381900 | runtime: 00:07:40 | bch(ms): 1145.51 | smp(ms): 7.15 | fwd(ms): 421.78 | crit-fwd(ms): 21.01 | bwd(ms): 661.45 | optim(ms): 57.22 | loss: 15.17435 | train-TER: 59.77 | train-WER: 76.54 | lists/dev.lst-loss: 13.44365 | lists/dev.lst-TER: 44.45 | lists/dev.lst-WER: 65.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 122 | hrs: 97.62 | thrpt(sec/sec): 763.20
epoch: 58 | nupdates: 23316 | lr: 0.388600 | lrcriterion: 0.388600 | runtime: 00:07:40 | bch(ms): 1145.86 | smp(ms): 6.04 | fwd(ms): 421.68 | crit-fwd(ms): 21.06 | bwd(ms): 662.17 | optim(ms): 57.19 | loss: 14.84819 | train-TER: 60.43 | train-WER: 76.06 | lists/dev.lst-loss: 13.51374 | lists/dev.lst-TER: 49.12 | lists/dev.lst-WER: 67.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 762.96
epoch: 59 | nupdates: 23718 | lr: 0.395300 | lrcriterion: 0.395300 | runtime: 00:07:36 | bch(ms): 1134.66 | smp(ms): 8.54 | fwd(ms): 422.14 | crit-fwd(ms): 21.04 | bwd(ms): 650.54 | optim(ms): 57.20 | loss: 14.56374 | train-TER: 54.85 | train-WER: 73.34 | lists/dev.lst-loss: 13.13301 | lists/dev.lst-TER: 48.60 | lists/dev.lst-WER: 66.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 770.49
epoch: 60 | nupdates: 24120 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1129.16 | smp(ms): 6.76 | fwd(ms): 421.10 | crit-fwd(ms): 21.06 | bwd(ms): 645.35 | optim(ms): 57.22 | loss: 16.87386 | train-TER: 67.22 | train-WER: 81.42 | lists/dev.lst-loss: 13.63964 | lists/dev.lst-TER: 42.41 | lists/dev.lst-WER: 65.45 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 774.25
epoch: 61 | nupdates: 24522 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.10 | smp(ms): 8.86 | fwd(ms): 418.07 | crit-fwd(ms): 21.04 | bwd(ms): 645.10 | optim(ms): 57.23 | loss: 21.45547 | train-TER: 77.48 | train-WER: 90.32 | lists/dev.lst-loss: 13.55002 | lists/dev.lst-TER: 47.99 | lists/dev.lst-WER: 67.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.04
epoch: 62 | nupdates: 24924 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.91 | smp(ms): 5.11 | fwd(ms): 418.81 | crit-fwd(ms): 21.12 | bwd(ms): 639.95 | optim(ms): 57.26 | loss: 20.71633 | train-TER: 76.02 | train-WER: 88.70 | lists/dev.lst-loss: 13.30020 | lists/dev.lst-TER: 46.06 | lists/dev.lst-WER: 65.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.94
epoch: 63 | nupdates: 25326 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.37 | smp(ms): 5.89 | fwd(ms): 418.99 | crit-fwd(ms): 20.97 | bwd(ms): 637.86 | optim(ms): 57.25 | loss: 20.17442 | train-TER: 69.40 | train-WER: 84.32 | lists/dev.lst-loss: 13.28457 | lists/dev.lst-TER: 44.68 | lists/dev.lst-WER: 66.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.02
epoch: 64 | nupdates: 25728 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.02 | smp(ms): 6.42 | fwd(ms): 419.43 | crit-fwd(ms): 21.06 | bwd(ms): 637.73 | optim(ms): 57.26 | loss: 20.08063 | train-TER: 75.05 | train-WER: 88.59 | lists/dev.lst-loss: 13.02198 | lists/dev.lst-TER: 46.80 | lists/dev.lst-WER: 65.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.26
epoch: 65 | nupdates: 26130 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.49 | smp(ms): 6.99 | fwd(ms): 418.26 | crit-fwd(ms): 21.55 | bwd(ms): 639.27 | optim(ms): 57.25 | loss: 19.58498 | train-TER: 68.09 | train-WER: 83.71 | lists/dev.lst-loss: 12.71989 | lists/dev.lst-TER: 44.05 | lists/dev.lst-WER: 64.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.93
epoch: 66 | nupdates: 26532 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.26 | smp(ms): 6.72 | fwd(ms): 418.77 | crit-fwd(ms): 20.96 | bwd(ms): 651.84 | optim(ms): 57.24 | loss: 19.72613 | train-TER: 72.76 | train-WER: 88.07 | lists/dev.lst-loss: 12.66421 | lists/dev.lst-TER: 43.31 | lists/dev.lst-WER: 63.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.45
epoch: 67 | nupdates: 26934 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.62 | smp(ms): 7.50 | fwd(ms): 416.98 | crit-fwd(ms): 21.20 | bwd(ms): 651.13 | optim(ms): 57.25 | loss: 19.40530 | train-TER: 75.97 | train-WER: 88.02 | lists/dev.lst-loss: 12.70186 | lists/dev.lst-TER: 48.45 | lists/dev.lst-WER: 66.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.25
epoch: 68 | nupdates: 27336 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.95 | smp(ms): 7.58 | fwd(ms): 418.23 | crit-fwd(ms): 21.26 | bwd(ms): 643.42 | optim(ms): 57.26 | loss: 19.21337 | train-TER: 73.86 | train-WER: 86.98 | lists/dev.lst-loss: 12.63130 | lists/dev.lst-TER: 46.08 | lists/dev.lst-WER: 66.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.84
epoch: 69 | nupdates: 27738 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.62 | smp(ms): 7.27 | fwd(ms): 418.83 | crit-fwd(ms): 21.04 | bwd(ms): 644.53 | optim(ms): 57.20 | loss: 18.99999 | train-TER: 60.46 | train-WER: 79.11 | lists/dev.lst-loss: 12.46292 | lists/dev.lst-TER: 41.57 | lists/dev.lst-WER: 61.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.68
epoch: 70 | nupdates: 28140 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.23 | smp(ms): 6.42 | fwd(ms): 419.49 | crit-fwd(ms): 21.29 | bwd(ms): 655.77 | optim(ms): 57.23 | loss: 18.98772 | train-TER: 76.27 | train-WER: 87.71 | lists/dev.lst-loss: 12.18081 | lists/dev.lst-TER: 45.37 | lists/dev.lst-WER: 64.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 768.75
epoch: 71 | nupdates: 28542 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.40 | smp(ms): 7.20 | fwd(ms): 417.76 | crit-fwd(ms): 21.23 | bwd(ms): 643.34 | optim(ms): 57.24 | loss: 18.84176 | train-TER: 73.31 | train-WER: 86.87 | lists/dev.lst-loss: 12.14791 | lists/dev.lst-TER: 45.42 | lists/dev.lst-WER: 63.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.22
epoch: 72 | nupdates: 28944 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.11 | smp(ms): 6.66 | fwd(ms): 418.96 | crit-fwd(ms): 21.20 | bwd(ms): 643.23 | optim(ms): 57.24 | loss: 18.80567 | train-TER: 73.30 | train-WER: 86.68 | lists/dev.lst-loss: 12.02671 | lists/dev.lst-TER: 42.09 | lists/dev.lst-WER: 61.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.72
epoch: 73 | nupdates: 29346 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.13 | smp(ms): 7.75 | fwd(ms): 418.28 | crit-fwd(ms): 21.02 | bwd(ms): 650.23 | optim(ms): 57.27 | loss: 18.77794 | train-TER: 72.03 | train-WER: 86.25 | lists/dev.lst-loss: 12.01790 | lists/dev.lst-TER: 40.61 | lists/dev.lst-WER: 61.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.90
epoch: 74 | nupdates: 29748 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.32 | smp(ms): 7.54 | fwd(ms): 418.35 | crit-fwd(ms): 21.14 | bwd(ms): 653.94 | optim(ms): 57.23 | loss: 18.32982 | train-TER: 62.36 | train-WER: 78.98 | lists/dev.lst-loss: 11.77249 | lists/dev.lst-TER: 40.03 | lists/dev.lst-WER: 60.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.72
epoch: 75 | nupdates: 30150 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.74 | smp(ms): 7.07 | fwd(ms): 417.21 | crit-fwd(ms): 21.14 | bwd(ms): 653.29 | optim(ms): 57.25 | loss: 18.10331 | train-TER: 67.54 | train-WER: 83.25 | lists/dev.lst-loss: 11.88006 | lists/dev.lst-TER: 44.97 | lists/dev.lst-WER: 63.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.80
epoch: 76 | nupdates: 30552 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.24 | smp(ms): 7.33 | fwd(ms): 418.31 | crit-fwd(ms): 21.06 | bwd(ms): 642.41 | optim(ms): 57.23 | loss: 18.19987 | train-TER: 66.21 | train-WER: 81.83 | lists/dev.lst-loss: 11.64802 | lists/dev.lst-TER: 38.08 | lists/dev.lst-WER: 59.33 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.33
epoch: 77 | nupdates: 30954 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.16 | smp(ms): 6.83 | fwd(ms): 418.81 | crit-fwd(ms): 21.14 | bwd(ms): 652.94 | optim(ms): 57.22 | loss: 17.87337 | train-TER: 65.52 | train-WER: 81.45 | lists/dev.lst-loss: 11.49395 | lists/dev.lst-TER: 43.04 | lists/dev.lst-WER: 61.59 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 770.83
epoch: 78 | nupdates: 31356 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.47 | smp(ms): 7.16 | fwd(ms): 418.49 | crit-fwd(ms): 20.92 | bwd(ms): 641.50 | optim(ms): 57.23 | loss: 17.93354 | train-TER: 66.74 | train-WER: 82.42 | lists/dev.lst-loss: 11.53457 | lists/dev.lst-TER: 44.62 | lists/dev.lst-WER: 62.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.86
epoch: 79 | nupdates: 31758 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1121.90 | smp(ms): 7.80 | fwd(ms): 418.90 | crit-fwd(ms): 21.27 | bwd(ms): 640.79 | optim(ms): 57.24 | loss: 17.75793 | train-TER: 61.36 | train-WER: 79.35 | lists/dev.lst-loss: 11.33377 | lists/dev.lst-TER: 40.68 | lists/dev.lst-WER: 59.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.26
epoch: 80 | nupdates: 32160 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.48 | smp(ms): 7.78 | fwd(ms): 418.51 | crit-fwd(ms): 21.31 | bwd(ms): 641.91 | optim(ms): 57.22 | loss: 17.75346 | train-TER: 63.90 | train-WER: 81.03 | lists/dev.lst-loss: 11.22176 | lists/dev.lst-TER: 40.38 | lists/dev.lst-WER: 59.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.86
epoch: 81 | nupdates: 32562 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.61 | smp(ms): 7.85 | fwd(ms): 418.22 | crit-fwd(ms): 21.18 | bwd(ms): 643.19 | optim(ms): 57.22 | loss: 17.48617 | train-TER: 69.01 | train-WER: 83.84 | lists/dev.lst-loss: 11.07498 | lists/dev.lst-TER: 35.81 | lists/dev.lst-WER: 56.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.07
epoch: 82 | nupdates: 32964 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.38 | smp(ms): 7.23 | fwd(ms): 418.50 | crit-fwd(ms): 21.13 | bwd(ms): 656.16 | optim(ms): 57.23 | loss: 17.39745 | train-TER: 63.26 | train-WER: 79.87 | lists/dev.lst-loss: 10.84792 | lists/dev.lst-TER: 36.81 | lists/dev.lst-WER: 56.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 768.65
epoch: 83 | nupdates: 33366 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.75 | smp(ms): 7.89 | fwd(ms): 417.85 | crit-fwd(ms): 21.14 | bwd(ms): 654.77 | optim(ms): 57.23 | loss: 17.28212 | train-TER: 65.13 | train-WER: 81.28 | lists/dev.lst-loss: 11.26261 | lists/dev.lst-TER: 42.08 | lists/dev.lst-WER: 60.51 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.43
epoch: 84 | nupdates: 33768 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.63 | smp(ms): 7.56 | fwd(ms): 418.39 | crit-fwd(ms): 21.14 | bwd(ms): 640.19 | optim(ms): 57.25 | loss: 17.15141 | train-TER: 64.19 | train-WER: 81.78 | lists/dev.lst-loss: 10.67227 | lists/dev.lst-TER: 35.93 | lists/dev.lst-WER: 56.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.14
epoch: 85 | nupdates: 34170 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.12 | smp(ms): 5.89 | fwd(ms): 418.70 | crit-fwd(ms): 20.91 | bwd(ms): 649.21 | optim(ms): 57.25 | loss: 17.23015 | train-TER: 59.35 | train-WER: 77.02 | lists/dev.lst-loss: 10.85940 | lists/dev.lst-TER: 40.46 | lists/dev.lst-WER: 58.30 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.59
epoch: 86 | nupdates: 34572 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.93 | smp(ms): 6.37 | fwd(ms): 419.06 | crit-fwd(ms): 21.07 | bwd(ms): 638.80 | optim(ms): 57.24 | loss: 16.96564 | train-TER: 59.62 | train-WER: 77.21 | lists/dev.lst-loss: 10.54389 | lists/dev.lst-TER: 33.87 | lists/dev.lst-WER: 54.50 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.63
epoch: 87 | nupdates: 34974 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1136.42 | smp(ms): 6.93 | fwd(ms): 419.02 | crit-fwd(ms): 21.06 | bwd(ms): 655.43 | optim(ms): 57.21 | loss: 16.96073 | train-TER: 68.13 | train-WER: 84.00 | lists/dev.lst-loss: 10.39644 | lists/dev.lst-TER: 33.70 | lists/dev.lst-WER: 54.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 769.30
epoch: 88 | nupdates: 35376 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.80 | smp(ms): 6.66 | fwd(ms): 417.09 | crit-fwd(ms): 21.29 | bwd(ms): 650.51 | optim(ms): 57.28 | loss: 16.97702 | train-TER: 61.65 | train-WER: 78.93 | lists/dev.lst-loss: 10.37635 | lists/dev.lst-TER: 34.83 | lists/dev.lst-WER: 54.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.81
epoch: 89 | nupdates: 35778 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.01 | smp(ms): 6.28 | fwd(ms): 419.88 | crit-fwd(ms): 21.10 | bwd(ms): 639.82 | optim(ms): 57.26 | loss: 16.70030 | train-TER: 61.79 | train-WER: 79.76 | lists/dev.lst-loss: 10.30520 | lists/dev.lst-TER: 35.69 | lists/dev.lst-WER: 54.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.18
epoch: 90 | nupdates: 36180 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.76 | smp(ms): 7.48 | fwd(ms): 417.94 | crit-fwd(ms): 20.95 | bwd(ms): 639.86 | optim(ms): 57.25 | loss: 16.57162 | train-TER: 64.12 | train-WER: 80.89 | lists/dev.lst-loss: 10.44773 | lists/dev.lst-TER: 37.63 | lists/dev.lst-WER: 56.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.74
epoch: 91 | nupdates: 36582 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.21 | smp(ms): 5.99 | fwd(ms): 417.96 | crit-fwd(ms): 21.07 | bwd(ms): 641.30 | optim(ms): 57.23 | loss: 16.66347 | train-TER: 72.31 | train-WER: 86.37 | lists/dev.lst-loss: 10.27144 | lists/dev.lst-TER: 36.66 | lists/dev.lst-WER: 55.65 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.73
epoch: 92 | nupdates: 36984 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.99 | smp(ms): 7.79 | fwd(ms): 416.70 | crit-fwd(ms): 21.11 | bwd(ms): 644.19 | optim(ms): 57.24 | loss: 16.51025 | train-TER: 62.98 | train-WER: 80.44 | lists/dev.lst-loss: 10.24336 | lists/dev.lst-TER: 37.91 | lists/dev.lst-WER: 55.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.50
epoch: 93 | nupdates: 37386 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.46 | smp(ms): 7.91 | fwd(ms): 418.74 | crit-fwd(ms): 21.16 | bwd(ms): 638.47 | optim(ms): 57.23 | loss: 16.45285 | train-TER: 58.88 | train-WER: 76.47 | lists/dev.lst-loss: 10.05003 | lists/dev.lst-TER: 36.03 | lists/dev.lst-WER: 54.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.96
epoch: 94 | nupdates: 37788 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.92 | smp(ms): 7.03 | fwd(ms): 419.59 | crit-fwd(ms): 21.21 | bwd(ms): 642.18 | optim(ms): 57.23 | loss: 16.21421 | train-TER: 55.38 | train-WER: 74.05 | lists/dev.lst-loss: 10.35817 | lists/dev.lst-TER: 39.70 | lists/dev.lst-WER: 57.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 777.86
epoch: 95 | nupdates: 38190 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.96 | smp(ms): 6.40 | fwd(ms): 418.07 | crit-fwd(ms): 21.08 | bwd(ms): 638.74 | optim(ms): 57.26 | loss: 16.16825 | train-TER: 60.08 | train-WER: 78.45 | lists/dev.lst-loss: 9.88431 | lists/dev.lst-TER: 32.12 | lists/dev.lst-WER: 51.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.31
epoch: 96 | nupdates: 38592 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.12 | smp(ms): 6.94 | fwd(ms): 417.99 | crit-fwd(ms): 21.18 | bwd(ms): 650.34 | optim(ms): 57.25 | loss: 16.20026 | train-TER: 63.33 | train-WER: 79.86 | lists/dev.lst-loss: 9.79642 | lists/dev.lst-TER: 33.20 | lists/dev.lst-WER: 52.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.59
epoch: 97 | nupdates: 38994 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1124.70 | smp(ms): 7.61 | fwd(ms): 418.32 | crit-fwd(ms): 21.22 | bwd(ms): 644.16 | optim(ms): 57.24 | loss: 16.09557 | train-TER: 58.97 | train-WER: 76.51 | lists/dev.lst-loss: 9.88127 | lists/dev.lst-TER: 34.17 | lists/dev.lst-WER: 52.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.32
epoch: 98 | nupdates: 39396 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.37 | smp(ms): 4.69 | fwd(ms): 417.67 | crit-fwd(ms): 20.97 | bwd(ms): 637.75 | optim(ms): 57.24 | loss: 15.98377 | train-TER: 61.28 | train-WER: 78.19 | lists/dev.lst-loss: 9.94061 | lists/dev.lst-TER: 33.23 | lists/dev.lst-WER: 52.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.72
epoch: 99 | nupdates: 39798 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.48 | smp(ms): 7.05 | fwd(ms): 419.57 | crit-fwd(ms): 21.06 | bwd(ms): 640.84 | optim(ms): 57.23 | loss: 15.81249 | train-TER: 57.55 | train-WER: 74.73 | lists/dev.lst-loss: 9.96920 | lists/dev.lst-TER: 36.11 | lists/dev.lst-WER: 53.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.85
epoch: 100 | nupdates: 40200 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.62 | smp(ms): 7.26 | fwd(ms): 418.33 | crit-fwd(ms): 21.10 | bwd(ms): 643.28 | optim(ms): 57.22 | loss: 15.76856 | train-TER: 59.21 | train-WER: 77.85 | lists/dev.lst-loss: 9.51413 | lists/dev.lst-TER: 30.03 | lists/dev.lst-WER: 49.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.07
epoch: 101 | nupdates: 40602 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.74 | smp(ms): 6.39 | fwd(ms): 417.90 | crit-fwd(ms): 21.04 | bwd(ms): 651.28 | optim(ms): 57.24 | loss: 15.81209 | train-TER: 61.84 | train-WER: 79.23 | lists/dev.lst-loss: 9.53090 | lists/dev.lst-TER: 30.82 | lists/dev.lst-WER: 50.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.48
epoch: 102 | nupdates: 41004 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.38 | smp(ms): 3.82 | fwd(ms): 418.55 | crit-fwd(ms): 21.18 | bwd(ms): 641.00 | optim(ms): 57.25 | loss: 15.74271 | train-TER: 53.49 | train-WER: 72.16 | lists/dev.lst-loss: 9.50530 | lists/dev.lst-TER: 32.22 | lists/dev.lst-WER: 50.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.93
epoch: 103 | nupdates: 41406 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.01 | smp(ms): 8.31 | fwd(ms): 418.96 | crit-fwd(ms): 21.07 | bwd(ms): 641.75 | optim(ms): 57.25 | loss: 15.66112 | train-TER: 57.97 | train-WER: 74.97 | lists/dev.lst-loss: 9.41947 | lists/dev.lst-TER: 32.10 | lists/dev.lst-WER: 50.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.49
epoch: 104 | nupdates: 41808 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 7.73 | fwd(ms): 417.89 | crit-fwd(ms): 21.45 | bwd(ms): 640.54 | optim(ms): 57.23 | loss: 15.52963 | train-TER: 55.11 | train-WER: 73.25 | lists/dev.lst-loss: 9.42631 | lists/dev.lst-TER: 29.26 | lists/dev.lst-WER: 48.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.97
epoch: 105 | nupdates: 42210 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1134.11 | smp(ms): 7.14 | fwd(ms): 419.47 | crit-fwd(ms): 21.01 | bwd(ms): 652.28 | optim(ms): 57.24 | loss: 15.51499 | train-TER: 59.74 | train-WER: 77.59 | lists/dev.lst-loss: 9.35540 | lists/dev.lst-TER: 31.02 | lists/dev.lst-WER: 49.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.87
epoch: 106 | nupdates: 42612 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.01 | smp(ms): 7.68 | fwd(ms): 418.97 | crit-fwd(ms): 21.25 | bwd(ms): 642.72 | optim(ms): 57.25 | loss: 15.45425 | train-TER: 57.54 | train-WER: 75.21 | lists/dev.lst-loss: 9.14207 | lists/dev.lst-TER: 29.30 | lists/dev.lst-WER: 48.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.79
epoch: 107 | nupdates: 43014 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.45 | smp(ms): 7.03 | fwd(ms): 417.94 | crit-fwd(ms): 20.93 | bwd(ms): 652.00 | optim(ms): 57.24 | loss: 15.57122 | train-TER: 61.49 | train-WER: 77.95 | lists/dev.lst-loss: 9.31035 | lists/dev.lst-TER: 30.57 | lists/dev.lst-WER: 49.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.00
epoch: 108 | nupdates: 43416 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:28 | bch(ms): 1116.64 | smp(ms): 6.87 | fwd(ms): 418.93 | crit-fwd(ms): 21.18 | bwd(ms): 635.80 | optim(ms): 57.24 | loss: 15.27094 | train-TER: 58.17 | train-WER: 76.04 | lists/dev.lst-loss: 9.14575 | lists/dev.lst-TER: 31.28 | lists/dev.lst-WER: 49.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.92
epoch: 109 | nupdates: 43818 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.61 | smp(ms): 7.85 | fwd(ms): 417.61 | crit-fwd(ms): 21.15 | bwd(ms): 640.69 | optim(ms): 57.23 | loss: 15.31628 | train-TER: 55.99 | train-WER: 73.51 | lists/dev.lst-loss: 9.24124 | lists/dev.lst-TER: 31.79 | lists/dev.lst-WER: 50.12 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.16
epoch: 110 | nupdates: 44220 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.60 | smp(ms): 7.31 | fwd(ms): 417.53 | crit-fwd(ms): 21.18 | bwd(ms): 641.78 | optim(ms): 57.22 | loss: 15.14866 | train-TER: 52.46 | train-WER: 71.79 | lists/dev.lst-loss: 9.46158 | lists/dev.lst-TER: 33.22 | lists/dev.lst-WER: 51.26 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.47
epoch: 111 | nupdates: 44622 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.36 | smp(ms): 6.25 | fwd(ms): 417.26 | crit-fwd(ms): 21.06 | bwd(ms): 641.07 | optim(ms): 57.29 | loss: 15.13038 | train-TER: 63.11 | train-WER: 79.56 | lists/dev.lst-loss: 9.24710 | lists/dev.lst-TER: 32.18 | lists/dev.lst-WER: 50.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.33
epoch: 112 | nupdates: 45024 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.70 | smp(ms): 8.38 | fwd(ms): 418.81 | crit-fwd(ms): 21.05 | bwd(ms): 641.54 | optim(ms): 57.25 | loss: 14.79451 | train-TER: 55.67 | train-WER: 73.78 | lists/dev.lst-loss: 9.48923 | lists/dev.lst-TER: 34.71 | lists/dev.lst-WER: 51.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.70
epoch: 113 | nupdates: 45426 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.32 | smp(ms): 7.22 | fwd(ms): 419.14 | crit-fwd(ms): 21.21 | bwd(ms): 643.22 | optim(ms): 57.22 | loss: 15.04601 | train-TER: 57.83 | train-WER: 77.00 | lists/dev.lst-loss: 8.84531 | lists/dev.lst-TER: 28.22 | lists/dev.lst-WER: 47.08 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 777.58
epoch: 114 | nupdates: 45828 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.75 | smp(ms): 6.37 | fwd(ms): 417.87 | crit-fwd(ms): 20.90 | bwd(ms): 652.50 | optim(ms): 57.22 | loss: 14.98419 | train-TER: 54.90 | train-WER: 73.11 | lists/dev.lst-loss: 8.84740 | lists/dev.lst-TER: 28.65 | lists/dev.lst-WER: 46.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.79
epoch: 115 | nupdates: 46230 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.20 | smp(ms): 6.90 | fwd(ms): 417.62 | crit-fwd(ms): 21.23 | bwd(ms): 652.60 | optim(ms): 57.22 | loss: 14.90790 | train-TER: 54.74 | train-WER: 72.87 | lists/dev.lst-loss: 9.17924 | lists/dev.lst-TER: 34.00 | lists/dev.lst-WER: 50.81 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.16
epoch: 116 | nupdates: 46632 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:28 | bch(ms): 1116.33 | smp(ms): 6.13 | fwd(ms): 417.84 | crit-fwd(ms): 21.07 | bwd(ms): 636.08 | optim(ms): 57.26 | loss: 14.75618 | train-TER: 54.01 | train-WER: 72.20 | lists/dev.lst-loss: 9.03953 | lists/dev.lst-TER: 32.32 | lists/dev.lst-WER: 49.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 783.14
epoch: 117 | nupdates: 47034 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.72 | smp(ms): 7.69 | fwd(ms): 417.78 | crit-fwd(ms): 21.17 | bwd(ms): 640.88 | optim(ms): 57.22 | loss: 14.70447 | train-TER: 56.60 | train-WER: 74.05 | lists/dev.lst-loss: 8.68354 | lists/dev.lst-TER: 28.65 | lists/dev.lst-WER: 46.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.08
epoch: 118 | nupdates: 47436 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.00 | smp(ms): 6.40 | fwd(ms): 419.00 | crit-fwd(ms): 21.18 | bwd(ms): 651.91 | optim(ms): 57.25 | loss: 14.44669 | train-TER: 60.53 | train-WER: 77.53 | lists/dev.lst-loss: 8.61744 | lists/dev.lst-TER: 28.26 | lists/dev.lst-WER: 46.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 771.62
epoch: 119 | nupdates: 47838 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.27 | smp(ms): 4.22 | fwd(ms): 418.88 | crit-fwd(ms): 21.04 | bwd(ms): 648.67 | optim(ms): 57.32 | loss: 14.79736 | train-TER: 57.66 | train-WER: 74.98 | lists/dev.lst-loss: 8.73393 | lists/dev.lst-TER: 29.20 | lists/dev.lst-WER: 47.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.49
epoch: 120 | nupdates: 48240 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.77 | smp(ms): 6.86 | fwd(ms): 419.23 | crit-fwd(ms): 21.22 | bwd(ms): 639.35 | optim(ms): 57.24 | loss: 14.56824 | train-TER: 55.75 | train-WER: 73.51 | lists/dev.lst-loss: 8.78212 | lists/dev.lst-TER: 30.67 | lists/dev.lst-WER: 47.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.04
epoch: 121 | nupdates: 48642 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.75 | smp(ms): 6.83 | fwd(ms): 418.89 | crit-fwd(ms): 21.04 | bwd(ms): 639.34 | optim(ms): 57.23 | loss: 14.55233 | train-TER: 51.83 | train-WER: 70.12 | lists/dev.lst-loss: 8.54195 | lists/dev.lst-TER: 28.51 | lists/dev.lst-WER: 46.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.06
epoch: 122 | nupdates: 49044 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.38 | smp(ms): 6.72 | fwd(ms): 417.57 | crit-fwd(ms): 21.09 | bwd(ms): 641.02 | optim(ms): 57.22 | loss: 14.63787 | train-TER: 52.36 | train-WER: 71.13 | lists/dev.lst-loss: 8.48944 | lists/dev.lst-TER: 28.34 | lists/dev.lst-WER: 45.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.31
epoch: 123 | nupdates: 49446 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.46 | smp(ms): 6.02 | fwd(ms): 418.48 | crit-fwd(ms): 21.30 | bwd(ms): 648.68 | optim(ms): 57.26 | loss: 14.38288 | train-TER: 56.75 | train-WER: 74.53 | lists/dev.lst-loss: 8.54591 | lists/dev.lst-TER: 28.70 | lists/dev.lst-WER: 46.51 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 774.04
epoch: 124 | nupdates: 49848 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.11 | smp(ms): 7.97 | fwd(ms): 418.06 | crit-fwd(ms): 21.13 | bwd(ms): 642.75 | optim(ms): 57.22 | loss: 14.52782 | train-TER: 63.02 | train-WER: 80.15 | lists/dev.lst-loss: 8.46953 | lists/dev.lst-TER: 26.28 | lists/dev.lst-WER: 44.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.41
epoch: 125 | nupdates: 50250 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.36 | smp(ms): 6.24 | fwd(ms): 417.97 | crit-fwd(ms): 21.13 | bwd(ms): 651.07 | optim(ms): 57.23 | loss: 14.28490 | train-TER: 55.92 | train-WER: 73.66 | lists/dev.lst-loss: 8.39460 | lists/dev.lst-TER: 26.71 | lists/dev.lst-WER: 44.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.74
epoch: 126 | nupdates: 50652 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.37 | smp(ms): 7.22 | fwd(ms): 418.08 | crit-fwd(ms): 21.16 | bwd(ms): 640.12 | optim(ms): 57.22 | loss: 14.30071 | train-TER: 51.42 | train-WER: 69.99 | lists/dev.lst-loss: 8.45202 | lists/dev.lst-TER: 28.54 | lists/dev.lst-WER: 45.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.32
epoch: 127 | nupdates: 51054 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.50 | smp(ms): 6.19 | fwd(ms): 418.02 | crit-fwd(ms): 21.01 | bwd(ms): 641.46 | optim(ms): 57.24 | loss: 14.16151 | train-TER: 58.02 | train-WER: 75.33 | lists/dev.lst-loss: 8.34970 | lists/dev.lst-TER: 26.30 | lists/dev.lst-WER: 44.20 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.53
epoch: 128 | nupdates: 51456 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.72 | smp(ms): 7.15 | fwd(ms): 419.47 | crit-fwd(ms): 21.15 | bwd(ms): 651.32 | optim(ms): 57.21 | loss: 14.27378 | train-TER: 54.79 | train-WER: 73.47 | lists/dev.lst-loss: 8.38338 | lists/dev.lst-TER: 26.80 | lists/dev.lst-WER: 44.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.81
epoch: 129 | nupdates: 51858 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.82 | smp(ms): 6.32 | fwd(ms): 418.65 | crit-fwd(ms): 20.99 | bwd(ms): 638.10 | optim(ms): 57.22 | loss: 14.27120 | train-TER: 47.64 | train-WER: 67.11 | lists/dev.lst-loss: 8.61761 | lists/dev.lst-TER: 30.06 | lists/dev.lst-WER: 46.98 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.40
epoch: 130 | nupdates: 52260 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.54 | smp(ms): 6.17 | fwd(ms): 418.09 | crit-fwd(ms): 20.92 | bwd(ms): 639.05 | optim(ms): 57.25 | loss: 14.22493 | train-TER: 56.97 | train-WER: 75.34 | lists/dev.lst-loss: 8.38831 | lists/dev.lst-TER: 27.07 | lists/dev.lst-WER: 44.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.90
epoch: 131 | nupdates: 52662 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1135.17 | smp(ms): 7.17 | fwd(ms): 419.02 | crit-fwd(ms): 21.01 | bwd(ms): 653.97 | optim(ms): 57.21 | loss: 14.15012 | train-TER: 48.26 | train-WER: 66.47 | lists/dev.lst-loss: 8.24389 | lists/dev.lst-TER: 26.25 | lists/dev.lst-WER: 43.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.15
epoch: 132 | nupdates: 53064 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.02 | smp(ms): 8.45 | fwd(ms): 416.94 | crit-fwd(ms): 21.20 | bwd(ms): 653.04 | optim(ms): 57.25 | loss: 14.06675 | train-TER: 49.62 | train-WER: 68.83 | lists/dev.lst-loss: 8.20475 | lists/dev.lst-TER: 25.15 | lists/dev.lst-WER: 43.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.29
epoch: 133 | nupdates: 53466 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1129.34 | smp(ms): 5.51 | fwd(ms): 417.24 | crit-fwd(ms): 21.23 | bwd(ms): 650.27 | optim(ms): 57.24 | loss: 14.13045 | train-TER: 53.23 | train-WER: 70.71 | lists/dev.lst-loss: 8.45529 | lists/dev.lst-TER: 30.17 | lists/dev.lst-WER: 46.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 774.12
epoch: 134 | nupdates: 53868 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.69 | smp(ms): 5.10 | fwd(ms): 418.72 | crit-fwd(ms): 20.96 | bwd(ms): 640.99 | optim(ms): 57.25 | loss: 13.92196 | train-TER: 53.81 | train-WER: 73.25 | lists/dev.lst-loss: 8.14939 | lists/dev.lst-TER: 25.41 | lists/dev.lst-WER: 43.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.71
epoch: 135 | nupdates: 54270 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1126.56 | smp(ms): 7.44 | fwd(ms): 418.16 | crit-fwd(ms): 21.08 | bwd(ms): 645.95 | optim(ms): 57.22 | loss: 13.85039 | train-TER: 55.79 | train-WER: 74.12 | lists/dev.lst-loss: 8.05329 | lists/dev.lst-TER: 24.56 | lists/dev.lst-WER: 42.45 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.03
epoch: 136 | nupdates: 54672 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:37 | bch(ms): 1137.13 | smp(ms): 6.73 | fwd(ms): 420.51 | crit-fwd(ms): 21.10 | bwd(ms): 654.46 | optim(ms): 57.23 | loss: 13.76668 | train-TER: 42.65 | train-WER: 62.36 | lists/dev.lst-loss: 8.38886 | lists/dev.lst-TER: 27.73 | lists/dev.lst-WER: 45.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 768.82
epoch: 137 | nupdates: 55074 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.51 | smp(ms): 6.49 | fwd(ms): 418.75 | crit-fwd(ms): 21.01 | bwd(ms): 640.40 | optim(ms): 57.26 | loss: 13.59661 | train-TER: 51.50 | train-WER: 69.32 | lists/dev.lst-loss: 8.15681 | lists/dev.lst-TER: 26.36 | lists/dev.lst-WER: 43.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.53
epoch: 138 | nupdates: 55476 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.27 | smp(ms): 6.58 | fwd(ms): 418.45 | crit-fwd(ms): 20.97 | bwd(ms): 638.65 | optim(ms): 57.25 | loss: 13.81801 | train-TER: 54.59 | train-WER: 72.60 | lists/dev.lst-loss: 7.96134 | lists/dev.lst-TER: 24.83 | lists/dev.lst-WER: 42.46 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.09
epoch: 139 | nupdates: 55878 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.52 | smp(ms): 6.20 | fwd(ms): 417.46 | crit-fwd(ms): 20.99 | bwd(ms): 638.32 | optim(ms): 57.26 | loss: 13.70655 | train-TER: 47.13 | train-WER: 66.18 | lists/dev.lst-loss: 8.01994 | lists/dev.lst-TER: 26.69 | lists/dev.lst-WER: 43.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.61
epoch: 140 | nupdates: 56280 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.82 | smp(ms): 7.56 | fwd(ms): 417.32 | crit-fwd(ms): 21.02 | bwd(ms): 640.10 | optim(ms): 57.26 | loss: 13.70011 | train-TER: 53.84 | train-WER: 72.36 | lists/dev.lst-loss: 8.19977 | lists/dev.lst-TER: 27.70 | lists/dev.lst-WER: 44.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.70
epoch: 141 | nupdates: 56682 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1121.92 | smp(ms): 6.89 | fwd(ms): 418.91 | crit-fwd(ms): 21.00 | bwd(ms): 640.59 | optim(ms): 57.24 | loss: 13.63012 | train-TER: 48.99 | train-WER: 68.01 | lists/dev.lst-loss: 7.94642 | lists/dev.lst-TER: 24.27 | lists/dev.lst-WER: 41.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.25
epoch: 142 | nupdates: 57084 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.39 | smp(ms): 6.96 | fwd(ms): 418.33 | crit-fwd(ms): 21.33 | bwd(ms): 650.13 | optim(ms): 57.26 | loss: 13.45313 | train-TER: 58.71 | train-WER: 75.33 | lists/dev.lst-loss: 8.08680 | lists/dev.lst-TER: 26.78 | lists/dev.lst-WER: 43.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.41
epoch: 143 | nupdates: 57486 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.77 | smp(ms): 5.94 | fwd(ms): 419.40 | crit-fwd(ms): 21.08 | bwd(ms): 639.17 | optim(ms): 57.23 | loss: 13.41076 | train-TER: 52.01 | train-WER: 70.68 | lists/dev.lst-loss: 7.79057 | lists/dev.lst-TER: 24.24 | lists/dev.lst-WER: 41.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.04
epoch: 144 | nupdates: 57888 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.61 | smp(ms): 7.52 | fwd(ms): 417.67 | crit-fwd(ms): 21.29 | bwd(ms): 654.73 | optim(ms): 57.23 | loss: 13.50784 | train-TER: 49.80 | train-WER: 67.70 | lists/dev.lst-loss: 7.82797 | lists/dev.lst-TER: 24.47 | lists/dev.lst-WER: 41.63 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.53
epoch: 145 | nupdates: 58290 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.62 | smp(ms): 8.08 | fwd(ms): 418.27 | crit-fwd(ms): 21.01 | bwd(ms): 642.08 | optim(ms): 57.22 | loss: 13.60574 | train-TER: 53.65 | train-WER: 71.02 | lists/dev.lst-loss: 7.89450 | lists/dev.lst-TER: 24.69 | lists/dev.lst-WER: 41.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.76
epoch: 146 | nupdates: 58692 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.67 | smp(ms): 4.76 | fwd(ms): 418.44 | crit-fwd(ms): 21.08 | bwd(ms): 639.10 | optim(ms): 57.25 | loss: 13.35476 | train-TER: 43.18 | train-WER: 63.36 | lists/dev.lst-loss: 8.20162 | lists/dev.lst-TER: 28.46 | lists/dev.lst-WER: 44.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.81
epoch: 147 | nupdates: 59094 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.45 | smp(ms): 7.45 | fwd(ms): 417.46 | crit-fwd(ms): 21.00 | bwd(ms): 639.82 | optim(ms): 57.23 | loss: 13.47927 | train-TER: 52.87 | train-WER: 72.35 | lists/dev.lst-loss: 7.85984 | lists/dev.lst-TER: 25.10 | lists/dev.lst-WER: 41.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.96
epoch: 148 | nupdates: 59496 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.02 | smp(ms): 6.66 | fwd(ms): 416.54 | crit-fwd(ms): 21.18 | bwd(ms): 641.34 | optim(ms): 57.22 | loss: 13.18582 | train-TER: 46.08 | train-WER: 65.95 | lists/dev.lst-loss: 7.93400 | lists/dev.lst-TER: 25.89 | lists/dev.lst-WER: 42.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.56
epoch: 149 | nupdates: 59898 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.89 | smp(ms): 4.96 | fwd(ms): 418.69 | crit-fwd(ms): 21.08 | bwd(ms): 639.19 | optim(ms): 57.24 | loss: 13.08399 | train-TER: 49.58 | train-WER: 68.11 | lists/dev.lst-loss: 7.71010 | lists/dev.lst-TER: 24.09 | lists/dev.lst-WER: 41.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.66
epoch: 150 | nupdates: 60300 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:36 | bch(ms): 1134.66 | smp(ms): 6.52 | fwd(ms): 418.09 | crit-fwd(ms): 21.12 | bwd(ms): 654.55 | optim(ms): 57.20 | loss: 13.22116 | train-TER: 52.56 | train-WER: 69.53 | lists/dev.lst-loss: 7.74704 | lists/dev.lst-TER: 25.23 | lists/dev.lst-WER: 41.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.49
epoch: 151 | nupdates: 60702 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1124.24 | smp(ms): 6.89 | fwd(ms): 417.76 | crit-fwd(ms): 20.98 | bwd(ms): 644.57 | optim(ms): 57.21 | loss: 13.38768 | train-TER: 53.51 | train-WER: 71.08 | lists/dev.lst-loss: 7.78949 | lists/dev.lst-TER: 25.18 | lists/dev.lst-WER: 41.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.64
epoch: 152 | nupdates: 61104 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.62 | smp(ms): 8.88 | fwd(ms): 417.45 | crit-fwd(ms): 21.04 | bwd(ms): 642.11 | optim(ms): 57.19 | loss: 13.26836 | train-TER: 44.32 | train-WER: 63.81 | lists/dev.lst-loss: 7.86794 | lists/dev.lst-TER: 25.89 | lists/dev.lst-WER: 42.13 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.45
epoch: 153 | nupdates: 61506 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.38 | smp(ms): 7.34 | fwd(ms): 419.23 | crit-fwd(ms): 21.01 | bwd(ms): 640.85 | optim(ms): 57.23 | loss: 13.18466 | train-TER: 47.50 | train-WER: 65.92 | lists/dev.lst-loss: 7.70928 | lists/dev.lst-TER: 24.17 | lists/dev.lst-WER: 41.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.93
epoch: 154 | nupdates: 61908 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1131.31 | smp(ms): 6.48 | fwd(ms): 418.28 | crit-fwd(ms): 21.08 | bwd(ms): 650.27 | optim(ms): 57.23 | loss: 13.10210 | train-TER: 45.53 | train-WER: 65.00 | lists/dev.lst-loss: 7.77708 | lists/dev.lst-TER: 24.79 | lists/dev.lst-WER: 41.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.77
epoch: 155 | nupdates: 62310 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.83 | smp(ms): 6.22 | fwd(ms): 418.51 | crit-fwd(ms): 20.98 | bwd(ms): 640.07 | optim(ms): 57.22 | loss: 13.12608 | train-TER: 44.62 | train-WER: 63.28 | lists/dev.lst-loss: 7.59663 | lists/dev.lst-TER: 22.21 | lists/dev.lst-WER: 39.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.00
epoch: 156 | nupdates: 62712 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.43 | smp(ms): 6.76 | fwd(ms): 418.89 | crit-fwd(ms): 21.03 | bwd(ms): 649.43 | optim(ms): 57.24 | loss: 13.05531 | train-TER: 45.62 | train-WER: 63.95 | lists/dev.lst-loss: 7.70725 | lists/dev.lst-TER: 24.76 | lists/dev.lst-WER: 41.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.38
epoch: 157 | nupdates: 63114 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.45 | smp(ms): 6.78 | fwd(ms): 419.30 | crit-fwd(ms): 21.02 | bwd(ms): 642.16 | optim(ms): 57.21 | loss: 12.89740 | train-TER: 46.18 | train-WER: 64.81 | lists/dev.lst-loss: 7.59010 | lists/dev.lst-TER: 22.50 | lists/dev.lst-WER: 39.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.18
epoch: 158 | nupdates: 63516 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.07 | smp(ms): 7.00 | fwd(ms): 418.13 | crit-fwd(ms): 21.22 | bwd(ms): 640.84 | optim(ms): 57.22 | loss: 12.96884 | train-TER: 52.76 | train-WER: 71.60 | lists/dev.lst-loss: 7.63837 | lists/dev.lst-TER: 24.35 | lists/dev.lst-WER: 40.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.83
epoch: 159 | nupdates: 63918 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.10 | smp(ms): 7.45 | fwd(ms): 417.91 | crit-fwd(ms): 21.14 | bwd(ms): 641.20 | optim(ms): 57.22 | loss: 12.94717 | train-TER: 50.14 | train-WER: 69.38 | lists/dev.lst-loss: 7.63473 | lists/dev.lst-TER: 23.67 | lists/dev.lst-WER: 40.25 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 779.81
epoch: 160 | nupdates: 64320 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.46 | smp(ms): 8.16 | fwd(ms): 419.25 | crit-fwd(ms): 21.10 | bwd(ms): 641.92 | optim(ms): 57.23 | loss: 13.01450 | train-TER: 51.79 | train-WER: 70.33 | lists/dev.lst-loss: 7.53934 | lists/dev.lst-TER: 24.36 | lists/dev.lst-WER: 40.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.17
epoch: 161 | nupdates: 64722 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:32 | bch(ms): 1125.51 | smp(ms): 6.54 | fwd(ms): 420.62 | crit-fwd(ms): 21.13 | bwd(ms): 642.59 | optim(ms): 57.21 | loss: 12.94276 | train-TER: 52.15 | train-WER: 70.01 | lists/dev.lst-loss: 7.44481 | lists/dev.lst-TER: 23.17 | lists/dev.lst-WER: 39.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.76
epoch: 162 | nupdates: 65124 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1119.15 | smp(ms): 6.49 | fwd(ms): 419.42 | crit-fwd(ms): 21.15 | bwd(ms): 637.86 | optim(ms): 57.25 | loss: 12.85309 | train-TER: 48.45 | train-WER: 66.35 | lists/dev.lst-loss: 7.52816 | lists/dev.lst-TER: 22.57 | lists/dev.lst-WER: 39.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.17
epoch: 163 | nupdates: 65526 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1132.16 | smp(ms): 7.12 | fwd(ms): 418.06 | crit-fwd(ms): 21.06 | bwd(ms): 651.79 | optim(ms): 57.23 | loss: 12.88853 | train-TER: 46.10 | train-WER: 64.72 | lists/dev.lst-loss: 7.46618 | lists/dev.lst-TER: 22.31 | lists/dev.lst-WER: 39.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.20
epoch: 164 | nupdates: 65928 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1130.98 | smp(ms): 7.31 | fwd(ms): 417.12 | crit-fwd(ms): 21.17 | bwd(ms): 651.93 | optim(ms): 57.21 | loss: 12.89770 | train-TER: 49.42 | train-WER: 66.45 | lists/dev.lst-loss: 7.44288 | lists/dev.lst-TER: 23.12 | lists/dev.lst-WER: 39.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.00
epoch: 165 | nupdates: 66330 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1121.13 | smp(ms): 6.31 | fwd(ms): 418.44 | crit-fwd(ms): 21.02 | bwd(ms): 640.59 | optim(ms): 57.21 | loss: 12.82855 | train-TER: 44.71 | train-WER: 62.38 | lists/dev.lst-loss: 7.53362 | lists/dev.lst-TER: 23.73 | lists/dev.lst-WER: 39.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.79
epoch: 166 | nupdates: 66732 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1123.58 | smp(ms): 7.46 | fwd(ms): 419.10 | crit-fwd(ms): 21.07 | bwd(ms): 642.36 | optim(ms): 57.21 | loss: 12.69368 | train-TER: 50.51 | train-WER: 67.88 | lists/dev.lst-loss: 7.61495 | lists/dev.lst-TER: 24.11 | lists/dev.lst-WER: 40.03 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.09
epoch: 167 | nupdates: 67134 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.02 | smp(ms): 6.36 | fwd(ms): 418.00 | crit-fwd(ms): 21.08 | bwd(ms): 638.25 | optim(ms): 57.24 | loss: 12.65514 | train-TER: 45.95 | train-WER: 63.24 | lists/dev.lst-loss: 7.33882 | lists/dev.lst-TER: 21.88 | lists/dev.lst-WER: 38.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.96
epoch: 168 | nupdates: 67536 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:33 | bch(ms): 1127.67 | smp(ms): 6.83 | fwd(ms): 418.23 | crit-fwd(ms): 21.08 | bwd(ms): 647.42 | optim(ms): 57.25 | loss: 12.83542 | train-TER: 44.58 | train-WER: 63.24 | lists/dev.lst-loss: 7.41125 | lists/dev.lst-TER: 22.21 | lists/dev.lst-WER: 38.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 775.27
epoch: 169 | nupdates: 67938 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.20 | smp(ms): 7.57 | fwd(ms): 418.63 | crit-fwd(ms): 20.93 | bwd(ms): 641.24 | optim(ms): 57.21 | loss: 12.70959 | train-TER: 47.70 | train-WER: 66.45 | lists/dev.lst-loss: 7.30663 | lists/dev.lst-TER: 21.59 | lists/dev.lst-WER: 38.34 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.05
epoch: 170 | nupdates: 68340 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.94 | smp(ms): 6.95 | fwd(ms): 419.36 | crit-fwd(ms): 21.02 | bwd(ms): 652.48 | optim(ms): 57.21 | loss: 12.56968 | train-TER: 48.72 | train-WER: 67.40 | lists/dev.lst-loss: 7.30601 | lists/dev.lst-TER: 21.41 | lists/dev.lst-WER: 38.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.99
epoch: 171 | nupdates: 68742 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.99 | smp(ms): 5.98 | fwd(ms): 418.80 | crit-fwd(ms): 21.00 | bwd(ms): 648.57 | optim(ms): 57.26 | loss: 12.83445 | train-TER: 47.83 | train-WER: 66.34 | lists/dev.lst-loss: 7.29749 | lists/dev.lst-TER: 21.47 | lists/dev.lst-WER: 38.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.68
epoch: 172 | nupdates: 69144 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.70 | smp(ms): 6.54 | fwd(ms): 417.44 | crit-fwd(ms): 20.99 | bwd(ms): 650.20 | optim(ms): 57.21 | loss: 12.52775 | train-TER: 43.22 | train-WER: 62.62 | lists/dev.lst-loss: 7.33210 | lists/dev.lst-TER: 22.74 | lists/dev.lst-WER: 38.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 773.88
epoch: 173 | nupdates: 69546 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1117.31 | smp(ms): 6.84 | fwd(ms): 418.11 | crit-fwd(ms): 21.06 | bwd(ms): 637.34 | optim(ms): 57.22 | loss: 12.65324 | train-TER: 45.97 | train-WER: 63.40 | lists/dev.lst-loss: 7.28360 | lists/dev.lst-TER: 21.46 | lists/dev.lst-WER: 37.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 782.46
epoch: 174 | nupdates: 69948 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:35 | bch(ms): 1133.42 | smp(ms): 7.87 | fwd(ms): 419.40 | crit-fwd(ms): 21.11 | bwd(ms): 651.48 | optim(ms): 57.23 | loss: 12.54826 | train-TER: 47.45 | train-WER: 65.42 | lists/dev.lst-loss: 7.56915 | lists/dev.lst-TER: 24.63 | lists/dev.lst-WER: 40.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 771.33
epoch: 175 | nupdates: 70350 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:31 | bch(ms): 1122.94 | smp(ms): 6.74 | fwd(ms): 419.25 | crit-fwd(ms): 21.28 | bwd(ms): 641.94 | optim(ms): 57.24 | loss: 12.55889 | train-TER: 51.52 | train-WER: 69.10 | lists/dev.lst-loss: 7.35429 | lists/dev.lst-TER: 22.77 | lists/dev.lst-WER: 38.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.54
epoch: 176 | nupdates: 70752 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:29 | bch(ms): 1118.57 | smp(ms): 6.11 | fwd(ms): 419.06 | crit-fwd(ms): 21.06 | bwd(ms): 636.95 | optim(ms): 57.25 | loss: 12.51755 | train-TER: 48.08 | train-WER: 65.64 | lists/dev.lst-loss: 7.58862 | lists/dev.lst-TER: 25.15 | lists/dev.lst-WER: 40.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.58
epoch: 177 | nupdates: 71154 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1120.85 | smp(ms): 7.96 | fwd(ms): 418.59 | crit-fwd(ms): 21.19 | bwd(ms): 640.02 | optim(ms): 57.23 | loss: 12.38473 | train-TER: 46.26 | train-WER: 64.17 | lists/dev.lst-loss: 7.27269 | lists/dev.lst-TER: 22.15 | lists/dev.lst-WER: 38.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.98
epoch: 178 | nupdates: 71556 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:30 | bch(ms): 1119.99 | smp(ms): 6.47 | fwd(ms): 418.52 | crit-fwd(ms): 21.04 | bwd(ms): 639.09 | optim(ms): 57.22 | loss: 12.35725 | train-TER: 47.20 | train-WER: 65.81 | lists/dev.lst-loss: 7.11603 | lists/dev.lst-TER: 20.92 | lists/dev.lst-WER: 37.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.59
epoch: 179 | nupdates: 71958 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:07:34 | bch(ms): 1129.61 | smp(ms): 6.48 | fwd(ms): 417.94 | crit-fwd(ms): 21.08 | bwd(ms): 649.59 | optim(ms): 57.25 | loss: 12.20913 | train-TER: 50.72 | train-WER: 68.27 | lists/dev.lst-loss: 7.19737 | lists/dev.lst-TER: 21.30 | lists/dev.lst-WER: 37.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 773.94
epoch: 180 | nupdates: 72360 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.28 | smp(ms): 7.30 | fwd(ms): 418.29 | crit-fwd(ms): 21.39 | bwd(ms): 641.99 | optim(ms): 57.21 | loss: 12.12032 | train-TER: 51.38 | train-WER: 68.51 | lists/dev.lst-loss: 7.21357 | lists/dev.lst-TER: 22.31 | lists/dev.lst-WER: 37.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.00
epoch: 181 | nupdates: 72762 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.96 | smp(ms): 8.03 | fwd(ms): 418.35 | crit-fwd(ms): 21.09 | bwd(ms): 639.64 | optim(ms): 57.22 | loss: 12.24439 | train-TER: 54.08 | train-WER: 72.33 | lists/dev.lst-loss: 7.33857 | lists/dev.lst-TER: 22.95 | lists/dev.lst-WER: 38.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.61
epoch: 182 | nupdates: 73164 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.16 | smp(ms): 6.62 | fwd(ms): 417.44 | crit-fwd(ms): 21.18 | bwd(ms): 638.53 | optim(ms): 57.23 | loss: 12.00566 | train-TER: 42.76 | train-WER: 60.91 | lists/dev.lst-loss: 7.16530 | lists/dev.lst-TER: 22.56 | lists/dev.lst-WER: 38.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.86
epoch: 183 | nupdates: 73566 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.27 | smp(ms): 5.40 | fwd(ms): 418.21 | crit-fwd(ms): 20.97 | bwd(ms): 637.05 | optim(ms): 57.24 | loss: 12.17233 | train-TER: 47.49 | train-WER: 66.26 | lists/dev.lst-loss: 7.11299 | lists/dev.lst-TER: 21.56 | lists/dev.lst-WER: 37.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 782.49
epoch: 184 | nupdates: 73968 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.39 | smp(ms): 5.92 | fwd(ms): 419.01 | crit-fwd(ms): 21.00 | bwd(ms): 637.66 | optim(ms): 57.25 | loss: 12.02063 | train-TER: 46.95 | train-WER: 64.83 | lists/dev.lst-loss: 7.14865 | lists/dev.lst-TER: 21.92 | lists/dev.lst-WER: 37.46 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.70
epoch: 185 | nupdates: 74370 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.38 | smp(ms): 7.09 | fwd(ms): 418.20 | crit-fwd(ms): 21.00 | bwd(ms): 639.12 | optim(ms): 57.22 | loss: 12.04784 | train-TER: 46.15 | train-WER: 64.90 | lists/dev.lst-loss: 7.18734 | lists/dev.lst-TER: 22.26 | lists/dev.lst-WER: 37.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.01
epoch: 186 | nupdates: 74772 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.32 | smp(ms): 5.64 | fwd(ms): 418.47 | crit-fwd(ms): 21.13 | bwd(ms): 637.26 | optim(ms): 57.24 | loss: 11.96989 | train-TER: 48.49 | train-WER: 66.87 | lists/dev.lst-loss: 7.15873 | lists/dev.lst-TER: 21.69 | lists/dev.lst-WER: 37.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.75
epoch: 187 | nupdates: 75174 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:33 | bch(ms): 1127.48 | smp(ms): 4.51 | fwd(ms): 417.08 | crit-fwd(ms): 21.02 | bwd(ms): 648.04 | optim(ms): 57.28 | loss: 11.85950 | train-TER: 47.92 | train-WER: 66.06 | lists/dev.lst-loss: 7.07227 | lists/dev.lst-TER: 21.04 | lists/dev.lst-WER: 36.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 775.40
epoch: 188 | nupdates: 75576 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:34 | bch(ms): 1131.71 | smp(ms): 6.96 | fwd(ms): 419.13 | crit-fwd(ms): 21.10 | bwd(ms): 650.50 | optim(ms): 57.22 | loss: 12.02631 | train-TER: 44.41 | train-WER: 63.74 | lists/dev.lst-loss: 7.10498 | lists/dev.lst-TER: 21.35 | lists/dev.lst-WER: 36.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.50
epoch: 189 | nupdates: 75978 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.01 | smp(ms): 5.98 | fwd(ms): 418.85 | crit-fwd(ms): 21.10 | bwd(ms): 638.06 | optim(ms): 57.22 | loss: 11.90251 | train-TER: 46.85 | train-WER: 64.79 | lists/dev.lst-loss: 7.07784 | lists/dev.lst-TER: 21.86 | lists/dev.lst-WER: 37.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.27
epoch: 190 | nupdates: 76380 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.69 | smp(ms): 7.24 | fwd(ms): 417.62 | crit-fwd(ms): 21.07 | bwd(ms): 637.58 | optim(ms): 57.23 | loss: 11.90915 | train-TER: 45.61 | train-WER: 64.17 | lists/dev.lst-loss: 7.03675 | lists/dev.lst-TER: 21.47 | lists/dev.lst-WER: 36.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 782.19
epoch: 191 | nupdates: 76782 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.02 | smp(ms): 6.63 | fwd(ms): 419.15 | crit-fwd(ms): 21.14 | bwd(ms): 637.88 | optim(ms): 57.21 | loss: 11.79472 | train-TER: 46.92 | train-WER: 64.50 | lists/dev.lst-loss: 7.10484 | lists/dev.lst-TER: 21.51 | lists/dev.lst-WER: 36.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 781.26
epoch: 192 | nupdates: 77184 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.31 | smp(ms): 8.42 | fwd(ms): 417.18 | crit-fwd(ms): 21.21 | bwd(ms): 641.02 | optim(ms): 57.22 | loss: 11.80307 | train-TER: 46.62 | train-WER: 65.40 | lists/dev.lst-loss: 7.07330 | lists/dev.lst-TER: 21.57 | lists/dev.lst-WER: 37.02 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.36
epoch: 193 | nupdates: 77586 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.22 | smp(ms): 6.69 | fwd(ms): 418.93 | crit-fwd(ms): 21.21 | bwd(ms): 640.22 | optim(ms): 57.23 | loss: 12.06413 | train-TER: 48.57 | train-WER: 66.70 | lists/dev.lst-loss: 7.03203 | lists/dev.lst-TER: 21.37 | lists/dev.lst-WER: 36.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.73
epoch: 194 | nupdates: 77988 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.58 | smp(ms): 5.37 | fwd(ms): 418.36 | crit-fwd(ms): 21.02 | bwd(ms): 639.06 | optim(ms): 57.27 | loss: 11.67942 | train-TER: 46.09 | train-WER: 64.49 | lists/dev.lst-loss: 7.03581 | lists/dev.lst-TER: 20.56 | lists/dev.lst-WER: 36.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.87
epoch: 195 | nupdates: 78390 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:35 | bch(ms): 1132.91 | smp(ms): 6.36 | fwd(ms): 420.04 | crit-fwd(ms): 20.94 | bwd(ms): 650.78 | optim(ms): 57.24 | loss: 11.70607 | train-TER: 44.72 | train-WER: 62.43 | lists/dev.lst-loss: 7.00646 | lists/dev.lst-TER: 21.22 | lists/dev.lst-WER: 36.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.69
epoch: 196 | nupdates: 78792 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:32 | bch(ms): 1125.15 | smp(ms): 5.98 | fwd(ms): 420.07 | crit-fwd(ms): 21.16 | bwd(ms): 643.05 | optim(ms): 57.21 | loss: 11.80809 | train-TER: 46.86 | train-WER: 64.91 | lists/dev.lst-loss: 7.12295 | lists/dev.lst-TER: 21.52 | lists/dev.lst-WER: 36.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.01
epoch: 197 | nupdates: 79194 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1119.63 | smp(ms): 6.19 | fwd(ms): 417.83 | crit-fwd(ms): 20.97 | bwd(ms): 639.53 | optim(ms): 57.21 | loss: 11.69644 | train-TER: 43.32 | train-WER: 61.62 | lists/dev.lst-loss: 6.96446 | lists/dev.lst-TER: 20.75 | lists/dev.lst-WER: 36.15 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.83
epoch: 198 | nupdates: 79596 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1119.16 | smp(ms): 6.39 | fwd(ms): 418.16 | crit-fwd(ms): 21.00 | bwd(ms): 638.59 | optim(ms): 57.22 | loss: 11.79784 | train-TER: 38.89 | train-WER: 56.61 | lists/dev.lst-loss: 6.97371 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 35.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 781.16
epoch: 199 | nupdates: 79998 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:34 | bch(ms): 1131.15 | smp(ms): 4.49 | fwd(ms): 419.28 | crit-fwd(ms): 21.14 | bwd(ms): 650.09 | optim(ms): 57.24 | loss: 11.79763 | train-TER: 48.71 | train-WER: 66.80 | lists/dev.lst-loss: 6.99532 | lists/dev.lst-TER: 20.75 | lists/dev.lst-WER: 36.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.88
epoch: 200 | nupdates: 80400 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1123.05 | smp(ms): 7.03 | fwd(ms): 419.44 | crit-fwd(ms): 21.00 | bwd(ms): 641.49 | optim(ms): 57.23 | loss: 11.90821 | train-TER: 37.77 | train-WER: 55.31 | lists/dev.lst-loss: 7.09134 | lists/dev.lst-TER: 21.99 | lists/dev.lst-WER: 36.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.46
epoch: 201 | nupdates: 80802 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.10 | smp(ms): 8.10 | fwd(ms): 416.96 | crit-fwd(ms): 20.99 | bwd(ms): 643.15 | optim(ms): 57.21 | loss: 11.59235 | train-TER: 44.88 | train-WER: 62.62 | lists/dev.lst-loss: 6.95186 | lists/dev.lst-TER: 20.59 | lists/dev.lst-WER: 36.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.12
epoch: 202 | nupdates: 81204 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1116.54 | smp(ms): 6.82 | fwd(ms): 417.27 | crit-fwd(ms): 21.03 | bwd(ms): 637.02 | optim(ms): 57.29 | loss: 11.71110 | train-TER: 48.04 | train-WER: 66.29 | lists/dev.lst-loss: 7.03448 | lists/dev.lst-TER: 20.88 | lists/dev.lst-WER: 36.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 783.00
epoch: 203 | nupdates: 81606 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1117.32 | smp(ms): 6.36 | fwd(ms): 417.40 | crit-fwd(ms): 21.09 | bwd(ms): 637.67 | optim(ms): 57.27 | loss: 11.54316 | train-TER: 41.60 | train-WER: 59.75 | lists/dev.lst-loss: 7.01641 | lists/dev.lst-TER: 20.97 | lists/dev.lst-WER: 36.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.45
epoch: 204 | nupdates: 82008 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.91 | smp(ms): 3.54 | fwd(ms): 418.10 | crit-fwd(ms): 20.96 | bwd(ms): 637.51 | optim(ms): 57.24 | loss: 11.44882 | train-TER: 42.26 | train-WER: 60.62 | lists/dev.lst-loss: 7.09944 | lists/dev.lst-TER: 22.50 | lists/dev.lst-WER: 37.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.34
epoch: 205 | nupdates: 82410 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1116.35 | smp(ms): 4.79 | fwd(ms): 416.43 | crit-fwd(ms): 20.94 | bwd(ms): 637.69 | optim(ms): 57.26 | loss: 11.52040 | train-TER: 38.64 | train-WER: 58.98 | lists/dev.lst-loss: 6.98894 | lists/dev.lst-TER: 21.54 | lists/dev.lst-WER: 36.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 783.13
epoch: 206 | nupdates: 82812 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.36 | smp(ms): 7.46 | fwd(ms): 419.81 | crit-fwd(ms): 21.13 | bwd(ms): 639.34 | optim(ms): 57.24 | loss: 11.45530 | train-TER: 43.13 | train-WER: 60.77 | lists/dev.lst-loss: 7.04795 | lists/dev.lst-TER: 21.64 | lists/dev.lst-WER: 36.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 122 | hrs: 97.62 | thrpt(sec/sec): 779.63
epoch: 207 | nupdates: 83214 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1122.08 | smp(ms): 6.95 | fwd(ms): 419.82 | crit-fwd(ms): 21.27 | bwd(ms): 640.21 | optim(ms): 57.23 | loss: 11.75678 | train-TER: 47.76 | train-WER: 64.76 | lists/dev.lst-loss: 6.97346 | lists/dev.lst-TER: 20.85 | lists/dev.lst-WER: 35.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.13
epoch: 208 | nupdates: 83616 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.89 | smp(ms): 8.04 | fwd(ms): 417.32 | crit-fwd(ms): 21.20 | bwd(ms): 637.75 | optim(ms): 57.27 | loss: 11.60338 | train-TER: 43.14 | train-WER: 61.07 | lists/dev.lst-loss: 6.88011 | lists/dev.lst-TER: 20.62 | lists/dev.lst-WER: 35.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.36
epoch: 209 | nupdates: 84018 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1124.03 | smp(ms): 5.33 | fwd(ms): 418.75 | crit-fwd(ms): 21.10 | bwd(ms): 642.51 | optim(ms): 57.25 | loss: 11.48685 | train-TER: 47.57 | train-WER: 65.82 | lists/dev.lst-loss: 7.02744 | lists/dev.lst-TER: 21.79 | lists/dev.lst-WER: 36.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.78
epoch: 210 | nupdates: 84420 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1121.57 | smp(ms): 7.56 | fwd(ms): 418.89 | crit-fwd(ms): 21.34 | bwd(ms): 640.49 | optim(ms): 57.22 | loss: 11.59111 | train-TER: 49.94 | train-WER: 67.48 | lists/dev.lst-loss: 6.92240 | lists/dev.lst-TER: 20.96 | lists/dev.lst-WER: 35.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.48
epoch: 211 | nupdates: 84822 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:29 | bch(ms): 1118.97 | smp(ms): 6.16 | fwd(ms): 418.66 | crit-fwd(ms): 20.97 | bwd(ms): 638.47 | optim(ms): 57.24 | loss: 11.45393 | train-TER: 40.08 | train-WER: 57.28 | lists/dev.lst-loss: 6.85382 | lists/dev.lst-TER: 21.27 | lists/dev.lst-WER: 36.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 781.30
epoch: 212 | nupdates: 85224 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1123.87 | smp(ms): 7.47 | fwd(ms): 418.89 | crit-fwd(ms): 21.27 | bwd(ms): 642.56 | optim(ms): 57.23 | loss: 11.52129 | train-TER: 48.04 | train-WER: 64.44 | lists/dev.lst-loss: 6.85867 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 35.43 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.89
epoch: 213 | nupdates: 85626 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:35 | bch(ms): 1132.40 | smp(ms): 6.40 | fwd(ms): 419.14 | crit-fwd(ms): 21.13 | bwd(ms): 651.43 | optim(ms): 57.23 | loss: 11.37089 | train-TER: 46.13 | train-WER: 64.66 | lists/dev.lst-loss: 6.84399 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 35.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.03
epoch: 214 | nupdates: 86028 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:37 | bch(ms): 1138.37 | smp(ms): 8.17 | fwd(ms): 419.76 | crit-fwd(ms): 21.15 | bwd(ms): 656.30 | optim(ms): 57.22 | loss: 11.55306 | train-TER: 48.10 | train-WER: 66.27 | lists/dev.lst-loss: 6.91602 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 35.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 767.98
epoch: 215 | nupdates: 86430 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.38 | smp(ms): 6.77 | fwd(ms): 417.81 | crit-fwd(ms): 21.21 | bwd(ms): 640.56 | optim(ms): 57.22 | loss: 11.43209 | train-TER: 48.28 | train-WER: 64.79 | lists/dev.lst-loss: 6.98994 | lists/dev.lst-TER: 21.60 | lists/dev.lst-WER: 36.50 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.31
epoch: 216 | nupdates: 86832 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.26 | smp(ms): 7.02 | fwd(ms): 418.27 | crit-fwd(ms): 20.95 | bwd(ms): 639.75 | optim(ms): 57.24 | loss: 11.50092 | train-TER: 40.00 | train-WER: 56.62 | lists/dev.lst-loss: 7.02892 | lists/dev.lst-TER: 21.76 | lists/dev.lst-WER: 36.52 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.40
epoch: 217 | nupdates: 87234 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:28 | bch(ms): 1115.78 | smp(ms): 7.42 | fwd(ms): 417.25 | crit-fwd(ms): 21.05 | bwd(ms): 636.36 | optim(ms): 57.26 | loss: 11.42197 | train-TER: 50.97 | train-WER: 68.04 | lists/dev.lst-loss: 7.06908 | lists/dev.lst-TER: 22.15 | lists/dev.lst-WER: 36.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 783.53
epoch: 218 | nupdates: 87636 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:30 | bch(ms): 1120.70 | smp(ms): 7.17 | fwd(ms): 418.37 | crit-fwd(ms): 21.04 | bwd(ms): 639.85 | optim(ms): 57.25 | loss: 11.40922 | train-TER: 47.70 | train-WER: 65.62 | lists/dev.lst-loss: 6.86247 | lists/dev.lst-TER: 20.82 | lists/dev.lst-WER: 35.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.09
epoch: 219 | nupdates: 88038 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:07:31 | bch(ms): 1124.29 | smp(ms): 8.33 | fwd(ms): 417.72 | crit-fwd(ms): 21.17 | bwd(ms): 644.72 | optim(ms): 57.21 | loss: 11.31004 | train-TER: 37.47 | train-WER: 56.57 | lists/dev.lst-loss: 6.88911 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 35.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.60
epoch: 220 | nupdates: 88440 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1121.99 | smp(ms): 6.85 | fwd(ms): 418.45 | crit-fwd(ms): 21.01 | bwd(ms): 641.33 | optim(ms): 57.24 | loss: 11.33801 | train-TER: 41.46 | train-WER: 59.99 | lists/dev.lst-loss: 6.75162 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 35.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.20
epoch: 221 | nupdates: 88842 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1134.03 | smp(ms): 6.71 | fwd(ms): 419.69 | crit-fwd(ms): 20.99 | bwd(ms): 652.11 | optim(ms): 57.23 | loss: 11.38815 | train-TER: 42.83 | train-WER: 60.08 | lists/dev.lst-loss: 6.81624 | lists/dev.lst-TER: 20.55 | lists/dev.lst-WER: 35.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.92
epoch: 222 | nupdates: 89244 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.90 | smp(ms): 7.13 | fwd(ms): 418.55 | crit-fwd(ms): 21.05 | bwd(ms): 643.21 | optim(ms): 57.24 | loss: 11.41717 | train-TER: 43.01 | train-WER: 61.60 | lists/dev.lst-loss: 6.86301 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 35.67 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.87
epoch: 223 | nupdates: 89646 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.42 | smp(ms): 6.04 | fwd(ms): 417.75 | crit-fwd(ms): 21.16 | bwd(ms): 638.55 | optim(ms): 57.23 | loss: 11.30616 | train-TER: 42.63 | train-WER: 61.00 | lists/dev.lst-loss: 6.79989 | lists/dev.lst-TER: 20.41 | lists/dev.lst-WER: 35.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.68
epoch: 224 | nupdates: 90048 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:27 | bch(ms): 1113.07 | smp(ms): 4.46 | fwd(ms): 418.06 | crit-fwd(ms): 21.01 | bwd(ms): 633.15 | optim(ms): 57.31 | loss: 11.35378 | train-TER: 45.34 | train-WER: 62.81 | lists/dev.lst-loss: 6.98529 | lists/dev.lst-TER: 21.46 | lists/dev.lst-WER: 35.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 785.44
epoch: 225 | nupdates: 90450 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.32 | smp(ms): 7.27 | fwd(ms): 419.52 | crit-fwd(ms): 21.15 | bwd(ms): 638.87 | optim(ms): 57.23 | loss: 11.37245 | train-TER: 45.70 | train-WER: 63.60 | lists/dev.lst-loss: 6.90978 | lists/dev.lst-TER: 21.21 | lists/dev.lst-WER: 36.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.35
epoch: 226 | nupdates: 90852 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.51 | smp(ms): 6.56 | fwd(ms): 418.06 | crit-fwd(ms): 20.99 | bwd(ms): 641.05 | optim(ms): 57.22 | loss: 11.17685 | train-TER: 45.52 | train-WER: 64.04 | lists/dev.lst-loss: 6.79407 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.53
epoch: 227 | nupdates: 91254 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:36 | bch(ms): 1134.82 | smp(ms): 8.27 | fwd(ms): 417.47 | crit-fwd(ms): 21.13 | bwd(ms): 654.90 | optim(ms): 57.23 | loss: 11.31527 | train-TER: 40.23 | train-WER: 57.57 | lists/dev.lst-loss: 6.76190 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 770.38
epoch: 228 | nupdates: 91656 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1134.21 | smp(ms): 6.39 | fwd(ms): 419.50 | crit-fwd(ms): 21.01 | bwd(ms): 652.53 | optim(ms): 57.22 | loss: 11.28642 | train-TER: 43.90 | train-WER: 61.89 | lists/dev.lst-loss: 6.92776 | lists/dev.lst-TER: 21.05 | lists/dev.lst-WER: 35.61 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.80
epoch: 229 | nupdates: 92058 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.49 | smp(ms): 4.92 | fwd(ms): 418.72 | crit-fwd(ms): 21.08 | bwd(ms): 637.59 | optim(ms): 57.27 | loss: 11.27643 | train-TER: 46.77 | train-WER: 64.95 | lists/dev.lst-loss: 6.83402 | lists/dev.lst-TER: 20.42 | lists/dev.lst-WER: 35.21 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.63
epoch: 230 | nupdates: 92460 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.39 | smp(ms): 7.38 | fwd(ms): 417.09 | crit-fwd(ms): 21.14 | bwd(ms): 641.19 | optim(ms): 57.23 | loss: 11.35871 | train-TER: 42.95 | train-WER: 61.34 | lists/dev.lst-loss: 6.82054 | lists/dev.lst-TER: 20.53 | lists/dev.lst-WER: 35.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.31
epoch: 231 | nupdates: 92862 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.48 | smp(ms): 7.49 | fwd(ms): 418.10 | crit-fwd(ms): 21.08 | bwd(ms): 640.24 | optim(ms): 57.24 | loss: 11.56612 | train-TER: 49.68 | train-WER: 66.69 | lists/dev.lst-loss: 6.91017 | lists/dev.lst-TER: 21.23 | lists/dev.lst-WER: 35.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.25
epoch: 232 | nupdates: 93264 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.74 | smp(ms): 8.22 | fwd(ms): 418.32 | crit-fwd(ms): 21.16 | bwd(ms): 643.02 | optim(ms): 57.21 | loss: 11.34977 | train-TER: 40.18 | train-WER: 58.00 | lists/dev.lst-loss: 6.70046 | lists/dev.lst-TER: 20.08 | lists/dev.lst-WER: 34.84 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.98
epoch: 233 | nupdates: 93666 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:34 | bch(ms): 1131.26 | smp(ms): 7.24 | fwd(ms): 418.40 | crit-fwd(ms): 20.99 | bwd(ms): 650.61 | optim(ms): 57.22 | loss: 11.22591 | train-TER: 41.61 | train-WER: 60.07 | lists/dev.lst-loss: 6.75398 | lists/dev.lst-TER: 19.89 | lists/dev.lst-WER: 34.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 772.81
epoch: 234 | nupdates: 94068 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.11 | smp(ms): 6.94 | fwd(ms): 418.88 | crit-fwd(ms): 21.11 | bwd(ms): 650.90 | optim(ms): 57.24 | loss: 11.00878 | train-TER: 42.84 | train-WER: 60.60 | lists/dev.lst-loss: 6.84965 | lists/dev.lst-TER: 20.49 | lists/dev.lst-WER: 35.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.23
epoch: 235 | nupdates: 94470 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.91 | smp(ms): 7.42 | fwd(ms): 417.00 | crit-fwd(ms): 21.15 | bwd(ms): 639.56 | optim(ms): 57.23 | loss: 11.32189 | train-TER: 38.02 | train-WER: 56.16 | lists/dev.lst-loss: 6.81756 | lists/dev.lst-TER: 20.86 | lists/dev.lst-WER: 35.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.34
epoch: 236 | nupdates: 94872 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.14 | smp(ms): 7.24 | fwd(ms): 419.31 | crit-fwd(ms): 21.36 | bwd(ms): 641.70 | optim(ms): 57.21 | loss: 11.12376 | train-TER: 39.15 | train-WER: 57.22 | lists/dev.lst-loss: 6.85788 | lists/dev.lst-TER: 20.71 | lists/dev.lst-WER: 35.23 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.40
epoch: 237 | nupdates: 95274 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.51 | smp(ms): 5.76 | fwd(ms): 418.50 | crit-fwd(ms): 20.98 | bwd(ms): 640.05 | optim(ms): 57.20 | loss: 11.04973 | train-TER: 43.80 | train-WER: 60.77 | lists/dev.lst-loss: 6.80430 | lists/dev.lst-TER: 20.59 | lists/dev.lst-WER: 35.09 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.23
epoch: 238 | nupdates: 95676 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.83 | smp(ms): 6.42 | fwd(ms): 417.66 | crit-fwd(ms): 20.89 | bwd(ms): 636.04 | optim(ms): 57.24 | loss: 10.98742 | train-TER: 45.40 | train-WER: 61.95 | lists/dev.lst-loss: 6.83968 | lists/dev.lst-TER: 20.04 | lists/dev.lst-WER: 34.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 783.50
epoch: 239 | nupdates: 96078 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:36 | bch(ms): 1135.97 | smp(ms): 6.94 | fwd(ms): 419.49 | crit-fwd(ms): 21.11 | bwd(ms): 654.20 | optim(ms): 57.22 | loss: 11.19168 | train-TER: 46.59 | train-WER: 63.54 | lists/dev.lst-loss: 6.95753 | lists/dev.lst-TER: 21.54 | lists/dev.lst-WER: 35.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 769.61
epoch: 240 | nupdates: 96480 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.58 | smp(ms): 5.98 | fwd(ms): 418.13 | crit-fwd(ms): 20.89 | bwd(ms): 640.13 | optim(ms): 57.23 | loss: 11.11112 | train-TER: 45.69 | train-WER: 63.95 | lists/dev.lst-loss: 6.71408 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 34.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.18
epoch: 241 | nupdates: 96882 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.10 | smp(ms): 7.62 | fwd(ms): 418.14 | crit-fwd(ms): 21.06 | bwd(ms): 651.71 | optim(ms): 57.24 | loss: 11.23949 | train-TER: 43.75 | train-WER: 62.11 | lists/dev.lst-loss: 6.64316 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 34.49 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 772.24
epoch: 242 | nupdates: 97284 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1132.39 | smp(ms): 4.26 | fwd(ms): 418.71 | crit-fwd(ms): 21.32 | bwd(ms): 651.51 | optim(ms): 57.25 | loss: 11.18350 | train-TER: 42.52 | train-WER: 60.17 | lists/dev.lst-loss: 6.76315 | lists/dev.lst-TER: 20.53 | lists/dev.lst-WER: 35.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.04
epoch: 243 | nupdates: 97686 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1117.32 | smp(ms): 6.08 | fwd(ms): 418.90 | crit-fwd(ms): 21.02 | bwd(ms): 636.55 | optim(ms): 57.27 | loss: 11.22291 | train-TER: 45.10 | train-WER: 62.08 | lists/dev.lst-loss: 6.80712 | lists/dev.lst-TER: 20.70 | lists/dev.lst-WER: 35.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.45
epoch: 244 | nupdates: 98088 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.87 | smp(ms): 7.04 | fwd(ms): 418.33 | crit-fwd(ms): 21.11 | bwd(ms): 641.29 | optim(ms): 57.21 | loss: 11.18604 | train-TER: 40.21 | train-WER: 57.68 | lists/dev.lst-loss: 6.79022 | lists/dev.lst-TER: 20.35 | lists/dev.lst-WER: 34.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.28
epoch: 245 | nupdates: 98490 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1119.09 | smp(ms): 6.54 | fwd(ms): 418.17 | crit-fwd(ms): 21.22 | bwd(ms): 638.78 | optim(ms): 57.24 | loss: 11.07367 | train-TER: 41.98 | train-WER: 59.97 | lists/dev.lst-loss: 6.84947 | lists/dev.lst-TER: 20.99 | lists/dev.lst-WER: 35.35 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.21
epoch: 246 | nupdates: 98892 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.90 | smp(ms): 6.66 | fwd(ms): 419.24 | crit-fwd(ms): 21.00 | bwd(ms): 642.09 | optim(ms): 57.21 | loss: 11.04590 | train-TER: 45.50 | train-WER: 63.13 | lists/dev.lst-loss: 6.79369 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.87
epoch: 247 | nupdates: 99294 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1120.00 | smp(ms): 7.35 | fwd(ms): 418.30 | crit-fwd(ms): 20.99 | bwd(ms): 639.64 | optim(ms): 57.22 | loss: 11.00134 | train-TER: 41.46 | train-WER: 59.29 | lists/dev.lst-loss: 6.85750 | lists/dev.lst-TER: 20.40 | lists/dev.lst-WER: 34.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.58
epoch: 248 | nupdates: 99696 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.13 | smp(ms): 7.12 | fwd(ms): 418.69 | crit-fwd(ms): 21.17 | bwd(ms): 641.34 | optim(ms): 57.22 | loss: 11.27691 | train-TER: 43.79 | train-WER: 60.88 | lists/dev.lst-loss: 6.72764 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.10
epoch: 249 | nupdates: 100098 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1121.45 | smp(ms): 7.58 | fwd(ms): 418.00 | crit-fwd(ms): 21.31 | bwd(ms): 641.27 | optim(ms): 57.22 | loss: 10.83702 | train-TER: 42.93 | train-WER: 60.01 | lists/dev.lst-loss: 6.83052 | lists/dev.lst-TER: 20.44 | lists/dev.lst-WER: 34.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.57
epoch: 250 | nupdates: 100500 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.41 | smp(ms): 7.24 | fwd(ms): 417.67 | crit-fwd(ms): 21.05 | bwd(ms): 642.77 | optim(ms): 57.22 | loss: 11.11319 | train-TER: 43.88 | train-WER: 62.51 | lists/dev.lst-loss: 6.77070 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.90 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.90
epoch: 251 | nupdates: 100902 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1122.82 | smp(ms): 7.18 | fwd(ms): 418.80 | crit-fwd(ms): 21.01 | bwd(ms): 642.03 | optim(ms): 57.21 | loss: 11.04168 | train-TER: 44.84 | train-WER: 63.76 | lists/dev.lst-loss: 6.69973 | lists/dev.lst-TER: 19.36 | lists/dev.lst-WER: 34.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.62
epoch: 252 | nupdates: 101304 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:35 | bch(ms): 1133.04 | smp(ms): 7.78 | fwd(ms): 419.10 | crit-fwd(ms): 21.38 | bwd(ms): 651.87 | optim(ms): 57.25 | loss: 11.08078 | train-TER: 44.58 | train-WER: 61.91 | lists/dev.lst-loss: 6.76998 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.59
epoch: 253 | nupdates: 101706 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.26 | smp(ms): 5.35 | fwd(ms): 417.59 | crit-fwd(ms): 21.01 | bwd(ms): 635.27 | optim(ms): 57.26 | loss: 11.24814 | train-TER: 38.11 | train-WER: 56.34 | lists/dev.lst-loss: 6.78449 | lists/dev.lst-TER: 20.79 | lists/dev.lst-WER: 35.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 783.90
epoch: 254 | nupdates: 102108 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:28 | bch(ms): 1115.00 | smp(ms): 6.07 | fwd(ms): 417.59 | crit-fwd(ms): 21.08 | bwd(ms): 635.41 | optim(ms): 57.24 | loss: 11.06087 | train-TER: 41.26 | train-WER: 59.08 | lists/dev.lst-loss: 6.90967 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 35.64 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 784.08
epoch: 255 | nupdates: 102510 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:29 | bch(ms): 1118.92 | smp(ms): 5.45 | fwd(ms): 419.11 | crit-fwd(ms): 20.99 | bwd(ms): 637.59 | optim(ms): 57.28 | loss: 11.10428 | train-TER: 42.38 | train-WER: 60.94 | lists/dev.lst-loss: 6.83471 | lists/dev.lst-TER: 20.47 | lists/dev.lst-WER: 34.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 781.34
epoch: 256 | nupdates: 102912 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1119.90 | smp(ms): 5.78 | fwd(ms): 418.65 | crit-fwd(ms): 20.97 | bwd(ms): 639.20 | optim(ms): 57.24 | loss: 11.01318 | train-TER: 48.53 | train-WER: 67.12 | lists/dev.lst-loss: 6.69787 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.38 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.65
epoch: 257 | nupdates: 103314 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:32 | bch(ms): 1124.40 | smp(ms): 7.39 | fwd(ms): 418.11 | crit-fwd(ms): 21.08 | bwd(ms): 643.84 | optim(ms): 57.19 | loss: 11.09951 | train-TER: 42.85 | train-WER: 60.55 | lists/dev.lst-loss: 6.75729 | lists/dev.lst-TER: 20.51 | lists/dev.lst-WER: 34.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.53
epoch: 258 | nupdates: 103716 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:31 | bch(ms): 1123.63 | smp(ms): 7.41 | fwd(ms): 419.20 | crit-fwd(ms): 21.06 | bwd(ms): 642.51 | optim(ms): 57.22 | loss: 11.07322 | train-TER: 39.44 | train-WER: 57.80 | lists/dev.lst-loss: 6.73136 | lists/dev.lst-TER: 20.08 | lists/dev.lst-WER: 34.62 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.06
epoch: 259 | nupdates: 104118 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:07:30 | bch(ms): 1119.56 | smp(ms): 4.98 | fwd(ms): 418.44 | crit-fwd(ms): 20.80 | bwd(ms): 638.01 | optim(ms): 57.23 | loss: 11.11710 | train-TER: 37.77 | train-WER: 55.48 | lists/dev.lst-loss: 6.74001 | lists/dev.lst-TER: 20.68 | lists/dev.lst-WER: 35.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.88
epoch: 260 | nupdates: 104520 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.68 | smp(ms): 6.34 | fwd(ms): 419.24 | crit-fwd(ms): 21.05 | bwd(ms): 640.53 | optim(ms): 57.22 | loss: 11.03792 | train-TER: 45.23 | train-WER: 63.77 | lists/dev.lst-loss: 6.85008 | lists/dev.lst-TER: 20.61 | lists/dev.lst-WER: 34.95 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 779.41
epoch: 261 | nupdates: 104922 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.75 | smp(ms): 6.28 | fwd(ms): 419.29 | crit-fwd(ms): 21.34 | bwd(ms): 639.37 | optim(ms): 57.24 | loss: 10.83485 | train-TER: 41.45 | train-WER: 59.86 | lists/dev.lst-loss: 6.70959 | lists/dev.lst-TER: 20.10 | lists/dev.lst-WER: 34.57 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.05
epoch: 262 | nupdates: 105324 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.72 | smp(ms): 5.99 | fwd(ms): 417.15 | crit-fwd(ms): 20.94 | bwd(ms): 639.49 | optim(ms): 57.22 | loss: 11.04013 | train-TER: 49.24 | train-WER: 67.48 | lists/dev.lst-loss: 6.66456 | lists/dev.lst-TER: 20.04 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.47
epoch: 263 | nupdates: 105726 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.00 | smp(ms): 6.30 | fwd(ms): 419.03 | crit-fwd(ms): 21.12 | bwd(ms): 638.98 | optim(ms): 57.24 | loss: 10.96142 | train-TER: 43.78 | train-WER: 61.61 | lists/dev.lst-loss: 6.72319 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.60 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.58
epoch: 264 | nupdates: 106128 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1119.28 | smp(ms): 8.23 | fwd(ms): 418.56 | crit-fwd(ms): 21.09 | bwd(ms): 638.49 | optim(ms): 57.26 | loss: 11.09634 | train-TER: 40.15 | train-WER: 57.50 | lists/dev.lst-loss: 6.70202 | lists/dev.lst-TER: 20.06 | lists/dev.lst-WER: 34.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.08
epoch: 265 | nupdates: 106530 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.43 | smp(ms): 6.62 | fwd(ms): 419.79 | crit-fwd(ms): 21.00 | bwd(ms): 639.61 | optim(ms): 57.23 | loss: 11.13880 | train-TER: 45.62 | train-WER: 63.36 | lists/dev.lst-loss: 6.71379 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.58
epoch: 266 | nupdates: 106932 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:32 | bch(ms): 1124.40 | smp(ms): 6.82 | fwd(ms): 418.56 | crit-fwd(ms): 20.97 | bwd(ms): 643.30 | optim(ms): 57.22 | loss: 10.88673 | train-TER: 42.52 | train-WER: 61.18 | lists/dev.lst-loss: 6.65110 | lists/dev.lst-TER: 19.89 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.52
epoch: 267 | nupdates: 107334 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.42 | smp(ms): 6.28 | fwd(ms): 421.13 | crit-fwd(ms): 21.31 | bwd(ms): 640.06 | optim(ms): 57.23 | loss: 10.95675 | train-TER: 39.80 | train-WER: 58.01 | lists/dev.lst-loss: 6.72858 | lists/dev.lst-TER: 20.40 | lists/dev.lst-WER: 34.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.20
epoch: 268 | nupdates: 107736 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1124.18 | smp(ms): 8.59 | fwd(ms): 419.11 | crit-fwd(ms): 21.19 | bwd(ms): 642.87 | optim(ms): 57.23 | loss: 11.17714 | train-TER: 48.56 | train-WER: 66.28 | lists/dev.lst-loss: 6.67676 | lists/dev.lst-TER: 20.03 | lists/dev.lst-WER: 34.48 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.68
epoch: 269 | nupdates: 108138 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.81 | smp(ms): 6.28 | fwd(ms): 420.07 | crit-fwd(ms): 21.05 | bwd(ms): 637.69 | optim(ms): 57.25 | loss: 10.78095 | train-TER: 47.56 | train-WER: 66.00 | lists/dev.lst-loss: 6.71272 | lists/dev.lst-TER: 20.10 | lists/dev.lst-WER: 34.53 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.71
epoch: 270 | nupdates: 108540 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1116.39 | smp(ms): 6.95 | fwd(ms): 417.47 | crit-fwd(ms): 21.09 | bwd(ms): 636.94 | optim(ms): 57.24 | loss: 11.03590 | train-TER: 46.37 | train-WER: 64.37 | lists/dev.lst-loss: 6.73831 | lists/dev.lst-TER: 20.14 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 783.10
epoch: 271 | nupdates: 108942 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.00 | smp(ms): 6.99 | fwd(ms): 418.83 | crit-fwd(ms): 21.24 | bwd(ms): 639.76 | optim(ms): 57.28 | loss: 10.93185 | train-TER: 45.13 | train-WER: 63.25 | lists/dev.lst-loss: 6.76600 | lists/dev.lst-TER: 20.28 | lists/dev.lst-WER: 34.57 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.88
epoch: 272 | nupdates: 109344 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.13 | smp(ms): 7.83 | fwd(ms): 417.76 | crit-fwd(ms): 21.00 | bwd(ms): 642.48 | optim(ms): 57.23 | loss: 10.85380 | train-TER: 41.66 | train-WER: 60.17 | lists/dev.lst-loss: 6.65032 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 34.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.10
epoch: 273 | nupdates: 109746 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1131.82 | smp(ms): 5.96 | fwd(ms): 418.44 | crit-fwd(ms): 20.95 | bwd(ms): 651.34 | optim(ms): 57.24 | loss: 10.94733 | train-TER: 45.17 | train-WER: 62.96 | lists/dev.lst-loss: 6.74055 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.41 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.42
epoch: 274 | nupdates: 110148 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.80 | smp(ms): 7.06 | fwd(ms): 417.97 | crit-fwd(ms): 21.06 | bwd(ms): 640.52 | optim(ms): 57.24 | loss: 11.00493 | train-TER: 49.53 | train-WER: 66.56 | lists/dev.lst-loss: 6.74047 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.02
epoch: 275 | nupdates: 110550 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:32 | bch(ms): 1125.21 | smp(ms): 6.50 | fwd(ms): 419.94 | crit-fwd(ms): 21.05 | bwd(ms): 643.25 | optim(ms): 57.22 | loss: 10.80539 | train-TER: 43.48 | train-WER: 61.44 | lists/dev.lst-loss: 6.75868 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 34.69 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.96
epoch: 276 | nupdates: 110952 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.59 | smp(ms): 8.57 | fwd(ms): 418.32 | crit-fwd(ms): 21.04 | bwd(ms): 638.16 | optim(ms): 57.21 | loss: 11.12784 | train-TER: 42.98 | train-WER: 60.52 | lists/dev.lst-loss: 6.71512 | lists/dev.lst-TER: 20.46 | lists/dev.lst-WER: 34.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.56
epoch: 277 | nupdates: 111354 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.59 | smp(ms): 6.90 | fwd(ms): 417.83 | crit-fwd(ms): 21.05 | bwd(ms): 639.44 | optim(ms): 57.21 | loss: 10.87850 | train-TER: 41.97 | train-WER: 60.31 | lists/dev.lst-loss: 6.68581 | lists/dev.lst-TER: 19.65 | lists/dev.lst-WER: 34.08 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.87
epoch: 278 | nupdates: 111756 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1121.92 | smp(ms): 7.11 | fwd(ms): 418.23 | crit-fwd(ms): 21.00 | bwd(ms): 641.45 | optim(ms): 57.21 | loss: 11.03103 | train-TER: 51.17 | train-WER: 68.92 | lists/dev.lst-loss: 6.74854 | lists/dev.lst-TER: 19.91 | lists/dev.lst-WER: 34.30 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.24
epoch: 279 | nupdates: 112158 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.44 | smp(ms): 7.12 | fwd(ms): 417.95 | crit-fwd(ms): 20.96 | bwd(ms): 638.54 | optim(ms): 57.26 | loss: 10.86679 | train-TER: 42.17 | train-WER: 60.41 | lists/dev.lst-loss: 6.67381 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 34.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.67
epoch: 280 | nupdates: 112560 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1117.98 | smp(ms): 6.25 | fwd(ms): 418.75 | crit-fwd(ms): 21.21 | bwd(ms): 637.21 | optim(ms): 57.25 | loss: 11.15947 | train-TER: 44.50 | train-WER: 63.00 | lists/dev.lst-loss: 6.68154 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 34.22 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.99
epoch: 281 | nupdates: 112962 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.49 | smp(ms): 4.78 | fwd(ms): 419.11 | crit-fwd(ms): 20.95 | bwd(ms): 638.88 | optim(ms): 57.23 | loss: 10.88759 | train-TER: 42.82 | train-WER: 59.89 | lists/dev.lst-loss: 6.73656 | lists/dev.lst-TER: 20.24 | lists/dev.lst-WER: 34.40 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.24
epoch: 282 | nupdates: 113364 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.92 | smp(ms): 6.08 | fwd(ms): 419.17 | crit-fwd(ms): 21.08 | bwd(ms): 642.55 | optim(ms): 57.23 | loss: 10.83481 | train-TER: 36.57 | train-WER: 53.01 | lists/dev.lst-loss: 6.68294 | lists/dev.lst-TER: 20.16 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.86
epoch: 283 | nupdates: 113766 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.65 | smp(ms): 7.74 | fwd(ms): 417.82 | crit-fwd(ms): 21.46 | bwd(ms): 638.43 | optim(ms): 57.23 | loss: 10.79162 | train-TER: 42.49 | train-WER: 60.67 | lists/dev.lst-loss: 6.64335 | lists/dev.lst-TER: 19.98 | lists/dev.lst-WER: 34.25 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 781.52
epoch: 284 | nupdates: 114168 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:29 | bch(ms): 1118.74 | smp(ms): 6.28 | fwd(ms): 418.41 | crit-fwd(ms): 21.20 | bwd(ms): 638.25 | optim(ms): 57.24 | loss: 11.00945 | train-TER: 41.27 | train-WER: 59.70 | lists/dev.lst-loss: 6.71452 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.16 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.46
epoch: 285 | nupdates: 114570 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.92 | smp(ms): 8.06 | fwd(ms): 417.63 | crit-fwd(ms): 20.98 | bwd(ms): 640.99 | optim(ms): 57.26 | loss: 10.71856 | train-TER: 38.88 | train-WER: 56.04 | lists/dev.lst-loss: 6.69798 | lists/dev.lst-TER: 20.33 | lists/dev.lst-WER: 34.56 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.94
epoch: 286 | nupdates: 114972 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.79 | smp(ms): 6.23 | fwd(ms): 420.08 | crit-fwd(ms): 21.22 | bwd(ms): 641.90 | optim(ms): 57.22 | loss: 10.65459 | train-TER: 34.91 | train-WER: 53.93 | lists/dev.lst-loss: 6.71353 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.95
epoch: 287 | nupdates: 115374 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1120.05 | smp(ms): 7.07 | fwd(ms): 417.90 | crit-fwd(ms): 21.16 | bwd(ms): 640.21 | optim(ms): 57.23 | loss: 10.84945 | train-TER: 40.57 | train-WER: 58.15 | lists/dev.lst-loss: 6.72145 | lists/dev.lst-TER: 20.18 | lists/dev.lst-WER: 34.44 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.54
epoch: 288 | nupdates: 115776 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1123.59 | smp(ms): 7.89 | fwd(ms): 419.67 | crit-fwd(ms): 21.07 | bwd(ms): 641.55 | optim(ms): 57.25 | loss: 10.99489 | train-TER: 44.54 | train-WER: 63.27 | lists/dev.lst-loss: 6.75089 | lists/dev.lst-TER: 20.29 | lists/dev.lst-WER: 34.47 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.09
epoch: 289 | nupdates: 116178 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1115.77 | smp(ms): 6.60 | fwd(ms): 417.77 | crit-fwd(ms): 21.13 | bwd(ms): 635.72 | optim(ms): 57.25 | loss: 10.75101 | train-TER: 47.20 | train-WER: 65.20 | lists/dev.lst-loss: 6.71355 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.26 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 783.54
epoch: 290 | nupdates: 116580 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:28 | bch(ms): 1116.17 | smp(ms): 5.01 | fwd(ms): 417.35 | crit-fwd(ms): 21.22 | bwd(ms): 636.82 | optim(ms): 57.31 | loss: 10.87084 | train-TER: 42.11 | train-WER: 61.14 | lists/dev.lst-loss: 6.62369 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 783.26
epoch: 291 | nupdates: 116982 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:35 | bch(ms): 1133.74 | smp(ms): 6.64 | fwd(ms): 420.00 | crit-fwd(ms): 21.20 | bwd(ms): 651.73 | optim(ms): 57.22 | loss: 10.79659 | train-TER: 43.60 | train-WER: 61.68 | lists/dev.lst-loss: 6.74688 | lists/dev.lst-TER: 20.03 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 771.12
epoch: 292 | nupdates: 117384 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1121.99 | smp(ms): 7.09 | fwd(ms): 418.69 | crit-fwd(ms): 21.24 | bwd(ms): 639.50 | optim(ms): 57.25 | loss: 11.02203 | train-TER: 45.46 | train-WER: 62.18 | lists/dev.lst-loss: 6.72946 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.24 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.20
epoch: 293 | nupdates: 117786 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1119.59 | smp(ms): 5.23 | fwd(ms): 419.82 | crit-fwd(ms): 20.98 | bwd(ms): 637.83 | optim(ms): 57.24 | loss: 10.71788 | train-TER: 45.93 | train-WER: 62.56 | lists/dev.lst-loss: 6.67587 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 34.05 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.86
epoch: 294 | nupdates: 118188 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1131.09 | smp(ms): 6.03 | fwd(ms): 418.64 | crit-fwd(ms): 21.14 | bwd(ms): 650.45 | optim(ms): 57.29 | loss: 10.81870 | train-TER: 42.28 | train-WER: 60.43 | lists/dev.lst-loss: 6.71912 | lists/dev.lst-TER: 20.19 | lists/dev.lst-WER: 34.37 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 772.92
epoch: 295 | nupdates: 118590 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:30 | bch(ms): 1121.12 | smp(ms): 5.62 | fwd(ms): 418.59 | crit-fwd(ms): 20.94 | bwd(ms): 639.79 | optim(ms): 57.21 | loss: 10.74011 | train-TER: 33.24 | train-WER: 50.45 | lists/dev.lst-loss: 6.68437 | lists/dev.lst-TER: 20.42 | lists/dev.lst-WER: 34.58 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.80
epoch: 296 | nupdates: 118992 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.63 | smp(ms): 6.35 | fwd(ms): 419.74 | crit-fwd(ms): 21.44 | bwd(ms): 640.33 | optim(ms): 57.22 | loss: 10.97935 | train-TER: 40.88 | train-WER: 58.69 | lists/dev.lst-loss: 6.69050 | lists/dev.lst-TER: 20.36 | lists/dev.lst-WER: 34.54 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 778.75
epoch: 297 | nupdates: 119394 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.56 | smp(ms): 6.09 | fwd(ms): 419.98 | crit-fwd(ms): 21.03 | bwd(ms): 640.21 | optim(ms): 57.23 | loss: 10.78796 | train-TER: 39.46 | train-WER: 56.49 | lists/dev.lst-loss: 6.62739 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.80
epoch: 298 | nupdates: 119796 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:34 | bch(ms): 1130.05 | smp(ms): 5.78 | fwd(ms): 417.43 | crit-fwd(ms): 21.06 | bwd(ms): 650.62 | optim(ms): 57.25 | loss: 10.89956 | train-TER: 41.28 | train-WER: 59.25 | lists/dev.lst-loss: 6.69034 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 773.64
epoch: 299 | nupdates: 120198 | lr: 0.050000 | lrcriterion: 0.050000 | runtime: 00:07:31 | bch(ms): 1122.57 | smp(ms): 7.73 | fwd(ms): 418.21 | crit-fwd(ms): 21.10 | bwd(ms): 642.34 | optim(ms): 57.23 | loss: 10.77005 | train-TER: 39.67 | train-WER: 56.60 | lists/dev.lst-loss: 6.67104 | lists/dev.lst-TER: 20.02 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.79
epoch: 300 | nupdates: 120600 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.34 | smp(ms): 6.57 | fwd(ms): 417.52 | crit-fwd(ms): 20.98 | bwd(ms): 640.47 | optim(ms): 57.22 | loss: 10.81043 | train-TER: 32.92 | train-WER: 50.34 | lists/dev.lst-loss: 6.65966 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.11 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.34
epoch: 301 | nupdates: 121002 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.99 | smp(ms): 8.63 | fwd(ms): 418.01 | crit-fwd(ms): 21.24 | bwd(ms): 644.50 | optim(ms): 57.20 | loss: 10.77536 | train-TER: 40.79 | train-WER: 59.21 | lists/dev.lst-loss: 6.66066 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 34.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.12
epoch: 302 | nupdates: 121404 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.83 | smp(ms): 6.81 | fwd(ms): 418.93 | crit-fwd(ms): 21.06 | bwd(ms): 638.90 | optim(ms): 57.25 | loss: 10.70175 | train-TER: 39.35 | train-WER: 57.08 | lists/dev.lst-loss: 6.77147 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 34.33 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.69
epoch: 303 | nupdates: 121806 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.50 | smp(ms): 7.28 | fwd(ms): 417.64 | crit-fwd(ms): 21.13 | bwd(ms): 642.63 | optim(ms): 57.23 | loss: 10.68096 | train-TER: 43.08 | train-WER: 60.83 | lists/dev.lst-loss: 6.63917 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.84
epoch: 304 | nupdates: 122208 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1125.04 | smp(ms): 8.38 | fwd(ms): 419.41 | crit-fwd(ms): 20.99 | bwd(ms): 643.42 | optim(ms): 57.22 | loss: 10.79036 | train-TER: 41.55 | train-WER: 59.67 | lists/dev.lst-loss: 6.69519 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.19 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.09
epoch: 305 | nupdates: 122610 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.74 | smp(ms): 8.37 | fwd(ms): 417.39 | crit-fwd(ms): 21.45 | bwd(ms): 642.71 | optim(ms): 57.24 | loss: 10.74811 | train-TER: 43.41 | train-WER: 62.10 | lists/dev.lst-loss: 6.68067 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 34.04 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.67
epoch: 306 | nupdates: 123012 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.50 | smp(ms): 7.21 | fwd(ms): 418.78 | crit-fwd(ms): 20.91 | bwd(ms): 640.54 | optim(ms): 57.23 | loss: 10.82780 | train-TER: 39.32 | train-WER: 56.80 | lists/dev.lst-loss: 6.68922 | lists/dev.lst-TER: 19.96 | lists/dev.lst-WER: 34.10 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.53
epoch: 307 | nupdates: 123414 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.33 | smp(ms): 5.98 | fwd(ms): 418.25 | crit-fwd(ms): 21.02 | bwd(ms): 640.78 | optim(ms): 57.23 | loss: 10.77024 | train-TER: 42.98 | train-WER: 60.80 | lists/dev.lst-loss: 6.69091 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.65
epoch: 308 | nupdates: 123816 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1123.24 | smp(ms): 7.75 | fwd(ms): 418.50 | crit-fwd(ms): 21.28 | bwd(ms): 642.70 | optim(ms): 57.22 | loss: 10.79831 | train-TER: 47.42 | train-WER: 65.42 | lists/dev.lst-loss: 6.73109 | lists/dev.lst-TER: 20.12 | lists/dev.lst-WER: 34.32 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.33
epoch: 309 | nupdates: 124218 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.42 | smp(ms): 6.56 | fwd(ms): 418.40 | crit-fwd(ms): 21.13 | bwd(ms): 641.11 | optim(ms): 57.22 | loss: 10.83720 | train-TER: 47.26 | train-WER: 64.28 | lists/dev.lst-loss: 6.59614 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.59
epoch: 310 | nupdates: 124620 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.64 | smp(ms): 6.50 | fwd(ms): 418.93 | crit-fwd(ms): 21.01 | bwd(ms): 643.30 | optim(ms): 57.22 | loss: 10.66964 | train-TER: 45.04 | train-WER: 61.98 | lists/dev.lst-loss: 6.65539 | lists/dev.lst-TER: 19.75 | lists/dev.lst-WER: 33.97 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.36
epoch: 311 | nupdates: 125022 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.89 | smp(ms): 7.20 | fwd(ms): 419.49 | crit-fwd(ms): 21.05 | bwd(ms): 641.41 | optim(ms): 57.23 | loss: 10.77329 | train-TER: 44.26 | train-WER: 61.64 | lists/dev.lst-loss: 6.66448 | lists/dev.lst-TER: 20.25 | lists/dev.lst-WER: 34.39 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.57
epoch: 312 | nupdates: 125424 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.31 | smp(ms): 8.00 | fwd(ms): 417.83 | crit-fwd(ms): 21.16 | bwd(ms): 641.28 | optim(ms): 57.24 | loss: 10.75939 | train-TER: 36.91 | train-WER: 54.57 | lists/dev.lst-loss: 6.65007 | lists/dev.lst-TER: 19.75 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.66
epoch: 313 | nupdates: 125826 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.29 | smp(ms): 8.35 | fwd(ms): 418.65 | crit-fwd(ms): 21.17 | bwd(ms): 639.55 | optim(ms): 57.23 | loss: 10.73199 | train-TER: 42.92 | train-WER: 60.65 | lists/dev.lst-loss: 6.68610 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.38
epoch: 314 | nupdates: 126228 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1124.67 | smp(ms): 5.97 | fwd(ms): 419.82 | crit-fwd(ms): 20.91 | bwd(ms): 642.55 | optim(ms): 57.22 | loss: 10.88882 | train-TER: 43.85 | train-WER: 61.34 | lists/dev.lst-loss: 6.73855 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.34
epoch: 315 | nupdates: 126630 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.69 | smp(ms): 6.35 | fwd(ms): 418.62 | crit-fwd(ms): 21.18 | bwd(ms): 639.94 | optim(ms): 57.22 | loss: 10.61482 | train-TER: 37.20 | train-WER: 55.39 | lists/dev.lst-loss: 6.70637 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.10
epoch: 316 | nupdates: 127032 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.74 | smp(ms): 7.50 | fwd(ms): 417.94 | crit-fwd(ms): 21.16 | bwd(ms): 638.72 | optim(ms): 57.25 | loss: 10.90136 | train-TER: 42.60 | train-WER: 61.17 | lists/dev.lst-loss: 6.65119 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.46
epoch: 317 | nupdates: 127434 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.30 | smp(ms): 6.25 | fwd(ms): 418.80 | crit-fwd(ms): 21.12 | bwd(ms): 639.20 | optim(ms): 57.24 | loss: 10.88599 | train-TER: 40.91 | train-WER: 59.08 | lists/dev.lst-loss: 6.73520 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 34.06 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.37
epoch: 318 | nupdates: 127836 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.89 | smp(ms): 8.39 | fwd(ms): 417.60 | crit-fwd(ms): 21.16 | bwd(ms): 640.08 | optim(ms): 57.27 | loss: 10.65374 | train-TER: 37.64 | train-WER: 55.30 | lists/dev.lst-loss: 6.62736 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.66
epoch: 319 | nupdates: 128238 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:35 | bch(ms): 1132.73 | smp(ms): 7.64 | fwd(ms): 417.82 | crit-fwd(ms): 21.12 | bwd(ms): 653.03 | optim(ms): 57.24 | loss: 10.60002 | train-TER: 41.01 | train-WER: 58.90 | lists/dev.lst-loss: 6.71207 | lists/dev.lst-TER: 19.66 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 771.81
epoch: 320 | nupdates: 128640 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1124.00 | smp(ms): 7.56 | fwd(ms): 419.28 | crit-fwd(ms): 21.06 | bwd(ms): 642.56 | optim(ms): 57.25 | loss: 10.76944 | train-TER: 46.30 | train-WER: 63.90 | lists/dev.lst-loss: 6.69706 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.80
epoch: 321 | nupdates: 129042 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.98 | smp(ms): 5.75 | fwd(ms): 419.26 | crit-fwd(ms): 21.06 | bwd(ms): 637.64 | optim(ms): 57.25 | loss: 10.73401 | train-TER: 53.35 | train-WER: 70.94 | lists/dev.lst-loss: 6.66058 | lists/dev.lst-TER: 19.50 | lists/dev.lst-WER: 33.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.29
epoch: 322 | nupdates: 129444 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1122.78 | smp(ms): 6.89 | fwd(ms): 418.60 | crit-fwd(ms): 21.12 | bwd(ms): 641.97 | optim(ms): 57.23 | loss: 10.62311 | train-TER: 38.92 | train-WER: 57.53 | lists/dev.lst-loss: 6.66115 | lists/dev.lst-TER: 19.57 | lists/dev.lst-WER: 33.85 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.65
epoch: 323 | nupdates: 129846 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.84 | smp(ms): 5.79 | fwd(ms): 417.97 | crit-fwd(ms): 21.07 | bwd(ms): 639.58 | optim(ms): 57.21 | loss: 10.70284 | train-TER: 46.31 | train-WER: 64.30 | lists/dev.lst-loss: 6.67914 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.69
epoch: 324 | nupdates: 130248 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.68 | smp(ms): 6.62 | fwd(ms): 420.21 | crit-fwd(ms): 21.11 | bwd(ms): 639.13 | optim(ms): 57.23 | loss: 10.76655 | train-TER: 39.30 | train-WER: 57.20 | lists/dev.lst-loss: 6.65189 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.41
epoch: 325 | nupdates: 130650 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1118.14 | smp(ms): 7.86 | fwd(ms): 416.98 | crit-fwd(ms): 21.08 | bwd(ms): 638.64 | optim(ms): 57.25 | loss: 10.88024 | train-TER: 44.67 | train-WER: 62.40 | lists/dev.lst-loss: 6.69408 | lists/dev.lst-TER: 19.90 | lists/dev.lst-WER: 34.03 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.88
epoch: 326 | nupdates: 131052 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1123.36 | smp(ms): 8.33 | fwd(ms): 418.92 | crit-fwd(ms): 21.02 | bwd(ms): 642.17 | optim(ms): 57.22 | loss: 10.78969 | train-TER: 46.04 | train-WER: 63.21 | lists/dev.lst-loss: 6.67542 | lists/dev.lst-TER: 19.99 | lists/dev.lst-WER: 34.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.24
epoch: 327 | nupdates: 131454 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.61 | smp(ms): 6.71 | fwd(ms): 418.87 | crit-fwd(ms): 21.13 | bwd(ms): 638.55 | optim(ms): 57.26 | loss: 10.70045 | train-TER: 45.91 | train-WER: 62.29 | lists/dev.lst-loss: 6.70422 | lists/dev.lst-TER: 20.17 | lists/dev.lst-WER: 34.28 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.85
epoch: 328 | nupdates: 131856 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.68 | smp(ms): 7.01 | fwd(ms): 419.48 | crit-fwd(ms): 21.02 | bwd(ms): 639.24 | optim(ms): 57.26 | loss: 10.83294 | train-TER: 39.03 | train-WER: 57.63 | lists/dev.lst-loss: 6.67976 | lists/dev.lst-TER: 19.60 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.10
epoch: 329 | nupdates: 132258 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:31 | bch(ms): 1124.21 | smp(ms): 7.42 | fwd(ms): 418.58 | crit-fwd(ms): 21.16 | bwd(ms): 643.45 | optim(ms): 57.23 | loss: 10.69132 | train-TER: 41.46 | train-WER: 58.36 | lists/dev.lst-loss: 6.70156 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.66
epoch: 330 | nupdates: 132660 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.06 | smp(ms): 7.23 | fwd(ms): 417.86 | crit-fwd(ms): 21.15 | bwd(ms): 640.94 | optim(ms): 57.23 | loss: 10.85531 | train-TER: 41.36 | train-WER: 58.88 | lists/dev.lst-loss: 6.67632 | lists/dev.lst-TER: 20.09 | lists/dev.lst-WER: 34.17 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.84
epoch: 331 | nupdates: 133062 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.99 | smp(ms): 5.75 | fwd(ms): 419.02 | crit-fwd(ms): 20.90 | bwd(ms): 639.73 | optim(ms): 57.24 | loss: 10.80438 | train-TER: 41.58 | train-WER: 58.68 | lists/dev.lst-loss: 6.67867 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.89
epoch: 332 | nupdates: 133464 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:33 | bch(ms): 1129.12 | smp(ms): 6.69 | fwd(ms): 420.57 | crit-fwd(ms): 21.19 | bwd(ms): 646.30 | optim(ms): 57.23 | loss: 10.82993 | train-TER: 41.24 | train-WER: 58.64 | lists/dev.lst-loss: 6.57723 | lists/dev.lst-TER: 19.50 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 774.27
epoch: 333 | nupdates: 133866 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:36 | bch(ms): 1134.89 | smp(ms): 7.13 | fwd(ms): 418.16 | crit-fwd(ms): 21.05 | bwd(ms): 654.69 | optim(ms): 57.23 | loss: 10.78275 | train-TER: 41.07 | train-WER: 59.83 | lists/dev.lst-loss: 6.75549 | lists/dev.lst-TER: 20.17 | lists/dev.lst-WER: 34.31 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 770.34
epoch: 334 | nupdates: 134268 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:32 | bch(ms): 1125.25 | smp(ms): 6.91 | fwd(ms): 418.37 | crit-fwd(ms): 21.16 | bwd(ms): 644.84 | optim(ms): 57.20 | loss: 10.77315 | train-TER: 43.41 | train-WER: 60.68 | lists/dev.lst-loss: 6.69076 | lists/dev.lst-TER: 20.25 | lists/dev.lst-WER: 34.29 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 776.93
epoch: 335 | nupdates: 134670 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 7.32 | fwd(ms): 418.66 | crit-fwd(ms): 21.15 | bwd(ms): 640.25 | optim(ms): 57.23 | loss: 10.73087 | train-TER: 39.07 | train-WER: 57.27 | lists/dev.lst-loss: 6.73155 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 34.07 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.97
epoch: 336 | nupdates: 135072 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1117.05 | smp(ms): 7.42 | fwd(ms): 417.77 | crit-fwd(ms): 21.40 | bwd(ms): 637.09 | optim(ms): 57.25 | loss: 10.89123 | train-TER: 37.99 | train-WER: 54.81 | lists/dev.lst-loss: 6.75205 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.14 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 782.64
epoch: 337 | nupdates: 135474 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:29 | bch(ms): 1119.21 | smp(ms): 6.95 | fwd(ms): 417.85 | crit-fwd(ms): 21.09 | bwd(ms): 639.37 | optim(ms): 57.24 | loss: 11.02013 | train-TER: 44.59 | train-WER: 61.33 | lists/dev.lst-loss: 6.73084 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.13
epoch: 338 | nupdates: 135876 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1119.79 | smp(ms): 8.22 | fwd(ms): 417.09 | crit-fwd(ms): 21.01 | bwd(ms): 640.96 | optim(ms): 57.23 | loss: 10.85372 | train-TER: 45.72 | train-WER: 63.84 | lists/dev.lst-loss: 6.65583 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.73
epoch: 339 | nupdates: 136278 | lr: 0.025000 | lrcriterion: 0.025000 | runtime: 00:07:30 | bch(ms): 1121.27 | smp(ms): 5.73 | fwd(ms): 419.20 | crit-fwd(ms): 21.09 | bwd(ms): 639.03 | optim(ms): 57.23 | loss: 10.95398 | train-TER: 41.21 | train-WER: 59.35 | lists/dev.lst-loss: 6.67316 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.69
epoch: 340 | nupdates: 136680 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.39 | smp(ms): 7.26 | fwd(ms): 417.62 | crit-fwd(ms): 21.01 | bwd(ms): 641.43 | optim(ms): 57.21 | loss: 10.87525 | train-TER: 44.39 | train-WER: 61.18 | lists/dev.lst-loss: 6.69762 | lists/dev.lst-TER: 20.05 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.61
epoch: 341 | nupdates: 137082 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.64 | smp(ms): 8.20 | fwd(ms): 418.02 | crit-fwd(ms): 20.93 | bwd(ms): 641.33 | optim(ms): 57.24 | loss: 10.92946 | train-TER: 47.92 | train-WER: 64.85 | lists/dev.lst-loss: 6.60496 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.44
epoch: 342 | nupdates: 137484 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.08 | smp(ms): 4.54 | fwd(ms): 418.69 | crit-fwd(ms): 20.98 | bwd(ms): 639.44 | optim(ms): 57.21 | loss: 10.55190 | train-TER: 40.16 | train-WER: 58.84 | lists/dev.lst-loss: 6.62945 | lists/dev.lst-TER: 19.47 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.52
epoch: 343 | nupdates: 137886 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:34 | bch(ms): 1131.34 | smp(ms): 7.58 | fwd(ms): 417.90 | crit-fwd(ms): 20.98 | bwd(ms): 651.43 | optim(ms): 57.21 | loss: 10.77964 | train-TER: 38.16 | train-WER: 54.80 | lists/dev.lst-loss: 6.69175 | lists/dev.lst-TER: 19.65 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 772.76
epoch: 344 | nupdates: 138288 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1116.61 | smp(ms): 5.33 | fwd(ms): 418.18 | crit-fwd(ms): 20.97 | bwd(ms): 635.78 | optim(ms): 57.23 | loss: 10.92030 | train-TER: 44.31 | train-WER: 61.06 | lists/dev.lst-loss: 6.68560 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.95
epoch: 345 | nupdates: 138690 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.88 | smp(ms): 8.06 | fwd(ms): 416.78 | crit-fwd(ms): 21.07 | bwd(ms): 640.89 | optim(ms): 57.19 | loss: 10.72552 | train-TER: 35.15 | train-WER: 54.80 | lists/dev.lst-loss: 6.67925 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.66
epoch: 346 | nupdates: 139092 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:32 | bch(ms): 1125.22 | smp(ms): 6.33 | fwd(ms): 418.75 | crit-fwd(ms): 20.92 | bwd(ms): 644.24 | optim(ms): 57.18 | loss: 10.66137 | train-TER: 42.73 | train-WER: 60.39 | lists/dev.lst-loss: 6.71087 | lists/dev.lst-TER: 19.84 | lists/dev.lst-WER: 33.98 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.96
epoch: 347 | nupdates: 139494 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.56 | smp(ms): 7.02 | fwd(ms): 418.85 | crit-fwd(ms): 21.05 | bwd(ms): 639.60 | optim(ms): 57.22 | loss: 10.87768 | train-TER: 40.39 | train-WER: 58.12 | lists/dev.lst-loss: 6.65764 | lists/dev.lst-TER: 19.67 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.19
epoch: 348 | nupdates: 139896 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.68 | smp(ms): 6.53 | fwd(ms): 417.16 | crit-fwd(ms): 21.00 | bwd(ms): 641.09 | optim(ms): 57.23 | loss: 10.93024 | train-TER: 48.29 | train-WER: 65.10 | lists/dev.lst-loss: 6.64501 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.11
epoch: 349 | nupdates: 140298 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.77 | smp(ms): 6.65 | fwd(ms): 419.90 | crit-fwd(ms): 21.05 | bwd(ms): 640.52 | optim(ms): 57.22 | loss: 10.83907 | train-TER: 41.24 | train-WER: 59.29 | lists/dev.lst-loss: 6.71243 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.66
epoch: 350 | nupdates: 140700 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.40 | smp(ms): 7.12 | fwd(ms): 418.32 | crit-fwd(ms): 20.95 | bwd(ms): 640.06 | optim(ms): 57.24 | loss: 10.64456 | train-TER: 47.36 | train-WER: 64.98 | lists/dev.lst-loss: 6.60474 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.30
epoch: 351 | nupdates: 141102 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1123.63 | smp(ms): 6.93 | fwd(ms): 418.48 | crit-fwd(ms): 21.39 | bwd(ms): 643.42 | optim(ms): 57.21 | loss: 10.56230 | train-TER: 42.91 | train-WER: 61.16 | lists/dev.lst-loss: 6.59990 | lists/dev.lst-TER: 19.55 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.06
epoch: 352 | nupdates: 141504 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.26 | smp(ms): 5.71 | fwd(ms): 419.46 | crit-fwd(ms): 20.99 | bwd(ms): 638.94 | optim(ms): 57.25 | loss: 10.67672 | train-TER: 35.06 | train-WER: 51.89 | lists/dev.lst-loss: 6.59618 | lists/dev.lst-TER: 19.66 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 780.40
epoch: 353 | nupdates: 141906 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.20 | smp(ms): 8.04 | fwd(ms): 418.37 | crit-fwd(ms): 20.98 | bwd(ms): 640.77 | optim(ms): 57.22 | loss: 10.99347 | train-TER: 40.91 | train-WER: 57.35 | lists/dev.lst-loss: 6.66943 | lists/dev.lst-TER: 19.64 | lists/dev.lst-WER: 33.79 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.74
epoch: 354 | nupdates: 142308 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.88 | smp(ms): 7.20 | fwd(ms): 418.56 | crit-fwd(ms): 21.02 | bwd(ms): 639.07 | optim(ms): 57.23 | loss: 10.61850 | train-TER: 36.69 | train-WER: 54.70 | lists/dev.lst-loss: 6.66907 | lists/dev.lst-TER: 19.86 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.66
epoch: 355 | nupdates: 142710 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1121.94 | smp(ms): 7.51 | fwd(ms): 418.77 | crit-fwd(ms): 21.09 | bwd(ms): 640.83 | optim(ms): 57.21 | loss: 10.72346 | train-TER: 41.79 | train-WER: 59.93 | lists/dev.lst-loss: 6.65510 | lists/dev.lst-TER: 19.60 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 118 | hrs: 97.62 | thrpt(sec/sec): 779.23
epoch: 356 | nupdates: 143112 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.20 | smp(ms): 7.40 | fwd(ms): 418.91 | crit-fwd(ms): 21.13 | bwd(ms): 639.00 | optim(ms): 57.22 | loss: 10.80536 | train-TER: 48.13 | train-WER: 65.24 | lists/dev.lst-loss: 6.66143 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.44
epoch: 357 | nupdates: 143514 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.68 | smp(ms): 6.11 | fwd(ms): 417.78 | crit-fwd(ms): 21.02 | bwd(ms): 639.69 | optim(ms): 57.22 | loss: 10.57769 | train-TER: 38.02 | train-WER: 56.00 | lists/dev.lst-loss: 6.73684 | lists/dev.lst-TER: 19.88 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.80
epoch: 358 | nupdates: 143916 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.92 | smp(ms): 5.47 | fwd(ms): 417.57 | crit-fwd(ms): 21.04 | bwd(ms): 639.12 | optim(ms): 57.24 | loss: 10.63500 | train-TER: 40.68 | train-WER: 58.58 | lists/dev.lst-loss: 6.71481 | lists/dev.lst-TER: 19.90 | lists/dev.lst-WER: 33.99 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.33
epoch: 359 | nupdates: 144318 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.19 | smp(ms): 6.65 | fwd(ms): 418.51 | crit-fwd(ms): 21.00 | bwd(ms): 637.75 | optim(ms): 57.22 | loss: 10.94275 | train-TER: 43.29 | train-WER: 61.43 | lists/dev.lst-loss: 6.62894 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.84
epoch: 360 | nupdates: 144720 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1119.19 | smp(ms): 5.86 | fwd(ms): 417.40 | crit-fwd(ms): 21.04 | bwd(ms): 639.65 | optim(ms): 57.22 | loss: 10.70565 | train-TER: 44.41 | train-WER: 62.68 | lists/dev.lst-loss: 6.73623 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.15
epoch: 361 | nupdates: 145122 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1119.25 | smp(ms): 5.72 | fwd(ms): 417.23 | crit-fwd(ms): 20.92 | bwd(ms): 639.30 | optim(ms): 57.24 | loss: 10.80538 | train-TER: 44.84 | train-WER: 62.61 | lists/dev.lst-loss: 6.65564 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.10
epoch: 362 | nupdates: 145524 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.93 | smp(ms): 6.25 | fwd(ms): 417.72 | crit-fwd(ms): 21.02 | bwd(ms): 638.63 | optim(ms): 57.25 | loss: 10.60469 | train-TER: 44.62 | train-WER: 61.79 | lists/dev.lst-loss: 6.67576 | lists/dev.lst-TER: 19.63 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.32
epoch: 363 | nupdates: 145926 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.65 | smp(ms): 6.99 | fwd(ms): 418.94 | crit-fwd(ms): 21.01 | bwd(ms): 641.12 | optim(ms): 57.20 | loss: 10.81291 | train-TER: 47.05 | train-WER: 64.34 | lists/dev.lst-loss: 6.63599 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.74
epoch: 364 | nupdates: 146328 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.51 | smp(ms): 6.31 | fwd(ms): 417.10 | crit-fwd(ms): 21.09 | bwd(ms): 639.50 | optim(ms): 57.22 | loss: 10.82430 | train-TER: 42.32 | train-WER: 60.30 | lists/dev.lst-loss: 6.66549 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.62
epoch: 365 | nupdates: 146730 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.79 | smp(ms): 6.72 | fwd(ms): 418.29 | crit-fwd(ms): 20.95 | bwd(ms): 642.36 | optim(ms): 57.19 | loss: 10.68717 | train-TER: 47.24 | train-WER: 65.46 | lists/dev.lst-loss: 6.70168 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.64
epoch: 366 | nupdates: 147132 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1123.72 | smp(ms): 7.98 | fwd(ms): 419.31 | crit-fwd(ms): 21.11 | bwd(ms): 642.50 | optim(ms): 57.23 | loss: 10.70517 | train-TER: 41.96 | train-WER: 59.62 | lists/dev.lst-loss: 6.70760 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.76 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.99
epoch: 367 | nupdates: 147534 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:33 | bch(ms): 1128.79 | smp(ms): 8.14 | fwd(ms): 419.81 | crit-fwd(ms): 21.25 | bwd(ms): 646.95 | optim(ms): 57.19 | loss: 10.73120 | train-TER: 31.01 | train-WER: 48.88 | lists/dev.lst-loss: 6.69520 | lists/dev.lst-TER: 19.87 | lists/dev.lst-WER: 33.93 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 774.50
epoch: 368 | nupdates: 147936 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.24 | smp(ms): 6.52 | fwd(ms): 417.76 | crit-fwd(ms): 21.05 | bwd(ms): 641.21 | optim(ms): 57.21 | loss: 10.68916 | train-TER: 42.01 | train-WER: 59.07 | lists/dev.lst-loss: 6.74897 | lists/dev.lst-TER: 19.92 | lists/dev.lst-WER: 33.92 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.71
epoch: 369 | nupdates: 148338 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1117.61 | smp(ms): 6.13 | fwd(ms): 418.39 | crit-fwd(ms): 21.26 | bwd(ms): 636.24 | optim(ms): 57.24 | loss: 10.69075 | train-TER: 43.12 | train-WER: 60.67 | lists/dev.lst-loss: 6.58688 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.25
epoch: 370 | nupdates: 148740 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.40 | smp(ms): 7.72 | fwd(ms): 417.65 | crit-fwd(ms): 21.28 | bwd(ms): 642.40 | optim(ms): 57.21 | loss: 10.87215 | train-TER: 40.21 | train-WER: 58.63 | lists/dev.lst-loss: 6.61945 | lists/dev.lst-TER: 19.95 | lists/dev.lst-WER: 34.01 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.91
epoch: 371 | nupdates: 149142 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1120.24 | smp(ms): 6.42 | fwd(ms): 418.67 | crit-fwd(ms): 20.97 | bwd(ms): 639.23 | optim(ms): 57.22 | loss: 10.61025 | train-TER: 46.16 | train-WER: 62.50 | lists/dev.lst-loss: 6.68208 | lists/dev.lst-TER: 19.93 | lists/dev.lst-WER: 33.94 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.41
epoch: 372 | nupdates: 149544 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.79 | smp(ms): 5.11 | fwd(ms): 418.69 | crit-fwd(ms): 21.00 | bwd(ms): 638.65 | optim(ms): 57.21 | loss: 10.74536 | train-TER: 40.76 | train-WER: 57.79 | lists/dev.lst-loss: 6.68823 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.00 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.73
epoch: 373 | nupdates: 149946 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1116.46 | smp(ms): 7.35 | fwd(ms): 416.65 | crit-fwd(ms): 21.16 | bwd(ms): 637.79 | optim(ms): 57.21 | loss: 10.89943 | train-TER: 38.84 | train-WER: 57.21 | lists/dev.lst-loss: 6.69341 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 783.06
epoch: 374 | nupdates: 150348 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1119.50 | smp(ms): 7.09 | fwd(ms): 417.02 | crit-fwd(ms): 21.20 | bwd(ms): 640.63 | optim(ms): 57.23 | loss: 10.71602 | train-TER: 37.35 | train-WER: 55.89 | lists/dev.lst-loss: 6.63854 | lists/dev.lst-TER: 19.59 | lists/dev.lst-WER: 33.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 780.93
epoch: 375 | nupdates: 150750 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:28 | bch(ms): 1115.36 | smp(ms): 6.82 | fwd(ms): 417.23 | crit-fwd(ms): 21.07 | bwd(ms): 635.92 | optim(ms): 57.25 | loss: 10.74817 | train-TER: 38.59 | train-WER: 55.37 | lists/dev.lst-loss: 6.68849 | lists/dev.lst-TER: 20.18 | lists/dev.lst-WER: 34.18 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 783.83
epoch: 376 | nupdates: 151152 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:31 | bch(ms): 1122.78 | smp(ms): 8.22 | fwd(ms): 417.07 | crit-fwd(ms): 21.21 | bwd(ms): 643.75 | optim(ms): 57.21 | loss: 10.77428 | train-TER: 41.59 | train-WER: 60.24 | lists/dev.lst-loss: 6.61870 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.89 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.65
epoch: 377 | nupdates: 151554 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.40 | smp(ms): 6.81 | fwd(ms): 420.51 | crit-fwd(ms): 21.18 | bwd(ms): 638.97 | optim(ms): 57.22 | loss: 10.63653 | train-TER: 40.69 | train-WER: 58.46 | lists/dev.lst-loss: 6.64540 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 33.91 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.61
epoch: 378 | nupdates: 151956 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:29 | bch(ms): 1118.65 | smp(ms): 6.22 | fwd(ms): 418.68 | crit-fwd(ms): 21.26 | bwd(ms): 637.80 | optim(ms): 57.24 | loss: 10.87476 | train-TER: 44.23 | train-WER: 61.85 | lists/dev.lst-loss: 6.63541 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.86 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.52
epoch: 379 | nupdates: 152358 | lr: 0.012500 | lrcriterion: 0.012500 | runtime: 00:07:30 | bch(ms): 1121.86 | smp(ms): 6.84 | fwd(ms): 418.92 | crit-fwd(ms): 20.91 | bwd(ms): 640.92 | optim(ms): 57.21 | loss: 10.59453 | train-TER: 42.60 | train-WER: 60.01 | lists/dev.lst-loss: 6.57962 | lists/dev.lst-TER: 19.56 | lists/dev.lst-WER: 33.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 779.28
epoch: 380 | nupdates: 152760 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1126.29 | smp(ms): 6.61 | fwd(ms): 418.76 | crit-fwd(ms): 21.23 | bwd(ms): 645.36 | optim(ms): 57.26 | loss: 10.74273 | train-TER: 48.93 | train-WER: 65.37 | lists/dev.lst-loss: 6.69067 | lists/dev.lst-TER: 19.63 | lists/dev.lst-WER: 33.73 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 776.22
epoch: 381 | nupdates: 153162 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:30 | bch(ms): 1120.88 | smp(ms): 6.71 | fwd(ms): 418.56 | crit-fwd(ms): 20.99 | bwd(ms): 639.91 | optim(ms): 57.22 | loss: 10.73482 | train-TER: 44.53 | train-WER: 62.77 | lists/dev.lst-loss: 6.72419 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 779.97
epoch: 382 | nupdates: 153564 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.83 | smp(ms): 6.43 | fwd(ms): 418.62 | crit-fwd(ms): 21.02 | bwd(ms): 643.12 | optim(ms): 57.23 | loss: 10.73894 | train-TER: 34.70 | train-WER: 52.31 | lists/dev.lst-loss: 6.66490 | lists/dev.lst-TER: 19.79 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.92
epoch: 383 | nupdates: 153966 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.83 | smp(ms): 7.19 | fwd(ms): 418.61 | crit-fwd(ms): 21.11 | bwd(ms): 644.22 | optim(ms): 57.22 | loss: 10.84190 | train-TER: 47.90 | train-WER: 65.20 | lists/dev.lst-loss: 6.64215 | lists/dev.lst-TER: 19.62 | lists/dev.lst-WER: 33.78 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.23
epoch: 384 | nupdates: 154368 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1118.47 | smp(ms): 7.17 | fwd(ms): 418.47 | crit-fwd(ms): 21.06 | bwd(ms): 637.92 | optim(ms): 57.24 | loss: 10.76920 | train-TER: 42.60 | train-WER: 60.00 | lists/dev.lst-loss: 6.61777 | lists/dev.lst-TER: 19.57 | lists/dev.lst-WER: 33.70 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.65
epoch: 385 | nupdates: 154770 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.39 | smp(ms): 7.13 | fwd(ms): 419.08 | crit-fwd(ms): 21.07 | bwd(ms): 643.21 | optim(ms): 57.22 | loss: 10.84138 | train-TER: 44.53 | train-WER: 62.33 | lists/dev.lst-loss: 6.65517 | lists/dev.lst-TER: 19.81 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.53
epoch: 386 | nupdates: 155172 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1119.36 | smp(ms): 6.84 | fwd(ms): 417.83 | crit-fwd(ms): 21.14 | bwd(ms): 639.66 | optim(ms): 57.25 | loss: 10.75169 | train-TER: 43.95 | train-WER: 62.08 | lists/dev.lst-loss: 6.60215 | lists/dev.lst-TER: 19.78 | lists/dev.lst-WER: 33.88 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 781.02
epoch: 387 | nupdates: 155574 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1126.64 | smp(ms): 7.29 | fwd(ms): 419.80 | crit-fwd(ms): 21.05 | bwd(ms): 644.80 | optim(ms): 57.21 | loss: 10.65912 | train-TER: 34.57 | train-WER: 51.59 | lists/dev.lst-loss: 6.66376 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 775.98
epoch: 388 | nupdates: 155976 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.30 | smp(ms): 7.31 | fwd(ms): 418.33 | crit-fwd(ms): 21.31 | bwd(ms): 641.73 | optim(ms): 57.21 | loss: 10.62669 | train-TER: 46.35 | train-WER: 63.95 | lists/dev.lst-loss: 6.67349 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 33.71 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.98
epoch: 389 | nupdates: 156378 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.34 | smp(ms): 7.23 | fwd(ms): 418.26 | crit-fwd(ms): 21.16 | bwd(ms): 643.89 | optim(ms): 57.20 | loss: 10.75452 | train-TER: 45.12 | train-WER: 62.49 | lists/dev.lst-loss: 6.67610 | lists/dev.lst-TER: 19.77 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 777.56
epoch: 390 | nupdates: 156780 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.01 | smp(ms): 7.92 | fwd(ms): 418.60 | crit-fwd(ms): 21.23 | bwd(ms): 642.24 | optim(ms): 57.22 | loss: 10.73723 | train-TER: 50.22 | train-WER: 68.62 | lists/dev.lst-loss: 6.64329 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.49
epoch: 391 | nupdates: 157182 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.19 | smp(ms): 8.26 | fwd(ms): 418.19 | crit-fwd(ms): 21.11 | bwd(ms): 641.52 | optim(ms): 57.25 | loss: 10.75576 | train-TER: 42.55 | train-WER: 60.68 | lists/dev.lst-loss: 6.64239 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 779.05
epoch: 392 | nupdates: 157584 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.35 | smp(ms): 7.34 | fwd(ms): 418.32 | crit-fwd(ms): 21.10 | bwd(ms): 643.46 | optim(ms): 57.24 | loss: 10.64738 | train-TER: 41.47 | train-WER: 59.60 | lists/dev.lst-loss: 6.61881 | lists/dev.lst-TER: 19.76 | lists/dev.lst-WER: 33.82 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.56
epoch: 393 | nupdates: 157986 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:28 | bch(ms): 1116.80 | smp(ms): 6.79 | fwd(ms): 417.06 | crit-fwd(ms): 21.20 | bwd(ms): 637.89 | optim(ms): 57.26 | loss: 10.47069 | train-TER: 41.11 | train-WER: 57.11 | lists/dev.lst-loss: 6.59647 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.68 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 782.82
epoch: 394 | nupdates: 158388 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:30 | bch(ms): 1119.47 | smp(ms): 4.96 | fwd(ms): 417.22 | crit-fwd(ms): 20.93 | bwd(ms): 638.43 | optim(ms): 57.23 | loss: 10.66487 | train-TER: 43.43 | train-WER: 60.14 | lists/dev.lst-loss: 6.64685 | lists/dev.lst-TER: 19.73 | lists/dev.lst-WER: 33.83 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 780.95
epoch: 395 | nupdates: 158790 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1125.30 | smp(ms): 7.04 | fwd(ms): 419.28 | crit-fwd(ms): 21.30 | bwd(ms): 643.98 | optim(ms): 57.23 | loss: 10.68931 | train-TER: 44.86 | train-WER: 62.54 | lists/dev.lst-loss: 6.60740 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 33.75 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.91
epoch: 396 | nupdates: 159192 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1124.13 | smp(ms): 6.57 | fwd(ms): 419.13 | crit-fwd(ms): 21.08 | bwd(ms): 642.24 | optim(ms): 57.23 | loss: 10.60523 | train-TER: 38.68 | train-WER: 56.60 | lists/dev.lst-loss: 6.57608 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.72 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 777.71
epoch: 397 | nupdates: 159594 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.64 | smp(ms): 7.56 | fwd(ms): 418.76 | crit-fwd(ms): 20.96 | bwd(ms): 642.06 | optim(ms): 57.23 | loss: 10.74693 | train-TER: 40.34 | train-WER: 57.30 | lists/dev.lst-loss: 6.60898 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 121 | hrs: 97.62 | thrpt(sec/sec): 778.74
epoch: 398 | nupdates: 159996 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:28 | bch(ms): 1116.67 | smp(ms): 5.10 | fwd(ms): 417.85 | crit-fwd(ms): 21.01 | bwd(ms): 636.57 | optim(ms): 57.25 | loss: 10.58123 | train-TER: 44.81 | train-WER: 61.63 | lists/dev.lst-loss: 6.59653 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.88[[ | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 782.90
epoch: 399 | nupdates: 160398 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1123.11 | smp(ms): 8.13 | fwd(ms): 418.90 | crit-fwd(ms): 21.12 | bwd(ms): 642.17 | optim(ms): 57.25 | loss: 10.53012 | train-TER: 40.06 | train-WER: 56.77 | lists/dev.lst-loss: 6.62226 | lists/dev.lst-TER: 19.82 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.42
epoch: 400 | nupdates: 160800 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.56 | smp(ms): 7.06 | fwd(ms): 418.75 | crit-fwd(ms): 21.09 | bwd(ms): 641.36 | optim(ms): 57.24 | loss: 10.64156 | train-TER: 52.41 | train-WER: 68.82 | lists/dev.lst-loss: 6.67411 | lists/dev.lst-TER: 19.79 | lists/dev.lst-WER: 33.87 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 778.80
epoch: 401 | nupdates: 161202 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:29 | bch(ms): 1118.23 | smp(ms): 3.67 | fwd(ms): 417.46 | crit-fwd(ms): 20.88 | bwd(ms): 637.65 | optim(ms): 57.31 | loss: 10.64980 | train-TER: 42.47 | train-WER: 60.65 | lists/dev.lst-loss: 6.61162 | lists/dev.lst-TER: 19.59 | lists/dev.lst-WER: 33.74 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 781.81
epoch: 402 | nupdates: 161604 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1124.50 | smp(ms): 4.92 | fwd(ms): 420.02 | crit-fwd(ms): 20.92 | bwd(ms): 642.55 | optim(ms): 57.33 | loss: 10.77812 | train-TER: 48.15 | train-WER: 65.94 | lists/dev.lst-loss: 6.58243 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 777.45
epoch: 403 | nupdates: 162006 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:31 | bch(ms): 1122.55 | smp(ms): 6.38 | fwd(ms): 419.54 | crit-fwd(ms): 20.96 | bwd(ms): 640.69 | optim(ms): 57.22 | loss: 10.65866 | train-TER: 41.94 | train-WER: 60.21 | lists/dev.lst-loss: 6.61306 | lists/dev.lst-TER: 19.68 | lists/dev.lst-WER: 33.77 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 119 | hrs: 97.62 | thrpt(sec/sec): 778.81
epoch: 404 | nupdates: 162408 | lr: 0.006250 | lrcriterion: 0.006250 | runtime: 00:07:32 | bch(ms): 1125.92 | smp(ms): 7.74 | fwd(ms): 418.89 | crit-fwd(ms): 21.13 | bwd(ms): 644.72 | optim(ms): 57.24 | loss: 10.54506 | train-TER: 43.04 | train-WER: 60.40 | lists/dev.lst-loss: 6.61504 | lists/dev.lst-TER: 19.71 | lists/dev.lst-WER: 33.80 | avg-isz: 683 | avg-tsz: 023 | max-tsz: 120 | hrs: 97.62 | thrpt(sec/sec): 776.48