epoch: 6 | nupdates: 3693 | lr: 0.092325 | lrcriterion: 0.092325 | runtime: 00:10:47 | bch(ms): 806.10 | smp(ms): 1.58 | fwd(ms): 281.74 | crit-fwd(ms): 19.56 | bwd(ms): 458.02 | optim(ms): 58.80 | loss: 29.71504 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 30.62654 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 539.44
epoch: 7 | nupdates: 4496 | lr: 0.112400 | lrcriterion: 0.112400 | runtime: 00:10:39 | bch(ms): 796.35 | smp(ms): 1.71 | fwd(ms): 277.77 | crit-fwd(ms): 18.88 | bwd(ms): 459.27 | optim(ms): 56.95 | loss: 29.14489 | train-TER: 100.00 | train-WER: 100.00 | lists/dev.lst-loss: 28.66800 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 546.04
epoch: 8 | nupdates: 5299 | lr: 0.132475 | lrcriterion: 0.132475 | runtime: 00:10:43 | bch(ms): 801.20 | smp(ms): 2.18 | fwd(ms): 278.16 | crit-fwd(ms): 18.90 | bwd(ms): 463.76 | optim(ms): 56.85 | loss: 28.84527 | train-TER: 99.97 | train-WER: 100.00 | lists/dev.lst-loss: 29.02840 | lists/dev.lst-TER: 100.00 | lists/dev.lst-WER: 100.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 542.74
epoch: 9 | nupdates: 6102 | lr: 0.152550 | lrcriterion: 0.152550 | runtime: 00:10:45 | bch(ms): 803.61 | smp(ms): 2.86 | fwd(ms): 277.53 | crit-fwd(ms): 18.92 | bwd(ms): 466.88 | optim(ms): 56.80 | loss: 28.60569 | train-TER: 99.24 | train-WER: 99.80 | lists/dev.lst-loss: 27.97900 | lists/dev.lst-TER: 99.70 | lists/dev.lst-WER: 99.85 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 541.11
epoch: 10 | nupdates: 6905 | lr: 0.172625 | lrcriterion: 0.172625 | runtime: 00:10:46 | bch(ms): 804.84 | smp(ms): 2.25 | fwd(ms): 277.49 | crit-fwd(ms): 18.91 | bwd(ms): 468.28 | optim(ms): 56.76 | loss: 28.21785 | train-TER: 99.30 | train-WER: 99.47 | lists/dev.lst-loss: 27.66185 | lists/dev.lst-TER: 99.38 | lists/dev.lst-WER: 99.46 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 540.28
epoch: 11 | nupdates: 7708 | lr: 0.192700 | lrcriterion: 0.192700 | runtime: 00:10:47 | bch(ms): 806.10 | smp(ms): 1.62 | fwd(ms): 278.00 | crit-fwd(ms): 18.81 | bwd(ms): 468.94 | optim(ms): 56.77 | loss: 27.72629 | train-TER: 98.35 | train-WER: 98.70 | lists/dev.lst-loss: 26.79953 | lists/dev.lst-TER: 95.71 | lists/dev.lst-WER: 97.50 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 539.44
epoch: 12 | nupdates: 8511 | lr: 0.212775 | lrcriterion: 0.212775 | runtime: 00:10:48 | bch(ms): 807.17 | smp(ms): 2.03 | fwd(ms): 278.34 | crit-fwd(ms): 18.96 | bwd(ms): 469.80 | optim(ms): 56.76 | loss: 27.04987 | train-TER: 97.35 | train-WER: 97.97 | lists/dev.lst-loss: 26.03985 | lists/dev.lst-TER: 93.85 | lists/dev.lst-WER: 96.80 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 538.73
epoch: 13 | nupdates: 9314 | lr: 0.232850 | lrcriterion: 0.232850 | runtime: 00:10:47 | bch(ms): 806.22 | smp(ms): 2.04 | fwd(ms): 277.73 | crit-fwd(ms): 18.93 | bwd(ms): 469.40 | optim(ms): 56.73 | loss: 26.35331 | train-TER: 92.61 | train-WER: 95.84 | lists/dev.lst-loss: 25.20862 | lists/dev.lst-TER: 89.18 | lists/dev.lst-WER: 94.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 539.36
epoch: 14 | nupdates: 10117 | lr: 0.252925 | lrcriterion: 0.252925 | runtime: 00:10:48 | bch(ms): 808.08 | smp(ms): 2.19 | fwd(ms): 278.11 | crit-fwd(ms): 18.94 | bwd(ms): 470.81 | optim(ms): 56.72 | loss: 25.59886 | train-TER: 92.22 | train-WER: 95.18 | lists/dev.lst-loss: 24.39065 | lists/dev.lst-TER: 88.33 | lists/dev.lst-WER: 92.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 538.11
epoch: 15 | nupdates: 10920 | lr: 0.273000 | lrcriterion: 0.273000 | runtime: 00:10:48 | bch(ms): 807.92 | smp(ms): 2.56 | fwd(ms): 278.24 | crit-fwd(ms): 18.97 | bwd(ms): 470.64 | optim(ms): 56.72 | loss: 24.83128 | train-TER: 89.48 | train-WER: 93.93 | lists/dev.lst-loss: 23.62460 | lists/dev.lst-TER: 91.46 | lists/dev.lst-WER: 93.91 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 538.22
epoch: 16 | nupdates: 11723 | lr: 0.293075 | lrcriterion: 0.293075 | runtime: 00:10:42 | bch(ms): 800.53 | smp(ms): 1.44 | fwd(ms): 277.28 | crit-fwd(ms): 18.84 | bwd(ms): 463.74 | optim(ms): 56.73 | loss: 24.10814 | train-TER: 86.15 | train-WER: 92.39 | lists/dev.lst-loss: 22.78769 | lists/dev.lst-TER: 86.12 | lists/dev.lst-WER: 91.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 543.19
epoch: 17 | nupdates: 12526 | lr: 0.313150 | lrcriterion: 0.313150 | runtime: 00:10:48 | bch(ms): 807.45 | smp(ms): 2.43 | fwd(ms): 278.20 | crit-fwd(ms): 18.95 | bwd(ms): 470.08 | optim(ms): 56.73 | loss: 23.39149 | train-TER: 81.98 | train-WER: 90.51 | lists/dev.lst-loss: 22.04153 | lists/dev.lst-TER: 77.93 | lists/dev.lst-WER: 88.93 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 538.54
epoch: 18 | nupdates: 13329 | lr: 0.333225 | lrcriterion: 0.333225 | runtime: 00:10:48 | bch(ms): 807.96 | smp(ms): 2.21 | fwd(ms): 278.55 | crit-fwd(ms): 18.96 | bwd(ms): 470.34 | optim(ms): 56.73 | loss: 22.74859 | train-TER: 80.67 | train-WER: 89.68 | lists/dev.lst-loss: 21.45315 | lists/dev.lst-TER: 78.01 | lists/dev.lst-WER: 87.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 538.20
epoch: 19 | nupdates: 14132 | lr: 0.353300 | lrcriterion: 0.353300 | runtime: 00:10:47 | bch(ms): 806.83 | smp(ms): 1.55 | fwd(ms): 277.25 | crit-fwd(ms): 18.91 | bwd(ms): 470.52 | optim(ms): 56.71 | loss: 22.17432 | train-TER: 83.02 | train-WER: 90.48 | lists/dev.lst-loss: 21.05041 | lists/dev.lst-TER: 82.57 | lists/dev.lst-WER: 90.55 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 538.95
epoch: 20 | nupdates: 14935 | lr: 0.373375 | lrcriterion: 0.373375 | runtime: 00:10:43 | bch(ms): 801.74 | smp(ms): 2.21 | fwd(ms): 277.05 | crit-fwd(ms): 18.90 | bwd(ms): 465.49 | optim(ms): 56.71 | loss: 21.59827 | train-TER: 78.18 | train-WER: 88.98 | lists/dev.lst-loss: 20.53805 | lists/dev.lst-TER: 72.09 | lists/dev.lst-WER: 85.10 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 542.37
epoch: 21 | nupdates: 15738 | lr: 0.393450 | lrcriterion: 0.393450 | runtime: 00:10:47 | bch(ms): 806.88 | smp(ms): 2.02 | fwd(ms): 277.97 | crit-fwd(ms): 18.91 | bwd(ms): 469.87 | optim(ms): 56.71 | loss: 21.07051 | train-TER: 77.23 | train-WER: 88.04 | lists/dev.lst-loss: 19.76956 | lists/dev.lst-TER: 76.42 | lists/dev.lst-WER: 86.35 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 538.92
epoch: 22 | nupdates: 16541 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.39 | smp(ms): 2.07 | fwd(ms): 274.87 | crit-fwd(ms): 19.18 | bwd(ms): 455.43 | optim(ms): 56.74 | loss: 24.01818 | train-TER: 81.88 | train-WER: 91.60 | lists/dev.lst-loss: 20.42508 | lists/dev.lst-TER: 78.47 | lists/dev.lst-WER: 88.52 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.86
epoch: 23 | nupdates: 17344 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 785.99 | smp(ms): 2.71 | fwd(ms): 274.07 | crit-fwd(ms): 19.35 | bwd(ms): 452.81 | optim(ms): 56.77 | loss: 24.67981 | train-TER: 82.47 | train-WER: 92.73 | lists/dev.lst-loss: 20.08192 | lists/dev.lst-TER: 81.08 | lists/dev.lst-WER: 89.24 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.24
epoch: 24 | nupdates: 18147 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.43 | smp(ms): 1.43 | fwd(ms): 274.29 | crit-fwd(ms): 19.26 | bwd(ms): 453.56 | optim(ms): 56.76 | loss: 24.26502 | train-TER: 86.22 | train-WER: 93.42 | lists/dev.lst-loss: 19.65014 | lists/dev.lst-TER: 74.80 | lists/dev.lst-WER: 86.67 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 552.23
epoch: 25 | nupdates: 18950 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 788.16 | smp(ms): 2.04 | fwd(ms): 274.05 | crit-fwd(ms): 19.21 | bwd(ms): 454.89 | optim(ms): 56.76 | loss: 24.01530 | train-TER: 87.48 | train-WER: 93.93 | lists/dev.lst-loss: 19.38371 | lists/dev.lst-TER: 77.27 | lists/dev.lst-WER: 87.56 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 551.71
epoch: 26 | nupdates: 19753 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.68 | smp(ms): 2.00 | fwd(ms): 274.33 | crit-fwd(ms): 19.21 | bwd(ms): 453.14 | optim(ms): 56.77 | loss: 23.58201 | train-TER: 82.88 | train-WER: 92.24 | lists/dev.lst-loss: 18.96313 | lists/dev.lst-TER: 74.08 | lists/dev.lst-WER: 85.77 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.75
epoch: 27 | nupdates: 20556 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.32 | smp(ms): 1.97 | fwd(ms): 274.27 | crit-fwd(ms): 19.29 | bwd(ms): 452.99 | optim(ms): 56.77 | loss: 23.26930 | train-TER: 85.13 | train-WER: 93.09 | lists/dev.lst-loss: 18.53279 | lists/dev.lst-TER: 77.32 | lists/dev.lst-WER: 86.91 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.01
epoch: 28 | nupdates: 21359 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.26 | smp(ms): 1.91 | fwd(ms): 273.98 | crit-fwd(ms): 19.22 | bwd(ms): 449.95 | optim(ms): 56.78 | loss: 23.09594 | train-TER: 84.34 | train-WER: 92.56 | lists/dev.lst-loss: 17.70705 | lists/dev.lst-TER: 63.86 | lists/dev.lst-WER: 80.82 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.17
epoch: 29 | nupdates: 22162 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.42 | smp(ms): 2.13 | fwd(ms): 274.33 | crit-fwd(ms): 19.25 | bwd(ms): 457.94 | optim(ms): 56.77 | loss: 22.57435 | train-TER: 79.90 | train-WER: 90.32 | lists/dev.lst-loss: 17.26934 | lists/dev.lst-TER: 65.10 | lists/dev.lst-WER: 81.35 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.44
epoch: 30 | nupdates: 22965 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.82 | smp(ms): 2.12 | fwd(ms): 273.99 | crit-fwd(ms): 19.24 | bwd(ms): 453.66 | optim(ms): 56.77 | loss: 22.32816 | train-TER: 74.22 | train-WER: 87.75 | lists/dev.lst-loss: 17.00822 | lists/dev.lst-TER: 67.75 | lists/dev.lst-WER: 81.51 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.66
epoch: 31 | nupdates: 23768 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.79 | smp(ms): 1.95 | fwd(ms): 273.34 | crit-fwd(ms): 19.25 | bwd(ms): 450.35 | optim(ms): 56.78 | loss: 21.93827 | train-TER: 80.36 | train-WER: 90.58 | lists/dev.lst-loss: 16.31168 | lists/dev.lst-TER: 56.21 | lists/dev.lst-WER: 75.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.50
epoch: 32 | nupdates: 24571 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:37 | bch(ms): 793.64 | smp(ms): 1.96 | fwd(ms): 274.63 | crit-fwd(ms): 19.12 | bwd(ms): 459.80 | optim(ms): 56.79 | loss: 21.69832 | train-TER: 77.86 | train-WER: 89.60 | lists/dev.lst-loss: 16.19251 | lists/dev.lst-TER: 65.47 | lists/dev.lst-WER: 80.12 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 547.91
epoch: 33 | nupdates: 25374 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.76 | smp(ms): 2.64 | fwd(ms): 274.14 | crit-fwd(ms): 19.36 | bwd(ms): 453.46 | optim(ms): 56.76 | loss: 21.34769 | train-TER: 73.98 | train-WER: 87.59 | lists/dev.lst-loss: 15.55199 | lists/dev.lst-TER: 60.31 | lists/dev.lst-WER: 76.69 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.70
epoch: 34 | nupdates: 26177 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.84 | smp(ms): 2.16 | fwd(ms): 274.17 | crit-fwd(ms): 19.18 | bwd(ms): 451.52 | optim(ms): 56.77 | loss: 21.17177 | train-TER: 75.08 | train-WER: 87.76 | lists/dev.lst-loss: 15.24785 | lists/dev.lst-TER: 59.58 | lists/dev.lst-WER: 75.89 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.05
epoch: 35 | nupdates: 26980 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.74 | smp(ms): 2.58 | fwd(ms): 273.64 | crit-fwd(ms): 19.26 | bwd(ms): 451.90 | optim(ms): 56.77 | loss: 20.88110 | train-TER: 69.61 | train-WER: 85.52 | lists/dev.lst-loss: 14.83493 | lists/dev.lst-TER: 52.46 | lists/dev.lst-WER: 72.18 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.12
epoch: 36 | nupdates: 27783 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.71 | smp(ms): 1.78 | fwd(ms): 273.96 | crit-fwd(ms): 19.25 | bwd(ms): 457.61 | optim(ms): 56.78 | loss: 20.67697 | train-TER: 76.11 | train-WER: 88.96 | lists/dev.lst-loss: 14.36052 | lists/dev.lst-TER: 50.20 | lists/dev.lst-WER: 69.90 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.94
epoch: 37 | nupdates: 28586 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 792.97 | smp(ms): 2.05 | fwd(ms): 274.34 | crit-fwd(ms): 19.19 | bwd(ms): 459.50 | optim(ms): 56.77 | loss: 20.50031 | train-TER: 72.02 | train-WER: 85.27 | lists/dev.lst-loss: 14.53550 | lists/dev.lst-TER: 54.76 | lists/dev.lst-WER: 72.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 548.37
epoch: 38 | nupdates: 29389 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.79 | smp(ms): 2.06 | fwd(ms): 273.56 | crit-fwd(ms): 19.12 | bwd(ms): 452.03 | optim(ms): 56.77 | loss: 20.33790 | train-TER: 69.36 | train-WER: 84.77 | lists/dev.lst-loss: 14.18825 | lists/dev.lst-TER: 55.86 | lists/dev.lst-WER: 72.45 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.09
epoch: 39 | nupdates: 30192 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.46 | smp(ms): 2.07 | fwd(ms): 274.04 | crit-fwd(ms): 19.31 | bwd(ms): 452.18 | optim(ms): 56.77 | loss: 20.00354 | train-TER: 74.23 | train-WER: 87.73 | lists/dev.lst-loss: 13.63189 | lists/dev.lst-TER: 48.65 | lists/dev.lst-WER: 67.96 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.62
epoch: 40 | nupdates: 30995 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.66 | smp(ms): 1.81 | fwd(ms): 274.14 | crit-fwd(ms): 19.29 | bwd(ms): 458.44 | optim(ms): 56.76 | loss: 19.86422 | train-TER: 69.83 | train-WER: 85.29 | lists/dev.lst-loss: 13.38313 | lists/dev.lst-TER: 45.91 | lists/dev.lst-WER: 66.60 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.28
epoch: 41 | nupdates: 31798 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.24 | smp(ms): 1.97 | fwd(ms): 274.02 | crit-fwd(ms): 19.27 | bwd(ms): 457.11 | optim(ms): 56.75 | loss: 19.59726 | train-TER: 68.86 | train-WER: 84.74 | lists/dev.lst-loss: 13.19527 | lists/dev.lst-TER: 45.17 | lists/dev.lst-WER: 65.39 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.26
epoch: 42 | nupdates: 32601 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.57 | smp(ms): 1.18 | fwd(ms): 274.26 | crit-fwd(ms): 19.16 | bwd(ms): 457.16 | optim(ms): 56.76 | loss: 19.46408 | train-TER: 69.42 | train-WER: 84.54 | lists/dev.lst-loss: 13.05933 | lists/dev.lst-TER: 46.49 | lists/dev.lst-WER: 65.97 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.04
epoch: 43 | nupdates: 33404 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.25 | smp(ms): 1.94 | fwd(ms): 273.95 | crit-fwd(ms): 19.25 | bwd(ms): 452.16 | optim(ms): 56.75 | loss: 19.29657 | train-TER: 64.67 | train-WER: 81.38 | lists/dev.lst-loss: 13.00825 | lists/dev.lst-TER: 49.36 | lists/dev.lst-WER: 67.68 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.76
epoch: 44 | nupdates: 34207 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.56 | smp(ms): 1.93 | fwd(ms): 273.74 | crit-fwd(ms): 19.17 | bwd(ms): 451.81 | optim(ms): 56.75 | loss: 19.01853 | train-TER: 65.00 | train-WER: 81.97 | lists/dev.lst-loss: 12.53849 | lists/dev.lst-TER: 42.00 | lists/dev.lst-WER: 62.81 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.25
epoch: 45 | nupdates: 35010 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.06 | smp(ms): 1.96 | fwd(ms): 274.07 | crit-fwd(ms): 19.38 | bwd(ms): 457.88 | optim(ms): 56.75 | loss: 18.91372 | train-TER: 64.16 | train-WER: 81.83 | lists/dev.lst-loss: 12.41104 | lists/dev.lst-TER: 42.49 | lists/dev.lst-WER: 62.64 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.70
epoch: 46 | nupdates: 35813 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.69 | smp(ms): 2.19 | fwd(ms): 274.37 | crit-fwd(ms): 19.15 | bwd(ms): 457.24 | optim(ms): 56.75 | loss: 18.77318 | train-TER: 59.45 | train-WER: 78.18 | lists/dev.lst-loss: 12.15234 | lists/dev.lst-TER: 42.84 | lists/dev.lst-WER: 62.91 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 549.96
epoch: 47 | nupdates: 36616 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.36 | smp(ms): 2.25 | fwd(ms): 273.69 | crit-fwd(ms): 19.21 | bwd(ms): 450.36 | optim(ms): 56.75 | loss: 18.46053 | train-TER: 64.68 | train-WER: 81.65 | lists/dev.lst-loss: 11.97453 | lists/dev.lst-TER: 40.67 | lists/dev.lst-WER: 60.72 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.10
epoch: 48 | nupdates: 37419 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 789.95 | smp(ms): 2.33 | fwd(ms): 273.72 | crit-fwd(ms): 19.24 | bwd(ms): 457.00 | optim(ms): 56.75 | loss: 18.34775 | train-TER: 63.50 | train-WER: 81.37 | lists/dev.lst-loss: 11.93229 | lists/dev.lst-TER: 39.97 | lists/dev.lst-WER: 60.05 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 550.47
epoch: 49 | nupdates: 38222 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 792.06 | smp(ms): 2.57 | fwd(ms): 274.00 | crit-fwd(ms): 19.21 | bwd(ms): 459.05 | optim(ms): 56.75 | loss: 18.21102 | train-TER: 61.20 | train-WER: 79.64 | lists/dev.lst-loss: 11.75162 | lists/dev.lst-TER: 38.93 | lists/dev.lst-WER: 59.56 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 549.00
epoch: 50 | nupdates: 39025 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 788.38 | smp(ms): 2.19 | fwd(ms): 273.58 | crit-fwd(ms): 19.19 | bwd(ms): 455.63 | optim(ms): 56.75 | loss: 18.07222 | train-TER: 61.15 | train-WER: 78.43 | lists/dev.lst-loss: 11.64541 | lists/dev.lst-TER: 40.44 | lists/dev.lst-WER: 59.94 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 551.56
epoch: 51 | nupdates: 39828 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.11 | smp(ms): 1.97 | fwd(ms): 273.27 | crit-fwd(ms): 19.14 | bwd(ms): 451.73 | optim(ms): 56.74 | loss: 17.90051 | train-TER: 58.90 | train-WER: 77.82 | lists/dev.lst-loss: 11.55510 | lists/dev.lst-TER: 42.42 | lists/dev.lst-WER: 60.66 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.56
epoch: 52 | nupdates: 40631 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.04 | smp(ms): 2.48 | fwd(ms): 273.49 | crit-fwd(ms): 19.19 | bwd(ms): 452.41 | optim(ms): 56.74 | loss: 17.77186 | train-TER: 65.13 | train-WER: 82.63 | lists/dev.lst-loss: 11.25446 | lists/dev.lst-TER: 41.19 | lists/dev.lst-WER: 59.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.91
epoch: 53 | nupdates: 41434 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 792.51 | smp(ms): 2.57 | fwd(ms): 273.13 | crit-fwd(ms): 19.25 | bwd(ms): 460.31 | optim(ms): 56.73 | loss: 17.62647 | train-TER: 59.90 | train-WER: 77.41 | lists/dev.lst-loss: 11.24384 | lists/dev.lst-TER: 40.31 | lists/dev.lst-WER: 59.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 548.69
epoch: 54 | nupdates: 42237 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.48 | smp(ms): 2.64 | fwd(ms): 273.64 | crit-fwd(ms): 19.18 | bwd(ms): 452.66 | optim(ms): 56.73 | loss: 17.61184 | train-TER: 58.94 | train-WER: 77.04 | lists/dev.lst-loss: 10.89010 | lists/dev.lst-TER: 36.05 | lists/dev.lst-WER: 55.75 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.60
epoch: 55 | nupdates: 43040 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 792.85 | smp(ms): 2.31 | fwd(ms): 274.02 | crit-fwd(ms): 19.25 | bwd(ms): 459.78 | optim(ms): 56.73 | loss: 17.28309 | train-TER: 58.99 | train-WER: 78.09 | lists/dev.lst-loss: 10.72556 | lists/dev.lst-TER: 35.27 | lists/dev.lst-WER: 55.38 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 548.45
epoch: 56 | nupdates: 43843 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.16 | smp(ms): 2.09 | fwd(ms): 273.18 | crit-fwd(ms): 19.14 | bwd(ms): 456.81 | optim(ms): 56.74 | loss: 17.31098 | train-TER: 61.26 | train-WER: 79.14 | lists/dev.lst-loss: 10.85581 | lists/dev.lst-TER: 39.39 | lists/dev.lst-WER: 57.86 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 551.02
epoch: 57 | nupdates: 44646 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.38 | smp(ms): 2.06 | fwd(ms): 273.78 | crit-fwd(ms): 19.19 | bwd(ms): 451.35 | optim(ms): 56.74 | loss: 17.18699 | train-TER: 54.94 | train-WER: 74.25 | lists/dev.lst-loss: 10.67680 | lists/dev.lst-TER: 34.52 | lists/dev.lst-WER: 54.91 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.38
epoch: 58 | nupdates: 45449 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 792.99 | smp(ms): 2.55 | fwd(ms): 274.28 | crit-fwd(ms): 19.21 | bwd(ms): 459.53 | optim(ms): 56.74 | loss: 17.03633 | train-TER: 58.63 | train-WER: 78.12 | lists/dev.lst-loss: 10.63238 | lists/dev.lst-TER: 36.20 | lists/dev.lst-WER: 56.03 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 548.36
epoch: 59 | nupdates: 46252 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.71 | smp(ms): 2.38 | fwd(ms): 273.46 | crit-fwd(ms): 19.17 | bwd(ms): 451.92 | optim(ms): 56.74 | loss: 16.83723 | train-TER: 55.33 | train-WER: 74.68 | lists/dev.lst-loss: 10.50423 | lists/dev.lst-TER: 37.70 | lists/dev.lst-WER: 56.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.14
epoch: 60 | nupdates: 47055 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.66 | smp(ms): 2.47 | fwd(ms): 273.40 | crit-fwd(ms): 19.25 | bwd(ms): 452.04 | optim(ms): 56.73 | loss: 16.66030 | train-TER: 56.77 | train-WER: 75.04 | lists/dev.lst-loss: 10.49715 | lists/dev.lst-TER: 36.78 | lists/dev.lst-WER: 55.47 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.18
epoch: 61 | nupdates: 47858 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.34 | smp(ms): 2.14 | fwd(ms): 273.39 | crit-fwd(ms): 19.17 | bwd(ms): 449.63 | optim(ms): 56.74 | loss: 16.70617 | train-TER: 61.55 | train-WER: 79.93 | lists/dev.lst-loss: 10.36924 | lists/dev.lst-TER: 35.97 | lists/dev.lst-WER: 55.30 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.82
epoch: 62 | nupdates: 48661 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:26 | bch(ms): 780.01 | smp(ms): 1.72 | fwd(ms): 273.22 | crit-fwd(ms): 19.21 | bwd(ms): 447.57 | optim(ms): 56.75 | loss: 16.56252 | train-TER: 59.03 | train-WER: 77.87 | lists/dev.lst-loss: 10.19095 | lists/dev.lst-TER: 35.71 | lists/dev.lst-WER: 54.30 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 557.48
epoch: 63 | nupdates: 49464 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 788.66 | smp(ms): 2.07 | fwd(ms): 273.75 | crit-fwd(ms): 19.29 | bwd(ms): 455.81 | optim(ms): 56.74 | loss: 16.36471 | train-TER: 58.48 | train-WER: 77.25 | lists/dev.lst-loss: 10.05331 | lists/dev.lst-TER: 34.43 | lists/dev.lst-WER: 53.15 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 551.37
epoch: 64 | nupdates: 50267 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.55 | smp(ms): 2.13 | fwd(ms): 274.24 | crit-fwd(ms): 19.15 | bwd(ms): 458.18 | optim(ms): 56.75 | loss: 16.44484 | train-TER: 55.74 | train-WER: 74.11 | lists/dev.lst-loss: 10.32363 | lists/dev.lst-TER: 38.73 | lists/dev.lst-WER: 56.95 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 549.35
epoch: 65 | nupdates: 51070 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 785.96 | smp(ms): 2.45 | fwd(ms): 274.35 | crit-fwd(ms): 19.29 | bwd(ms): 452.45 | optim(ms): 56.73 | loss: 16.24395 | train-TER: 55.65 | train-WER: 73.78 | lists/dev.lst-loss: 9.86370 | lists/dev.lst-TER: 32.31 | lists/dev.lst-WER: 51.45 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.26
epoch: 66 | nupdates: 51873 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.23 | smp(ms): 2.20 | fwd(ms): 273.92 | crit-fwd(ms): 19.12 | bwd(ms): 458.00 | optim(ms): 56.75 | loss: 16.09748 | train-TER: 55.87 | train-WER: 74.33 | lists/dev.lst-loss: 10.02467 | lists/dev.lst-TER: 36.44 | lists/dev.lst-WER: 54.78 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 549.58
epoch: 67 | nupdates: 52676 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.45 | smp(ms): 2.31 | fwd(ms): 273.10 | crit-fwd(ms): 19.18 | bwd(ms): 451.90 | optim(ms): 56.73 | loss: 16.18764 | train-TER: 53.86 | train-WER: 73.07 | lists/dev.lst-loss: 9.82866 | lists/dev.lst-TER: 35.16 | lists/dev.lst-WER: 53.60 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.33
epoch: 68 | nupdates: 53479 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.80 | smp(ms): 1.79 | fwd(ms): 273.71 | crit-fwd(ms): 19.18 | bwd(ms): 451.90 | optim(ms): 56.74 | loss: 16.01650 | train-TER: 53.16 | train-WER: 72.55 | lists/dev.lst-loss: 10.01695 | lists/dev.lst-TER: 35.48 | lists/dev.lst-WER: 53.61 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.08
epoch: 69 | nupdates: 54282 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.74 | smp(ms): 1.33 | fwd(ms): 273.76 | crit-fwd(ms): 19.18 | bwd(ms): 449.85 | optim(ms): 56.75 | loss: 15.85021 | train-TER: 55.06 | train-WER: 75.14 | lists/dev.lst-loss: 9.58773 | lists/dev.lst-TER: 32.90 | lists/dev.lst-WER: 51.14 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.54
epoch: 70 | nupdates: 55085 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.00 | smp(ms): 2.61 | fwd(ms): 274.02 | crit-fwd(ms): 19.27 | bwd(ms): 457.76 | optim(ms): 56.72 | loss: 15.77210 | train-TER: 52.83 | train-WER: 72.42 | lists/dev.lst-loss: 9.45364 | lists/dev.lst-TER: 29.94 | lists/dev.lst-WER: 48.76 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 549.73
epoch: 71 | nupdates: 55888 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.40 | smp(ms): 1.95 | fwd(ms): 273.64 | crit-fwd(ms): 19.16 | bwd(ms): 456.77 | optim(ms): 56.74 | loss: 15.73174 | train-TER: 56.39 | train-WER: 75.61 | lists/dev.lst-loss: 9.51342 | lists/dev.lst-TER: 33.31 | lists/dev.lst-WER: 51.20 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.85
epoch: 72 | nupdates: 56691 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.34 | smp(ms): 2.16 | fwd(ms): 273.48 | crit-fwd(ms): 19.14 | bwd(ms): 450.73 | optim(ms): 56.74 | loss: 15.69155 | train-TER: 49.76 | train-WER: 68.47 | lists/dev.lst-loss: 9.28585 | lists/dev.lst-TER: 31.79 | lists/dev.lst-WER: 49.74 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.11
epoch: 73 | nupdates: 57494 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.28 | smp(ms): 2.04 | fwd(ms): 273.83 | crit-fwd(ms): 19.20 | bwd(ms): 449.41 | optim(ms): 56.74 | loss: 15.66275 | train-TER: 53.83 | train-WER: 73.07 | lists/dev.lst-loss: 9.47034 | lists/dev.lst-TER: 33.58 | lists/dev.lst-WER: 51.51 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.86
epoch: 74 | nupdates: 58297 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.80 | smp(ms): 2.24 | fwd(ms): 273.50 | crit-fwd(ms): 19.15 | bwd(ms): 450.18 | optim(ms): 56.74 | loss: 15.60274 | train-TER: 51.76 | train-WER: 71.28 | lists/dev.lst-loss: 9.29017 | lists/dev.lst-TER: 31.26 | lists/dev.lst-WER: 49.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.49
epoch: 75 | nupdates: 59100 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.43 | smp(ms): 2.39 | fwd(ms): 273.23 | crit-fwd(ms): 19.22 | bwd(ms): 450.14 | optim(ms): 56.74 | loss: 15.42089 | train-TER: 51.87 | train-WER: 71.45 | lists/dev.lst-loss: 9.14141 | lists/dev.lst-TER: 29.49 | lists/dev.lst-WER: 48.15 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.76
epoch: 76 | nupdates: 59903 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 789.76 | smp(ms): 2.30 | fwd(ms): 273.42 | crit-fwd(ms): 19.22 | bwd(ms): 456.95 | optim(ms): 56.75 | loss: 15.37596 | train-TER: 55.92 | train-WER: 75.21 | lists/dev.lst-loss: 9.37688 | lists/dev.lst-TER: 32.30 | lists/dev.lst-WER: 50.36 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 550.60
epoch: 77 | nupdates: 60706 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:26 | bch(ms): 780.58 | smp(ms): 1.72 | fwd(ms): 273.35 | crit-fwd(ms): 19.17 | bwd(ms): 448.00 | optim(ms): 56.76 | loss: 15.37757 | train-TER: 53.11 | train-WER: 71.89 | lists/dev.lst-loss: 9.04403 | lists/dev.lst-TER: 28.35 | lists/dev.lst-WER: 46.62 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 557.08
epoch: 78 | nupdates: 61509 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.51 | smp(ms): 2.21 | fwd(ms): 274.19 | crit-fwd(ms): 19.22 | bwd(ms): 458.03 | optim(ms): 56.74 | loss: 15.24937 | train-TER: 55.19 | train-WER: 74.29 | lists/dev.lst-loss: 8.99970 | lists/dev.lst-TER: 29.46 | lists/dev.lst-WER: 47.50 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 549.38
epoch: 79 | nupdates: 62312 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.51 | smp(ms): 2.28 | fwd(ms): 273.38 | crit-fwd(ms): 19.17 | bwd(ms): 452.84 | optim(ms): 56.73 | loss: 15.20477 | train-TER: 55.10 | train-WER: 73.88 | lists/dev.lst-loss: 8.84125 | lists/dev.lst-TER: 27.50 | lists/dev.lst-WER: 46.03 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.58
epoch: 80 | nupdates: 63115 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.28 | smp(ms): 1.87 | fwd(ms): 273.47 | crit-fwd(ms): 19.17 | bwd(ms): 456.61 | optim(ms): 56.74 | loss: 15.10373 | train-TER: 50.03 | train-WER: 70.72 | lists/dev.lst-loss: 8.86748 | lists/dev.lst-TER: 28.79 | lists/dev.lst-WER: 46.85 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 550.94
epoch: 81 | nupdates: 63918 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.23 | smp(ms): 2.08 | fwd(ms): 273.40 | crit-fwd(ms): 19.19 | bwd(ms): 451.58 | optim(ms): 56.74 | loss: 14.94535 | train-TER: 51.41 | train-WER: 71.14 | lists/dev.lst-loss: 8.75686 | lists/dev.lst-TER: 27.75 | lists/dev.lst-WER: 45.92 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.48
epoch: 82 | nupdates: 64721 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.23 | smp(ms): 2.25 | fwd(ms): 274.15 | crit-fwd(ms): 19.20 | bwd(ms): 458.03 | optim(ms): 56.74 | loss: 14.99663 | train-TER: 49.27 | train-WER: 68.87 | lists/dev.lst-loss: 8.70356 | lists/dev.lst-TER: 26.10 | lists/dev.lst-WER: 44.93 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.57
epoch: 83 | nupdates: 65524 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.52 | smp(ms): 2.16 | fwd(ms): 274.01 | crit-fwd(ms): 19.16 | bwd(ms): 458.47 | optim(ms): 56.74 | loss: 14.85269 | train-TER: 51.67 | train-WER: 70.84 | lists/dev.lst-loss: 8.69007 | lists/dev.lst-TER: 27.74 | lists/dev.lst-WER: 46.04 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 549.37
epoch: 84 | nupdates: 66327 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.51 | smp(ms): 2.12 | fwd(ms): 273.50 | crit-fwd(ms): 19.16 | bwd(ms): 451.81 | optim(ms): 56.73 | loss: 14.89355 | train-TER: 53.23 | train-WER: 72.25 | lists/dev.lst-loss: 8.77165 | lists/dev.lst-TER: 28.76 | lists/dev.lst-WER: 46.13 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.29
epoch: 85 | nupdates: 67130 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.66 | smp(ms): 2.30 | fwd(ms): 273.40 | crit-fwd(ms): 19.23 | bwd(ms): 452.15 | optim(ms): 56.73 | loss: 14.59037 | train-TER: 47.44 | train-WER: 66.91 | lists/dev.lst-loss: 8.53470 | lists/dev.lst-TER: 26.44 | lists/dev.lst-WER: 44.67 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.18
epoch: 86 | nupdates: 67933 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.47 | smp(ms): 1.63 | fwd(ms): 273.40 | crit-fwd(ms): 19.18 | bwd(ms): 456.92 | optim(ms): 56.73 | loss: 14.69502 | train-TER: 52.98 | train-WER: 71.41 | lists/dev.lst-loss: 8.43605 | lists/dev.lst-TER: 26.53 | lists/dev.lst-WER: 44.68 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 550.80
epoch: 87 | nupdates: 68736 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.84 | smp(ms): 2.08 | fwd(ms): 273.60 | crit-fwd(ms): 19.16 | bwd(ms): 451.20 | optim(ms): 56.73 | loss: 14.56231 | train-TER: 49.18 | train-WER: 68.31 | lists/dev.lst-loss: 8.50964 | lists/dev.lst-TER: 26.13 | lists/dev.lst-WER: 44.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.75
epoch: 88 | nupdates: 69539 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 789.75 | smp(ms): 2.00 | fwd(ms): 273.93 | crit-fwd(ms): 19.23 | bwd(ms): 456.74 | optim(ms): 56.74 | loss: 14.55271 | train-TER: 46.94 | train-WER: 65.66 | lists/dev.lst-loss: 8.72622 | lists/dev.lst-TER: 28.99 | lists/dev.lst-WER: 46.37 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.60
epoch: 89 | nupdates: 70342 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.68 | smp(ms): 1.86 | fwd(ms): 274.64 | crit-fwd(ms): 19.27 | bwd(ms): 452.98 | optim(ms): 56.74 | loss: 14.37543 | train-TER: 47.30 | train-WER: 67.05 | lists/dev.lst-loss: 8.33864 | lists/dev.lst-TER: 25.79 | lists/dev.lst-WER: 43.47 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.76
epoch: 90 | nupdates: 71145 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.27 | smp(ms): 2.10 | fwd(ms): 274.17 | crit-fwd(ms): 19.14 | bwd(ms): 456.81 | optim(ms): 56.74 | loss: 14.36725 | train-TER: 48.65 | train-WER: 67.34 | lists/dev.lst-loss: 8.45145 | lists/dev.lst-TER: 27.36 | lists/dev.lst-WER: 44.86 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.24
epoch: 91 | nupdates: 71948 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.33 | smp(ms): 2.11 | fwd(ms): 273.70 | crit-fwd(ms): 19.15 | bwd(ms): 452.43 | optim(ms): 56.74 | loss: 14.37755 | train-TER: 50.28 | train-WER: 70.74 | lists/dev.lst-loss: 8.38597 | lists/dev.lst-TER: 27.26 | lists/dev.lst-WER: 44.51 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.71
epoch: 92 | nupdates: 72751 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.11 | smp(ms): 2.09 | fwd(ms): 273.08 | crit-fwd(ms): 19.23 | bwd(ms): 450.64 | optim(ms): 56.74 | loss: 14.25795 | train-TER: 52.53 | train-WER: 70.81 | lists/dev.lst-loss: 8.17078 | lists/dev.lst-TER: 25.17 | lists/dev.lst-WER: 43.20 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.27
epoch: 93 | nupdates: 73554 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.14 | smp(ms): 2.57 | fwd(ms): 273.72 | crit-fwd(ms): 19.22 | bwd(ms): 458.36 | optim(ms): 56.75 | loss: 14.10092 | train-TER: 47.50 | train-WER: 67.54 | lists/dev.lst-loss: 8.28106 | lists/dev.lst-TER: 25.78 | lists/dev.lst-WER: 42.86 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 549.64
epoch: 94 | nupdates: 74357 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.49 | smp(ms): 2.18 | fwd(ms): 273.98 | crit-fwd(ms): 19.15 | bwd(ms): 457.33 | optim(ms): 56.74 | loss: 14.00633 | train-TER: 47.22 | train-WER: 66.16 | lists/dev.lst-loss: 8.15311 | lists/dev.lst-TER: 24.19 | lists/dev.lst-WER: 41.99 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 550.09
epoch: 95 | nupdates: 75160 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 789.95 | smp(ms): 2.43 | fwd(ms): 274.20 | crit-fwd(ms): 19.17 | bwd(ms): 456.63 | optim(ms): 56.74 | loss: 14.09231 | train-TER: 47.63 | train-WER: 66.59 | lists/dev.lst-loss: 8.06845 | lists/dev.lst-TER: 24.24 | lists/dev.lst-WER: 41.89 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 550.47
epoch: 96 | nupdates: 75963 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.59 | smp(ms): 2.36 | fwd(ms): 273.72 | crit-fwd(ms): 19.19 | bwd(ms): 458.70 | optim(ms): 56.73 | loss: 13.95021 | train-TER: 44.48 | train-WER: 65.20 | lists/dev.lst-loss: 8.37734 | lists/dev.lst-TER: 27.58 | lists/dev.lst-WER: 44.16 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.33
epoch: 97 | nupdates: 76766 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.70 | smp(ms): 2.29 | fwd(ms): 273.40 | crit-fwd(ms): 19.20 | bwd(ms): 451.09 | optim(ms): 56.72 | loss: 13.93125 | train-TER: 48.51 | train-WER: 68.51 | lists/dev.lst-loss: 8.00367 | lists/dev.lst-TER: 24.25 | lists/dev.lst-WER: 41.68 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.86
epoch: 98 | nupdates: 77569 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.00 | smp(ms): 2.35 | fwd(ms): 273.51 | crit-fwd(ms): 19.27 | bwd(ms): 456.35 | optim(ms): 56.75 | loss: 13.87519 | train-TER: 45.67 | train-WER: 65.45 | lists/dev.lst-loss: 8.19040 | lists/dev.lst-TER: 25.66 | lists/dev.lst-WER: 43.03 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 551.13
epoch: 99 | nupdates: 78372 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 787.02 | smp(ms): 2.08 | fwd(ms): 273.90 | crit-fwd(ms): 19.21 | bwd(ms): 454.01 | optim(ms): 56.72 | loss: 13.91597 | train-TER: 50.67 | train-WER: 69.53 | lists/dev.lst-loss: 8.02425 | lists/dev.lst-TER: 24.43 | lists/dev.lst-WER: 41.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.52
epoch: 100 | nupdates: 79175 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.53 | smp(ms): 2.03 | fwd(ms): 273.96 | crit-fwd(ms): 19.14 | bwd(ms): 457.25 | optim(ms): 56.73 | loss: 13.82145 | train-TER: 43.45 | train-WER: 63.30 | lists/dev.lst-loss: 7.92053 | lists/dev.lst-TER: 24.06 | lists/dev.lst-WER: 41.35 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.07
epoch: 101 | nupdates: 79978 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.05 | smp(ms): 2.14 | fwd(ms): 273.45 | crit-fwd(ms): 19.14 | bwd(ms): 457.44 | optim(ms): 56.72 | loss: 13.63767 | train-TER: 47.09 | train-WER: 67.14 | lists/dev.lst-loss: 7.95350 | lists/dev.lst-TER: 23.86 | lists/dev.lst-WER: 40.98 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 550.40
epoch: 102 | nupdates: 80781 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.28 | smp(ms): 2.04 | fwd(ms): 274.24 | crit-fwd(ms): 19.13 | bwd(ms): 455.94 | optim(ms): 56.75 | loss: 13.69892 | train-TER: 46.31 | train-WER: 65.37 | lists/dev.lst-loss: 7.78659 | lists/dev.lst-TER: 24.00 | lists/dev.lst-WER: 40.78 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 550.94
epoch: 103 | nupdates: 81584 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.21 | smp(ms): 1.74 | fwd(ms): 273.34 | crit-fwd(ms): 19.21 | bwd(ms): 456.73 | optim(ms): 56.74 | loss: 13.60302 | train-TER: 46.56 | train-WER: 65.52 | lists/dev.lst-loss: 7.79223 | lists/dev.lst-TER: 22.69 | lists/dev.lst-WER: 40.29 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.99
epoch: 104 | nupdates: 82387 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.05 | smp(ms): 2.36 | fwd(ms): 273.66 | crit-fwd(ms): 19.25 | bwd(ms): 456.24 | optim(ms): 56.73 | loss: 13.56559 | train-TER: 42.78 | train-WER: 62.94 | lists/dev.lst-loss: 7.81902 | lists/dev.lst-TER: 24.33 | lists/dev.lst-WER: 41.06 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 551.09
epoch: 105 | nupdates: 83190 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.12 | smp(ms): 1.35 | fwd(ms): 273.98 | crit-fwd(ms): 19.14 | bwd(ms): 450.07 | optim(ms): 56.73 | loss: 13.66669 | train-TER: 43.62 | train-WER: 62.56 | lists/dev.lst-loss: 7.81320 | lists/dev.lst-TER: 23.56 | lists/dev.lst-WER: 40.65 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.26
epoch: 106 | nupdates: 83993 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.90 | smp(ms): 2.41 | fwd(ms): 273.58 | crit-fwd(ms): 19.20 | bwd(ms): 451.21 | optim(ms): 56.73 | loss: 13.57221 | train-TER: 44.26 | train-WER: 63.04 | lists/dev.lst-loss: 8.00655 | lists/dev.lst-TER: 26.02 | lists/dev.lst-WER: 42.46 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.71
epoch: 107 | nupdates: 84796 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.87 | smp(ms): 1.86 | fwd(ms): 273.30 | crit-fwd(ms): 19.20 | bwd(ms): 450.44 | optim(ms): 56.74 | loss: 13.48876 | train-TER: 47.13 | train-WER: 66.36 | lists/dev.lst-loss: 7.79121 | lists/dev.lst-TER: 22.79 | lists/dev.lst-WER: 39.70 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.45
epoch: 108 | nupdates: 85599 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.84 | smp(ms): 1.90 | fwd(ms): 273.69 | crit-fwd(ms): 19.18 | bwd(ms): 455.08 | optim(ms): 56.77 | loss: 13.54249 | train-TER: 46.66 | train-WER: 66.07 | lists/dev.lst-loss: 7.68549 | lists/dev.lst-TER: 22.07 | lists/dev.lst-WER: 39.26 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 551.94
epoch: 109 | nupdates: 86402 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 793.06 | smp(ms): 2.42 | fwd(ms): 274.21 | crit-fwd(ms): 19.17 | bwd(ms): 459.69 | optim(ms): 56.73 | loss: 13.33789 | train-TER: 43.39 | train-WER: 63.17 | lists/dev.lst-loss: 7.70669 | lists/dev.lst-TER: 23.30 | lists/dev.lst-WER: 40.04 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 548.31
epoch: 110 | nupdates: 87205 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.84 | smp(ms): 1.43 | fwd(ms): 273.25 | crit-fwd(ms): 19.16 | bwd(ms): 450.30 | optim(ms): 56.75 | loss: 13.21468 | train-TER: 41.09 | train-WER: 60.36 | lists/dev.lst-loss: 7.62218 | lists/dev.lst-TER: 23.13 | lists/dev.lst-WER: 39.75 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.47
epoch: 111 | nupdates: 88008 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.91 | smp(ms): 2.36 | fwd(ms): 273.91 | crit-fwd(ms): 19.26 | bwd(ms): 449.90 | optim(ms): 56.74 | loss: 13.20864 | train-TER: 43.75 | train-WER: 63.70 | lists/dev.lst-loss: 7.61422 | lists/dev.lst-TER: 23.23 | lists/dev.lst-WER: 39.40 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.42
epoch: 112 | nupdates: 88811 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.67 | smp(ms): 2.18 | fwd(ms): 273.41 | crit-fwd(ms): 19.17 | bwd(ms): 451.09 | optim(ms): 56.74 | loss: 13.28425 | train-TER: 43.88 | train-WER: 62.72 | lists/dev.lst-loss: 7.70526 | lists/dev.lst-TER: 24.32 | lists/dev.lst-WER: 40.23 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.88
epoch: 113 | nupdates: 89614 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.26 | smp(ms): 2.05 | fwd(ms): 273.57 | crit-fwd(ms): 19.15 | bwd(ms): 451.46 | optim(ms): 56.74 | loss: 13.14738 | train-TER: 42.48 | train-WER: 61.46 | lists/dev.lst-loss: 7.61179 | lists/dev.lst-TER: 23.86 | lists/dev.lst-WER: 40.09 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.46
epoch: 114 | nupdates: 90417 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 787.04 | smp(ms): 2.42 | fwd(ms): 274.15 | crit-fwd(ms): 19.14 | bwd(ms): 453.54 | optim(ms): 56.74 | loss: 13.13681 | train-TER: 43.27 | train-WER: 62.64 | lists/dev.lst-loss: 7.50096 | lists/dev.lst-TER: 22.68 | lists/dev.lst-WER: 39.30 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.50
epoch: 115 | nupdates: 91220 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.95 | smp(ms): 2.27 | fwd(ms): 273.70 | crit-fwd(ms): 19.20 | bwd(ms): 450.03 | optim(ms): 56.74 | loss: 13.09075 | train-TER: 43.63 | train-WER: 63.97 | lists/dev.lst-loss: 7.70999 | lists/dev.lst-TER: 23.64 | lists/dev.lst-WER: 39.94 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.39
epoch: 116 | nupdates: 92023 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.40 | smp(ms): 2.13 | fwd(ms): 273.71 | crit-fwd(ms): 19.21 | bwd(ms): 452.56 | optim(ms): 56.72 | loss: 12.97437 | train-TER: 44.92 | train-WER: 63.86 | lists/dev.lst-loss: 7.42133 | lists/dev.lst-TER: 21.86 | lists/dev.lst-WER: 38.23 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.66
epoch: 117 | nupdates: 92826 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:37 | bch(ms): 793.64 | smp(ms): 2.30 | fwd(ms): 274.22 | crit-fwd(ms): 19.11 | bwd(ms): 460.23 | optim(ms): 56.73 | loss: 13.00274 | train-TER: 41.70 | train-WER: 61.52 | lists/dev.lst-loss: 7.68196 | lists/dev.lst-TER: 23.85 | lists/dev.lst-WER: 39.78 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 547.91
epoch: 118 | nupdates: 93629 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.10 | smp(ms): 2.51 | fwd(ms): 274.25 | crit-fwd(ms): 19.32 | bwd(ms): 453.74 | optim(ms): 56.73 | loss: 12.98837 | train-TER: 45.47 | train-WER: 64.44 | lists/dev.lst-loss: 7.50205 | lists/dev.lst-TER: 22.92 | lists/dev.lst-WER: 38.76 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.46
epoch: 119 | nupdates: 94432 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.66 | smp(ms): 2.19 | fwd(ms): 274.17 | crit-fwd(ms): 19.15 | bwd(ms): 454.37 | optim(ms): 56.73 | loss: 12.92465 | train-TER: 44.40 | train-WER: 63.80 | lists/dev.lst-loss: 7.48922 | lists/dev.lst-TER: 23.32 | lists/dev.lst-WER: 39.30 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.07
epoch: 120 | nupdates: 95235 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 785.93 | smp(ms): 2.26 | fwd(ms): 274.15 | crit-fwd(ms): 19.27 | bwd(ms): 452.64 | optim(ms): 56.73 | loss: 12.94680 | train-TER: 45.15 | train-WER: 65.39 | lists/dev.lst-loss: 7.45069 | lists/dev.lst-TER: 22.13 | lists/dev.lst-WER: 38.29 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.28
epoch: 121 | nupdates: 96038 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.05 | smp(ms): 2.43 | fwd(ms): 273.39 | crit-fwd(ms): 19.27 | bwd(ms): 451.44 | optim(ms): 56.75 | loss: 13.00947 | train-TER: 44.64 | train-WER: 63.10 | lists/dev.lst-loss: 7.34055 | lists/dev.lst-TER: 21.55 | lists/dev.lst-WER: 37.97 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.61
epoch: 122 | nupdates: 96841 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 789.85 | smp(ms): 2.52 | fwd(ms): 274.22 | crit-fwd(ms): 19.25 | bwd(ms): 456.45 | optim(ms): 56.75 | loss: 12.82009 | train-TER: 44.87 | train-WER: 64.09 | lists/dev.lst-loss: 7.52851 | lists/dev.lst-TER: 23.80 | lists/dev.lst-WER: 39.34 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.54
epoch: 123 | nupdates: 97644 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.22 | smp(ms): 1.94 | fwd(ms): 274.15 | crit-fwd(ms): 19.23 | bwd(ms): 450.90 | optim(ms): 56.75 | loss: 12.85941 | train-TER: 45.38 | train-WER: 65.61 | lists/dev.lst-loss: 7.59355 | lists/dev.lst-TER: 24.00 | lists/dev.lst-WER: 40.02 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.49
epoch: 124 | nupdates: 98447 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.15 | smp(ms): 2.40 | fwd(ms): 273.65 | crit-fwd(ms): 19.25 | bwd(ms): 451.41 | optim(ms): 56.74 | loss: 12.91564 | train-TER: 43.12 | train-WER: 62.32 | lists/dev.lst-loss: 7.25435 | lists/dev.lst-TER: 21.42 | lists/dev.lst-WER: 37.61 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.54
epoch: 125 | nupdates: 99250 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.18 | smp(ms): 2.52 | fwd(ms): 274.16 | crit-fwd(ms): 19.18 | bwd(ms): 456.87 | optim(ms): 56.74 | loss: 12.66314 | train-TER: 40.11 | train-WER: 58.87 | lists/dev.lst-loss: 7.26326 | lists/dev.lst-TER: 20.90 | lists/dev.lst-WER: 37.10 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 550.30
epoch: 126 | nupdates: 100053 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 790.83 | smp(ms): 2.14 | fwd(ms): 274.36 | crit-fwd(ms): 19.24 | bwd(ms): 457.34 | optim(ms): 56.74 | loss: 12.72953 | train-TER: 42.29 | train-WER: 60.87 | lists/dev.lst-loss: 7.35928 | lists/dev.lst-TER: 22.26 | lists/dev.lst-WER: 38.17 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.86
epoch: 127 | nupdates: 100856 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:27 | bch(ms): 781.74 | smp(ms): 2.51 | fwd(ms): 272.84 | crit-fwd(ms): 19.26 | bwd(ms): 449.77 | optim(ms): 56.74 | loss: 12.72491 | train-TER: 43.70 | train-WER: 62.00 | lists/dev.lst-loss: 7.38670 | lists/dev.lst-TER: 21.52 | lists/dev.lst-WER: 37.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 556.24
epoch: 128 | nupdates: 101659 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.14 | smp(ms): 2.16 | fwd(ms): 273.19 | crit-fwd(ms): 19.15 | bwd(ms): 451.72 | optim(ms): 56.73 | loss: 12.67162 | train-TER: 40.18 | train-WER: 60.07 | lists/dev.lst-loss: 7.44695 | lists/dev.lst-TER: 22.94 | lists/dev.lst-WER: 38.62 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 554.55
epoch: 129 | nupdates: 102462 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.21 | smp(ms): 2.48 | fwd(ms): 273.69 | crit-fwd(ms): 19.25 | bwd(ms): 449.37 | optim(ms): 56.74 | loss: 12.55686 | train-TER: 37.93 | train-WER: 57.16 | lists/dev.lst-loss: 7.30990 | lists/dev.lst-TER: 21.98 | lists/dev.lst-WER: 37.51 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.92
epoch: 130 | nupdates: 103265 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 782.44 | smp(ms): 1.92 | fwd(ms): 273.36 | crit-fwd(ms): 19.14 | bwd(ms): 449.79 | optim(ms): 56.74 | loss: 12.42848 | train-TER: 38.45 | train-WER: 57.32 | lists/dev.lst-loss: 7.43615 | lists/dev.lst-TER: 22.21 | lists/dev.lst-WER: 38.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.75
epoch: 131 | nupdates: 104068 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.71 | smp(ms): 2.43 | fwd(ms): 274.05 | crit-fwd(ms): 19.17 | bwd(ms): 452.51 | optim(ms): 56.72 | loss: 12.61028 | train-TER: 39.27 | train-WER: 57.74 | lists/dev.lst-loss: 7.22433 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 36.93 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.44
epoch: 132 | nupdates: 104871 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.37 | smp(ms): 2.45 | fwd(ms): 273.49 | crit-fwd(ms): 19.18 | bwd(ms): 456.64 | optim(ms): 56.74 | loss: 12.63936 | train-TER: 42.15 | train-WER: 61.69 | lists/dev.lst-loss: 7.50304 | lists/dev.lst-TER: 23.46 | lists/dev.lst-WER: 38.84 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.87
epoch: 133 | nupdates: 105674 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.77 | smp(ms): 2.23 | fwd(ms): 273.64 | crit-fwd(ms): 19.21 | bwd(ms): 452.03 | optim(ms): 56.73 | loss: 12.30108 | train-TER: 43.85 | train-WER: 64.23 | lists/dev.lst-loss: 7.07055 | lists/dev.lst-TER: 20.04 | lists/dev.lst-WER: 36.24 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.10
epoch: 134 | nupdates: 106477 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.20 | smp(ms): 2.65 | fwd(ms): 273.45 | crit-fwd(ms): 19.24 | bwd(ms): 457.61 | optim(ms): 56.74 | loss: 12.38365 | train-TER: 39.44 | train-WER: 59.63 | lists/dev.lst-loss: 7.21884 | lists/dev.lst-TER: 21.13 | lists/dev.lst-WER: 36.90 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.29
epoch: 135 | nupdates: 107280 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.10 | smp(ms): 2.18 | fwd(ms): 273.95 | crit-fwd(ms): 19.16 | bwd(ms): 452.10 | optim(ms): 56.73 | loss: 12.22458 | train-TER: 41.44 | train-WER: 59.61 | lists/dev.lst-loss: 7.43682 | lists/dev.lst-TER: 22.31 | lists/dev.lst-WER: 37.95 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.87
epoch: 136 | nupdates: 108083 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.67 | smp(ms): 2.33 | fwd(ms): 273.62 | crit-fwd(ms): 19.17 | bwd(ms): 450.86 | optim(ms): 56.73 | loss: 12.39751 | train-TER: 39.37 | train-WER: 59.10 | lists/dev.lst-loss: 7.27914 | lists/dev.lst-TER: 22.23 | lists/dev.lst-WER: 37.62 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.88
epoch: 137 | nupdates: 108886 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.33 | smp(ms): 2.48 | fwd(ms): 273.78 | crit-fwd(ms): 19.18 | bwd(ms): 451.39 | optim(ms): 56.73 | loss: 12.36563 | train-TER: 37.64 | train-WER: 56.25 | lists/dev.lst-loss: 7.38748 | lists/dev.lst-TER: 22.44 | lists/dev.lst-WER: 37.95 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.41
epoch: 138 | nupdates: 109689 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.17 | smp(ms): 2.20 | fwd(ms): 273.48 | crit-fwd(ms): 19.27 | bwd(ms): 450.65 | optim(ms): 56.74 | loss: 12.21596 | train-TER: 42.95 | train-WER: 62.22 | lists/dev.lst-loss: 7.07706 | lists/dev.lst-TER: 20.14 | lists/dev.lst-WER: 36.12 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.23
epoch: 139 | nupdates: 110492 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 788.23 | smp(ms): 1.83 | fwd(ms): 273.46 | crit-fwd(ms): 19.23 | bwd(ms): 455.57 | optim(ms): 56.75 | loss: 12.22821 | train-TER: 38.89 | train-WER: 58.66 | lists/dev.lst-loss: 7.46277 | lists/dev.lst-TER: 23.90 | lists/dev.lst-WER: 39.20 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 551.67
epoch: 140 | nupdates: 111295 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 784.71 | smp(ms): 2.74 | fwd(ms): 273.46 | crit-fwd(ms): 19.25 | bwd(ms): 452.14 | optim(ms): 56.74 | loss: 12.25955 | train-TER: 41.29 | train-WER: 60.62 | lists/dev.lst-loss: 6.91378 | lists/dev.lst-TER: 19.61 | lists/dev.lst-WER: 35.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.14
epoch: 141 | nupdates: 112098 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 790.84 | smp(ms): 2.19 | fwd(ms): 274.21 | crit-fwd(ms): 19.22 | bwd(ms): 457.50 | optim(ms): 56.74 | loss: 12.13062 | train-TER: 39.93 | train-WER: 58.14 | lists/dev.lst-loss: 7.02651 | lists/dev.lst-TER: 19.48 | lists/dev.lst-WER: 35.26 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 549.85
epoch: 142 | nupdates: 112901 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.06 | smp(ms): 2.11 | fwd(ms): 273.52 | crit-fwd(ms): 19.23 | bwd(ms): 457.41 | optim(ms): 56.73 | loss: 12.27384 | train-TER: 43.59 | train-WER: 63.22 | lists/dev.lst-loss: 6.97346 | lists/dev.lst-TER: 20.10 | lists/dev.lst-WER: 35.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.39
epoch: 143 | nupdates: 113704 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.92 | smp(ms): 2.05 | fwd(ms): 273.83 | crit-fwd(ms): 19.25 | bwd(ms): 453.98 | optim(ms): 56.73 | loss: 11.92488 | train-TER: 40.77 | train-WER: 60.11 | lists/dev.lst-loss: 6.92973 | lists/dev.lst-TER: 19.52 | lists/dev.lst-WER: 35.12 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.59
epoch: 144 | nupdates: 114507 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.09 | smp(ms): 2.20 | fwd(ms): 274.29 | crit-fwd(ms): 19.23 | bwd(ms): 457.71 | optim(ms): 56.74 | loss: 11.98494 | train-TER: 39.02 | train-WER: 58.07 | lists/dev.lst-loss: 7.18368 | lists/dev.lst-TER: 21.92 | lists/dev.lst-WER: 37.10 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.67
epoch: 145 | nupdates: 115310 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.38 | smp(ms): 2.43 | fwd(ms): 273.84 | crit-fwd(ms): 19.17 | bwd(ms): 452.41 | optim(ms): 56.72 | loss: 12.13365 | train-TER: 35.18 | train-WER: 54.01 | lists/dev.lst-loss: 6.96346 | lists/dev.lst-TER: 19.51 | lists/dev.lst-WER: 35.15 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.67
epoch: 146 | nupdates: 116113 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.13 | smp(ms): 1.96 | fwd(ms): 273.95 | crit-fwd(ms): 19.24 | bwd(ms): 452.97 | optim(ms): 56.73 | loss: 12.09948 | train-TER: 40.69 | train-WER: 59.24 | lists/dev.lst-loss: 6.90644 | lists/dev.lst-TER: 19.21 | lists/dev.lst-WER: 34.69 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.14
epoch: 147 | nupdates: 116916 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.65 | smp(ms): 1.88 | fwd(ms): 273.68 | crit-fwd(ms): 19.09 | bwd(ms): 457.54 | optim(ms): 56.73 | loss: 12.02362 | train-TER: 37.31 | train-WER: 55.26 | lists/dev.lst-loss: 6.89484 | lists/dev.lst-TER: 19.25 | lists/dev.lst-WER: 34.82 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.98
epoch: 148 | nupdates: 117719 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.78 | smp(ms): 2.43 | fwd(ms): 273.93 | crit-fwd(ms): 19.23 | bwd(ms): 450.58 | optim(ms): 56.74 | loss: 11.82540 | train-TER: 41.57 | train-WER: 61.66 | lists/dev.lst-loss: 7.18098 | lists/dev.lst-TER: 21.69 | lists/dev.lst-WER: 36.74 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.80
epoch: 149 | nupdates: 118522 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.52 | smp(ms): 2.36 | fwd(ms): 273.97 | crit-fwd(ms): 19.11 | bwd(ms): 453.44 | optim(ms): 56.73 | loss: 11.97385 | train-TER: 42.66 | train-WER: 60.95 | lists/dev.lst-loss: 6.89108 | lists/dev.lst-TER: 19.75 | lists/dev.lst-WER: 35.22 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.87
epoch: 150 | nupdates: 119325 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.95 | smp(ms): 2.11 | fwd(ms): 273.95 | crit-fwd(ms): 19.21 | bwd(ms): 450.95 | optim(ms): 56.74 | loss: 11.98562 | train-TER: 41.75 | train-WER: 60.27 | lists/dev.lst-loss: 6.91172 | lists/dev.lst-TER: 20.15 | lists/dev.lst-WER: 35.11 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.68
epoch: 151 | nupdates: 120128 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.54 | smp(ms): 2.36 | fwd(ms): 274.37 | crit-fwd(ms): 19.14 | bwd(ms): 452.11 | optim(ms): 56.73 | loss: 11.76251 | train-TER: 37.65 | train-WER: 57.16 | lists/dev.lst-loss: 6.90813 | lists/dev.lst-TER: 19.00 | lists/dev.lst-WER: 34.46 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.56
epoch: 152 | nupdates: 120931 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:33 | bch(ms): 789.40 | smp(ms): 2.16 | fwd(ms): 274.07 | crit-fwd(ms): 19.14 | bwd(ms): 456.19 | optim(ms): 56.75 | loss: 11.92522 | train-TER: 37.56 | train-WER: 55.88 | lists/dev.lst-loss: 6.89448 | lists/dev.lst-TER: 20.33 | lists/dev.lst-WER: 35.28 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 550.85
epoch: 153 | nupdates: 121734 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.79 | smp(ms): 1.79 | fwd(ms): 274.14 | crit-fwd(ms): 19.23 | bwd(ms): 452.56 | optim(ms): 56.78 | loss: 11.84749 | train-TER: 37.95 | train-WER: 56.88 | lists/dev.lst-loss: 6.97123 | lists/dev.lst-TER: 20.80 | lists/dev.lst-WER: 35.72 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.38
epoch: 154 | nupdates: 122537 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.49 | smp(ms): 2.17 | fwd(ms): 274.36 | crit-fwd(ms): 19.16 | bwd(ms): 453.92 | optim(ms): 56.73 | loss: 11.82955 | train-TER: 36.13 | train-WER: 54.43 | lists/dev.lst-loss: 6.91485 | lists/dev.lst-TER: 19.90 | lists/dev.lst-WER: 34.89 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 552.19
epoch: 155 | nupdates: 123340 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.26 | smp(ms): 2.37 | fwd(ms): 273.71 | crit-fwd(ms): 19.20 | bwd(ms): 452.34 | optim(ms): 56.73 | loss: 11.89190 | train-TER: 40.16 | train-WER: 58.02 | lists/dev.lst-loss: 7.29460 | lists/dev.lst-TER: 23.26 | lists/dev.lst-WER: 38.05 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.76
epoch: 156 | nupdates: 124143 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 785.88 | smp(ms): 2.29 | fwd(ms): 273.85 | crit-fwd(ms): 19.19 | bwd(ms): 452.93 | optim(ms): 56.73 | loss: 11.77509 | train-TER: 40.83 | train-WER: 59.22 | lists/dev.lst-loss: 6.74269 | lists/dev.lst-TER: 18.94 | lists/dev.lst-WER: 34.25 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.32
epoch: 157 | nupdates: 124946 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.54 | smp(ms): 2.25 | fwd(ms): 274.38 | crit-fwd(ms): 19.26 | bwd(ms): 457.93 | optim(ms): 56.73 | loss: 11.72677 | train-TER: 43.82 | train-WER: 62.56 | lists/dev.lst-loss: 6.84915 | lists/dev.lst-TER: 19.69 | lists/dev.lst-WER: 34.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.36
epoch: 158 | nupdates: 125749 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.18 | smp(ms): 2.42 | fwd(ms): 274.03 | crit-fwd(ms): 19.22 | bwd(ms): 452.91 | optim(ms): 56.74 | loss: 11.76452 | train-TER: 39.46 | train-WER: 59.07 | lists/dev.lst-loss: 6.95592 | lists/dev.lst-TER: 19.30 | lists/dev.lst-WER: 34.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.11
epoch: 159 | nupdates: 126552 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.70 | smp(ms): 1.97 | fwd(ms): 274.08 | crit-fwd(ms): 19.16 | bwd(ms): 452.47 | optim(ms): 56.74 | loss: 11.67402 | train-TER: 35.93 | train-WER: 55.49 | lists/dev.lst-loss: 6.74855 | lists/dev.lst-TER: 18.86 | lists/dev.lst-WER: 34.13 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.45
epoch: 160 | nupdates: 127355 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:37 | bch(ms): 793.55 | smp(ms): 2.01 | fwd(ms): 274.86 | crit-fwd(ms): 19.25 | bwd(ms): 459.49 | optim(ms): 56.74 | loss: 11.76319 | train-TER: 38.51 | train-WER: 57.44 | lists/dev.lst-loss: 6.84038 | lists/dev.lst-TER: 19.14 | lists/dev.lst-WER: 34.22 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 547.97
epoch: 161 | nupdates: 128158 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.05 | smp(ms): 2.44 | fwd(ms): 274.72 | crit-fwd(ms): 19.20 | bwd(ms): 453.25 | optim(ms): 56.73 | loss: 11.83348 | train-TER: 36.56 | train-WER: 55.53 | lists/dev.lst-loss: 6.96606 | lists/dev.lst-TER: 20.74 | lists/dev.lst-WER: 35.50 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.49
epoch: 162 | nupdates: 128961 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.46 | smp(ms): 2.25 | fwd(ms): 274.16 | crit-fwd(ms): 19.26 | bwd(ms): 451.20 | optim(ms): 56.74 | loss: 11.74730 | train-TER: 39.19 | train-WER: 58.73 | lists/dev.lst-loss: 6.98058 | lists/dev.lst-TER: 21.03 | lists/dev.lst-WER: 35.42 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.32
epoch: 163 | nupdates: 129764 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:27 | bch(ms): 781.68 | smp(ms): 1.96 | fwd(ms): 273.50 | crit-fwd(ms): 19.16 | bwd(ms): 449.13 | optim(ms): 56.76 | loss: 11.51001 | train-TER: 34.27 | train-WER: 52.23 | lists/dev.lst-loss: 6.71252 | lists/dev.lst-TER: 18.79 | lists/dev.lst-WER: 33.71 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 556.29
epoch: 164 | nupdates: 130567 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.49 | smp(ms): 2.08 | fwd(ms): 273.49 | crit-fwd(ms): 19.12 | bwd(ms): 454.82 | optim(ms): 56.76 | loss: 11.67962 | train-TER: 39.44 | train-WER: 58.15 | lists/dev.lst-loss: 6.73159 | lists/dev.lst-TER: 18.48 | lists/dev.lst-WER: 33.65 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.18
epoch: 165 | nupdates: 131370 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:34 | bch(ms): 790.77 | smp(ms): 2.45 | fwd(ms): 273.70 | crit-fwd(ms): 19.07 | bwd(ms): 458.05 | optim(ms): 56.74 | loss: 11.51757 | train-TER: 41.31 | train-WER: 61.02 | lists/dev.lst-loss: 6.89288 | lists/dev.lst-TER: 20.14 | lists/dev.lst-WER: 34.65 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.90
epoch: 166 | nupdates: 132173 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.36 | smp(ms): 2.43 | fwd(ms): 273.55 | crit-fwd(ms): 19.23 | bwd(ms): 451.65 | optim(ms): 56.73 | loss: 11.72115 | train-TER: 36.54 | train-WER: 56.83 | lists/dev.lst-loss: 6.78101 | lists/dev.lst-TER: 19.46 | lists/dev.lst-WER: 34.23 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.39
epoch: 167 | nupdates: 132976 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.16 | smp(ms): 2.58 | fwd(ms): 272.97 | crit-fwd(ms): 19.15 | bwd(ms): 451.03 | optim(ms): 56.74 | loss: 11.46514 | train-TER: 34.89 | train-WER: 53.69 | lists/dev.lst-loss: 6.80438 | lists/dev.lst-TER: 19.74 | lists/dev.lst-WER: 34.58 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.24
epoch: 168 | nupdates: 133779 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 783.81 | smp(ms): 2.00 | fwd(ms): 273.60 | crit-fwd(ms): 19.19 | bwd(ms): 451.13 | optim(ms): 56.73 | loss: 11.50866 | train-TER: 33.35 | train-WER: 52.31 | lists/dev.lst-loss: 6.86309 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.39 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.78
epoch: 169 | nupdates: 134582 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.38 | smp(ms): 2.37 | fwd(ms): 273.82 | crit-fwd(ms): 19.18 | bwd(ms): 452.39 | optim(ms): 56.72 | loss: 11.33141 | train-TER: 33.77 | train-WER: 53.97 | lists/dev.lst-loss: 6.88659 | lists/dev.lst-TER: 20.44 | lists/dev.lst-WER: 34.61 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.67
epoch: 170 | nupdates: 135385 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:29 | bch(ms): 784.03 | smp(ms): 1.54 | fwd(ms): 273.20 | crit-fwd(ms): 19.21 | bwd(ms): 451.58 | optim(ms): 56.72 | loss: 11.45619 | train-TER: 37.62 | train-WER: 55.83 | lists/dev.lst-loss: 6.64296 | lists/dev.lst-TER: 19.05 | lists/dev.lst-WER: 33.72 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.62
epoch: 171 | nupdates: 136188 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:27 | bch(ms): 781.41 | smp(ms): 2.05 | fwd(ms): 272.92 | crit-fwd(ms): 19.18 | bwd(ms): 449.39 | optim(ms): 56.73 | loss: 11.38065 | train-TER: 37.54 | train-WER: 55.98 | lists/dev.lst-loss: 6.77847 | lists/dev.lst-TER: 19.94 | lists/dev.lst-WER: 34.37 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 556.49
epoch: 172 | nupdates: 136991 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:28 | bch(ms): 783.22 | smp(ms): 2.18 | fwd(ms): 273.98 | crit-fwd(ms): 19.17 | bwd(ms): 450.15 | optim(ms): 56.73 | loss: 11.36992 | train-TER: 39.07 | train-WER: 57.89 | lists/dev.lst-loss: 6.76174 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 34.44 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.20
epoch: 173 | nupdates: 137794 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 788.26 | smp(ms): 2.80 | fwd(ms): 274.25 | crit-fwd(ms): 19.22 | bwd(ms): 454.88 | optim(ms): 56.73 | loss: 11.42281 | train-TER: 36.56 | train-WER: 55.20 | lists/dev.lst-loss: 6.73172 | lists/dev.lst-TER: 18.91 | lists/dev.lst-WER: 33.57 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 551.65
epoch: 174 | nupdates: 138597 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:32 | bch(ms): 787.64 | smp(ms): 2.30 | fwd(ms): 273.87 | crit-fwd(ms): 19.22 | bwd(ms): 454.68 | optim(ms): 56.75 | loss: 11.46336 | train-TER: 35.38 | train-WER: 53.40 | lists/dev.lst-loss: 6.89235 | lists/dev.lst-TER: 21.02 | lists/dev.lst-WER: 35.14 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.08
epoch: 175 | nupdates: 139400 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.71 | smp(ms): 2.32 | fwd(ms): 274.34 | crit-fwd(ms): 19.15 | bwd(ms): 452.30 | optim(ms): 56.73 | loss: 11.36604 | train-TER: 38.06 | train-WER: 56.63 | lists/dev.lst-loss: 6.87792 | lists/dev.lst-TER: 20.18 | lists/dev.lst-WER: 34.31 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.44
epoch: 176 | nupdates: 140203 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:31 | bch(ms): 786.14 | smp(ms): 1.97 | fwd(ms): 274.65 | crit-fwd(ms): 19.18 | bwd(ms): 452.31 | optim(ms): 56.73 | loss: 11.38031 | train-TER: 38.13 | train-WER: 55.91 | lists/dev.lst-loss: 6.69457 | lists/dev.lst-TER: 18.23 | lists/dev.lst-WER: 33.00 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.13
epoch: 177 | nupdates: 141006 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:36 | bch(ms): 793.11 | smp(ms): 2.11 | fwd(ms): 274.53 | crit-fwd(ms): 19.11 | bwd(ms): 459.34 | optim(ms): 56.72 | loss: 11.22097 | train-TER: 40.22 | train-WER: 57.61 | lists/dev.lst-loss: 6.98225 | lists/dev.lst-TER: 20.51 | lists/dev.lst-WER: 34.61 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 548.27
epoch: 178 | nupdates: 141809 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:30 | bch(ms): 785.66 | smp(ms): 2.11 | fwd(ms): 274.52 | crit-fwd(ms): 19.20 | bwd(ms): 452.13 | optim(ms): 56.73 | loss: 11.22346 | train-TER: 37.51 | train-WER: 55.99 | lists/dev.lst-loss: 6.66853 | lists/dev.lst-TER: 18.14 | lists/dev.lst-WER: 32.64 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.47
epoch: 179 | nupdates: 142612 | lr: 0.400000 | lrcriterion: 0.400000 | runtime: 00:10:35 | bch(ms): 791.75 | smp(ms): 2.42 | fwd(ms): 274.35 | crit-fwd(ms): 19.15 | bwd(ms): 458.18 | optim(ms): 56.74 | loss: 11.24690 | train-TER: 40.54 | train-WER: 59.49 | lists/dev.lst-loss: 6.79366 | lists/dev.lst-TER: 20.03 | lists/dev.lst-WER: 34.29 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.21
epoch: 180 | nupdates: 143415 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.68 | smp(ms): 1.98 | fwd(ms): 274.56 | crit-fwd(ms): 19.23 | bwd(ms): 453.96 | optim(ms): 56.74 | loss: 10.98470 | train-TER: 36.07 | train-WER: 54.58 | lists/dev.lst-loss: 6.77555 | lists/dev.lst-TER: 19.20 | lists/dev.lst-WER: 33.41 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.06
epoch: 181 | nupdates: 144218 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.69 | smp(ms): 2.08 | fwd(ms): 274.56 | crit-fwd(ms): 19.17 | bwd(ms): 454.06 | optim(ms): 56.73 | loss: 11.02427 | train-TER: 38.19 | train-WER: 55.81 | lists/dev.lst-loss: 6.59204 | lists/dev.lst-TER: 18.42 | lists/dev.lst-WER: 32.62 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.05
epoch: 182 | nupdates: 145021 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:35 | bch(ms): 790.94 | smp(ms): 2.40 | fwd(ms): 274.46 | crit-fwd(ms): 19.20 | bwd(ms): 457.41 | optim(ms): 56.74 | loss: 11.06857 | train-TER: 34.51 | train-WER: 51.91 | lists/dev.lst-loss: 6.61927 | lists/dev.lst-TER: 19.43 | lists/dev.lst-WER: 33.27 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.78
epoch: 183 | nupdates: 145824 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.37 | smp(ms): 2.49 | fwd(ms): 274.24 | crit-fwd(ms): 19.19 | bwd(ms): 451.98 | optim(ms): 56.75 | loss: 10.87459 | train-TER: 33.51 | train-WER: 52.58 | lists/dev.lst-loss: 6.51529 | lists/dev.lst-TER: 18.17 | lists/dev.lst-WER: 32.40 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.68
epoch: 184 | nupdates: 146627 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:34 | bch(ms): 790.13 | smp(ms): 1.88 | fwd(ms): 274.35 | crit-fwd(ms): 19.15 | bwd(ms): 456.54 | optim(ms): 56.74 | loss: 11.06320 | train-TER: 35.73 | train-WER: 52.82 | lists/dev.lst-loss: 6.57975 | lists/dev.lst-TER: 19.14 | lists/dev.lst-WER: 33.13 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.34
epoch: 185 | nupdates: 147430 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.20 | smp(ms): 1.89 | fwd(ms): 274.81 | crit-fwd(ms): 19.22 | bwd(ms): 452.27 | optim(ms): 56.74 | loss: 10.94619 | train-TER: 36.66 | train-WER: 54.45 | lists/dev.lst-loss: 6.58858 | lists/dev.lst-TER: 19.10 | lists/dev.lst-WER: 33.25 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.09
epoch: 186 | nupdates: 148233 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.78 | smp(ms): 2.09 | fwd(ms): 274.21 | crit-fwd(ms): 19.07 | bwd(ms): 453.48 | optim(ms): 56.74 | loss: 10.76425 | train-TER: 36.67 | train-WER: 54.79 | lists/dev.lst-loss: 6.50925 | lists/dev.lst-TER: 19.20 | lists/dev.lst-WER: 33.05 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.68
epoch: 187 | nupdates: 149036 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.91 | smp(ms): 1.84 | fwd(ms): 274.64 | crit-fwd(ms): 19.16 | bwd(ms): 453.13 | optim(ms): 56.72 | loss: 10.93237 | train-TER: 32.78 | train-WER: 50.93 | lists/dev.lst-loss: 6.56154 | lists/dev.lst-TER: 19.02 | lists/dev.lst-WER: 32.94 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.59
epoch: 188 | nupdates: 149839 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.17 | smp(ms): 2.55 | fwd(ms): 273.99 | crit-fwd(ms): 19.21 | bwd(ms): 453.07 | optim(ms): 56.74 | loss: 10.76230 | train-TER: 35.54 | train-WER: 53.73 | lists/dev.lst-loss: 6.46922 | lists/dev.lst-TER: 18.58 | lists/dev.lst-WER: 32.64 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.11
epoch: 189 | nupdates: 150642 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.96 | smp(ms): 2.37 | fwd(ms): 274.69 | crit-fwd(ms): 19.17 | bwd(ms): 453.14 | optim(ms): 56.73 | loss: 10.76356 | train-TER: 34.75 | train-WER: 54.26 | lists/dev.lst-loss: 6.50256 | lists/dev.lst-TER: 18.65 | lists/dev.lst-WER: 32.54 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 552.56
epoch: 190 | nupdates: 151445 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.51 | smp(ms): 2.07 | fwd(ms): 274.38 | crit-fwd(ms): 19.19 | bwd(ms): 454.07 | optim(ms): 56.73 | loss: 10.92518 | train-TER: 38.46 | train-WER: 57.10 | lists/dev.lst-loss: 6.77908 | lists/dev.lst-TER: 20.72 | lists/dev.lst-WER: 34.44 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.17
epoch: 191 | nupdates: 152248 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.75 | smp(ms): 2.25 | fwd(ms): 274.08 | crit-fwd(ms): 19.14 | bwd(ms): 452.59 | optim(ms): 56.74 | loss: 10.73721 | train-TER: 36.10 | train-WER: 54.22 | lists/dev.lst-loss: 6.59410 | lists/dev.lst-TER: 19.54 | lists/dev.lst-WER: 33.35 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.41
epoch: 192 | nupdates: 153051 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:29 | bch(ms): 784.38 | smp(ms): 2.07 | fwd(ms): 274.16 | crit-fwd(ms): 19.20 | bwd(ms): 450.94 | optim(ms): 56.74 | loss: 10.73530 | train-TER: 40.64 | train-WER: 59.13 | lists/dev.lst-loss: 6.49267 | lists/dev.lst-TER: 18.27 | lists/dev.lst-WER: 32.46 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.38
epoch: 193 | nupdates: 153854 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.59 | smp(ms): 2.10 | fwd(ms): 274.12 | crit-fwd(ms): 19.15 | bwd(ms): 454.27 | optim(ms): 56.73 | loss: 10.84819 | train-TER: 36.43 | train-WER: 54.24 | lists/dev.lst-loss: 6.64641 | lists/dev.lst-TER: 19.26 | lists/dev.lst-WER: 32.98 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.12
epoch: 194 | nupdates: 154657 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.18 | smp(ms): 1.94 | fwd(ms): 274.69 | crit-fwd(ms): 19.12 | bwd(ms): 452.37 | optim(ms): 56.74 | loss: 10.75668 | train-TER: 38.07 | train-WER: 56.77 | lists/dev.lst-loss: 6.44928 | lists/dev.lst-TER: 17.53 | lists/dev.lst-WER: 31.79 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.10
epoch: 195 | nupdates: 155460 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:34 | bch(ms): 790.33 | smp(ms): 2.21 | fwd(ms): 274.54 | crit-fwd(ms): 19.16 | bwd(ms): 456.58 | optim(ms): 56.74 | loss: 10.89307 | train-TER: 38.31 | train-WER: 55.82 | lists/dev.lst-loss: 6.54689 | lists/dev.lst-TER: 19.25 | lists/dev.lst-WER: 32.83 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 550.20
epoch: 196 | nupdates: 156263 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 786.09 | smp(ms): 2.44 | fwd(ms): 274.30 | crit-fwd(ms): 19.25 | bwd(ms): 452.64 | optim(ms): 56.74 | loss: 10.82547 | train-TER: 36.27 | train-WER: 53.87 | lists/dev.lst-loss: 6.43098 | lists/dev.lst-TER: 18.08 | lists/dev.lst-WER: 32.07 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.17
epoch: 197 | nupdates: 157066 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:33 | bch(ms): 789.01 | smp(ms): 2.19 | fwd(ms): 274.62 | crit-fwd(ms): 19.26 | bwd(ms): 455.29 | optim(ms): 56.72 | loss: 10.76898 | train-TER: 33.48 | train-WER: 50.38 | lists/dev.lst-loss: 6.53490 | lists/dev.lst-TER: 18.82 | lists/dev.lst-WER: 32.81 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 551.12
epoch: 198 | nupdates: 157869 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:31 | bch(ms): 785.84 | smp(ms): 2.24 | fwd(ms): 274.30 | crit-fwd(ms): 19.19 | bwd(ms): 452.37 | optim(ms): 56.74 | loss: 10.77399 | train-TER: 36.53 | train-WER: 54.89 | lists/dev.lst-loss: 6.57068 | lists/dev.lst-TER: 19.49 | lists/dev.lst-WER: 33.20 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 553.34
epoch: 199 | nupdates: 158672 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.19 | smp(ms): 1.40 | fwd(ms): 274.15 | crit-fwd(ms): 19.17 | bwd(ms): 451.72 | optim(ms): 56.73 | loss: 10.69899 | train-TER: 39.24 | train-WER: 57.06 | lists/dev.lst-loss: 6.39472 | lists/dev.lst-TER: 17.90 | lists/dev.lst-WER: 31.93 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.80
epoch: 200 | nupdates: 159475 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.33 | smp(ms): 2.08 | fwd(ms): 274.52 | crit-fwd(ms): 19.10 | bwd(ms): 451.65 | optim(ms): 56.73 | loss: 10.78118 | train-TER: 38.35 | train-WER: 55.96 | lists/dev.lst-loss: 6.63195 | lists/dev.lst-TER: 19.00 | lists/dev.lst-WER: 32.91 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.71
epoch: 201 | nupdates: 160278 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.26 | smp(ms): 2.60 | fwd(ms): 274.03 | crit-fwd(ms): 19.16 | bwd(ms): 452.17 | optim(ms): 56.74 | loss: 10.73137 | train-TER: 34.88 | train-WER: 52.69 | lists/dev.lst-loss: 6.38703 | lists/dev.lst-TER: 17.57 | lists/dev.lst-WER: 31.67 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.75
epoch: 202 | nupdates: 161081 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:35 | bch(ms): 791.42 | smp(ms): 1.73 | fwd(ms): 274.47 | crit-fwd(ms): 19.18 | bwd(ms): 457.84 | optim(ms): 56.74 | loss: 10.61894 | train-TER: 34.49 | train-WER: 50.74 | lists/dev.lst-loss: 6.45778 | lists/dev.lst-TER: 18.36 | lists/dev.lst-WER: 32.26 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 549.44
epoch: 203 | nupdates: 161884 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.52 | smp(ms): 2.47 | fwd(ms): 274.33 | crit-fwd(ms): 19.10 | bwd(ms): 451.96 | optim(ms): 56.74 | loss: 10.60532 | train-TER: 39.43 | train-WER: 57.52 | lists/dev.lst-loss: 6.53710 | lists/dev.lst-TER: 18.51 | lists/dev.lst-WER: 32.24 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.57
epoch: 204 | nupdates: 162687 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 784.70 | smp(ms): 1.76 | fwd(ms): 274.25 | crit-fwd(ms): 19.11 | bwd(ms): 451.29 | optim(ms): 56.76 | loss: 10.69073 | train-TER: 35.35 | train-WER: 53.21 | lists/dev.lst-loss: 6.39192 | lists/dev.lst-TER: 18.01 | lists/dev.lst-WER: 31.69 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.15
epoch: 205 | nupdates: 163490 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:27 | bch(ms): 781.62 | smp(ms): 2.13 | fwd(ms): 273.18 | crit-fwd(ms): 19.20 | bwd(ms): 449.37 | optim(ms): 56.74 | loss: 10.71213 | train-TER: 34.28 | train-WER: 52.45 | lists/dev.lst-loss: 6.57545 | lists/dev.lst-TER: 18.85 | lists/dev.lst-WER: 32.33 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 556.34
epoch: 206 | nupdates: 164293 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:28 | bch(ms): 782.37 | smp(ms): 2.26 | fwd(ms): 273.35 | crit-fwd(ms): 19.14 | bwd(ms): 449.88 | optim(ms): 56.74 | loss: 10.58860 | train-TER: 33.49 | train-WER: 51.93 | lists/dev.lst-loss: 6.46649 | lists/dev.lst-TER: 18.19 | lists/dev.lst-WER: 31.99 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.80
epoch: 207 | nupdates: 165096 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.21 | smp(ms): 2.10 | fwd(ms): 273.19 | crit-fwd(ms): 19.09 | bwd(ms): 452.83 | optim(ms): 56.72 | loss: 10.74558 | train-TER: 34.95 | train-WER: 53.85 | lists/dev.lst-loss: 6.43113 | lists/dev.lst-TER: 17.94 | lists/dev.lst-WER: 31.94 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.79
epoch: 208 | nupdates: 165899 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:28 | bch(ms): 782.89 | smp(ms): 2.14 | fwd(ms): 273.81 | crit-fwd(ms): 19.16 | bwd(ms): 449.90 | optim(ms): 56.74 | loss: 10.55780 | train-TER: 33.49 | train-WER: 51.10 | lists/dev.lst-loss: 6.36704 | lists/dev.lst-TER: 17.72 | lists/dev.lst-WER: 31.59 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.43
epoch: 209 | nupdates: 166702 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:33 | bch(ms): 788.75 | smp(ms): 1.90 | fwd(ms): 273.35 | crit-fwd(ms): 19.12 | bwd(ms): 456.21 | optim(ms): 56.73 | loss: 10.74741 | train-TER: 37.55 | train-WER: 55.27 | lists/dev.lst-loss: 6.71533 | lists/dev.lst-TER: 19.85 | lists/dev.lst-WER: 33.47 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 551.31
epoch: 210 | nupdates: 167505 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:28 | bch(ms): 783.20 | smp(ms): 2.41 | fwd(ms): 273.65 | crit-fwd(ms): 19.22 | bwd(ms): 450.43 | optim(ms): 56.73 | loss: 10.42826 | train-TER: 32.39 | train-WER: 50.69 | lists/dev.lst-loss: 6.48521 | lists/dev.lst-TER: 18.26 | lists/dev.lst-WER: 32.13 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.21
epoch: 211 | nupdates: 168308 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:29 | bch(ms): 783.67 | smp(ms): 2.17 | fwd(ms): 273.77 | crit-fwd(ms): 19.24 | bwd(ms): 450.85 | optim(ms): 56.72 | loss: 10.62273 | train-TER: 39.53 | train-WER: 58.03 | lists/dev.lst-loss: 6.50737 | lists/dev.lst-TER: 18.55 | lists/dev.lst-WER: 32.27 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.88
epoch: 212 | nupdates: 169111 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:28 | bch(ms): 782.33 | smp(ms): 2.15 | fwd(ms): 272.92 | crit-fwd(ms): 19.14 | bwd(ms): 450.15 | optim(ms): 56.74 | loss: 10.59295 | train-TER: 35.63 | train-WER: 53.44 | lists/dev.lst-loss: 6.36012 | lists/dev.lst-TER: 18.04 | lists/dev.lst-WER: 31.94 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 555.83
epoch: 213 | nupdates: 169914 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:26 | bch(ms): 780.19 | smp(ms): 1.40 | fwd(ms): 272.58 | crit-fwd(ms): 19.14 | bwd(ms): 448.38 | optim(ms): 56.73 | loss: 10.51814 | train-TER: 38.03 | train-WER: 55.48 | lists/dev.lst-loss: 6.49792 | lists/dev.lst-TER: 17.66 | lists/dev.lst-WER: 31.55 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 557.35
epoch: 214 | nupdates: 170717 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:35 | bch(ms): 790.96 | smp(ms): 1.99 | fwd(ms): 273.75 | crit-fwd(ms): 19.25 | bwd(ms): 458.17 | optim(ms): 56.74 | loss: 10.54457 | train-TER: 34.09 | train-WER: 53.24 | lists/dev.lst-loss: 6.55043 | lists/dev.lst-TER: 19.37 | lists/dev.lst-WER: 32.81 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 549.76
epoch: 215 | nupdates: 171520 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 785.34 | smp(ms): 2.16 | fwd(ms): 273.02 | crit-fwd(ms): 19.11 | bwd(ms): 453.15 | optim(ms): 56.71 | loss: 10.61777 | train-TER: 35.66 | train-WER: 53.85 | lists/dev.lst-loss: 6.55141 | lists/dev.lst-TER: 18.70 | lists/dev.lst-WER: 32.24 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.70
epoch: 216 | nupdates: 172323 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:28 | bch(ms): 783.13 | smp(ms): 2.15 | fwd(ms): 273.51 | crit-fwd(ms): 19.16 | bwd(ms): 450.16 | optim(ms): 56.73 | loss: 10.62580 | train-TER: 33.30 | train-WER: 51.20 | lists/dev.lst-loss: 6.48274 | lists/dev.lst-TER: 18.52 | lists/dev.lst-WER: 31.92 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.26
epoch: 217 | nupdates: 173126 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:30 | bch(ms): 784.67 | smp(ms): 2.05 | fwd(ms): 274.41 | crit-fwd(ms): 19.16 | bwd(ms): 451.04 | optim(ms): 56.75 | loss: 10.62084 | train-TER: 35.05 | train-WER: 52.60 | lists/dev.lst-loss: 6.33418 | lists/dev.lst-TER: 17.28 | lists/dev.lst-WER: 31.21 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.17
epoch: 218 | nupdates: 173929 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.37 | smp(ms): 2.43 | fwd(ms): 272.74 | crit-fwd(ms): 19.21 | bwd(ms): 455.42 | optim(ms): 56.73 | loss: 10.59605 | train-TER: 31.67 | train-WER: 48.49 | lists/dev.lst-loss: 6.39825 | lists/dev.lst-TER: 17.84 | lists/dev.lst-WER: 31.47 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 552.27
epoch: 219 | nupdates: 174732 | lr: 0.200000 | lrcriterion: 0.200000 | runtime: 00:10:32 | bch(ms): 787.15 | smp(ms): 2.20 | fwd(ms): 273.61 | crit-fwd(ms): 19.21 | bwd(ms): 454.43 | optim(ms): 56.72 | loss: 10.64473 | train-TER: 32.92 | train-WER: 50.87 | lists/dev.lst-loss: 6.39127 | lists/dev.lst-TER: 18.24 | lists/dev.lst-WER: 31.98 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 552.43
epoch: 220 | nupdates: 175535 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:28 | bch(ms): 782.91 | smp(ms): 1.77 | fwd(ms): 273.88 | crit-fwd(ms): 19.19 | bwd(ms): 449.89 | optim(ms): 56.73 | loss: 10.53841 | train-TER: 31.88 | train-WER: 48.36 | lists/dev.lst-loss: 6.42784 | lists/dev.lst-TER: 18.15 | lists/dev.lst-WER: 31.79 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 555.42
epoch: 221 | nupdates: 176338 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 785.06 | smp(ms): 1.88 | fwd(ms): 273.71 | crit-fwd(ms): 19.23 | bwd(ms): 452.32 | optim(ms): 56.73 | loss: 10.41773 | train-TER: 35.86 | train-WER: 53.93 | lists/dev.lst-loss: 6.42854 | lists/dev.lst-TER: 18.54 | lists/dev.lst-WER: 32.05 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.89
epoch: 222 | nupdates: 177141 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 784.85 | smp(ms): 2.12 | fwd(ms): 274.16 | crit-fwd(ms): 19.19 | bwd(ms): 451.57 | optim(ms): 56.74 | loss: 10.36161 | train-TER: 36.09 | train-WER: 53.96 | lists/dev.lst-loss: 6.42575 | lists/dev.lst-TER: 18.66 | lists/dev.lst-WER: 32.06 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.04
epoch: 223 | nupdates: 177944 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:31 | bch(ms): 786.39 | smp(ms): 1.98 | fwd(ms): 273.62 | crit-fwd(ms): 19.14 | bwd(ms): 453.65 | optim(ms): 56.72 | loss: 10.36105 | train-TER: 31.73 | train-WER: 49.15 | lists/dev.lst-loss: 6.40138 | lists/dev.lst-TER: 17.87 | lists/dev.lst-WER: 31.40 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 552.96
epoch: 224 | nupdates: 178747 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 784.68 | smp(ms): 2.21 | fwd(ms): 273.96 | crit-fwd(ms): 19.21 | bwd(ms): 451.49 | optim(ms): 56.72 | loss: 10.38223 | train-TER: 30.60 | train-WER: 47.09 | lists/dev.lst-loss: 6.41241 | lists/dev.lst-TER: 18.41 | lists/dev.lst-WER: 31.75 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.17
epoch: 225 | nupdates: 179550 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:27 | bch(ms): 781.75 | smp(ms): 1.44 | fwd(ms): 273.77 | crit-fwd(ms): 19.17 | bwd(ms): 448.74 | optim(ms): 56.74 | loss: 10.29468 | train-TER: 38.76 | train-WER: 56.52 | lists/dev.lst-loss: 6.39993 | lists/dev.lst-TER: 17.66 | lists/dev.lst-WER: 31.27 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 556.24
epoch: 226 | nupdates: 180353 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 785.69 | smp(ms): 1.93 | fwd(ms): 273.69 | crit-fwd(ms): 19.16 | bwd(ms): 452.85 | optim(ms): 56.73 | loss: 10.25394 | train-TER: 37.23 | train-WER: 55.39 | lists/dev.lst-loss: 6.38383 | lists/dev.lst-TER: 18.08 | lists/dev.lst-WER: 31.62 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 553.45
epoch: 227 | nupdates: 181156 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 785.14 | smp(ms): 2.31 | fwd(ms): 274.40 | crit-fwd(ms): 19.16 | bwd(ms): 451.58 | optim(ms): 56.73 | loss: 10.32262 | train-TER: 33.40 | train-WER: 50.59 | lists/dev.lst-loss: 6.52243 | lists/dev.lst-TER: 19.20 | lists/dev.lst-WER: 32.52 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.84
epoch: 228 | nupdates: 181959 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:29 | bch(ms): 783.99 | smp(ms): 2.43 | fwd(ms): 273.84 | crit-fwd(ms): 19.22 | bwd(ms): 450.94 | optim(ms): 56.74 | loss: 10.28221 | train-TER: 34.86 | train-WER: 52.23 | lists/dev.lst-loss: 6.36411 | lists/dev.lst-TER: 18.43 | lists/dev.lst-WER: 31.78 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.65
epoch: 229 | nupdates: 182762 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:29 | bch(ms): 784.10 | smp(ms): 1.85 | fwd(ms): 273.89 | crit-fwd(ms): 19.16 | bwd(ms): 451.16 | optim(ms): 56.73 | loss: 10.31650 | train-TER: 33.44 | train-WER: 51.01 | lists/dev.lst-loss: 6.32083 | lists/dev.lst-TER: 17.79 | lists/dev.lst-WER: 31.34 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.57
epoch: 230 | nupdates: 183565 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:28 | bch(ms): 782.85 | smp(ms): 2.09 | fwd(ms): 273.21 | crit-fwd(ms): 19.14 | bwd(ms): 450.47 | optim(ms): 56.73 | loss: 10.44297 | train-TER: 35.95 | train-WER: 53.15 | lists/dev.lst-loss: 6.32351 | lists/dev.lst-TER: 17.90 | lists/dev.lst-WER: 31.32 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 555.46
epoch: 231 | nupdates: 184368 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 785.52 | smp(ms): 1.84 | fwd(ms): 273.42 | crit-fwd(ms): 19.06 | bwd(ms): 452.78 | optim(ms): 56.75 | loss: 10.25216 | train-TER: 34.80 | train-WER: 53.14 | lists/dev.lst-loss: 6.38857 | lists/dev.lst-TER: 18.16 | lists/dev.lst-WER: 31.63 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 124 | hrs: 96.99 | thrpt(sec/sec): 553.57
epoch: 232 | nupdates: 185171 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:27 | bch(ms): 781.42 | smp(ms): 2.11 | fwd(ms): 273.29 | crit-fwd(ms): 19.20 | bwd(ms): 448.97 | optim(ms): 56.74 | loss: 10.41686 | train-TER: 37.88 | train-WER: 55.90 | lists/dev.lst-loss: 6.37435 | lists/dev.lst-TER: 18.02 | lists/dev.lst-WER: 31.43 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 556.48
epoch: 233 | nupdates: 185974 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:29 | bch(ms): 783.91 | smp(ms): 2.18 | fwd(ms): 273.72 | crit-fwd(ms): 19.19 | bwd(ms): 451.08 | optim(ms): 56.74 | loss: 10.34922 | train-TER: 35.33 | train-WER: 52.72 | lists/dev.lst-loss: 6.37986 | lists/dev.lst-TER: 18.50 | lists/dev.lst-WER: 31.70 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.71
epoch: 234 | nupdates: 186777 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 785.02 | smp(ms): 1.87 | fwd(ms): 273.96 | crit-fwd(ms): 19.15 | bwd(ms): 451.94 | optim(ms): 56.72 | loss: 10.46850 | train-TER: 37.59 | train-WER: 55.62 | lists/dev.lst-loss: 6.56190 | lists/dev.lst-TER: 19.08 | lists/dev.lst-WER: 32.23 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 553.92
epoch: 235 | nupdates: 187580 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:28 | bch(ms): 782.57 | smp(ms): 1.99 | fwd(ms): 272.88 | crit-fwd(ms): 19.08 | bwd(ms): 450.50 | optim(ms): 56.75 | loss: 10.34129 | train-TER: 36.29 | train-WER: 54.19 | lists/dev.lst-loss: 6.31790 | lists/dev.lst-TER: 17.75 | lists/dev.lst-WER: 31.32 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 555.66
epoch: 236 | nupdates: 188383 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:30 | bch(ms): 784.84 | smp(ms): 2.66 | fwd(ms): 273.37 | crit-fwd(ms): 19.20 | bwd(ms): 452.36 | optim(ms): 56.72 | loss: 10.28420 | train-TER: 36.50 | train-WER: 53.79 | lists/dev.lst-loss: 6.46919 | lists/dev.lst-TER: 18.45 | lists/dev.lst-WER: 31.70 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 554.05
epoch: 237 | nupdates: 189186 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:26 | bch(ms): 780.44 | smp(ms): 2.19 | fwd(ms): 273.03 | crit-fwd(ms): 19.15 | bwd(ms): 448.12 | optim(ms): 56.74 | loss: 10.22172 | train-TER: 30.47 | train-WER: 47.12 | lists/dev.lst-loss: 6.31541 | lists/dev.lst-TER: 18.01 | lists/dev.lst-WER: 31.40 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 557.17
epoch: 238 | nupdates: 189989 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:29 | bch(ms): 783.91 | smp(ms): 2.20 | fwd(ms): 273.48 | crit-fwd(ms): 19.20 | bwd(ms): 451.31 | optim(ms): 56.72 | loss: 10.20083 | train-TER: 36.24 | train-WER: 54.10 | lists/dev.lst-loss: 6.39222 | lists/dev.lst-TER: 18.11 | lists/dev.lst-WER: 31.46 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 554.71
epoch: 239 | nupdates: 190792 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:29 | bch(ms): 783.98 | smp(ms): 2.33 | fwd(ms): 273.37 | crit-fwd(ms): 19.20 | bwd(ms): 451.45 | optim(ms): 56.72 | loss: 10.32073 | train-TER: 34.16 | train-WER: 52.60 | lists/dev.lst-loss: 6.31201 | lists/dev.lst-TER: 17.46 | lists/dev.lst-WER: 31.03 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 554.66
epoch: 240 | nupdates: 191595 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:32 | bch(ms): 788.29 | smp(ms): 1.32 | fwd(ms): 273.02 | crit-fwd(ms): 19.20 | bwd(ms): 455.91 | optim(ms): 56.78 | loss: 10.22199 | train-TER: 37.90 | train-WER: 55.26 | lists/dev.lst-loss: 6.36060 | lists/dev.lst-TER: 18.06 | lists/dev.lst-WER: 31.42 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 122 | hrs: 96.99 | thrpt(sec/sec): 551.63
epoch: 241 | nupdates: 192398 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:31 | bch(ms): 785.92 | smp(ms): 2.35 | fwd(ms): 273.48 | crit-fwd(ms): 19.11 | bwd(ms): 453.24 | optim(ms): 56.72 | loss: 10.42578 | train-TER: 39.46 | train-WER: 58.00 | lists/dev.lst-loss: 6.41324 | lists/dev.lst-TER: 18.80 | lists/dev.lst-WER: 32.13 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 123 | hrs: 96.99 | thrpt(sec/sec): 553.29
epoch: 242 | nupdates: 193201 | lr: 0.100000 | lrcriterion: 0.100000 | runtime: 00:10:28 | bch(ms): 782.49 | smp(ms): 2.01 | fwd(ms): 273.34 | crit-fwd(ms): 19.21 | bwd(ms): 450.07 | optim(ms): 56.73 | loss: 10.27667 | train-TER: 32.70 | train-WER: 49.60 | lists/dev.lst-loss: 6.36963 | lists/dev.lst-TER: 17.98 | lists/dev.lst-WER: 31.36 | avg-isz: 679 | avg-tsz: 022 | max-tsz: 121 | hrs: 96.99 | thrpt(sec/sec): 555.71