diff --git a/egs/reverb/s5/RESULTS b/egs/reverb/s5/RESULTS index b92f144b458..bc994e05d48 100644 --- a/egs/reverb/s5/RESULTS +++ b/egs/reverb/s5/RESULTS @@ -1,121 +1,250 @@ ######################################## GMM RESULTs: exp/tri3/decode_dt_real_1ch -%WER 34.18 [ 500 / 1463, 24 ins, 125 del, 351 sub ] exp/tri3/decode_dt_real_1ch/wer_17_1.0_far_room1 -%WER 29.63 [ 475 / 1603, 24 ins, 127 del, 324 sub ] exp/tri3/decode_dt_real_1ch/wer_15_0.5_near_room1 +%WER 34.59 [ 506 / 1463, 40 ins, 113 del, 353 sub ] exp/tri3/decode_dt_real_1ch/wer_15_0.5_far_room1 +%WER 30.26 [ 485 / 1603, 42 ins, 112 del, 331 sub ] exp/tri3/decode_dt_real_1ch/wer_17_0.0_near_room1 exp/tri3/decode_dt_simu_1ch -%WER 6.78 [ 276 / 4071, 38 ins, 42 del, 196 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_1.0_far_room1 -%WER 18.28 [ 742 / 4058, 65 ins, 155 del, 522 sub ] exp/tri3/decode_dt_simu_1ch/wer_14_0.5_far_room2 -%WER 19.78 [ 800 / 4045, 77 ins, 148 del, 575 sub ] exp/tri3/decode_dt_simu_1ch/wer_13_0.0_far_room3 -%WER 5.53 [ 225 / 4071, 36 ins, 29 del, 160 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_1.0_near_room1 -%WER 7.81 [ 317 / 4058, 48 ins, 37 del, 232 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_0.0_near_room2 -%WER 10.70 [ 433 / 4045, 47 ins, 86 del, 300 sub ] exp/tri3/decode_dt_simu_1ch/wer_13_0.5_near_room3 +%WER 6.73 [ 274 / 4071, 42 ins, 40 del, 192 sub ] exp/tri3/decode_dt_simu_1ch/wer_15_0.0_far_room1 +%WER 18.38 [ 746 / 4058, 83 ins, 133 del, 530 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_0.5_far_room2 +%WER 19.70 [ 797 / 4045, 73 ins, 183 del, 541 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_1.0_far_room3 +%WER 5.43 [ 221 / 4071, 34 ins, 38 del, 149 sub ] exp/tri3/decode_dt_simu_1ch/wer_13_1.0_near_room1 +%WER 7.74 [ 314 / 4058, 54 ins, 47 del, 213 sub ] exp/tri3/decode_dt_simu_1ch/wer_12_0.5_near_room2 +%WER 7.86 [ 318 / 4045, 38 ins, 53 del, 227 sub ] exp/tri3/decode_dt_simu_1ch/wer_16_0.0_near_room3 exp/tri3/decode_et_real_1ch -%WER 33.09 [ 980 / 2962, 103 ins, 157 del, 720 sub ] exp/tri3/decode_et_real_1ch/wer_13_0.0_far_room1 -%WER 33.18 [ 1039 / 3131, 104 ins, 194 del, 741 sub ] exp/tri3/decode_et_real_1ch/wer_16_0.0_near_room1 +%WER 32.82 [ 972 / 2962, 93 ins, 178 del, 701 sub ] exp/tri3/decode_et_real_1ch/wer_17_0.0_far_room1 +%WER 33.15 [ 1038 / 3131, 111 ins, 177 del, 750 sub ] exp/tri3/decode_et_real_1ch/wer_16_0.0_near_room1 exp/tri3/decode_et_simu_1ch -%WER 7.47 [ 441 / 5907, 73 ins, 48 del, 320 sub ] exp/tri3/decode_et_simu_1ch/wer_15_0.5_far_room1 -%WER 18.31 [ 1140 / 6226, 128 ins, 191 del, 821 sub ] exp/tri3/decode_et_simu_1ch/wer_13_0.0_far_room2 -%WER 21.81 [ 1280 / 5868, 109 ins, 273 del, 898 sub ] exp/tri3/decode_et_simu_1ch/wer_14_0.5_far_room3 -%WER 7.26 [ 429 / 5907, 77 ins, 42 del, 310 sub ] exp/tri3/decode_et_simu_1ch/wer_16_1.0_near_room1 -%WER 9.52 [ 593 / 6226, 78 ins, 86 del, 429 sub ] exp/tri3/decode_et_simu_1ch/wer_13_0.5_near_room2 -%WER 11.96 [ 702 / 5868, 60 ins, 151 del, 491 sub ] exp/tri3/decode_et_simu_1ch/wer_13_1.0_near_room3 -######################################## -TDNN RESULTs: -exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt* -%WER 19.62 [ 287 / 1463, 29 ins, 55 del, 203 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch/wer_10_0.0_far_room1 -%WER 17.65 [ 283 / 1603, 27 ins, 67 del, 189 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch/wer_12_0.0_near_room1 -%WER 3.29 [ 134 / 4071, 17 ins, 25 del, 92 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_8_0.5_far_room1 -%WER 7.02 [ 285 / 4058, 27 ins, 53 del, 205 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_7_0.5_far_room2 -%WER 6.85 [ 277 / 4045, 20 ins, 54 del, 203 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_8_1.0_far_room3 -%WER 2.73 [ 111 / 4071, 10 ins, 18 del, 83 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_8_0.5_near_room1 -%WER 3.45 [ 140 / 4058, 14 ins, 24 del, 102 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_9_0.5_near_room2 -%WER 3.93 [ 159 / 4045, 23 ins, 26 del, 110 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_8_0.0_near_room3 - -exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et* -%WER 19.04 [ 564 / 2962, 53 ins, 94 del, 417 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch/wer_10_0.5_far_room1 -%WER 18.17 [ 569 / 3131, 48 ins, 123 del, 398 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch/wer_10_0.5_near_room1 -%WER 3.72 [ 220 / 5907, 24 ins, 41 del, 155 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_far_room1 -%WER 7.40 [ 461 / 6226, 41 ins, 97 del, 323 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_8_1.0_far_room2 -%WER 7.26 [ 426 / 5868, 33 ins, 101 del, 292 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_far_room3 -%WER 3.18 [ 188 / 5907, 25 ins, 38 del, 125 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_8_1.0_near_room1 -%WER 4.87 [ 303 / 6226, 31 ins, 64 del, 208 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_near_room2 -%WER 4.84 [ 284 / 5868, 23 ins, 64 del, 197 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_10_1.0_near_room3 - -######################################## -GMM RESULTs with WPE and Beamformit: -exp/tri3/decode_dt_real_1ch -%WER 27.48 [ 402 / 1463, 39 ins, 63 del, 300 sub ] exp/tri3/decode_dt_real_1ch/wer_14_0.5_far_room1 -%WER 22.33 [ 358 / 1603, 37 ins, 90 del, 231 sub ] exp/tri3/decode_dt_real_1ch/wer_16_0.0_near_room1 - -exp/tri3/decode_dt_simu_1ch -%WER 4.47 [ 182 / 4071, 35 ins, 26 del, 121 sub ] exp/tri3/decode_dt_simu_1ch/wer_14_0.0_far_room1 -%WER 6.78 [ 275 / 4058, 41 ins, 37 del, 197 sub ] exp/tri3/decode_dt_simu_1ch/wer_17_0.0_far_room2 -%WER 5.27 [ 213 / 4045, 27 ins, 32 del, 154 sub ] exp/tri3/decode_dt_simu_1ch/wer_13_1.0_far_room3 -%WER 4.54 [ 185 / 4071, 34 ins, 24 del, 127 sub ] exp/tri3/decode_dt_simu_1ch/wer_15_0.0_near_room1 -%WER 5.54 [ 225 / 4058, 32 ins, 27 del, 166 sub ] exp/tri3/decode_dt_simu_1ch/wer_15_0.5_near_room2 -%WER 5.59 [ 226 / 4045, 29 ins, 37 del, 160 sub ] exp/tri3/decode_dt_simu_1ch/wer_14_0.5_near_room3 - -exp/tri3/decode_et_real_1ch -%WER 20.97 [ 621 / 2962, 113 ins, 79 del, 429 sub ] exp/tri3/decode_et_real_1ch/wer_13_0.0_far_room1 -%WER 21.65 [ 678 / 3131, 77 ins, 138 del, 463 sub ] exp/tri3/decode_et_real_1ch/wer_16_1.0_near_room1 - -exp/tri3/decode_et_simu_1ch -%WER 5.54 [ 327 / 5907, 65 ins, 40 del, 222 sub ] exp/tri3/decode_et_simu_1ch/wer_16_0.5_far_room1 -%WER 7.48 [ 466 / 6226, 64 ins, 61 del, 341 sub ] exp/tri3/decode_et_simu_1ch/wer_15_0.5_far_room2 -%WER 7.11 [ 417 / 5868, 64 ins, 64 del, 289 sub ] exp/tri3/decode_et_simu_1ch/wer_14_0.5_far_room3 -%WER 5.50 [ 325 / 5907, 58 ins, 44 del, 223 sub ] exp/tri3/decode_et_simu_1ch/wer_17_1.0_near_room1 -%WER 6.23 [ 388 / 6226, 60 ins, 52 del, 276 sub ] exp/tri3/decode_et_simu_1ch/wer_15_0.5_near_room2 -%WER 7.09 [ 416 / 5868, 67 ins, 60 del, 289 sub ] exp/tri3/decode_et_simu_1ch/wer_14_0.5_near_room3 +%WER 7.55 [ 446 / 5907, 79 ins, 55 del, 312 sub ] exp/tri3/decode_et_simu_1ch/wer_15_0.5_far_room1 +%WER 18.36 [ 1143 / 6226, 109 ins, 209 del, 825 sub ] exp/tri3/decode_et_simu_1ch/wer_13_0.5_far_room2 +%WER 20.60 [ 1209 / 5868, 140 ins, 244 del, 825 sub ] exp/tri3/decode_et_simu_1ch/wer_13_0.0_far_room3 +%WER 6.97 [ 412 / 5907, 70 ins, 44 del, 298 sub ] exp/tri3/decode_et_simu_1ch/wer_16_1.0_near_room1 +%WER 9.46 [ 589 / 6226, 54 ins, 116 del, 419 sub ] exp/tri3/decode_et_simu_1ch/wer_15_1.0_near_room2 +%WER 10.62 [ 623 / 5868, 81 ins, 105 del, 437 sub ] exp/tri3/decode_et_simu_1ch/wer_12_1.0_near_room3 + +exp/tri3/decode_dt_real_1ch_wpe +%WER 33.83 [ 495 / 1463, 42 ins, 97 del, 356 sub ] exp/tri3/decode_dt_real_1ch_wpe/wer_17_0.0_far_room1 +%WER 27.76 [ 445 / 1603, 34 ins, 110 del, 301 sub ] exp/tri3/decode_dt_real_1ch_wpe/wer_16_0.0_near_room1 + +exp/tri3/decode_dt_simu_1ch_wpe +%WER 6.61 [ 269 / 4071, 32 ins, 50 del, 187 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_15_1.0_far_room1 +%WER 17.32 [ 703 / 4058, 74 ins, 123 del, 506 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_16_0.0_far_room2 +%WER 18.34 [ 742 / 4045, 87 ins, 143 del, 512 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_15_0.0_far_room3 +%WER 5.50 [ 224 / 4071, 35 ins, 43 del, 146 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_16_1.0_near_room1 +%WER 7.20 [ 292 / 4058, 41 ins, 46 del, 205 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_12_1.0_near_room2 +%WER 7.69 [ 311 / 4045, 30 ins, 59 del, 222 sub ] exp/tri3/decode_dt_simu_1ch_wpe/wer_15_1.0_near_room3 + +exp/tri3/decode_et_real_1ch_wpe +%WER 30.25 [ 896 / 2962, 84 ins, 178 del, 634 sub ] exp/tri3/decode_et_real_1ch_wpe/wer_16_0.5_far_room1 +%WER 31.46 [ 985 / 3131, 111 ins, 157 del, 717 sub ] exp/tri3/decode_et_real_1ch_wpe/wer_16_0.0_near_room1 + +exp/tri3/decode_et_simu_1ch_wpe +%WER 7.23 [ 427 / 5907, 71 ins, 51 del, 305 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_16_0.5_far_room1 +%WER 16.86 [ 1050 / 6226, 75 ins, 243 del, 732 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_14_1.0_far_room2 +%WER 19.90 [ 1168 / 5868, 134 ins, 250 del, 784 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_13_0.5_far_room3 +%WER 7.13 [ 421 / 5907, 76 ins, 39 del, 306 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_17_0.5_near_room1 +%WER 8.54 [ 532 / 6226, 55 ins, 96 del, 381 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_17_0.5_near_room2 +%WER 10.07 [ 591 / 5868, 94 ins, 80 del, 417 sub ] exp/tri3/decode_et_simu_1ch_wpe/wer_12_0.5_near_room3 + +exp/tri3/decode_dt_real_2ch_wpe +%WER 31.51 [ 461 / 1463, 39 ins, 87 del, 335 sub ] exp/tri3/decode_dt_real_2ch_wpe/wer_17_0.0_far_room1 +%WER 26.51 [ 425 / 1603, 31 ins, 105 del, 289 sub ] exp/tri3/decode_dt_real_2ch_wpe/wer_17_0.0_near_room1 + +exp/tri3/decode_dt_simu_2ch_wpe +%WER 6.24 [ 254 / 4071, 51 ins, 34 del, 169 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_13_0.0_far_room1 +%WER 14.32 [ 581 / 4058, 78 ins, 98 del, 405 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_13_0.0_far_room2 +%WER 17.33 [ 701 / 4045, 87 ins, 154 del, 460 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_14_1.0_far_room3 +%WER 5.75 [ 234 / 4071, 35 ins, 40 del, 159 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_17_1.0_near_room1 +%WER 7.07 [ 287 / 4058, 40 ins, 41 del, 206 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_13_1.0_near_room2 +%WER 7.54 [ 305 / 4045, 41 ins, 45 del, 219 sub ] exp/tri3/decode_dt_simu_2ch_wpe/wer_13_0.5_near_room3 + +exp/tri3/decode_et_real_2ch_wpe +%WER 26.81 [ 794 / 2962, 113 ins, 116 del, 565 sub ] exp/tri3/decode_et_real_2ch_wpe/wer_16_0.0_far_room1 +%WER 28.11 [ 880 / 3131, 80 ins, 189 del, 611 sub ] exp/tri3/decode_et_real_2ch_wpe/wer_17_1.0_near_room1 + +exp/tri3/decode_et_simu_2ch_wpe +%WER 7.03 [ 415 / 5907, 73 ins, 45 del, 297 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_16_0.5_far_room1 +%WER 14.63 [ 911 / 6226, 93 ins, 161 del, 657 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_15_0.5_far_room2 +%WER 18.58 [ 1090 / 5868, 128 ins, 213 del, 749 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_14_0.5_far_room3 +%WER 7.06 [ 417 / 5907, 68 ins, 47 del, 302 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_17_1.0_near_room1 +%WER 8.75 [ 545 / 6226, 77 ins, 64 del, 404 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_13_0.5_near_room2 +%WER 9.08 [ 533 / 5868, 86 ins, 82 del, 365 sub ] exp/tri3/decode_et_simu_2ch_wpe/wer_12_1.0_near_room3 + +exp/tri3/decode_dt_real_8ch_wpe +%WER 27.41 [ 401 / 1463, 44 ins, 71 del, 286 sub ] exp/tri3/decode_dt_real_8ch_wpe/wer_15_1.0_far_room1 +%WER 23.96 [ 384 / 1603, 42 ins, 83 del, 259 sub ] exp/tri3/decode_dt_real_8ch_wpe/wer_15_1.0_near_room1 + +exp/tri3/decode_dt_simu_8ch_wpe +%WER 6.31 [ 257 / 4071, 43 ins, 46 del, 168 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_16_1.0_far_room1 +%WER 8.92 [ 362 / 4058, 63 ins, 56 del, 243 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_12_1.0_far_room2 +%WER 9.67 [ 391 / 4045, 131 ins, 42 del, 218 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_14_1.0_far_room3 +%WER 6.07 [ 247 / 4071, 39 ins, 39 del, 169 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_16_1.0_near_room1 +%WER 7.22 [ 293 / 4058, 60 ins, 32 del, 201 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_13_0.5_near_room2 +%WER 6.23 [ 252 / 4045, 54 ins, 25 del, 173 sub ] exp/tri3/decode_dt_simu_8ch_wpe/wer_14_0.0_near_room3 + +exp/tri3/decode_et_real_8ch_wpe +%WER 22.01 [ 652 / 2962, 118 ins, 87 del, 447 sub ] exp/tri3/decode_et_real_8ch_wpe/wer_17_0.5_far_room1 +%WER 23.95 [ 750 / 3131, 134 ins, 125 del, 491 sub ] exp/tri3/decode_et_real_8ch_wpe/wer_16_1.0_near_room1 + +exp/tri3/decode_et_simu_8ch_wpe +%WER 7.16 [ 423 / 5907, 89 ins, 44 del, 290 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_15_0.5_far_room1 +%WER 9.73 [ 606 / 6226, 87 ins, 90 del, 429 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_14_1.0_far_room2 +%WER 9.22 [ 541 / 5868, 105 ins, 77 del, 359 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_15_1.0_far_room3 +%WER 7.08 [ 418 / 5907, 70 ins, 45 del, 303 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_17_1.0_near_room1 +%WER 7.98 [ 497 / 6226, 61 ins, 80 del, 356 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_15_1.0_near_room2 +%WER 7.91 [ 464 / 5868, 83 ins, 67 del, 314 sub ] exp/tri3/decode_et_simu_8ch_wpe/wer_16_1.0_near_room3 exp/tri3/decode_dt_real_2ch_beamformit -%WER 25.91 [ 379 / 1463, 32 ins, 72 del, 275 sub ] exp/tri3/decode_dt_real_2ch_beamformit/wer_16_1.0_far_room1 -%WER 21.46 [ 344 / 1603, 36 ins, 87 del, 221 sub ] exp/tri3/decode_dt_real_2ch_beamformit/wer_17_0.0_near_room1 +%WER 28.43 [ 416 / 1463, 32 ins, 82 del, 302 sub ] exp/tri3/decode_dt_real_2ch_beamformit/wer_17_1.0_far_room1 +%WER 23.46 [ 376 / 1603, 26 ins, 98 del, 252 sub ] exp/tri3/decode_dt_real_2ch_beamformit/wer_17_1.0_near_room1 exp/tri3/decode_dt_simu_2ch_beamformit -%WER 4.91 [ 200 / 4071, 42 ins, 26 del, 132 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_17_0.0_far_room1 -%WER 6.38 [ 259 / 4058, 35 ins, 38 del, 186 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_15_1.0_far_room2 -%WER 5.12 [ 207 / 4045, 34 ins, 29 del, 144 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_13_1.0_far_room3 -%WER 5.21 [ 212 / 4071, 56 ins, 27 del, 129 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_16_0.0_near_room1 -%WER 5.32 [ 216 / 4058, 30 ins, 33 del, 153 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_17_1.0_near_room2 -%WER 5.07 [ 205 / 4045, 35 ins, 26 del, 144 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_14_0.0_near_room3 +%WER 6.46 [ 263 / 4071, 57 ins, 36 del, 170 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_14_0.5_far_room1 +%WER 11.80 [ 479 / 4058, 59 ins, 87 del, 333 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_10_1.0_far_room2 +%WER 13.75 [ 556 / 4045, 97 ins, 90 del, 369 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_11_0.5_far_room3 +%WER 6.29 [ 256 / 4071, 49 ins, 41 del, 166 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_17_1.0_near_room1 +%WER 6.36 [ 258 / 4058, 42 ins, 33 del, 183 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_12_1.0_near_room2 +%WER 6.67 [ 270 / 4045, 42 ins, 45 del, 183 sub ] exp/tri3/decode_dt_simu_2ch_beamformit/wer_12_1.0_near_room3 exp/tri3/decode_et_real_2ch_beamformit -%WER 17.45 [ 517 / 2962, 74 ins, 91 del, 352 sub ] exp/tri3/decode_et_real_2ch_beamformit/wer_17_0.5_far_room1 -%WER 18.78 [ 588 / 3131, 88 ins, 99 del, 401 sub ] exp/tri3/decode_et_real_2ch_beamformit/wer_16_0.5_near_room1 +%WER 25.05 [ 742 / 2962, 75 ins, 159 del, 508 sub ] exp/tri3/decode_et_real_2ch_beamformit/wer_16_1.0_far_room1 +%WER 23.83 [ 746 / 3131, 87 ins, 146 del, 513 sub ] exp/tri3/decode_et_real_2ch_beamformit/wer_17_1.0_near_room1 exp/tri3/decode_et_simu_2ch_beamformit -%WER 5.43 [ 321 / 5907, 63 ins, 44 del, 214 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_1.0_far_room1 -%WER 6.75 [ 420 / 6226, 50 ins, 62 del, 308 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_14_1.0_far_room2 -%WER 6.87 [ 403 / 5868, 75 ins, 47 del, 281 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_13_0.0_far_room3 -%WER 5.59 [ 330 / 5907, 70 ins, 46 del, 214 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_1.0_near_room1 -%WER 5.89 [ 367 / 6226, 45 ins, 62 del, 260 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_1.0_near_room2 -%WER 6.61 [ 388 / 5868, 55 ins, 67 del, 266 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_0.5_near_room3 +%WER 6.97 [ 412 / 5907, 71 ins, 38 del, 303 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_16_0.5_far_room1 +%WER 12.50 [ 778 / 6226, 104 ins, 104 del, 570 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_12_0.0_far_room2 +%WER 15.59 [ 915 / 5868, 134 ins, 153 del, 628 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_13_0.0_far_room3 +%WER 7.36 [ 435 / 5907, 80 ins, 48 del, 307 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_1.0_near_room1 +%WER 7.73 [ 481 / 6226, 52 ins, 81 del, 348 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_17_1.0_near_room2 +%WER 8.64 [ 507 / 5868, 78 ins, 77 del, 352 sub ] exp/tri3/decode_et_simu_2ch_beamformit/wer_13_1.0_near_room3 exp/tri3/decode_dt_real_8ch_beamformit -%WER 19.75 [ 289 / 1463, 41 ins, 38 del, 210 sub ] exp/tri3/decode_dt_real_8ch_beamformit/wer_15_1.0_far_room1 -%WER 15.41 [ 247 / 1603, 27 ins, 47 del, 173 sub ] exp/tri3/decode_dt_real_8ch_beamformit/wer_15_1.0_near_room1 +%WER 20.71 [ 303 / 1463, 41 ins, 43 del, 219 sub ] exp/tri3/decode_dt_real_8ch_beamformit/wer_14_1.0_far_room1 +%WER 17.28 [ 277 / 1603, 24 ins, 57 del, 196 sub ] exp/tri3/decode_dt_real_8ch_beamformit/wer_17_1.0_near_room1 exp/tri3/decode_dt_simu_8ch_beamformit -%WER 4.77 [ 194 / 4071, 39 ins, 27 del, 128 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_17_0.5_far_room1 -%WER 5.45 [ 221 / 4058, 46 ins, 24 del, 151 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_16_0.0_far_room2 -%WER 4.20 [ 170 / 4045, 25 ins, 26 del, 119 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_13_1.0_far_room3 -%WER 4.91 [ 200 / 4071, 55 ins, 20 del, 125 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_14_0.0_near_room1 -%WER 5.22 [ 212 / 4058, 33 ins, 26 del, 153 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_15_1.0_near_room2 -%WER 4.08 [ 165 / 4045, 28 ins, 20 del, 117 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_13_1.0_near_room3 +%WER 6.17 [ 251 / 4071, 41 ins, 43 del, 167 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_17_1.0_far_room1 +%WER 7.20 [ 292 / 4058, 58 ins, 44 del, 190 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_17_0.5_far_room2 +%WER 5.41 [ 219 / 4045, 43 ins, 27 del, 149 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_14_0.5_far_room3 +%WER 6.12 [ 249 / 4071, 51 ins, 37 del, 161 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_15_1.0_near_room1 +%WER 7.32 [ 297 / 4058, 105 ins, 27 del, 165 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_13_1.0_near_room2 +%WER 5.34 [ 216 / 4045, 48 ins, 31 del, 137 sub ] exp/tri3/decode_dt_simu_8ch_beamformit/wer_14_1.0_near_room3 exp/tri3/decode_et_real_8ch_beamformit -%WER 14.38 [ 426 / 2962, 72 ins, 71 del, 283 sub ] exp/tri3/decode_et_real_8ch_beamformit/wer_15_1.0_far_room1 -%WER 13.86 [ 434 / 3131, 68 ins, 70 del, 296 sub ] exp/tri3/decode_et_real_8ch_beamformit/wer_17_1.0_near_room1 +%WER 16.91 [ 501 / 2962, 93 ins, 71 del, 337 sub ] exp/tri3/decode_et_real_8ch_beamformit/wer_15_1.0_far_room1 +%WER 15.59 [ 488 / 3131, 86 ins, 74 del, 328 sub ] exp/tri3/decode_et_real_8ch_beamformit/wer_17_1.0_near_room1 exp/tri3/decode_et_simu_8ch_beamformit -%WER 5.59 [ 330 / 5907, 87 ins, 36 del, 207 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_14_1.0_far_room1 -%WER 6.10 [ 380 / 6226, 51 ins, 55 del, 274 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_15_1.0_far_room2 -%WER 6.24 [ 366 / 5868, 57 ins, 51 del, 258 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_14_1.0_far_room3 -%WER 5.62 [ 332 / 5907, 74 ins, 44 del, 214 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_16_1.0_near_room1 -%WER 5.73 [ 357 / 6226, 56 ins, 57 del, 244 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_17_1.0_near_room2 -%WER 5.93 [ 348 / 5868, 62 ins, 52 del, 234 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_14_1.0_near_room3 +%WER 6.57 [ 388 / 5907, 71 ins, 49 del, 268 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_15_1.0_far_room1 +%WER 7.60 [ 473 / 6226, 81 ins, 65 del, 327 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_15_0.5_far_room2 +%WER 7.26 [ 426 / 5868, 64 ins, 67 del, 295 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_17_1.0_far_room3 +%WER 7.11 [ 420 / 5907, 77 ins, 53 del, 290 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_17_1.0_near_room1 +%WER 7.07 [ 440 / 6226, 78 ins, 66 del, 296 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_17_1.0_near_room2 +%WER 7.00 [ 411 / 5868, 83 ins, 59 del, 269 sub ] exp/tri3/decode_et_simu_8ch_beamformit/wer_14_1.0_near_room3 + +exp/tri3/decode_et_cln +%WER 6.74 [ 1213 / 18001, 234 ins, 158 del, 821 sub ] exp/tri3/decode_et_cln/wer_15_1.0_cln_room ######################################## +TDNN RESULTs: +exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt* +%WER 20.44 [ 299 / 1463, 22 ins, 75 del, 202 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch/wer_10_0.5_far_room1 +%WER 18.59 [ 298 / 1603, 16 ins, 79 del, 203 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch/wer_13_0.0_near_room1 +%WER 17.91 [ 262 / 1463, 24 ins, 59 del, 179 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch_wpe/wer_8_0.5_far_room1 +%WER 16.16 [ 259 / 1603, 16 ins, 64 del, 179 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_1ch_wpe/wer_11_0.0_near_room1 +%WER 16.13 [ 236 / 1463, 21 ins, 66 del, 149 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_2ch_beamformit/wer_10_1.0_far_room1 +%WER 11.92 [ 191 / 1603, 16 ins, 37 del, 138 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_2ch_beamformit/wer_12_0.0_near_room1 +%WER 18.25 [ 267 / 1463, 21 ins, 70 del, 176 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_2ch_wpe/wer_9_0.5_far_room1 +%WER 14.60 [ 234 / 1603, 14 ins, 51 del, 169 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_2ch_wpe/wer_10_0.0_near_room1 +%WER 12.24 [ 179 / 1463, 10 ins, 51 del, 118 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_8ch_beamformit/wer_11_1.0_far_room1 +%WER 9.61 [ 154 / 1603, 15 ins, 30 del, 109 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_8ch_beamformit/wer_11_0.0_near_room1 +%WER 16.20 [ 237 / 1463, 19 ins, 80 del, 138 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_8ch_wpe/wer_11_0.5_far_room1 +%WER 12.98 [ 208 / 1603, 20 ins, 54 del, 134 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_real_8ch_wpe/wer_10_0.0_near_room1 +%WER 3.19 [ 130 / 4071, 16 ins, 27 del, 87 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_7_0.5_far_room1 +%WER 7.29 [ 296 / 4058, 35 ins, 51 del, 210 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_7_0.5_far_room2 +%WER 7.17 [ 290 / 4045, 31 ins, 57 del, 202 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_9_0.0_far_room3 +%WER 3.00 [ 122 / 4071, 14 ins, 22 del, 86 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_9_0.0_near_room1 +%WER 3.43 [ 139 / 4058, 12 ins, 21 del, 106 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_7_1.0_near_room2 +%WER 3.86 [ 156 / 4045, 19 ins, 28 del, 109 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch/wer_7_0.0_near_room3 +%WER 3.12 [ 127 / 4071, 20 ins, 19 del, 88 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_8_0.0_far_room1 +%WER 6.73 [ 273 / 4058, 33 ins, 46 del, 194 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_7_0.5_far_room2 +%WER 6.50 [ 263 / 4045, 34 ins, 47 del, 182 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_9_0.0_far_room3 +%WER 3.00 [ 122 / 4071, 15 ins, 13 del, 94 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_7_0.0_near_room1 +%WER 3.25 [ 132 / 4058, 21 ins, 15 del, 96 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_8_0.0_near_room2 +%WER 3.78 [ 153 / 4045, 23 ins, 24 del, 106 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_1ch_wpe/wer_7_0.0_near_room3 +%WER 3.10 [ 126 / 4071, 22 ins, 18 del, 86 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_8_0.0_far_room1 +%WER 4.44 [ 180 / 4058, 16 ins, 36 del, 128 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_9_1.0_far_room2 +%WER 4.70 [ 190 / 4045, 30 ins, 26 del, 134 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_9_0.0_far_room3 +%WER 2.82 [ 115 / 4071, 12 ins, 18 del, 85 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_8_0.0_near_room1 +%WER 2.88 [ 117 / 4058, 8 ins, 26 del, 83 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_8_1.0_near_room2 +%WER 3.39 [ 137 / 4045, 25 ins, 20 del, 92 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_beamformit/wer_7_0.0_near_room3 +%WER 3.00 [ 122 / 4071, 19 ins, 17 del, 86 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_8_0.0_far_room1 +%WER 5.40 [ 219 / 4058, 26 ins, 38 del, 155 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_7_1.0_far_room2 +%WER 5.86 [ 237 / 4045, 22 ins, 44 del, 171 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_9_0.5_far_room3 +%WER 2.97 [ 121 / 4071, 13 ins, 16 del, 92 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_8_0.0_near_room1 +%WER 3.40 [ 138 / 4058, 20 ins, 20 del, 98 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_8_0.0_near_room2 +%WER 3.76 [ 152 / 4045, 14 ins, 30 del, 108 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_2ch_wpe/wer_8_1.0_near_room3 +%WER 3.00 [ 122 / 4071, 13 ins, 22 del, 87 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_7_0.5_far_room1 +%WER 3.03 [ 123 / 4058, 21 ins, 14 del, 88 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_7_0.0_far_room2 +%WER 2.94 [ 119 / 4045, 12 ins, 23 del, 84 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_8_1.0_far_room3 +%WER 2.95 [ 120 / 4071, 15 ins, 14 del, 91 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_7_0.0_near_room1 +%WER 2.64 [ 107 / 4058, 14 ins, 18 del, 75 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_8_0.0_near_room2 +%WER 2.84 [ 115 / 4045, 13 ins, 27 del, 75 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_beamformit/wer_9_1.0_near_room3 +%WER 2.92 [ 119 / 4071, 14 ins, 21 del, 84 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_9_0.0_far_room1 +%WER 3.97 [ 161 / 4058, 14 ins, 38 del, 109 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_8_1.0_far_room2 +%WER 3.44 [ 139 / 4045, 14 ins, 21 del, 104 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_8_0.5_far_room3 +%WER 2.92 [ 119 / 4071, 13 ins, 18 del, 88 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_9_0.0_near_room1 +%WER 3.30 [ 134 / 4058, 13 ins, 29 del, 92 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_9_0.5_near_room2 +%WER 3.36 [ 136 / 4045, 15 ins, 27 del, 94 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt_simu_8ch_wpe/wer_9_0.5_near_room3 + +exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et* +%WER 3.55 [ 639 / 18001, 77 ins, 125 del, 437 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_cln/wer_9_1.0_cln_room +%WER 19.85 [ 588 / 2962, 52 ins, 114 del, 422 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch/wer_12_0.0_far_room1 +%WER 18.24 [ 571 / 3131, 39 ins, 159 del, 373 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch/wer_10_1.0_near_room1 +%WER 18.10 [ 536 / 2962, 38 ins, 116 del, 382 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch_wpe/wer_11_0.5_far_room1 +%WER 15.81 [ 495 / 3131, 61 ins, 96 del, 338 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_1ch_wpe/wer_10_0.0_near_room1 +%WER 14.21 [ 421 / 2962, 54 ins, 51 del, 316 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_2ch_beamformit/wer_11_0.0_far_room1 +%WER 11.27 [ 353 / 3131, 39 ins, 80 del, 234 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_2ch_beamformit/wer_11_0.5_near_room1 +%WER 15.94 [ 472 / 2962, 44 ins, 101 del, 327 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_2ch_wpe/wer_11_0.5_far_room1 +%WER 14.53 [ 455 / 3131, 52 ins, 97 del, 306 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_2ch_wpe/wer_10_0.5_near_room1 +%WER 10.23 [ 303 / 2962, 41 ins, 44 del, 218 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_8ch_beamformit/wer_10_0.5_far_room1 +%WER 9.17 [ 287 / 3131, 35 ins, 61 del, 191 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_8ch_beamformit/wer_10_1.0_near_room1 +%WER 12.90 [ 382 / 2962, 30 ins, 77 del, 275 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_8ch_wpe/wer_10_1.0_far_room1 +%WER 11.75 [ 368 / 3131, 58 ins, 65 del, 245 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_real_8ch_wpe/wer_10_0.0_near_room1 +%WER 3.74 [ 221 / 5907, 24 ins, 41 del, 156 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_8_1.0_far_room1 +%WER 7.66 [ 477 / 6226, 43 ins, 100 del, 334 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_0.5_far_room2 +%WER 7.72 [ 453 / 5868, 33 ins, 114 del, 306 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_far_room3 +%WER 3.28 [ 194 / 5907, 20 ins, 38 del, 136 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_near_room1 +%WER 4.75 [ 296 / 6226, 27 ins, 66 del, 203 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_9_1.0_near_room2 +%WER 4.91 [ 288 / 5868, 31 ins, 56 del, 201 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch/wer_8_1.0_near_room3 +%WER 3.69 [ 218 / 5907, 29 ins, 36 del, 153 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_8_0.5_far_room1 +%WER 7.04 [ 438 / 6226, 48 ins, 77 del, 313 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_7_0.5_far_room2 +%WER 7.17 [ 421 / 5868, 37 ins, 94 del, 290 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_8_1.0_far_room3 +%WER 3.22 [ 190 / 5907, 27 ins, 31 del, 132 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_10_0.0_near_room1 +%WER 4.72 [ 294 / 6226, 29 ins, 64 del, 201 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_9_1.0_near_room2 +%WER 4.87 [ 286 / 5868, 33 ins, 50 del, 203 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_1ch_wpe/wer_7_1.0_near_room3 +%WER 3.28 [ 194 / 5907, 20 ins, 36 del, 138 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_9_1.0_far_room1 +%WER 5.22 [ 325 / 6226, 36 ins, 72 del, 217 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_9_1.0_far_room2 +%WER 6.00 [ 352 / 5868, 39 ins, 70 del, 243 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_9_1.0_far_room3 +%WER 3.20 [ 189 / 5907, 28 ins, 29 del, 132 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_10_0.0_near_room1 +%WER 4.18 [ 260 / 6226, 24 ins, 60 del, 176 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_9_1.0_near_room2 +%WER 4.26 [ 250 / 5868, 38 ins, 45 del, 167 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_beamformit/wer_8_0.5_near_room3 +%WER 3.39 [ 200 / 5907, 27 ins, 35 del, 138 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_8_1.0_far_room1 +%WER 6.12 [ 381 / 6226, 28 ins, 94 del, 259 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_11_1.0_far_room2 +%WER 6.58 [ 386 / 5868, 39 ins, 77 del, 270 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_9_1.0_far_room3 +%WER 3.20 [ 189 / 5907, 29 ins, 30 del, 130 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_10_0.0_near_room1 +%WER 4.53 [ 282 / 6226, 29 ins, 61 del, 192 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_9_1.0_near_room2 +%WER 4.48 [ 263 / 5868, 26 ins, 49 del, 188 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_2ch_wpe/wer_9_1.0_near_room3 +%WER 3.54 [ 209 / 5907, 27 ins, 36 del, 146 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_9_0.5_far_room1 +%WER 4.11 [ 256 / 6226, 29 ins, 51 del, 176 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_8_1.0_far_room2 +%WER 3.89 [ 228 / 5868, 28 ins, 43 del, 157 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_8_1.0_far_room3 +%WER 3.22 [ 190 / 5907, 24 ins, 29 del, 137 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_8_0.5_near_room1 +%WER 3.71 [ 231 / 6226, 24 ins, 55 del, 152 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_9_1.0_near_room2 +%WER 3.66 [ 215 / 5868, 22 ins, 46 del, 147 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_beamformit/wer_8_1.0_near_room3 +%WER 3.50 [ 207 / 5907, 19 ins, 42 del, 146 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_9_1.0_far_room1 +%WER 5.08 [ 316 / 6226, 34 ins, 59 del, 223 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_7_1.0_far_room2 +%WER 4.46 [ 262 / 5868, 33 ins, 48 del, 181 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_10_0.5_far_room3 +%WER 3.35 [ 198 / 5907, 16 ins, 41 del, 141 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_10_1.0_near_room1 +%WER 4.42 [ 275 / 6226, 27 ins, 56 del, 192 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_8_1.0_near_room2 +%WER 3.92 [ 230 / 5868, 37 ins, 36 del, 157 sub ] exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_et_simu_8ch_wpe/wer_9_0.0_near_room3 diff --git a/egs/reverb/s5/local/compute_se_scores.sh b/egs/reverb/s5/local/compute_se_scores.sh new file mode 100755 index 00000000000..d65fbbca2f4 --- /dev/null +++ b/egs/reverb/s5/local/compute_se_scores.sh @@ -0,0 +1,39 @@ +#!/bin/bash +# Copyright 2018 Johns Hopkins University (Author: Aswin Shanmugam Subramanian) +# Apache 2.0 + +# This script computes the dereverberation scores given in REVERB challenge +# Eg. local/compute_se_scores.sh --nch 8 /export/corpora5/REVERB_2014/REVERB ${PWD}/wav ${PWD}/local + +. ./cmd.sh +. ./path.sh +set -e +set -u +set -o pipefail + +cmd=run.pl +nch=8 + +. utils/parse_options.sh || exit 1; + +if [ $# != 3 ]; then + echo "Wrong #arguments ($#, expected 3)" + echo "Usage: local/compute_se.sh [options] " + echo "options" + echo " --cmd # Command to run in parallel with" + echo " --nch # nch of WPE to use for computing SE scores" + exit 1; +fi + +reverb_data=$1 +enhancement_directory=$2 +pesqdir=$3 +enhancement_directory_sim=$enhancement_directory/WPE/${nch}ch/REVERB_WSJCAM0_dt/data/ +enhancement_directory_real=$enhancement_directory/WPE/${nch}ch/MC_WSJ_AV_Dev/ + +expdir=${PWD}/exp/compute_se_${nch}ch +pushd local/REVERB_scores_source/REVERB-SPEENHA.Release04Oct/evaltools +$cmd $expdir/compute_se_real.log matlab -nodisplay -nosplash -r "addpath('SRMRToolbox'); score_RealData('$reverb_data','$enhancement_directory_real');exit" +$cmd $expdir/compute_se_sim.log matlab -nodisplay -nosplash -r "addpath('SRMRToolbox'); score_SimData('$reverb_data','$enhancement_directory_sim','$pesqdir');exit" +popd +mv local/REVERB_scores_source/REVERB-SPEENHA.Release04Oct/scores $expdir/ diff --git a/egs/reverb/s5/local/download_se_eval_tool.sh b/egs/reverb/s5/local/download_se_eval_tool.sh new file mode 100755 index 00000000000..c7b272907b6 --- /dev/null +++ b/egs/reverb/s5/local/download_se_eval_tool.sh @@ -0,0 +1,33 @@ +#!/bin/bash +# Copyright 2018 Johns Hopkins University (Author: Aswin Shanmugam Subramanian) +# This script downloads the official REVERB challenge SE scripts and SRMR toolbox +# This script also downloads and compiles PESQ +# please make sure that you or your institution have the license to report PESQ +# Apache 2.0 + +wget 'https://www.itu.int/rec/dologin_pub.asp?lang=e&id=T-REC-P.862-200102-I!!SOFT-ZST-E&type=items' -O PESQ.zip +unzip PESQ.zip -d local/PESQ_sources +rm PESQ.zip +cd local/PESQ_sources/P862/Software/source +gcc *.c -lm -o PESQ +cd ../../../../../ +mv local/PESQ_sources/P862/Software/source/PESQ local/ + +wget 'https://reverb2014.dereverberation.com/tools/REVERB-SPEENHA.Release04Oct.zip' -O REVERB_scores.zip +unzip REVERB_scores.zip -d local/REVERB_scores_source +rm REVERB_scores.zip + +pushd local/REVERB_scores_source/REVERB-SPEENHA.Release04Oct/evaltools +sed -i 's/wavread/audioread/g' prog/score_sim.m +git clone https://github.com/MuSAELab/SRMRToolbox.git +sed -i 's/wavread/audioread/g' SRMRToolbox/libs/preprocess.m +sed -i 's/SRMR_main/SRMR/g' prog/score_real.m +sed -i 's/SRMR_main/SRMR/g' prog/score_sim.m +sed -i 's/+wb\ //g' prog/calcpesq.m +sed -i 's/pesq_/_pesq_/g' prog/calcpesq.m +sed -ie '30d;31d' prog/calcpesq.m +patch score_RealData.m -i ../../../score_RealData.patch -o score_RealData_new.m +mv score_RealData_new.m score_RealData.m +patch score_SimData.m -i ../../../score_SimData.patch -o score_SimData_new.m +mv score_SimData_new.m score_SimData.m +popd diff --git a/egs/reverb/s5/local/get_results.sh b/egs/reverb/s5/local/get_results.sh index e1fca60a2dd..8867961dcdd 100755 --- a/egs/reverb/s5/local/get_results.sh +++ b/egs/reverb/s5/local/get_results.sh @@ -15,6 +15,18 @@ echo "" echo "exp/tri3/decode_et_simu_1ch" cat exp/tri3/decode_et_simu_1ch/scoring_kaldi/best_wer* echo "" +echo "exp/tri3/decode_dt_real_1ch_wpe" +cat exp/tri3/decode_dt_real_1ch_wpe/scoring_kaldi/best_wer* +echo "" +echo "exp/tri3/decode_dt_simu_1ch_wpe" +cat exp/tri3/decode_dt_simu_1ch_wpe/scoring_kaldi/best_wer* +echo "" +echo "exp/tri3/decode_et_real_1ch_wpe" +cat exp/tri3/decode_et_real_1ch_wpe/scoring_kaldi/best_wer* +echo "" +echo "exp/tri3/decode_et_simu_1ch_wpe" +cat exp/tri3/decode_et_simu_1ch_wpe/scoring_kaldi/best_wer* +echo "" echo "exp/tri3/decode_dt_real_2ch_wpe" cat exp/tri3/decode_dt_real_2ch_wpe/scoring_kaldi/best_wer* echo "" @@ -60,8 +72,11 @@ echo "" echo "exp/tri3/decode_et_real_8ch_beamformit" cat exp/tri3/decode_et_real_8ch_beamformit/scoring_kaldi/best_wer* echo "" -echo "exp/tri3/decode_et_simu_8ch_beamformit" -cat exp/tri3/decode_et_simu_8ch_beamformit/scoring_kaldi/best_wer* +echo "exp/tri3/decode_dt_cln" +cat exp/tri3/decode_dt_cln/scoring_kaldi/best_wer* +echo "" +echo "exp/tri3/decode_et_cln" +cat exp/tri3/decode_et_cln/scoring_kaldi/best_wer* echo "########################################" echo "TDNN RESULTs:" echo "exp/chain_tr_simu_8ch/tdnn1a_sp/decode_test_tg_5k_dt*" diff --git a/egs/reverb/s5/local/prepare_simu_data.sh b/egs/reverb/s5/local/prepare_simu_data.sh index cfdc226dd1e..8757021ddd7 100755 --- a/egs/reverb/s5/local/prepare_simu_data.sh +++ b/egs/reverb/s5/local/prepare_simu_data.sh @@ -54,6 +54,12 @@ for nch in 1 2 8; do perl -se 'while (<>) { chomp; if (m/\/(\w{8})[^\/]+$/) { print $1, " ", $dir, $_, "\n"; } }' -- -dir=${reverb}/REVERB_WSJCAM0_${task}/data ${taskdir}/$x |\ sed -e "s/^\(...\)/\1_${x}_\1/" done > ${dir}/${task}_simu_${nch}ch_wav.scp + if [ ${nch} == 1 ]; then + for x in `ls ${taskdir} | grep SimData | grep _${task}_ | grep -e cln`; do + perl -se 'while (<>) { chomp; if (m/\/(\w{8})[^\/]+$/) { print $1, " ", $dir, $_, "\n"; } }' -- -dir=${reverb}/REVERB_WSJCAM0_${task}/data ${taskdir}/$x |\ + sed -e "s/^\(...\)/\1_${x}_\1/" + done > ${dir}/${task}_cln_wav.scp + fi done task=tr @@ -83,6 +89,14 @@ for nch in 1 2 8; do sed -e "s/^\(...\)/\1_${x}_\1/" done > ${dir}/${task}_simu_${nch}ch.trans1 || exit 1; cat ${dir}/${task}_simu_${nch}ch.trans1 | local/normalize_transcript.pl ${noiseword} > ${dir}/${task}_simu_${nch}ch.txt || exit 1; + if [ ${nch} == 1 ]; then + for x in `ls ${taskdir} | grep SimData | grep _${task}_ | grep -e cln`; do + perl -e 'while (<>) { chomp; if (m/\/(\w{8})[^\/]+$/) { print $1, "\n"; } }' ${taskdir}/$x |\ + perl local/find_transcripts_singledot.pl ${dir}/${task}.dot |\ + sed -e "s/^\(...\)/\1_${x}_\1/" + done > ${dir}/${task}_cln.trans1 || exit 1; + cat ${dir}/${task}_cln.trans1 | local/normalize_transcript.pl ${noiseword} > ${dir}/${task}_cln.txt || exit 1; + fi done # Make the utt2spk and spk2utt files. @@ -90,6 +104,10 @@ for nch in 1 2 8; do cat ${dir}/${task}_simu_${nch}ch_wav.scp | awk '{print $1}' | awk -F '_' '{print $0 " " $1}' > ${dir}/${task}_simu_${nch}ch.utt2spk || exit 1; cat ${dir}/${task}_simu_${nch}ch.utt2spk | ./utils/utt2spk_to_spk2utt.pl > ${dir}/${task}_simu_${nch}ch.spk2utt || exit 1; done + for task in dt et; do + cat ${dir}/${task}_cln_wav.scp | awk '{print $1}' | awk -F '_' '{print $0 " " $1}' > ${dir}/${task}_cln.utt2spk || exit 1; + cat ${dir}/${task}_cln.utt2spk | ./utils/utt2spk_to_spk2utt.pl > ${dir}/${task}_cln.spk2utt || exit 1; + done done # finally copy the above files to the data directory @@ -118,6 +136,14 @@ for nch in 1 2 8; do sort ${dir}/${task}_simu_1ch.utt2spk > ${datadir}/utt2spk sort ${dir}/${task}_simu_1ch.spk2utt > ${datadir}/spk2utt ./utils/fix_data_dir.sh ${datadir} + else + datadir=data/${task}_cln + mkdir -p ${datadir} + sort ${dir}/${task}_cln_wav.scp > ${datadir}/wav.scp + sort ${dir}/${task}_cln.txt > ${datadir}/text + sort ${dir}/${task}_cln.utt2spk > ${datadir}/utt2spk + sort ${dir}/${task}_cln.spk2utt > ${datadir}/spk2utt + ./utils/fix_data_dir.sh ${datadir} fi fi done diff --git a/egs/reverb/s5/local/score.sh b/egs/reverb/s5/local/score.sh index 00adb14d854..66bc976333f 100755 --- a/egs/reverb/s5/local/score.sh +++ b/egs/reverb/s5/local/score.sh @@ -63,6 +63,9 @@ mkdir -p $dir/scoring_kaldi if echo $data | grep -q "real"; then tasks="\ near_room1 far_room1" +elif echo $data | grep -q "cln"; then + tasks="\ + cln_room1 cln_room2 cln_room3" else tasks="\ near_room1 far_room1 \ diff --git a/egs/reverb/s5/run.sh b/egs/reverb/s5/run.sh index 3cc3efca9e7..89f77e3e01a 100755 --- a/egs/reverb/s5/run.sh +++ b/egs/reverb/s5/run.sh @@ -36,6 +36,10 @@ fi . ./path.sh stage=0 +nch_se=8 +# flag for turing on computation of dereverberation measures +# please make sure that you or your institution have the license to report PESQ before turning on the flag +compute_se=false . utils/parse_options.sh # Set bash to 'debug' mode, it prints the commands (option '-x') and exits on : @@ -57,7 +61,7 @@ fi #training set and test set train_set=tr_simu_8ch -test_sets="dt_real_1ch dt_simu_1ch et_real_1ch et_simu_1ch dt_real_2ch_beamformit dt_simu_2ch_beamformit et_real_2ch_beamformit et_simu_2ch_beamformit dt_real_8ch_beamformit dt_simu_8ch_beamformit et_real_8ch_beamformit et_simu_8ch_beamformit dt_real_1ch_wpe dt_simu_1ch_wpe et_real_1ch_wpe et_simu_1ch_wpe dt_real_2ch_wpe dt_simu_2ch_wpe et_real_2ch_wpe et_simu_2ch_wpe dt_real_8ch_wpe dt_simu_8ch_wpe et_real_8ch_wpe et_simu_8ch_wpe" +test_sets="dt_real_1ch dt_simu_1ch et_real_1ch et_simu_1ch dt_real_2ch_beamformit dt_simu_2ch_beamformit et_real_2ch_beamformit et_simu_2ch_beamformit dt_real_8ch_beamformit dt_simu_8ch_beamformit et_real_8ch_beamformit et_simu_8ch_beamformit dt_real_1ch_wpe dt_simu_1ch_wpe et_real_1ch_wpe et_simu_1ch_wpe dt_real_2ch_wpe dt_simu_2ch_wpe et_real_2ch_wpe et_simu_2ch_wpe dt_real_8ch_wpe dt_simu_8ch_wpe et_real_8ch_wpe et_simu_8ch_wpe dt_cln et_cln" # The language models with which to decode (tg_5k or bg_5k) lm="tg_5k" @@ -68,6 +72,7 @@ nj=92 decode_nj=10 wavdir=${PWD}/wav +pesqdir=${PWD}/local if [ ${stage} -le 1 ]; then # data preparation echo "stage 0: Data preparation" @@ -81,7 +86,18 @@ if [ $stage -le 2 ]; then local/run_beamform.sh ${wavdir}/WPE/ fi -if [ $stage -le 3 ]; then +# Compute dereverberation scores +if [ $stage -le 3 ] && $compute_se; then + if [ ! -d local/REVERB_scores_source ] || [ ! -d local/REVERB_scores_source/REVERB-SPEENHA.Release04Oct/evaltools/SRMRToolbox ] || [ ! -f local/PESQ ]; then + # download and install speech enhancement evaluation tools + local/download_se_eval_tool.sh + fi + local/compute_se_scores.sh --nch $nch_se $reverb $wavdir $pesqdir + cat exp/compute_se_${nch_se}ch/scores/score_SimData + cat exp/compute_se_${nch_se}ch/scores/score_RealData +fi + +if [ $stage -le 4 ]; then # Prepare wsjcam0 clean data and wsj0 language model. local/wsjcam0_data_prep.sh $wsjcam0 $wsj0 @@ -105,14 +121,14 @@ if [ $stage -le 3 ]; then data/lang $LM data/local/dict/lexicon.txt data/lang fi -if [ $stage -le 4 ]; then +if [ $stage -le 5 ]; then for dset in ${train_set} ${test_sets}; do utils/copy_data_dir.sh data/${dset} data/${dset}_nosplit utils/data/modify_speaker_info.sh --seconds-per-spk-max 180 data/${dset}_nosplit data/${dset} done fi -if [ $stage -le 5 ]; then +if [ $stage -le 6 ]; then # Extract MFCC features for train and test sets. mfccdir=mfcc for x in ${train_set} ${test_sets}; do @@ -122,13 +138,13 @@ if [ $stage -le 5 ]; then done fi -if [ $stage -le 6 ]; then +if [ $stage -le 7 ]; then # Starting basic training on MFCC features steps/train_mono.sh --nj $nj --cmd "$train_cmd" \ data/${train_set} data/lang exp/mono fi -if [ $stage -le 7 ]; then +if [ $stage -le 8 ]; then steps/align_si.sh --nj $nj --cmd "$train_cmd" \ data/${train_set} data/lang exp/mono exp/mono_ali @@ -136,7 +152,7 @@ if [ $stage -le 7 ]; then 2500 30000 data/${train_set} data/lang exp/mono_ali exp/tri1 fi -if [ $stage -le 8 ]; then +if [ $stage -le 9 ]; then steps/align_si.sh --nj $nj --cmd "$train_cmd" \ data/${train_set} data/lang exp/tri1 exp/tri1_ali @@ -144,7 +160,7 @@ if [ $stage -le 8 ]; then 4000 50000 data/${train_set} data/lang exp/tri1_ali exp/tri2 fi -if [ $stage -le 9 ]; then +if [ $stage -le 10 ]; then utils/mkgraph.sh data/lang_test_$lm exp/tri2 exp/tri2/graph for dset in ${test_sets}; do steps/decode.sh --nj $decode_nj --cmd "$decode_cmd" --num-threads 4 \ @@ -153,7 +169,7 @@ if [ $stage -le 9 ]; then wait fi -if [ $stage -le 10 ]; then +if [ $stage -le 11 ]; then steps/align_si.sh --nj $nj --cmd "$train_cmd" \ data/${train_set} data/lang exp/tri2 exp/tri2_ali @@ -161,7 +177,7 @@ if [ $stage -le 10 ]; then 5000 100000 data/${train_set} data/lang exp/tri2_ali exp/tri3 fi -if [ $stage -le 11 ]; then +if [ $stage -le 12 ]; then utils/mkgraph.sh data/lang_test_$lm exp/tri3 exp/tri3/graph for dset in ${test_sets}; do steps/decode_fmllr.sh --nj $decode_nj --cmd "$decode_cmd" --num-threads 4 \ @@ -170,13 +186,13 @@ if [ $stage -le 11 ]; then wait fi -if [ $stage -le 12 ]; then +if [ $stage -le 13 ]; then # chain TDNN local/chain/run_tdnn.sh --nj ${nj} --train-set ${train_set} --test-sets "$test_sets" --gmm tri3 --nnet3-affix _${train_set} \ --lm-suffix _test_$lm fi # get all WERs. -if [ $stage -le 13 ]; then +if [ $stage -le 14 ]; then local/get_results.sh fi