diff --git a/egs/dihard_2018/v2/run.sh b/egs/dihard_2018/v2/run.sh index b0fbdcc968c..6cd6630a838 100755 --- a/egs/dihard_2018/v2/run.sh +++ b/egs/dihard_2018/v2/run.sh @@ -75,6 +75,8 @@ if [ $stage -le 1 ]; then utils/fix_data_dir.sh data/${name}_cmn done + echo "0.01" > data/dihard_2018_dev_cmn/frame_shift + echo "0.01" > data/dihard_2018_eval_cmn/frame_shift echo "0.01" > data/train_cmn/frame_shift # Create segments to extract x-vectors from for PLDA training data. # The segments are created using an energy-based speech activity @@ -292,7 +294,7 @@ if [ $stage -le 12 ]; then > $nnet_dir/results/DER_threshold.txt der=$(grep -oP 'DIARIZATION\ ERROR\ =\ \K[0-9]+([.][0-9]+)?' \ $nnet_dir/results/DER_threshold.txt) - # Using supervised calibration, DER: 26.47% + # Using supervised calibration, DER: 26.30% echo "Using supervised calibration, DER: $der%" fi @@ -309,6 +311,6 @@ if [ $stage -le 13 ]; then > $nnet_dir/results/DER_num_spk.txt der=$(grep -oP 'DIARIZATION\ ERROR\ =\ \K[0-9]+([.][0-9]+)?' \ $nnet_dir/results/DER_num_spk.txt) - # Using the oracle number of speakers, DER: 23.90% + # Using the oracle number of speakers, DER: 23.42% echo "Using the oracle number of speakers, DER: $der%" fi diff --git a/egs/wsj/s5/utils/data/get_uniform_subsegments.py b/egs/wsj/s5/utils/data/get_uniform_subsegments.py index cc3015564a5..a963f35fa70 100755 --- a/egs/wsj/s5/utils/data/get_uniform_subsegments.py +++ b/egs/wsj/s5/utils/data/get_uniform_subsegments.py @@ -73,7 +73,7 @@ def run(args): new_utt = "{utt_id}-{s:08d}-{e:08d}".format( utt_id=utt_id, s=int(100 * start_relative), e=int(100 * end_relative)) - print ("{new_utt} {utt_id} {s} {e}".format( + print ("{new_utt} {utt_id} {s:.3f} {e:.3f}".format( new_utt=new_utt, utt_id=utt_id, s=start_relative, e=start_relative + args.max_segment_duration)) start += args.max_segment_duration - args.overlap_duration @@ -90,7 +90,7 @@ def run(args): new_utt = "{utt_id}-{s:08d}-{e:08d}".format( utt_id=utt_id, s=int(round(100 * (start - start_time))), e=int(round(100 * (end - start_time)))) - print ("{new_utt} {utt_id} {s} {e}".format( + print ("{new_utt} {utt_id} {s:.3f} {e:.3f}".format( new_utt=new_utt, utt_id=utt_id, s=start - start_time, e=end - start_time))