NVIDIA · blisc · Aug 4, 2022 · Aug 3, 2022 · Aug 4, 2022 · Aug 4, 2022
diff --git a/examples/tts/conf/aligner.yaml b/examples/tts/conf/aligner.yaml
@@ -19,7 +19,7 @@ lowfreq: 0
 highfreq: 8000
 window: hann
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-052722"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/examples/tts/conf/fastpitch_align_44100.yaml b/examples/tts/conf/fastpitch_align_44100.yaml
@@ -27,7 +27,7 @@ lowfreq: 0
 highfreq: null
 window: hann
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/examples/tts/conf/fastpitch_align_ipa.yaml b/examples/tts/conf/fastpitch_align_ipa.yaml
@@ -27,7 +27,7 @@ lowfreq: 0
 highfreq: 8000
 window: hann
 
-phoneme_dict_path: "scripts/tts_dataset_files/ipa_cmudict-0.7b_nv22.06.txt"
+phoneme_dict_path: "scripts/tts_dataset_files/ipa_cmudict-0.7b_nv22.08.txt"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-052722"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/examples/tts/conf/fastpitch_align_v1.05.yaml b/examples/tts/conf/fastpitch_align_v1.05.yaml
@@ -27,7 +27,7 @@ lowfreq: 0
 highfreq: 8000
 window: hann
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/examples/tts/conf/mixer-tts.yaml b/examples/tts/conf/mixer-tts.yaml
@@ -27,7 +27,7 @@ lowfreq: 0
 highfreq: 8000
 window: hann
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/examples/tts/conf/rad-tts_dec.yaml b/examples/tts/conf/rad-tts_dec.yaml
@@ -28,7 +28,7 @@ highfreq: 8000
 window: "hann"
 
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-052722"
 
 model:

diff --git a/examples/tts/conf/rad-tts_feature_pred.yaml b/examples/tts/conf/rad-tts_feature_pred.yaml
@@ -27,7 +27,7 @@ lowfreq: 0
 highfreq: 8000
 window: "hann"
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-052722" 
 
 model:

diff --git a/examples/tts/conf/tacotron2.yaml b/examples/tts/conf/tacotron2.yaml
@@ -9,7 +9,7 @@ validation_datasets: ???
 sup_data_path: null
 sup_data_types: null
 
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
 

diff --git a/nemo/collections/tts/models/fastpitch.py b/nemo/collections/tts/models/fastpitch.py
@@ -47,7 +47,7 @@
 @dataclass
 class G2PConfig:
     _target_: str = "nemo.collections.tts.torch.g2ps.EnglishG2p"
-    phoneme_dict: str = "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+    phoneme_dict: str = "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
     heteronyms: str = "scripts/tts_dataset_files/heteronyms-030921"
     phoneme_probability: float = 0.5
 

diff --git a/nemo/collections/tts/torch/g2ps.py b/nemo/collections/tts/torch/g2ps.py
@@ -139,7 +139,7 @@ def _parse_as_cmu_dict(phoneme_dict_path=None, encoding='latin-1'):
                 f"English g2p_dict will be used from nltk.corpus.cmudict.dict(), because phoneme_dict_path=None. "
                 "Note that nltk.corpus.cmudict.dict() has old version (0.6) of CMUDict. "
                 "You can use the latest official version of CMUDict (0.7b) with additional changes from NVIDIA directly from NeMo "
-                "using the path scripts/tts_dataset_files/cmudict-0.7b_nv22.07."
+                "using the path scripts/tts_dataset_files/cmudict-0.7b_nv22.08."
             )
 
             return nltk.corpus.cmudict.dict()
@@ -262,7 +262,7 @@ def __init__(
 
         Args:
             phoneme_dict (str, Path, Dict): Path to file in CMUdict format or dictionary of CMUdict-like entries.
-                Must be given for IPA G2P. (Consider using scripts/tts_dataset_files/ipa_cmudict-0.7b_nv22.06.txt.)
+                Must be given for IPA G2P. (Consider using scripts/tts_dataset_files/ipa_cmudict-0.7b_nv22.08.txt.)
             word_tokenize_func: Function for tokenizing text to words.
                 It has to return List[Tuple[Union[str, List[str]], bool]] where every tuple denotes word
                 representation and flag whether to leave unchanged or not.

diff --git a/nemo/collections/tts/torch/tts_dataset.yaml b/nemo/collections/tts/torch/tts_dataset.yaml
@@ -42,5 +42,5 @@ tts_dataset:
     pad_with_space: True
     g2p:
       _target_: nemo.collections.tts.torch.g2ps.EnglishG2p
-      phoneme_dict: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+      phoneme_dict: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
       heteronyms: "scripts/tts_dataset_files/heteronyms-030921"
diff --git a/scripts/dataset_processing/tts/ljspeech/ds_conf/ds_for_fastpitch_align.yaml b/scripts/dataset_processing/tts/ljspeech/ds_conf/ds_for_fastpitch_align.yaml
@@ -4,7 +4,7 @@ manifest_filepath: "train_manifest.json"
 sup_data_path: "sup_data"
 sup_data_types: [ "align_prior_matrix", "pitch" ]
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 
 dataset:

diff --git a/scripts/dataset_processing/tts/ljspeech/ds_conf/ds_for_mixer_tts.yaml b/scripts/dataset_processing/tts/ljspeech/ds_conf/ds_for_mixer_tts.yaml
@@ -4,7 +4,7 @@ manifest_filepath: "train_manifest.json"
 sup_data_path: "sup_data"
 sup_data_types: [ "align_prior_matrix", "pitch" ]
 whitelist_path: "nemo_text_processing/text_normalization/en/data/whitelist/lj_speech.tsv"
-phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.07"
+phoneme_dict_path: "scripts/tts_dataset_files/cmudict-0.7b_nv22.08"
 heteronyms_path: "scripts/tts_dataset_files/heteronyms-030921"
 
 dataset:

diff --git a/...ts/tts_dataset_files/cmudict-0.7b_nv22.07 → ...ts/tts_dataset_files/cmudict-0.7b_nv22.08 b/...ts/tts_dataset_files/cmudict-0.7b_nv22.07 → ...ts/tts_dataset_files/cmudict-0.7b_nv22.08
@@ -57166,7 +57166,7 @@ HURRAY  HH AH0 R EY1
 HURRELL  HH AO1 R AH0 L
 HURRI  HH ER1 IY0
 HURRICANE  HH ER1 AH0 K EY2 N
-HURRICANE(1)  HH AH1 R AH0 K EY2 N Z
+HURRICANE(1)  HH AH1 R AH0 K EY2 N
 HURRICANE'S  HH ER1 AH0 K EY2 N Z
 HURRICANES  HH ER1 AH0 K EY2 N Z
 HURRIED  HH ER1 IY0 D

diff --git a/...ataset_files/ipa_cmudict-0.7b_nv22.06.txt → ...ataset_files/ipa_cmudict-0.7b_nv22.08.txt b/...ataset_files/ipa_cmudict-0.7b_nv22.06.txt → ...ataset_files/ipa_cmudict-0.7b_nv22.08.txt
@@ -57581,7 +57581,7 @@ HURRAY  həˈɹeɪ
 HURRELL  ˈhɔɹəɫ
 HURRI  ˈhɝi
 HURRICANE  ˈhɝəˌkeɪn
-HURRICANE  ˈhəɹəˌkeɪnz
+HURRICANE  ˈhəɹəˌkeɪn
 HURRICANE'S  ˈhɝəˌkeɪnz
 HURRICANES  ˈhɝəˌkeɪnz
 HURRIED  ˈhɝid