Update japanese_bert.py

fishaudio · Sep 30, 2023 · bab550c · bab550c
1 parent 1e310ae
commit bab550c
Showing 1 changed file with 14 additions and 15 deletions.
diff --git a/text/japanese_bert.py b/text/japanese_bert.py
@@ -7,32 +7,31 @@
 tokenizer = AutoTokenizer.from_pretrained(BERT)
 # bert-large model has 25 hidden layers.You can decide which layer to use by setting this variable to a specific value
 # default value is 3(untested)
-BERT_LAYER = 3
-
-
-def get_bert_feature(text, word2ph, device=None):
-    if (
+BERT_LAYER = 20
+if (
         sys.platform == "darwin"
         and torch.backends.mps.is_available()
         and device == "cpu"
     ):
         device = "mps"
-    if not device:
-        device = "cuda"
-    model = AutoModelForMaskedLM.from_pretrained(BERT).to(device)
+if not device:
+    device = "cuda"
+model = AutoModelForMaskedLM.from_pretrained(BERT).to(device)
+
+def get_bert_feature(text, word2ph, device=None):
     with torch.no_grad():
         inputs = tokenizer(text, return_tensors="pt")
         for i in inputs:
             inputs[i] = inputs[i].to(device)
         res = model(**inputs, output_hidden_states=True)
         res = res["hidden_states"][BERT_LAYER]
-    assert inputs["input_ids"].shape[-1] == len(word2ph)
-    word2phone = word2ph
+    #assert inputs["input_ids"].shape[-1] == len(word2ph)
+    #word2phone = word2ph
     phone_level_feature = []
-    for i in range(len(word2phone)):
-        repeat_feature = res[0][i].repeat(word2phone[i], 1)
-        phone_level_feature.append(repeat_feature)
+    #for i in range(len(word2phone)):
+    #    repeat_feature = res[0][i].repeat(word2phone[i], 1)
+    #    phone_level_feature.append(repeat_feature)
 
-    phone_level_feature = torch.cat(phone_level_feature, dim=0)
+    #phone_level_feature = torch.cat(phone_level_feature, dim=0)
 
-    return phone_level_feature.T
+    return res