From bab550c41ece7cc624c05f66ffadef96568d43d4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Stardust=C2=B7=E5=87=8F?= <star_dust_chen@foxmail.com>
Date: Sat, 30 Sep 2023 09:36:03 +0800
Subject: [PATCH] Update japanese_bert.py

---
 text/japanese_bert.py | 29 ++++++++++++++---------------
 1 file changed, 14 insertions(+), 15 deletions(-)

diff --git a/text/japanese_bert.py b/text/japanese_bert.py
index 0953b1bd3..db9b6379f 100644
--- a/text/japanese_bert.py
+++ b/text/japanese_bert.py
@@ -7,32 +7,31 @@
 tokenizer = AutoTokenizer.from_pretrained(BERT)
 # bert-large model has 25 hidden layers.You can decide which layer to use by setting this variable to a specific value
 # default value is 3(untested)
-BERT_LAYER = 3
-
-
-def get_bert_feature(text, word2ph, device=None):
-    if (
+BERT_LAYER = 20
+if (
         sys.platform == "darwin"
         and torch.backends.mps.is_available()
         and device == "cpu"
     ):
         device = "mps"
-    if not device:
-        device = "cuda"
-    model = AutoModelForMaskedLM.from_pretrained(BERT).to(device)
+if not device:
+    device = "cuda"
+model = AutoModelForMaskedLM.from_pretrained(BERT).to(device)
+
+def get_bert_feature(text, word2ph, device=None):
     with torch.no_grad():
         inputs = tokenizer(text, return_tensors="pt")
         for i in inputs:
             inputs[i] = inputs[i].to(device)
         res = model(**inputs, output_hidden_states=True)
         res = res["hidden_states"][BERT_LAYER]
-    assert inputs["input_ids"].shape[-1] == len(word2ph)
-    word2phone = word2ph
+    #assert inputs["input_ids"].shape[-1] == len(word2ph)
+    #word2phone = word2ph
     phone_level_feature = []
-    for i in range(len(word2phone)):
-        repeat_feature = res[0][i].repeat(word2phone[i], 1)
-        phone_level_feature.append(repeat_feature)
+    #for i in range(len(word2phone)):
+    #    repeat_feature = res[0][i].repeat(word2phone[i], 1)
+    #    phone_level_feature.append(repeat_feature)
 
-    phone_level_feature = torch.cat(phone_level_feature, dim=0)
+    #phone_level_feature = torch.cat(phone_level_feature, dim=0)
 
-    return phone_level_feature.T
+    return res