修复英文多音字,调整字典热加载,新增姓名匹配 (RVC-Boss#869)

KamioRinn · web-flow · commit 0f7e5c4a3779 · 2024-03-25T15:20:10.000+08:00
* Fix homograph dict

* Add JSON in dict

* Adjust hot dict to hot reload

* Add English name dict

* Adjust get name dict logic
diff --git a/GPT_SoVITS/text/engdict-hot.rep b/GPT_SoVITS/text/engdict-hot.rep
@@ -1 +1,2 @@
-CHATGPT CH AE1 T JH IY1 P IY1 T IY1
+CHATGPT CH AE1 T JH IY1 P IY1 T IY1
+JSON JH EY1 S AH0 N
diff --git a/GPT_SoVITS/text/english.py b/GPT_SoVITS/text/english.py
@@ -20,6 +20,7 @@
 CMU_DICT_FAST_PATH = os.path.join(current_file_path, "cmudict-fast.rep")
 CMU_DICT_HOT_PATH = os.path.join(current_file_path, "engdict-hot.rep")
 CACHE_PATH = os.path.join(current_file_path, "engdict_cache.pickle")
+NAMECACHE_PATH = os.path.join(current_file_path, "namedict_cache.pickle")
 
 arpa = {
     "AH0",
@@ -162,6 +163,9 @@ def read_dict_new():
             line_index = line_index + 1
             line = f.readline()
 
+    return g2p_dict
+
+def hot_reload_hot(g2p_dict):
     with open(CMU_DICT_HOT_PATH) as f:
         line = f.readline()
         line_index = 1
@@ -175,7 +179,7 @@ def read_dict_new():
 
             line_index = line_index + 1
             line = f.readline()
-    
+
     return g2p_dict
 
 
@@ -192,9 +196,21 @@ def get_dict():
         g2p_dict = read_dict_new()
         cache_dict(g2p_dict, CACHE_PATH)
 
+    g2p_dict = hot_reload_hot(g2p_dict)
+
     return g2p_dict
 
 
+def get_namedict():
+    if os.path.exists(NAMECACHE_PATH):
+        with open(NAMECACHE_PATH, "rb") as pickle_file:
+            name_dict = pickle.load(pickle_file)
+    else:
+        name_dict = {}
+
+    return name_dict
+
+
 def text_normalize(text):
     # todo: eng text normalize
     # 适配中文及 g2p_en 标点
@@ -227,13 +243,18 @@ def __init__(self):
         # 分词初始化
         wordsegment.load()
 
-        # 扩展过时字典
+        # 扩展过时字典, 添加姓名字典
         self.cmu = get_dict()
+        self.namedict = get_namedict()
 
         # 剔除读音错误的几个缩写
         for word in ["AE", "AI", "AR", "IOS", "HUD", "OS"]:
             del self.cmu[word.lower()]
 
+        # 修正多音字
+        self.homograph2features["read"] = (['R', 'IY1', 'D'], ['R', 'EH1', 'D'], 'VBP')
+        self.homograph2features["complex"] = (['K', 'AH0', 'M', 'P', 'L', 'EH1', 'K', 'S'], ['K', 'AA1', 'M', 'P', 'L', 'EH0', 'K', 'S'], 'JJ')
+
 
     def __call__(self, text):
         # tokenization
@@ -260,25 +281,34 @@ def __call__(self, text):
                 pron1, pron2, pos1 = self.homograph2features[word]
                 if pos.startswith(pos1):
                     pron = pron1
+                # pos1比pos长仅出现在read
+                elif len(pos) < len(pos1) and pos == pos1[:len(pos)]:
+                    pron = pron1
                 else:
                     pron = pron2
             else:
                 # 递归查找预测
-                pron = self.qryword(word)
+                pron = self.qryword(o_word)
 
             prons.extend(pron)
             prons.extend([" "])
 
         return prons[:-1]
 
 
-    def qryword(self, word):
+    def qryword(self, o_word):
+        word = o_word.lower()
+
         # 查字典, 单字母除外
         if len(word) > 1 and word in self.cmu:  # lookup CMU dict
             return self.cmu[word][0]
 
+        # 单词仅首字母大写时查找姓名字典
+        if o_word.istitle() and word in self.namedict:
+            return self.namedict[word][0]
+
         # oov 长度小于等于 3 直接读字母
-        if (len(word) <= 3):
+        if len(word) <= 3:
             phones = []
             for w in word:
                 # 单读 A 发音修正, 此处不存在大写的情况
diff --git a/GPT_SoVITS/text/namedict_cache.pickle b/GPT_SoVITS/text/namedict_cache.pickle

Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`		`-CHATGPT CH AE1 T JH IY1 P IY1 T IY1`
	`1`	`+CHATGPT CH AE1 T JH IY1 P IY1 T IY1`
	`2`	`+JSON JH EY1 S AH0 N`