Spaces:
Running
Running
delete
Browse files- bert/ProsodyModel.py +0 -75
- bert/__init__.py +0 -2
- bert/config.json +0 -19
- bert/prosody_model.pt +0 -3
- bert/prosody_tool.py +0 -426
- bert/vocab.txt +0 -0
bert/ProsodyModel.py
DELETED
@@ -1,75 +0,0 @@
|
|
1 |
-
import os
|
2 |
-
import torch
|
3 |
-
import torch.nn as nn
|
4 |
-
import torch.nn.functional as F
|
5 |
-
|
6 |
-
from transformers import BertModel, BertConfig, BertTokenizer
|
7 |
-
|
8 |
-
|
9 |
-
class CharEmbedding(nn.Module):
|
10 |
-
def __init__(self, model_dir):
|
11 |
-
super().__init__()
|
12 |
-
self.tokenizer = BertTokenizer.from_pretrained(model_dir)
|
13 |
-
self.bert_config = BertConfig.from_pretrained(model_dir)
|
14 |
-
self.hidden_size = self.bert_config.hidden_size
|
15 |
-
self.bert = BertModel(self.bert_config)
|
16 |
-
self.proj = nn.Linear(self.hidden_size, 256)
|
17 |
-
self.linear = nn.Linear(256, 3)
|
18 |
-
|
19 |
-
def text2Token(self, text):
|
20 |
-
token = self.tokenizer.tokenize(text)
|
21 |
-
txtid = self.tokenizer.convert_tokens_to_ids(token)
|
22 |
-
return txtid
|
23 |
-
|
24 |
-
def forward(self, inputs_ids, inputs_masks, tokens_type_ids):
|
25 |
-
out_seq = self.bert(input_ids=inputs_ids,
|
26 |
-
attention_mask=inputs_masks,
|
27 |
-
token_type_ids=tokens_type_ids)[0]
|
28 |
-
out_seq = self.proj(out_seq)
|
29 |
-
return out_seq
|
30 |
-
|
31 |
-
|
32 |
-
class TTSProsody(object):
|
33 |
-
def __init__(self, path, device):
|
34 |
-
self.device = device
|
35 |
-
self.char_model = CharEmbedding(path)
|
36 |
-
self.char_model.load_state_dict(
|
37 |
-
torch.load(
|
38 |
-
os.path.join(path, 'prosody_model.pt'),
|
39 |
-
map_location="cpu"
|
40 |
-
),
|
41 |
-
strict=False
|
42 |
-
)
|
43 |
-
self.char_model.eval()
|
44 |
-
self.char_model.to(self.device)
|
45 |
-
|
46 |
-
def get_char_embeds(self, text):
|
47 |
-
input_ids = self.char_model.text2Token(text)
|
48 |
-
input_masks = [1] * len(input_ids)
|
49 |
-
type_ids = [0] * len(input_ids)
|
50 |
-
input_ids = torch.LongTensor([input_ids]).to(self.device)
|
51 |
-
input_masks = torch.LongTensor([input_masks]).to(self.device)
|
52 |
-
type_ids = torch.LongTensor([type_ids]).to(self.device)
|
53 |
-
|
54 |
-
with torch.no_grad():
|
55 |
-
char_embeds = self.char_model(
|
56 |
-
input_ids, input_masks, type_ids).squeeze(0).cpu()
|
57 |
-
return char_embeds
|
58 |
-
|
59 |
-
def expand_for_phone(self, char_embeds, length): # length of phones for char
|
60 |
-
assert char_embeds.size(0) == len(length)
|
61 |
-
expand_vecs = list()
|
62 |
-
for vec, leng in zip(char_embeds, length):
|
63 |
-
vec = vec.expand(leng, -1)
|
64 |
-
expand_vecs.append(vec)
|
65 |
-
expand_embeds = torch.cat(expand_vecs, 0)
|
66 |
-
assert expand_embeds.size(0) == sum(length)
|
67 |
-
return expand_embeds.numpy()
|
68 |
-
|
69 |
-
|
70 |
-
if __name__ == "__main__":
|
71 |
-
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
72 |
-
prosody = TTSProsody('./bert/', device)
|
73 |
-
while True:
|
74 |
-
text = input("请输入文本:")
|
75 |
-
prosody.get_char_embeds(text)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bert/__init__.py
DELETED
@@ -1,2 +0,0 @@
|
|
1 |
-
""" from https://github.com/PlayVoice/vits_chinese """
|
2 |
-
from .ProsodyModel import TTSProsody
|
|
|
|
|
|
bert/config.json
DELETED
@@ -1,19 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"attention_probs_dropout_prob": 0.1,
|
3 |
-
"directionality": "bidi",
|
4 |
-
"hidden_act": "gelu",
|
5 |
-
"hidden_dropout_prob": 0.1,
|
6 |
-
"hidden_size": 768,
|
7 |
-
"initializer_range": 0.02,
|
8 |
-
"intermediate_size": 3072,
|
9 |
-
"max_position_embeddings": 512,
|
10 |
-
"num_attention_heads": 12,
|
11 |
-
"num_hidden_layers": 12,
|
12 |
-
"pooler_fc_size": 768,
|
13 |
-
"pooler_num_attention_heads": 12,
|
14 |
-
"pooler_num_fc_layers": 3,
|
15 |
-
"pooler_size_per_head": 128,
|
16 |
-
"pooler_type": "first_token_transform",
|
17 |
-
"type_vocab_size": 2,
|
18 |
-
"vocab_size": 21128
|
19 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bert/prosody_model.pt
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:3accec7a0d5cbfccaa8a42b96374a91d442a69801c6a01402baae3bf06b8c015
|
3 |
-
size 409941419
|
|
|
|
|
|
|
|
bert/prosody_tool.py
DELETED
@@ -1,426 +0,0 @@
|
|
1 |
-
def is_chinese(uchar):
|
2 |
-
if uchar >= u'\u4e00' and uchar <= u'\u9fa5':
|
3 |
-
return True
|
4 |
-
else:
|
5 |
-
return False
|
6 |
-
|
7 |
-
|
8 |
-
pinyin_dict = {
|
9 |
-
"a": ("^", "a"),
|
10 |
-
"ai": ("^", "ai"),
|
11 |
-
"an": ("^", "an"),
|
12 |
-
"ang": ("^", "ang"),
|
13 |
-
"ao": ("^", "ao"),
|
14 |
-
"ba": ("b", "a"),
|
15 |
-
"bai": ("b", "ai"),
|
16 |
-
"ban": ("b", "an"),
|
17 |
-
"bang": ("b", "ang"),
|
18 |
-
"bao": ("b", "ao"),
|
19 |
-
"be": ("b", "e"),
|
20 |
-
"bei": ("b", "ei"),
|
21 |
-
"ben": ("b", "en"),
|
22 |
-
"beng": ("b", "eng"),
|
23 |
-
"bi": ("b", "i"),
|
24 |
-
"bian": ("b", "ian"),
|
25 |
-
"biao": ("b", "iao"),
|
26 |
-
"bie": ("b", "ie"),
|
27 |
-
"bin": ("b", "in"),
|
28 |
-
"bing": ("b", "ing"),
|
29 |
-
"bo": ("b", "o"),
|
30 |
-
"bu": ("b", "u"),
|
31 |
-
"ca": ("c", "a"),
|
32 |
-
"cai": ("c", "ai"),
|
33 |
-
"can": ("c", "an"),
|
34 |
-
"cang": ("c", "ang"),
|
35 |
-
"cao": ("c", "ao"),
|
36 |
-
"ce": ("c", "e"),
|
37 |
-
"cen": ("c", "en"),
|
38 |
-
"ceng": ("c", "eng"),
|
39 |
-
"cha": ("ch", "a"),
|
40 |
-
"chai": ("ch", "ai"),
|
41 |
-
"chan": ("ch", "an"),
|
42 |
-
"chang": ("ch", "ang"),
|
43 |
-
"chao": ("ch", "ao"),
|
44 |
-
"che": ("ch", "e"),
|
45 |
-
"chen": ("ch", "en"),
|
46 |
-
"cheng": ("ch", "eng"),
|
47 |
-
"chi": ("ch", "iii"),
|
48 |
-
"chong": ("ch", "ong"),
|
49 |
-
"chou": ("ch", "ou"),
|
50 |
-
"chu": ("ch", "u"),
|
51 |
-
"chua": ("ch", "ua"),
|
52 |
-
"chuai": ("ch", "uai"),
|
53 |
-
"chuan": ("ch", "uan"),
|
54 |
-
"chuang": ("ch", "uang"),
|
55 |
-
"chui": ("ch", "uei"),
|
56 |
-
"chun": ("ch", "uen"),
|
57 |
-
"chuo": ("ch", "uo"),
|
58 |
-
"ci": ("c", "ii"),
|
59 |
-
"cong": ("c", "ong"),
|
60 |
-
"cou": ("c", "ou"),
|
61 |
-
"cu": ("c", "u"),
|
62 |
-
"cuan": ("c", "uan"),
|
63 |
-
"cui": ("c", "uei"),
|
64 |
-
"cun": ("c", "uen"),
|
65 |
-
"cuo": ("c", "uo"),
|
66 |
-
"da": ("d", "a"),
|
67 |
-
"dai": ("d", "ai"),
|
68 |
-
"dan": ("d", "an"),
|
69 |
-
"dang": ("d", "ang"),
|
70 |
-
"dao": ("d", "ao"),
|
71 |
-
"de": ("d", "e"),
|
72 |
-
"dei": ("d", "ei"),
|
73 |
-
"den": ("d", "en"),
|
74 |
-
"deng": ("d", "eng"),
|
75 |
-
"di": ("d", "i"),
|
76 |
-
"dia": ("d", "ia"),
|
77 |
-
"dian": ("d", "ian"),
|
78 |
-
"diao": ("d", "iao"),
|
79 |
-
"die": ("d", "ie"),
|
80 |
-
"ding": ("d", "ing"),
|
81 |
-
"diu": ("d", "iou"),
|
82 |
-
"dong": ("d", "ong"),
|
83 |
-
"dou": ("d", "ou"),
|
84 |
-
"du": ("d", "u"),
|
85 |
-
"duan": ("d", "uan"),
|
86 |
-
"dui": ("d", "uei"),
|
87 |
-
"dun": ("d", "uen"),
|
88 |
-
"duo": ("d", "uo"),
|
89 |
-
"e": ("^", "e"),
|
90 |
-
"ei": ("^", "ei"),
|
91 |
-
"en": ("^", "en"),
|
92 |
-
"ng": ("^", "en"),
|
93 |
-
"eng": ("^", "eng"),
|
94 |
-
"er": ("^", "er"),
|
95 |
-
"fa": ("f", "a"),
|
96 |
-
"fan": ("f", "an"),
|
97 |
-
"fang": ("f", "ang"),
|
98 |
-
"fei": ("f", "ei"),
|
99 |
-
"fen": ("f", "en"),
|
100 |
-
"feng": ("f", "eng"),
|
101 |
-
"fo": ("f", "o"),
|
102 |
-
"fou": ("f", "ou"),
|
103 |
-
"fu": ("f", "u"),
|
104 |
-
"ga": ("g", "a"),
|
105 |
-
"gai": ("g", "ai"),
|
106 |
-
"gan": ("g", "an"),
|
107 |
-
"gang": ("g", "ang"),
|
108 |
-
"gao": ("g", "ao"),
|
109 |
-
"ge": ("g", "e"),
|
110 |
-
"gei": ("g", "ei"),
|
111 |
-
"gen": ("g", "en"),
|
112 |
-
"geng": ("g", "eng"),
|
113 |
-
"gong": ("g", "ong"),
|
114 |
-
"gou": ("g", "ou"),
|
115 |
-
"gu": ("g", "u"),
|
116 |
-
"gua": ("g", "ua"),
|
117 |
-
"guai": ("g", "uai"),
|
118 |
-
"guan": ("g", "uan"),
|
119 |
-
"guang": ("g", "uang"),
|
120 |
-
"gui": ("g", "uei"),
|
121 |
-
"gun": ("g", "uen"),
|
122 |
-
"guo": ("g", "uo"),
|
123 |
-
"ha": ("h", "a"),
|
124 |
-
"hai": ("h", "ai"),
|
125 |
-
"han": ("h", "an"),
|
126 |
-
"hang": ("h", "ang"),
|
127 |
-
"hao": ("h", "ao"),
|
128 |
-
"he": ("h", "e"),
|
129 |
-
"hei": ("h", "ei"),
|
130 |
-
"hen": ("h", "en"),
|
131 |
-
"heng": ("h", "eng"),
|
132 |
-
"hong": ("h", "ong"),
|
133 |
-
"hou": ("h", "ou"),
|
134 |
-
"hu": ("h", "u"),
|
135 |
-
"hua": ("h", "ua"),
|
136 |
-
"huai": ("h", "uai"),
|
137 |
-
"huan": ("h", "uan"),
|
138 |
-
"huang": ("h", "uang"),
|
139 |
-
"hui": ("h", "uei"),
|
140 |
-
"hun": ("h", "uen"),
|
141 |
-
"huo": ("h", "uo"),
|
142 |
-
"ji": ("j", "i"),
|
143 |
-
"jia": ("j", "ia"),
|
144 |
-
"jian": ("j", "ian"),
|
145 |
-
"jiang": ("j", "iang"),
|
146 |
-
"jiao": ("j", "iao"),
|
147 |
-
"jie": ("j", "ie"),
|
148 |
-
"jin": ("j", "in"),
|
149 |
-
"jing": ("j", "ing"),
|
150 |
-
"jiong": ("j", "iong"),
|
151 |
-
"jiu": ("j", "iou"),
|
152 |
-
"ju": ("j", "v"),
|
153 |
-
"juan": ("j", "van"),
|
154 |
-
"jue": ("j", "ve"),
|
155 |
-
"jun": ("j", "vn"),
|
156 |
-
"ka": ("k", "a"),
|
157 |
-
"kai": ("k", "ai"),
|
158 |
-
"kan": ("k", "an"),
|
159 |
-
"kang": ("k", "ang"),
|
160 |
-
"kao": ("k", "ao"),
|
161 |
-
"ke": ("k", "e"),
|
162 |
-
"kei": ("k", "ei"),
|
163 |
-
"ken": ("k", "en"),
|
164 |
-
"keng": ("k", "eng"),
|
165 |
-
"kong": ("k", "ong"),
|
166 |
-
"kou": ("k", "ou"),
|
167 |
-
"ku": ("k", "u"),
|
168 |
-
"kua": ("k", "ua"),
|
169 |
-
"kuai": ("k", "uai"),
|
170 |
-
"kuan": ("k", "uan"),
|
171 |
-
"kuang": ("k", "uang"),
|
172 |
-
"kui": ("k", "uei"),
|
173 |
-
"kun": ("k", "uen"),
|
174 |
-
"kuo": ("k", "uo"),
|
175 |
-
"la": ("l", "a"),
|
176 |
-
"lai": ("l", "ai"),
|
177 |
-
"lan": ("l", "an"),
|
178 |
-
"lang": ("l", "ang"),
|
179 |
-
"lao": ("l", "ao"),
|
180 |
-
"le": ("l", "e"),
|
181 |
-
"lei": ("l", "ei"),
|
182 |
-
"leng": ("l", "eng"),
|
183 |
-
"li": ("l", "i"),
|
184 |
-
"lia": ("l", "ia"),
|
185 |
-
"lian": ("l", "ian"),
|
186 |
-
"liang": ("l", "iang"),
|
187 |
-
"liao": ("l", "iao"),
|
188 |
-
"lie": ("l", "ie"),
|
189 |
-
"lin": ("l", "in"),
|
190 |
-
"ling": ("l", "ing"),
|
191 |
-
"liu": ("l", "iou"),
|
192 |
-
"lo": ("l", "o"),
|
193 |
-
"long": ("l", "ong"),
|
194 |
-
"lou": ("l", "ou"),
|
195 |
-
"lu": ("l", "u"),
|
196 |
-
"lv": ("l", "v"),
|
197 |
-
"luan": ("l", "uan"),
|
198 |
-
"lve": ("l", "ve"),
|
199 |
-
"lue": ("l", "ve"),
|
200 |
-
"lun": ("l", "uen"),
|
201 |
-
"luo": ("l", "uo"),
|
202 |
-
"ma": ("m", "a"),
|
203 |
-
"mai": ("m", "ai"),
|
204 |
-
"man": ("m", "an"),
|
205 |
-
"mang": ("m", "ang"),
|
206 |
-
"mao": ("m", "ao"),
|
207 |
-
"me": ("m", "e"),
|
208 |
-
"mei": ("m", "ei"),
|
209 |
-
"men": ("m", "en"),
|
210 |
-
"meng": ("m", "eng"),
|
211 |
-
"mi": ("m", "i"),
|
212 |
-
"mian": ("m", "ian"),
|
213 |
-
"miao": ("m", "iao"),
|
214 |
-
"mie": ("m", "ie"),
|
215 |
-
"min": ("m", "in"),
|
216 |
-
"ming": ("m", "ing"),
|
217 |
-
"miu": ("m", "iou"),
|
218 |
-
"mo": ("m", "o"),
|
219 |
-
"mou": ("m", "ou"),
|
220 |
-
"mu": ("m", "u"),
|
221 |
-
"na": ("n", "a"),
|
222 |
-
"nai": ("n", "ai"),
|
223 |
-
"nan": ("n", "an"),
|
224 |
-
"nang": ("n", "ang"),
|
225 |
-
"nao": ("n", "ao"),
|
226 |
-
"ne": ("n", "e"),
|
227 |
-
"nei": ("n", "ei"),
|
228 |
-
"nen": ("n", "en"),
|
229 |
-
"neng": ("n", "eng"),
|
230 |
-
"ni": ("n", "i"),
|
231 |
-
"nia": ("n", "ia"),
|
232 |
-
"nian": ("n", "ian"),
|
233 |
-
"niang": ("n", "iang"),
|
234 |
-
"niao": ("n", "iao"),
|
235 |
-
"nie": ("n", "ie"),
|
236 |
-
"nin": ("n", "in"),
|
237 |
-
"ning": ("n", "ing"),
|
238 |
-
"niu": ("n", "iou"),
|
239 |
-
"nong": ("n", "ong"),
|
240 |
-
"nou": ("n", "ou"),
|
241 |
-
"nu": ("n", "u"),
|
242 |
-
"nv": ("n", "v"),
|
243 |
-
"nuan": ("n", "uan"),
|
244 |
-
"nve": ("n", "ve"),
|
245 |
-
"nue": ("n", "ve"),
|
246 |
-
"nuo": ("n", "uo"),
|
247 |
-
"o": ("^", "o"),
|
248 |
-
"ou": ("^", "ou"),
|
249 |
-
"pa": ("p", "a"),
|
250 |
-
"pai": ("p", "ai"),
|
251 |
-
"pan": ("p", "an"),
|
252 |
-
"pang": ("p", "ang"),
|
253 |
-
"pao": ("p", "ao"),
|
254 |
-
"pe": ("p", "e"),
|
255 |
-
"pei": ("p", "ei"),
|
256 |
-
"pen": ("p", "en"),
|
257 |
-
"peng": ("p", "eng"),
|
258 |
-
"pi": ("p", "i"),
|
259 |
-
"pian": ("p", "ian"),
|
260 |
-
"piao": ("p", "iao"),
|
261 |
-
"pie": ("p", "ie"),
|
262 |
-
"pin": ("p", "in"),
|
263 |
-
"ping": ("p", "ing"),
|
264 |
-
"po": ("p", "o"),
|
265 |
-
"pou": ("p", "ou"),
|
266 |
-
"pu": ("p", "u"),
|
267 |
-
"qi": ("q", "i"),
|
268 |
-
"qia": ("q", "ia"),
|
269 |
-
"qian": ("q", "ian"),
|
270 |
-
"qiang": ("q", "iang"),
|
271 |
-
"qiao": ("q", "iao"),
|
272 |
-
"qie": ("q", "ie"),
|
273 |
-
"qin": ("q", "in"),
|
274 |
-
"qing": ("q", "ing"),
|
275 |
-
"qiong": ("q", "iong"),
|
276 |
-
"qiu": ("q", "iou"),
|
277 |
-
"qu": ("q", "v"),
|
278 |
-
"quan": ("q", "van"),
|
279 |
-
"que": ("q", "ve"),
|
280 |
-
"qun": ("q", "vn"),
|
281 |
-
"ran": ("r", "an"),
|
282 |
-
"rang": ("r", "ang"),
|
283 |
-
"rao": ("r", "ao"),
|
284 |
-
"re": ("r", "e"),
|
285 |
-
"ren": ("r", "en"),
|
286 |
-
"reng": ("r", "eng"),
|
287 |
-
"ri": ("r", "iii"),
|
288 |
-
"rong": ("r", "ong"),
|
289 |
-
"rou": ("r", "ou"),
|
290 |
-
"ru": ("r", "u"),
|
291 |
-
"rua": ("r", "ua"),
|
292 |
-
"ruan": ("r", "uan"),
|
293 |
-
"rui": ("r", "uei"),
|
294 |
-
"run": ("r", "uen"),
|
295 |
-
"ruo": ("r", "uo"),
|
296 |
-
"sa": ("s", "a"),
|
297 |
-
"sai": ("s", "ai"),
|
298 |
-
"san": ("s", "an"),
|
299 |
-
"sang": ("s", "ang"),
|
300 |
-
"sao": ("s", "ao"),
|
301 |
-
"se": ("s", "e"),
|
302 |
-
"sen": ("s", "en"),
|
303 |
-
"seng": ("s", "eng"),
|
304 |
-
"sha": ("sh", "a"),
|
305 |
-
"shai": ("sh", "ai"),
|
306 |
-
"shan": ("sh", "an"),
|
307 |
-
"shang": ("sh", "ang"),
|
308 |
-
"shao": ("sh", "ao"),
|
309 |
-
"she": ("sh", "e"),
|
310 |
-
"shei": ("sh", "ei"),
|
311 |
-
"shen": ("sh", "en"),
|
312 |
-
"sheng": ("sh", "eng"),
|
313 |
-
"shi": ("sh", "iii"),
|
314 |
-
"shou": ("sh", "ou"),
|
315 |
-
"shu": ("sh", "u"),
|
316 |
-
"shua": ("sh", "ua"),
|
317 |
-
"shuai": ("sh", "uai"),
|
318 |
-
"shuan": ("sh", "uan"),
|
319 |
-
"shuang": ("sh", "uang"),
|
320 |
-
"shui": ("sh", "uei"),
|
321 |
-
"shun": ("sh", "uen"),
|
322 |
-
"shuo": ("sh", "uo"),
|
323 |
-
"si": ("s", "ii"),
|
324 |
-
"song": ("s", "ong"),
|
325 |
-
"sou": ("s", "ou"),
|
326 |
-
"su": ("s", "u"),
|
327 |
-
"suan": ("s", "uan"),
|
328 |
-
"sui": ("s", "uei"),
|
329 |
-
"sun": ("s", "uen"),
|
330 |
-
"suo": ("s", "uo"),
|
331 |
-
"ta": ("t", "a"),
|
332 |
-
"tai": ("t", "ai"),
|
333 |
-
"tan": ("t", "an"),
|
334 |
-
"tang": ("t", "ang"),
|
335 |
-
"tao": ("t", "ao"),
|
336 |
-
"te": ("t", "e"),
|
337 |
-
"tei": ("t", "ei"),
|
338 |
-
"teng": ("t", "eng"),
|
339 |
-
"ti": ("t", "i"),
|
340 |
-
"tian": ("t", "ian"),
|
341 |
-
"tiao": ("t", "iao"),
|
342 |
-
"tie": ("t", "ie"),
|
343 |
-
"ting": ("t", "ing"),
|
344 |
-
"tong": ("t", "ong"),
|
345 |
-
"tou": ("t", "ou"),
|
346 |
-
"tu": ("t", "u"),
|
347 |
-
"tuan": ("t", "uan"),
|
348 |
-
"tui": ("t", "uei"),
|
349 |
-
"tun": ("t", "uen"),
|
350 |
-
"tuo": ("t", "uo"),
|
351 |
-
"wa": ("^", "ua"),
|
352 |
-
"wai": ("^", "uai"),
|
353 |
-
"wan": ("^", "uan"),
|
354 |
-
"wang": ("^", "uang"),
|
355 |
-
"wei": ("^", "uei"),
|
356 |
-
"wen": ("^", "uen"),
|
357 |
-
"weng": ("^", "ueng"),
|
358 |
-
"wo": ("^", "uo"),
|
359 |
-
"wu": ("^", "u"),
|
360 |
-
"xi": ("x", "i"),
|
361 |
-
"xia": ("x", "ia"),
|
362 |
-
"xian": ("x", "ian"),
|
363 |
-
"xiang": ("x", "iang"),
|
364 |
-
"xiao": ("x", "iao"),
|
365 |
-
"xie": ("x", "ie"),
|
366 |
-
"xin": ("x", "in"),
|
367 |
-
"xing": ("x", "ing"),
|
368 |
-
"xiong": ("x", "iong"),
|
369 |
-
"xiu": ("x", "iou"),
|
370 |
-
"xu": ("x", "v"),
|
371 |
-
"xuan": ("x", "van"),
|
372 |
-
"xue": ("x", "ve"),
|
373 |
-
"xun": ("x", "vn"),
|
374 |
-
"ya": ("^", "ia"),
|
375 |
-
"yan": ("^", "ian"),
|
376 |
-
"yang": ("^", "iang"),
|
377 |
-
"yao": ("^", "iao"),
|
378 |
-
"ye": ("^", "ie"),
|
379 |
-
"yi": ("^", "i"),
|
380 |
-
"yin": ("^", "in"),
|
381 |
-
"ying": ("^", "ing"),
|
382 |
-
"yo": ("^", "iou"),
|
383 |
-
"yong": ("^", "iong"),
|
384 |
-
"you": ("^", "iou"),
|
385 |
-
"yu": ("^", "v"),
|
386 |
-
"yuan": ("^", "van"),
|
387 |
-
"yue": ("^", "ve"),
|
388 |
-
"yun": ("^", "vn"),
|
389 |
-
"za": ("z", "a"),
|
390 |
-
"zai": ("z", "ai"),
|
391 |
-
"zan": ("z", "an"),
|
392 |
-
"zang": ("z", "ang"),
|
393 |
-
"zao": ("z", "ao"),
|
394 |
-
"ze": ("z", "e"),
|
395 |
-
"zei": ("z", "ei"),
|
396 |
-
"zen": ("z", "en"),
|
397 |
-
"zeng": ("z", "eng"),
|
398 |
-
"zha": ("zh", "a"),
|
399 |
-
"zhai": ("zh", "ai"),
|
400 |
-
"zhan": ("zh", "an"),
|
401 |
-
"zhang": ("zh", "ang"),
|
402 |
-
"zhao": ("zh", "ao"),
|
403 |
-
"zhe": ("zh", "e"),
|
404 |
-
"zhei": ("zh", "ei"),
|
405 |
-
"zhen": ("zh", "en"),
|
406 |
-
"zheng": ("zh", "eng"),
|
407 |
-
"zhi": ("zh", "iii"),
|
408 |
-
"zhong": ("zh", "ong"),
|
409 |
-
"zhou": ("zh", "ou"),
|
410 |
-
"zhu": ("zh", "u"),
|
411 |
-
"zhua": ("zh", "ua"),
|
412 |
-
"zhuai": ("zh", "uai"),
|
413 |
-
"zhuan": ("zh", "uan"),
|
414 |
-
"zhuang": ("zh", "uang"),
|
415 |
-
"zhui": ("zh", "uei"),
|
416 |
-
"zhun": ("zh", "uen"),
|
417 |
-
"zhuo": ("zh", "uo"),
|
418 |
-
"zi": ("z", "ii"),
|
419 |
-
"zong": ("z", "ong"),
|
420 |
-
"zou": ("z", "ou"),
|
421 |
-
"zu": ("z", "u"),
|
422 |
-
"zuan": ("z", "uan"),
|
423 |
-
"zui": ("z", "uei"),
|
424 |
-
"zun": ("z", "uen"),
|
425 |
-
"zuo": ("z", "uo"),
|
426 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bert/vocab.txt
DELETED
The diff for this file is too large to render.
See raw diff
|
|