forked from contr4l/SimilarCharacter
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Pronunciation.py
59 lines (53 loc) · 1.68 KB
/
Pronunciation.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
# coding=gbk
from pypinyin import pinyin,Style,lazy_pinyin
import Dict
import Character
from tqdm import tqdm
symbol = Character.Symbol_lst()
def similar(char1,char2): # char1,char2为拼音
if char1[0:2] not in ['zh','ch','sh']:
fst1 = char1[0] # 此处四行为声母韵母抽取
end1 = char1[1:]
else:
fst1 = char1[0:2]
end1 = char1[2:]
if char2[0:2] not in ['zh','ch','sh']:
fst2 = char2[0]
end2 = char2[1:]
else:
fst2 = char2[0:2]
end2 = char2[2:]
# 韵母相同,声母相近
if fst1 in Dict.similar_dict:
if Dict.similar_dict[fst1] == fst2 and end1 == end2:
return 0.8
# 声母相同,韵母相近
if end1 in Dict.similar_dict:
if Dict.similar_dict[end1] == end2 and fst1 == fst2:
return 0.8
# 声母韵母均相近
if fst1 in Dict.similar_dict and fst2 in Dict.similar_dict and end1 in Dict.similar_dict and end2 in Dict.similar_dict:
if Dict.similar_dict[fst1] == fst2 and Dict.similar_dict[end1] == end2:
return 0.6
return 0
# 判断路径存在,不存在则创建
# if not os.path.exists('D:/py'):
# os.mkdir('D:/py')
# file1 = open('D:/py/Announciation.txt', 'w')
def pronunciation_index(i,j):
similar_index = 0
# for i in tqdm(symbol):
# for j in symbol:
# # 若两字相同,则跳过
if i == j:
return 0
else:
tone1 = lazy_pinyin(i)[0]
tone2 = lazy_pinyin(j)[0]
if tone1 == tone2:
return 1
else:
return similar(tone1, tone2)
# # 此处添加相近音的写入文件
# file1.write('\n')
# file1.close()