-
Notifications
You must be signed in to change notification settings - Fork 1
/
Pouleng.schema.yaml
199 lines (174 loc) · 4.08 KB
/
Pouleng.schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
# Rime schema
# encoding: UTF-8 w/o BOM
# 參考書目:
# 單字基於《莆田縣誌》同音字表 完工
# 增補《莆田市志》 同音字表 完工
# 詞彙《莆仙方言簡明詞彙》完工 校對中
# 增補《莆田市誌》分類詞表 完工
# 增補《莆仙方言大詞典》未面世 請期待
# 本字不明的詞週邊若有寫法可暫時借用
schema:
schema_id: Pouleng
name: 莆仙話拼音-莆田
version: "2019.11.22.1"
author:
- 文本:芽油 <[email protected]>
- 程序:子善
description: 測試版 v0.1詞彙錄入中
討論羣「莆仙興化閩語 643608959」
dependencies:
- luna_pinyin
switches:
- name: ascii_mode
reset: 0
states: [ 汉字, 字母 ]
- name: full_shape
states: [ 半角, 全角 ]
- name: simplification
states: [ 繁體, 简体 ]
engine:
processors:
- ascii_composer
- recognizer
- key_binder
- speller
- punctuator
- selector
- navigator
- express_editor
segmentors:
- ascii_segmentor
- matcher
- abc_segmentor
- punct_segmentor
- fallback_segmentor
translators:
- punct_translator
- script_translator
- reverse_lookup_translator
filters:
- simplifier
- uniquifier
speller:
alphabet: zyxwvutsrqponmlkjihgfedcba
delimiter: " '"
algebra:
# 忽略声调 及 {}
- xform/^\{?([a-z]+)([0-9]*)\}?$/$1/
# 以首字母爲多字母音節碼的縮寫 Radium學長寫
- abbrev/^([gkhlnmbpdtzcs]|ng)[aoeiuyr]+(ng|h|k)?$/$1/
# ——————模糊音——————
# 普通話拼音
#- derive/原码/模糊音/
#- derive/^原码全词匹配/模糊音/
- derive/y/v/
- derive/oe/ee/
- derive/au/ao/
- derive/ieng/ian/
- derive/ieu/iao/
- derive/^ieng/yan/
- derive/yorng/iong/
# 略縮輸入
- derive/yor/yo/
- derive/yor/io/
- derive/yorng/yong/
- derive/yorh/yoh/
- derive/yorng/ion/
- derive/orh/oq/
- derive/orng/om/
- derive/zyor/jo/
- derive/zyorng/jong/
- derive/zyorng/jon/
- derive/ung/ng/
# 普通話拼音的零声母辅音
- derive/^ia/ya/
- derive/^i/yi/
- derive/^iu/you/
- derive/^y/yu/
- derive/^yorng/yong/
- derive/uang/wan/
- derive/^ue/wei/
- derive/^ui/wui/
- derive/^ua/wa/
- derive/^u/wu/
# 鼻音韵尾简化
- derive/ang/an/
- derive/ing/in/
- derive/yng/yn/
- derive/ong/on/
- derive/eng/en/
- derive/orng/orn/
- derive/ieng/ien/
- derive/ung/un/
- derive/uang/uan/
#
#
# 顎化
- derive/zi/ji/
- derive/ci/qi/
- derive/si/xi/
- derive/zy/ju/
- derive/cy/qu/
- derive/sy/xu/
# 入聲
- derive/^(.+)[hk]$/$1/
- derive/^(.+)[hk]$/$1h/
- derive/^(.+)[hk]$/$1k/
#類普拼式與IPA式轉換
- derive/z/ts/
- derive/c/tsh/
#老派
- derive/ieu/iau/
- derive/ieh/iah/
- derive/ieng/iang/
#新派
- derive/o/er/
- derive/ong/erng/
- derive/oh/erh/
- derive/ue/uei/
#容错
- derive/ang/ag/
- derive/eng/eg/
- derive/oeng/oeg/
- derive/ieng/ieg/
- derive/ing/ig/
- derive/yng/yg/
- derive/yorng/yorg/
- derive/ang/am/
- derive/eng/em/
- derive/oeng/oem/
- derive/ieng/iem/
- derive/ing/im/
- derive/yng/ym/
- derive/yorng/yom/
#其他口音
- derive/ue/uai/
translator:
dictionary: Pouleng
spelling_hints: 12
enable_sentence: true
enable_encoder: true
preedit_format:
# 便捷鍵還原
- xform/f/ng/
comment_format: &comment_rules
# 聲調上標
- xlit/012345678/⁰¹²³⁴⁵⁶⁷⁸/
reverse_lookup:
dictionary: luna_pinyin
prefix: "`"
suffix: "'"
tips: 〔普通話拼音反查〕
preedit_format:
- xform/([nl])v/$1ü/
- xform/([nl])ue/$1üe/
- xform/([jqxy])v/$1u/
comment_format: *comment_rules
punctuator:
import_preset: default
key_binder:
import_preset: default
recognizer:
import_preset: default
patterns:
reverse_lookup: "`[a-z]*'?$"