forked from rime/rime-cantonese
-
Notifications
You must be signed in to change notification settings - Fork 0
/
jyut6ping3.schema.yaml
225 lines (201 loc) · 6.37 KB
/
jyut6ping3.schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
# Rime schema
# encoding: utf-8
schema:
schema_id: jyut6ping3
name: 粵語拼音
version: "2020.11.26"
author:
- sgalal <[email protected]>
- LeiMaau <[email protected]>
- chaaklau <[email protected]>
- laubonghaudoi <[email protected]>
- tanxpyox <[email protected]>
- William915 <[email protected]>
- szc126 (@szc126)
- Bing Jeung <[email protected]>
- Ayaka Mikazuki <[email protected]>
description: |-
採用香港語言學學會粵語拼音方案
https://www.lshk.org/jyutping
支援聲調顯示同輸入
Telegram 用户交流組 https://t.me/rime_cantonese
dependencies:
- luna_pinyin
- loengfan
- stroke
- cangjie5
switches:
- name: ascii_mode
reset: 0
states: [ 中文, 西文 ]
- name: full_shape
states: [ 半角, 全角 ]
- options: [ noop, variants_hk, trad_tw, simplification ]
states: [ 傳統漢字, 香港傳統漢字, 臺灣傳統漢字, 大陆简化汉字 ]
# 修改下行,改變預設用字 [0, 1, 2, 3 --> 對應上表]
reset: 1
- name: ascii_punct
states: [ 。,, ., ]
- name: emoji_suggestion
# 取消下行註釋,預設啓動 emoji
#reset: 1
states: [ 冇 Emoji, 有 Emoji ]
engine:
processors:
- ascii_composer
- recognizer
- key_binder
- speller
- punctuator
- selector
- navigator
- express_editor
segmentors:
- ascii_segmentor
- matcher
- affix_segmentor@luna_pinyin
- affix_segmentor@loengfan
- affix_segmentor@stroke
- affix_segmentor@cangjie5
- abc_segmentor
- punct_segmentor
- fallback_segmentor
translators:
- punct_translator
- script_translator
- script_translator@luna_pinyin
- script_translator@loengfan
- table_translator@stroke
- table_translator@cangjie5
filters:
- simplifier@variants_hk
- simplifier@trad_tw
- simplifier
- simplifier@emoji_suggestion
- uniquifier
- reverse_lookup_filter@jyut6ping3_reverse_lookup
speller:
alphabet: zyxwvutsrqponmlkjihgfedcba
delimiter: " '"
algebra:
# 取消下兩行註釋,支援疑影交替: ng- 通 Ø-,Ø- 通 ng-
- derive/^ng([aeiou])/$1/
- derive/^([aeiou])/ng$1/
# 取消下行註釋,支援泥來合流: n- 併入 l- ,如「你」讀若「理」
- derive/^n(?!g)/l/
# 取消下行註釋,支援圓唇輔音合口韻缺位: gw-, kw- 併入 g-, k- ,如「國」讀若「各」、「廓」讀若「確」
- derive/^(g|k)w/$1/
# 取消下行註釋,支援獨立鼻音韻 ng 併入 m,如「吳」讀若「唔」
- derive/^ng([123456])$/m$1/
# fuzzy match addition by Bala
- derive/^s([aeiou])/sh$1/ #fuzzy match s with sh
- derive/^b([aeiou])/p$1/ #fuzzy match p with b
- derive/^g([aeiou])/k$1/ #fuzzy match g with k
- derive/^z([aeiouy])/j$1/ #fuzzy match z with j
- derive/^z([aiu])/t$1/ #fuzzy match z with t for short forms
- derive/^z([aeiou])/ts$1/ #fuzzy match z with ts
#- derive/^cy([iou])/ch$1/ # cy/ch
- derive/^cy([iou])/ts$1/ # cy/ts
- derive/^c([aeiouy])/ch$1/ # c/ch
- derive/[123456]// # 忽略聲調
- xform/1/v/ # 陰平
- xform/4/vv/ # 陽平
- xform/2/x/ # 陰上
- xform/5/xx/ # 陽上
- xform/3/q/ # 陰去
- xform/6/qq/ # 陽去
- derive/^([aeiou])/q$1/ # 增加 q 表示喉塞
- derive/^jy?([aeiou])/y$1/ # 容錯 je -> ye, jyu -> yu
- derive/^jyu/ju/ # 容錯 jyu -> ju
#- derive/yu/y/ # 容錯 jyu -> jy
#- derive/yut$/uet/ # Bala yut and uet ie. syut = suet
- derive/^yu?([tn])/yue$1/ # Bala yu*/yue*
- derive/yu(t|n)$/ue$1/ # Bala *yu(t|n)/*ue(t|n)
- derive/yu$/hue/ # Bala *yu/*hue
- derive/eoi$/oey/ # 容錯
- derive/eoi$/eoy/ # 容錯
- derive/eo/oe/ # 容錯 eo/oe 不分
- derive/eoi$/ui/ # Bala eoi/ui
- derive/oe(ng|k)$/eo$1/ # 容錯
- derive/oeng$/eung/ # Bala oe/eu ng
- derive/oe(n|t|k)$/u$1/ # Bala *oe/*u n/t/k
- derive/aa([iutpknm])/a$1/ # Bala aa/a
- derive/aa$/a/ # 容錯
- abbrev/^([a-z]).+$/$1/ # 首字母簡拼
- abbrev/^([a-z]{2}).+$/$1/ # 首2字母簡拼
- abbrev/^([a-z]{3}).+$/$1/ # Bala 首3字母簡拼
translator:
dictionary: jyut6ping3
spelling_hints: 8 # 將呢度改作 0,可以去除候選字後邊嘅粵拼提示
preedit_format:
- xform/([aeioumngptk])vv/${1}4/
- xform/([aeioumngptk])xx/${1}5/
- xform/([aeioumngptk])qq/${1}6/
- xform/([aeioumngptk])v/${1}1/
- xform/([aeioumngptk])x/${1}2/
- xform/([aeioumngptk])q/${1}3/
luna_pinyin:
tag: luna_pinyin
dictionary: luna_pinyin
prefix: "`"
suffix: ";"
tips: 〔普通話拼音〕
preedit_format:
- xform/([nl])v/$1ü/
- xform/([nl])ue/$1üe/
- xform/([jqxy])v/$1u/
loengfan:
tag: loengfan
dictionary: loengfan
prefix: "r"
suffix: ";"
tips: 〔粵語兩分〕
stroke:
tag: stroke
dictionary: stroke
prefix: "x"
suffix: ";"
tips: 〔筆畫〕
preedit_format:
- xlit/hspnz/一丨丿丶乙/
cangjie5:
tag: cangjie5
dictionary: cangjie5
enable_user_dict: false
prefix: "v"
suffix: ";"
tips: 〔倉頡五代〕
preedit_format:
- 'xform/^([a-z]*)$/$1\t(\U$1\E)/'
- "xlit|ABCDEFGHIJKLMNOPQRSTUVWXYZ|日月金木水火土竹戈十大中一弓人心手口尸廿山女田難卜符|"
comment_format:
- "xlit|abcdefghijklmnopqrstuvwxyz~|日月金木水火土竹戈十大中一弓人心手口尸廿山女田難卜符~|"
disable_user_dict_for_patterns:
- "^z.*$"
- "^yyy.*$"
jyut6ping3_reverse_lookup:
tags: [ luna_pinyin, loengfan, stroke, cangjie5 ]
overwrite_comment: false
dictionary: jyut6ping3
variants_hk:
option_name: variants_hk
opencc_config: t2hkf.json
trad_tw:
option_name: trad_tw
opencc_config: t2tw.json
emoji_suggestion:
opencc_config: emoji.json
option_name: emoji_suggestion
tips: all
punctuator:
import_preset: symbols_cantonese
key_binder:
import_preset: default
recognizer:
import_preset: default
patterns:
punct: "^/([0-9]0?|[a-z]+)$"
luna_pinyin: "^`[a-z']*;?$"
loengfan: "^r[a-z']*;?$"
stroke: "^x[hspnz]*;?$"
cangjie5: "^v[a-z]*;?$"