-
Notifications
You must be signed in to change notification settings - Fork 0
/
gninpou_ipa.schema.yaml
265 lines (244 loc) · 6.73 KB
/
gninpou_ipa.schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
# Rime schema
# encoding: utf-8
schema:
schema_id: gninpou_ipa
name: 寧波話(IPA版)
version: "0.1.1"
author:
- Shin Zoqchiuq <shinzoqchiuq@outlook.com>
description: |
採用學堂式吳語拼音(顯示IPA)
老三區口音
https://www.wugniu.com/
https://github.com/shinzoqchiuq/rime-gninpou-variant/
dependencies:
- luna_pinyin
- stroke
switches:
- name: ascii_mode
reset: 0
states: [ 中文, 西文 ]
- name: full_shape
states: [ 半角, 全角 ]
- name: simplification
reset: 1
states: [ 漢字, 汉字 ]
- name: ascii_punct
states: [ 。,, ., ]
engine:
processors:
- ascii_composer
- recognizer
- key_binder
- speller
- punctuator
- selector
- navigator
- express_editor
segmentors:
- ascii_segmentor
- matcher
- affix_segmentor@luna_pinyin # 自定義tag luna_pinyin
- affix_segmentor@stroke # 自定義tag stroke
- abc_segmentor
- punct_segmentor
- fallback_segmentor
translators:
- punct_translator
- script_translator # 主翻譯器
- script_translator@luna_pinyin # 用於反查的luna_pinyin翻譯器
- table_translator@stroke # 用於反查的stroke翻譯器
- table_translator@custom_phrase # 用戶短語
filters:
- simplifier
- uniquifier
- reverse_lookup_filter@reverse_lookup # 反查濾鏡
speller:
alphabet: abcdefghijklmnopqrstuvwxyz
delimiter: " '"
algebra:
- xform/^([bcdfghjklpqstvwxyz])$/$1_/
# 還原城區音系
- xform/(\w*)-(\w*)/$1/
# io韻消失
- erase/(^|c|j|gn|kn|[csz]h)(y|i)o$/
# 兼容吳語協會式拼音
- derive/q/h/
- derive/(i|y)au/$1o/
- derive/([gk])ni(?=[nqh]|\d|\b)/nyi/
- derive/([gk])ni(?=[aoue])/ny/
- derive/(?<=[szh])yu(?=[nqh])/oe/
- derive/er/r/
# 胡符不分
- derive/wu$/vu/
- derive/vu$/wu/
# 亂漏不分
- derive/loe/leu/
# 新派
# 且采不分
- derive/c(h)?ie$/ts$1e/
- derive/jie$/dze/
- derive/(?<=[sz])hie$/e/
- derive/^ye$/ghe/
# 降壯不分
- derive/ciaon/tsaon/
# 穿秋不分
- derive/ts(h)?oe$/c$1ieu/
- derive/dzoe$/jieu/
- derive/^(s|z)oe$/$1hieu/
# 掛架不分
- derive/(kh?)uo/$1o/
# 話夏不分
- derive/wo/gho/
- derive/^(h)?uo/$1o/
# 官孤不分
- derive/(?<![iy])un/u/
# 春沖不分 出促不分
- derive/(?<=[szh])(yu|oe)(?=[nqh])/o/
# 羣窮不分 缺吃不分
- derive/(^y|i)u(?=[nqh])/$1o/
- derive/(^y|i)o(?=[nqh])/$1u/
# 約一不分
- derive/ia(?=q|h)/i/
- derive/ya(?=q|h)/yi/
# 清鼻邊音
- derive/([mnl])h/$1/
- derive/kn/gn/
- derive/nk/ng/
# 容錯 gn(ny) => n kn => nh
- derive/(gn|ny)i/ni/
- derive/kni/nhi/
- derive/ny(?=[aoue])/ni/
# 簡拼
- abbrev/^([a-z]).+$/$1/
- abbrev/^([pmtnlszckg]h|[kg]n|n[kg]|tsh?|dz).+$/$1/
# 容錯 un => oe
- derive/([pbmw]|ph)un/$1oe/
- derive/^([kgh]|kh)?un/$1uoe/
# 容錯 au => ao
- derive/au/ao/
# c組聲母後自動加i
- derive/^(c|j|gn|kn|[csz]h)i(?=[aoue])/$1/
# 容錯 介音、主元音順序調換
- derive/^(.+)([iu])([aeou])([euonqh])$/$1$3$2$4/
# 容錯 oe => eo
- derive/oe/eo/
# 容錯 ao => oa
- derive/ao/oa/
# 容錯 ae => ea
- derive/ae/ea/
# 主翻譯器 寧波吳拼
translator:
dictionary: wugniu_gninpou # 調取詞典wugniu_gninpou
prism: gninpou_ipa # 根據拼寫運算生成棱鏡文件gninpou_ipa
preedit_format:
- "xform/'/ /"
- xform/(?<=[aeiou])h\b/q/
- xform/\bni/gni/
- xform/\bnhi/kni/
- xform/\bnyi/gni/
- xform/\bnhyi/kni/
- xform/\bny/gni/
- xform/\bnhy/kni/
- xform/\br\b/er/
- xform/oe(?=[qhn])/yu/
- xform/(?<=[iy])o\b/au/
- xform/oa/ao/
- xform/ao(?!n)/au/
- xform/eo/oe/
- xform/ea/ae/
- xform/\b(.+)([aeou])([iu])([euonqh])\b/$1$3$2$4/
- xform/\b([cj]|gn|kn|[csz]h)(?=[aoue])/$1i/
- xform/\by\b/ɦi/
- xform/\bw\b/ɦu/
- xform/\b([ptck]|ts)h/$1ʰ/
- xform/\bc/tɕ/
- xform/\bj/dʑ/
- xform/\bgn/ȵ/
- xform/\bkn/ʔȵ/
- xform/\bsh/ɕ/
- xform/\bzh/ʑ/
- xform/\bng/ŋ/
- xform/\bnk/ʔŋ/
- xform/\b([mnl])h/ʔ$1/
- xform/\bgh/ɦ/
- xform/\bg/ɡ/
- xform/\byi|\by(?=a|e)/ɦi/
- xform/\bwu|\bw(?=a|e|o)/ɦu/
- xform/\byu|\by(?=o)/ɦy/
- xform/ʔ(m|n)\b/ʔ$1̩/
- xform/\b(m|n)\b/$1̩/
- xform/\bŋ\b/ŋ̍/
- xform/ʔŋ\b/ʔŋ̍/
- xform/(s|z|sʰ)yu/$1ʮ/
- xform/(s|z|sʰ)y/$1ɿ/
- xform/iu|i(?=o|ao)/y/
- xform/a[ou]/ɔ/
- xform/iɔ/io/
- xform/ae/ɛ/
- xform/([pbmtdnlu]|pʰ|tʰ)oe/$1ø/
- xform/oe/ʏ/
- xform/ieu/iʏ/
- xform/ei/ɐɪ/
- xform/ou/əu/
- xform/eu/œʏ/
- xform/e(?=n)/ə/
- xform/y(?=n|q)/yə/
- xform/ʮ(?=n)/ʮø/
- xform/a(?=q)/ɐ/
- xform/i(?=q)/iɪ/
- xform/ʮ(?=q)/ʮœ/
- xform/(a|ɔ|u)n/$1̃/
- xform/(?<=[əioø])n(?=\b)/ŋ/
- xform/q(?=\b)/ʔ/
- xform/er/əl/
# 副翻譯器1 朙月拼音
luna_pinyin:
tag: luna_pinyin
dictionary: luna_pinyin # 調取詞典luna_pinyin
enable_user_dict: false # 關閉用戶詞典
prefix: '`' # 引導鍵「`」
suffix: "'" # 結束鍵「'」
tips: 〔反查〕 # 輸入前提示〔反查〕
closing_tips: 〔吳語(寧波)〕
preedit_format:
- xform/([nl])v/$1ü/
- xform/([nl])ue/$1üe/
- xform/([jqxy])v/$1u/
# 副翻譯器2 五筆畫
stroke:
tag: stroke
dictionary: stroke # 調取詞典stroke
enable_user_dict: false # 關閉用戶詞典
prefix: '`' # 引導鍵「`」
suffix: "'" # 結束鍵「'」
tips: 〔反查〕 # 輸入前提示〔反查〕
closing_tips: 〔吳語(寧波)〕
preedit_format:
- xlit/hspnz/一丨丿丶乙/
# 副翻譯器3 用戶短語
custom_phrase:
dictionary: ""
user_dict: custom_phrase # 用戶詞典名
db_class: stabledb # 詞典類型爲只讀格式
enable_completion: false
enable_sentence: false
initial_quality: 1
# 反查濾鏡
reverse_lookup:
tags: [luna_pinyin, stroke] # 掛在翻譯器luna_pinyin和stroke上
overwrite_comment: true # 覆蓋其他提示
dictionary: wugniu_gninpou # 反查所得爲寧波吳拼
comment_format:
# 還原城區音系
- xform/(\w*)-(\w*)/$1/
punctuator:
import_preset: symbols # 句讀處理器,統一從外部導入
key_binder:
import_preset: default # 快捷鍵,統一從外部導入
recognizer:
import_preset: default # 特殊規則輸入碼,統一從外部導入
patterns:
punct: "^/([0-9]|10|[A-Za-z]+)$" # 按 / 輸入符號
luna_pinyin: "`[hspnz]*[aeiouv][a-z]*'?$|`[a-gi-moqrt-y][a-z]*'?$"
stroke: "`[hspnz]+'?$"