-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathshanghe_xhipin.schema.yaml
249 lines (233 loc) · 6.24 KB
/
shanghe_xhipin.schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
# Rime schema
# encoding: utf-8
schema:
schema_id: shanghe_xhipin
name: 上海中派(錢拼)
version: "0.3.1"
author:
- Shin Zoqchiuq <[email protected]> (schema)
description: |
中派上海話輸入方案(錢拼)
採用上海話拼音方案 正式(錢拼)
本方案依賴於
- 上海吳語拼音輸入方案 ℞ NGLI/rime-wugniu_zaonhe
https://github.com/shinzoqchiuq/rime-shanghainese/
dependencies:
- luna_pinyin
- stroke
switches:
- name: ascii_mode
reset: 0
states: [ 中文, 西文 ]
- name: full_shape
states: [ 半角, 全角 ]
- name: simplification
reset: 1
states: [ 漢字, 汉字 ]
- name: ascii_punct
states: [ 。,, ., ]
engine:
processors:
- ascii_composer
- recognizer
- key_binder
- speller
- punctuator
- selector
- navigator
- express_editor
segmentors:
- ascii_segmentor
- matcher
- affix_segmentor@luna_pinyin # 自定義tag luna_pinyin
- affix_segmentor@stroke # 自定義tag stroke
- abc_segmentor
- punct_segmentor
- fallback_segmentor
translators:
- punct_translator
- script_translator # 主翻譯器
- script_translator@luna_pinyin # 用於反查的luna_pinyin翻譯器
- table_translator@stroke # 用於反查的stroke翻譯器
- table_translator@custom_phrase # 用戶短語
filters:
- simplifier
- uniquifier
- reverse_lookup_filter@reverse_lookup # 反查濾鏡
speller:
alphabet: abcdefghijklmnopqrstuvwxyz
delimiter: " '"
algebra:
- xform/^([bcdfghjklpqstvwxyz])$/$1_/
# 轉換爲錢拼
- xform/^([mnl])/$1h/
- xform/^([mnl])hh/$1/
- xform/^gn/nh/
- xform/^kn/n/
- xform/^nhk/ng/
- xform/^gh/hh/
- xform/^(c|j|[csz]h)i(?=u)/$1/
- xform/^([bdgj])/$1h/
- xform/q/k/
- xform/ch/q/
- xform/c/j/
- xform/^sh/x/
- xform/zh/xh/
- xform/z/sh/
- xform/tsh/c/
- xform/ts/z/
- xform/^p(?!h)/b/
- xform/^t(?!h)/d/
- xform/^k(?!h)/g/
- xform/^([ptk])h/$1/
- xform/v/fh/
- xform/^([yw])/$1h/
- xform/^i(?=[aeou])/y/
- xform/^u(?=[aeo])/w/
- xform/^i(?=n|k|$)/yi/
- xform/^u$/wu/
- xform/iu/yu/
- xform/(yh?)oe/$1uoe/
- xform/(jh?|q|xh?)ioe/$1uoe/
- xform/(nh?)ioe/$1yuoe/
- xform/au/ao/
- xform/eu/ou/
- xform/iou/iu/
- xform/aon/ang/
- xform/on/ong/
- xform/uk/uik/
# 尖團不分
- derive/zi/ji/
- derive/ci/qi/
- derive/^s(h?)i/x$1i/
- derive/zyu/ju/
- derive/cyu/qu/
- derive/^s(h?)yu/x$1u/
# 清鼻邊音
- derive/^([mnl])h/$1/
# fh => v
- derive/^fh/v/
# 干官不分
- derive/^([gkh])uoe/$1oe/
- derive/^whoe/hhoe/
- derive/^woe/oe/
# 余圓不分
- derive/^(yh?|jh?|q|xh?)uoe$/$1u/
- derive/^(nh?)yuoe$/$1yu/
# 打黨不分
- derive/ang$/an/
- derive/an$/ang/
# 格割不分
- derive/ek/ak/
- derive/([bmfdnlsjxgh]h)a(?=k)/$1e/
- derive/(?<![iyh])a(?=k)/e/
# 約一不分
- derive/ia(?=k)/i/
- derive/(yh?)a(?=k)/$1i/
- derive/(?<!u)i(?=k)/ia/
- derive/(yh?)i(?=k)/$1a/
# 容錯 yuik => yuk
- derive/uik/uk/
# 聲母簡拼
- abbrev/^([a-z]).+$/$1/
- abbrev/^([bmfdnlsjxghyw]h|ng|nhg).+$/$1/
# 容錯 ao => oa
- derive/ao/oa/
# 容錯 介音、主元音順序調換
- derive/^(.+)([iu])([aeou])([euonk])$/$1$3$2$4/
# 容錯 oe => eo
- derive/oe/eo/
# 容錯 ong => on
- derive/ong/on/
# 主翻譯器
translator:
dictionary: wugniu_zaonhe # 調取詞典wugniu_zaonhe
prism: shanghe_xhipin # 根據拼寫運算生成棱鏡文件shanghe_xhipin
spelling_hints: 5 # 標註拼音
comment_format:
# 轉換爲錢拼
- xform/\b([mnl])/$1h/
- xform/\b([mnl])hh/$1/
- xform/\bgn/nh/
- xform/\bkn/n/
- xform/\bnhk/ng/
- xform/\bgh/hh/
- xform/\b(c|j|[csz]h)i(?=u)/$1/
- xform/\b([bdgj])/$1h/
- xform/q/k/
- xform/ch/q/
- xform/c/j/
- xform/\bsh/x/
- xform/zh/xh/
- xform/z/sh/
- xform/tsh/c/
- xform/ts/z/
- xform/\bp(?!h)/b/
- xform/\bt(?!h)/d/
- xform/\bk(?!h)/g/
- xform/\b([ptk])h/$1/
- xform/v/fh/
- xform/\b([yw])/$1h/
- xform/\bi(?=[aeou])/y/
- xform/\bu(?=[aeo])/w/
- xform/\bi(?=n|k|\b)/yi/
- xform/\bu\b/wu/
- xform/iu/yu/
- xform/(yh?)oe/$1uoe/
- xform/(jh?|q|xh?)ioe/$1uoe/
- xform/(nh?)ioe/$1yuoe/
- xform/au/ao/
- xform/eu/ou/
- xform/iou/iu/
- xform/aon/ang/
- xform/on/ong/
- xform/uk/uik/
# 副翻譯器1 朙月拼音
luna_pinyin:
tag: luna_pinyin
dictionary: luna_pinyin # 調取詞典luna_pinyin
enable_user_dict: false # 關閉用戶詞典
prefix: '`' # 引導鍵「`」
suffix: "'" # 結束鍵「'」
tips: 〔拼音〕 # 輸入前提示〔拼音〕
closing_tips: 〔錢拼〕
preedit_format:
- xform/([nl])v/$1ü/
- xform/([nl])ue/$1üe/
- xform/([jqxy])v/$1u/
# 副翻譯器2 五筆畫
stroke:
tag: stroke
dictionary: stroke # 調取詞典stroke
enable_user_dict: false # 關閉用戶詞典
prefix: '`' # 引導鍵「`」
suffix: "'" # 結束鍵「'」
tips: 〔筆畫〕 # 輸入前提示〔筆畫〕
closing_tips: 〔錢拼〕
preedit_format:
- xlit/hspnz/一丨丿丶乙/
# 副翻譯器3 用戶短語
custom_phrase:
dictionary: ""
user_dict: custom_phrase # 用戶詞典名
db_class: stabledb # 詞典類型爲只讀格式
enable_completion: false
enable_sentence: false
initial_quality: 1
# 反查濾鏡
reverse_lookup:
tags: [luna_pinyin, stroke] # 掛在翻譯器luna_pinyin和stroke上
overwrite_comment: true # 覆蓋其他提示
dictionary: wugniu_zaonhe # 反查所得爲上海吳語
comment_format:
__include: translator/comment_format
punctuator:
import_preset: symbols # 句讀處理器,統一從外部導入
key_binder:
import_preset: default # 快捷鍵,統一從外部導入
recognizer:
import_preset: default # 特殊規則輸入碼,統一從外部導入
patterns:
punct: "^/([0-9]|10|[A-Za-z]+)$" # 按 / 輸入符號
luna_pinyin: "`[hspnz]*[aeiouv][a-z]*'?$|`[a-gi-moqrt-y][a-z]*'?$"
stroke: "`[hspnz]+'?$"