forked from Mintimate/oh-my-rime
-
Notifications
You must be signed in to change notification settings - Fork 0
/
rime_mint.schema.yaml
executable file
·334 lines (315 loc) · 13.3 KB
/
rime_mint.schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
# Rime schema
# encoding: utf-8
schema:
schema_id: rime_mint
name: 薄荷拼音-全拼输入
version: "24.02.15"
author:
- mintimate < @Mintimate|https://www.mintimate.cn >
description: |
Mintimate的薄荷拼音方案。
除了参考官方明月拼音,还参考:
* chenhe: https://chenhe.me
* rime wiki: https://github.com/rime/home/wiki
* rime ice: https://github.com/iDvel/rime-ice
* Chewing - 新酷音
* opencc - 開放中文轉換
dependencies:
- radical_pinyin_flypy # 参考 https://github.com/mirtlecn/rime-radical-pinyin
- wubi98_mint # 98五笔库 https://github.com/yanhuacuo/98wubi-tables
- stroke
- melt_eng # 英文方案
key_binder:
import_preset: default
bindings:
- {accept: "Control+Shift+E", toggle: emoji_suggestion, when: always}
- {accept: "Control+Shift+exclam", toggle: transcription, when: has_menu}
- {accept: "Control+Shift+1", toggle: transcription, when: has_menu}
- {accept: minus, send: Page_Up, when: paging} # 使用`-`进行向上翻页(第一页时候无效)
- {accept: equal, send: Page_Down, when: has_menu} # 使用`=`进行向下翻页
switches:
- name: ascii_mode
reset: 0
states: [ 中文, 英文 ]
- name: emoji_suggestion
reset: 1
states: [ "😣️","😁️"]
- name: full_shape
states: [ 半角, 全角 ]
- name: transcription
reset: 0
states: [ 简体 , 繁体 ]
- name: ascii_punct
states: [ 。,, ., ]
engine:
processors:
- lua_processor@*select_character # 以词定字
- lua_processor@*codeLengthLimit_processor # 使用Lua限制输入内容的最大长度(防止过长而卡顿)
- ascii_composer # ※ 處理西文模式及中西文切換
- recognizer # ※ 與 matcher 搭配,處理符合特定規則的輸入碼,如網址、反查等
- key_binder # ※ 在特定條件下將按鍵綁定到其他按鍵,如重定義逗號、句號爲候選翻頁鍵
- speller
- punctuator
- selector
- navigator
- express_editor
segmentors:
- ascii_segmentor # 標識西文段落
- matcher # 標識符合特定規則的段落,如網址、反查等
- affix_segmentor@wubi98_mint
- affix_segmentor@radical_reverse_lookup
- affix_segmentor@stroke
- abc_segmentor # 標識常規的文字段落
- punct_segmentor # 標識句讀段落
- fallback_segmentor # 標識其他未標識段落
translators:
- punct_translator # ※ 轉換標點符號
- script_translator
- lua_translator@*date_translator # 日期Lua
- lua_translator@*time_translator # 时间Lua
- lua_translator@*week_translator # 星期Lua
- lua_translator@*number_translator # 金额大小写
- lua_translator@*chineseLunarCalendar_translator # 农历
- table_translator@melt_eng # 英文输入(作为子翻译器,优先级需要比原生的低)
- table_translator@cn_en # 中英混合词汇
# - echo_translator # ※ 没有候选词,返回字符
- reverse_lookup_translator@wubi98_mint
- reverse_lookup_translator@radical_reverse_lookup
- reverse_lookup_translator@stroke
# - reverse_lookup_translator # 反查模块,多标签情况下去除
filters:
- lua_filter@*corrector_filter # 错音错字提示
- lua_filter@*autocap_filter # 英文自动大写
- simplifier@emoji_suggestion
- simplifier@transcription_cc
- lua_filter@*reduce_english_filter # 降低部分英语单词在候选项的位置
- uniquifier # 去重
# 简繁切换
transcription_cc:
option_name: transcription
opencc_config: s2t.json # s2t.json | s2hk.json | s2tw.json | s2twp.json
tips: none # 转换提示: all 都显示 | char 仅单字显示 | none 不显示。
excluded_types: [ reverse_lookup ] # 不转换反查(两分拼字)的内容
# 最大输入长度
codeLengthLimit_processor: 25
# Emoji模块
emoji_suggestion:
opencc_config: emoji.json
option_name: emoji_suggestion
tips: all
inherit_comment: false
# Lua 配置: 降低部分英语单词在候选项的位置。
# 详细介绍 https://dvel.me/posts/make-rime-en-better/#短单词置顶的问题
# 正常情况: 输入 rug 得到 「1.rug 2.如果 …… 」
# 降低之后: 输入 rug 得到 「1.如果 2.rug …… 」
# 几种模式:
# all 使用 reduce_english_filter 自带的降频词库(降低所有 3~4 位长度、前 2~3 位是完整拼音、最后一位是声母的单词)
# none 不降低任何单词,相当于没有启用这个 Lua
# custom 自定义,只降低 words 里的
# 『留白』 不设置该选项,使用 reduce_english_filter 内全局设置内容
# (匹配的是编码,不是单词)
reduce_english_filter:
mode: all # all | none | custom | 『留白』
idx: 2 # 降低到第 idx 个位置
# 自定义的单词列表,示例列表没有降低部分常用单词,如 and cat mail Mac but bad shit ……
words: [aid, ann,
bail, bait, bam, band, bans, bat, bay, bend, bent, benz, bib, bid, bien, biz, boc, bop, bos, bud, buf,
cab, cad, cain, cam, cans, cap, cas, cef, chad, chan, chap, chef, cher, chew, chic, chin, chip, chit, coup, cum, cunt, cur,
dab, dag, dal, dam, dent, dew, dial, diet, dim, din, dip, dis, dit, doug, dub, dug, dunn,
fab, fax, fob, fog, foul, fur,
gag, gail, gain, gal, gam, gaol, ged, gel, ger, guam, gus, gut,
hail, ham, hank, hans, hat, hay, heil, heir, hem, hep, hud, hum, hung, hunk, hut,
jim, jug,
kat,
lab, lad, lag, laid, lam, laos, lap, lat, lax, lay, led, leg, lex, liam, lib, lid, lied, lien, lies, linn, lip, lit, liz, lob, lug, lund, lung, lux,
mag, maid, mann, mar, mat, med, mel, mend, mens, ment, mil, mins, mint, mob, moc, mop, mos, mot, mud, mug, mum, nail,
nap, nat, nay, neil, nib, nip, noun, nous, nun, nut,
pac, paid, pail, pain, pair, pak, pal, pam, pans, pant, pap, par, pat, paw, pax, pens, pic, pier, pies, pins, pint, pit, pix, pod, pop, pos, pot, pour, pow, pub,
rand, rant, rent, rep, res, ret, rex, rib, rid, rig, rim, rub, rug, rum, runc, runs,
sac, sail, sal, sam, sans, sap, saw, sax, sew, sham, shaw, shin, sig, sin, sip, sis, suit, sung, suns, sup, sur, sus,
tad, tail, taj, tar, tax, tec, ted, tel, ter, tex, tic, tied, tier, ties, tim, tin, tit, tour, tout, tum,
wag, wand, womens, wap, wax, weir, won,
yan, yen]
# 中国农历配置
chineseLunarCalendar_translator: lunar
translator:
# 字典文件
dictionary: rime_mint # 使用的字典文件
spelling_hints: 8 # corrector.lua :为了让错音错字提示的 Lua 同时适配全拼双拼,将拼音显示在 comment 中
always_show_comments: true # corrector.lua :Rime 默认在 preedit 等于 comment 时取消显示 comment,这里强制一直显示,供 corrector.lua 做判断用。
preedit_format:
- xform/([nl])v/$1ü/
- xform/([nl])ue/$1üe/
- xform/([jqxy])v/$1u/
initial_quality: 1.2
melt_eng:
dictionary: melt_eng # 英文词典
enable_sentence: false # 关闭自动造句
enable_completion: false # 关闭自动提示
initial_quality: 0.8
# 中英混合词汇
cn_en:
dictionary: "" # 中英混输,直接使用短语词典,普通字典直接留空即可
user_dict: dicts/rime_ice.cn_en
db_class: stabledb
enable_completion: false
enable_sentence: false
initial_quality: 0.5
comment_format:
- xform/^.+$//
speller:
# 如果不想让什么标点直接上屏,可以加在 alphabet,或者编辑标点符号为两个及以上的映射;默认没用大写字母,使用大写字母方便中英混熟词典生效
alphabet: zyxwvutsrqponmlkjihgfedcbaZYXWVUTSRQPONMLKJIHGFEDCBA
# 第一位 「空格」是拼音之间的默认分隔符;第二位「`」表示可以手动输入单引号来分割拼音
delimiter: " `"
# 拼写匹配
algebra:
- erase/^xx$/ # 首选保留
# - derive/^([zcs])h/$1/ # zh, ch, sh => z, c, s
# - derive/^([zcs])([^h])/$1h$2/ # z, c, s => zh, ch, sh
# - derive/([aei])n$/$1ng/ # en => eng, in => ing
# - derive/([aei])ng$/$1n/ # eng => en, ing => in
# - derive/([iu])an$/$lan/ # ian => iang, uan => uang
# - derive/([iu])ang$/$lan/ # iang => ian, uang => uan
- derive/([aeiou])ng$/$1gn/ # dagn => dang
- derive/([dtngkhrzcs])o(u|ng)$/$1o/ # zho => zhong|zhou
- derive/ong$/on/ # zhonguo => zhong guo
- abbrev/^([a-z]).+$/$1/ #简拼(首字母)
- abbrev/^([zcs]h).+$/$1/ #简拼(zh, ch, sh)
### 自动纠错
# 有些规则对全拼简拼混输有副作用:如「x'ai 喜爱」被纠错为「xia 下」
# zh、ch、sh
- derive/([zcs])h(a|e|i|u|ai|ei|an|en|ou|uo|ua|un|ui|uan|uai|uang|ang|eng|ong)$/h$1$2/ # hzi → zhi
- derive/([zcs])h([aeiu])$/$1$2h/ # zih → zhi
# ai
- derive/^([wghk])ai$/$1ia/ # wia → wai
# ia
- derive/([qjx])ia$/$1ai/ # qai → qia
# ei
- derive/([wtfghkz])ei$/$1ie/
# ie
- derive/([jqx])ie$/$1ei/
# ao
- derive/([rtypsdghklzcbnm])ao$/$1oa/
# ou
- derive/([ypfm])ou$/$1uo/
# uo(无)
# an
- derive/([wrtypsdfghklzcbnm])an$/$1na/
# en
- derive/([wrpsdfghklzcbnm])en$/$1ne/
# ang
- derive/([wrtypsdfghklzcbnm])ang$/$1nag/
- derive/([wrtypsdfghklzcbnm])ang$/$1agn/
# eng
- derive/([wrtpsdfghklzcbnm])eng$/$1neg/
- derive/([wrtpsdfghklzcbnm])eng$/$1egn/
# ing
- derive/([qtypdjlxbnm])ing$/$1nig/
- derive/([qtypdjlxbnm])ing$/$1ign/
# ong
- derive/([rtysdghklzcn])ong$/$1nog/
- derive/([rtysdghklzcn])ong$/$1ogn/
# iao
- derive/([qtpdjlxbnm])iao$/$1ioa/
- derive/([qtpdjlxbnm])iao$/$1oia/
# ui
- derive/([rtsghkzc])ui$/$1iu/
# iu
- derive/([qjlxnm])iu$/$1ui/
# ian
- derive/([qtpdjlxbnm])ian$/$1ain/
# - derive/([qtpdjlxbnm])ian$/$1ina/ # 和「李娜、蒂娜、缉拿」等常用词有冲突
# in
- derive/([qypjlxbnm])in$/$1ni/
# iang
- derive/([qjlxn])iang$/$1aing/
- derive/([qjlxn])iang$/$1inag/
# ua
- derive/([g|k|h|zh|sh])ua$/$1au/
# uai
- derive/([g|h|k|zh|ch|sh])uai$/$1aui/
- derive/([g|h|k|zh|ch|sh])uai$/$1uia/
# uan
- derive/([qrtysdghjklzxcn])uan$/$1aun/
# - derive/([qrtysdghjklzxcn])uan$/$1una/ # 和「去哪、露娜」等常用词有冲突
# un
- derive/([qrtysdghjklzxc])un$/$1nu/
# ue
- derive/([nlyjqx])ue$/$1eu/
# uang
- derive/([g|h|k|zh|ch|sh])uang$/$1aung/
- derive/([g|h|k|zh|ch|sh])uang$/$1uagn/
- derive/([g|h|k|zh|ch|sh])uang$/$1unag/
- derive/([g|h|k|zh|ch|sh])uang$/$1augn/
# iong
- derive/([jqx])iong$/$1inog/
- derive/([jqx])iong$/$1oing/
- derive/([jqx])iong$/$1iogn/
- derive/([jqx])iong$/$1oign/
# 其他
- derive/([rtsdghkzc])o(u|ng)$/$1o/ # do → dou|dong
- derive/ong$/on/ # lon → long
- derive/([tl])eng$/$1en/ # ten → teng
- derive/([qwrtypsdfghjklzxcbnm])([aeio])ng$/$1ng/ # lng → lang、leng、ling、long
wubi98_mint:
tag: wubi98_mint
dictionary: wubi98_mint
enable_user_dict: false
enable_completion: true
prefix: "uw"
suffix: "'"
tips: 〔五笔〕
stroke:
tag: stroke
dictionary: stroke
enable_user_dict: false
prefix: 'ui'
suffix: "'"
tips: 〔笔画〕
preedit_format:
- xlit/hspnz/一丨丿丶乙/
radical_reverse_lookup:
tag: radical_lookup
dictionary: radical_pinyin
enable_completion: false
enable_sentence: false
prefix: "uu"
suffix: " '"
comment_format:
- erase/^.*$//
tips: 〔拆字〕
reverse_lookup:
tags: [wubi98_mint,stroke,radical_lookup]
overwrite_comment: true
dictionary: dicts/rime_ice.8105
punctuator:
import_preset: symbols
# 定义部分半角字符
half_shape:
"#": "#"
"*": "*"
'.' : { commit: 。 }
"`": "`"
"~": "~"
"@": "@"
"=": "="
"/": ["/", "÷",]
'\': "、"
"_" : "──"
"'": {pair: ["「", "」"]}
"[": ["【", "["]
"]": ["】", "]"]
"$": ["¥", "$", "€", "£", "¢", "¤"]
"<": ["《", "〈", "«", "<"]
">": ["》", "〉", "»", ">"]
recognizer:
import_preset: default
patterns:
url: "^[a-z]+[.].+$"
punct: "^/([0-9]0?|[a-z]+)$"
wubi98_mint: "uw[a-z]*'?$"
stroke: "ui[a-z]*'?$"
radical_lookup: "uu[a-z]*'?$"
rmb: "^R[0-9]+[.]?[0-9]*" # 响应 lua_translator@number_translator 脚本将自动获取第 2 个字符作为触发前缀
gregorian_to_lunar: "^N[0-9]{1,8}" # 响应 lua_translator@Chinese_lunar_calendar 公历转农历,输入 N20240115 得到「二〇二四年腊月初五」,脚本将自动获取第 2 个字符作为触发前缀