Skip to content

Commit 6f51bdd

Browse files
committed
feat: 不派生中英混输词库的大些形式; close #344
1 parent 67979e9 commit 6f51bdd

8 files changed

+2755
-2741
lines changed

en_dicts/cn_en.dict.yaml

+456-455
Large diffs are not rendered by default.

en_dicts/cn_en_double_pinyin.dict.yaml

+456-455
Large diffs are not rendered by default.

en_dicts/cn_en_double_pinyin_abc.dict.yaml

+456-455
Large diffs are not rendered by default.

en_dicts/cn_en_double_pinyin_flypy.dict.yaml

+456-455
Large diffs are not rendered by default.

en_dicts/cn_en_double_pinyin_mspy.dict.yaml

+456-455
Large diffs are not rendered by default.

en_dicts/cn_en_double_pinyin_ziguang.dict.yaml

+456-455
Large diffs are not rendered by default.

melt_eng.schema.yaml

+10-4
Original file line numberDiff line numberDiff line change
@@ -86,16 +86,19 @@ speller:
8686
- derive/[@]//
8787
- derive/[-]//
8888
- derive/[_]//
89+
90+
# 下面带 ⓘ 的,是为了中英混输词库不派生出纯大写
91+
8992
# 派生无任何非字母数字字符的拼写
90-
- derive/[^a-zA-Z0-9]//
93+
- derive/[^a-zA-Z0-9ⓘ]//
9194
# 禁用非英文、数字开头的编码
92-
- erase/^[\W|_].+$/
95+
- erase/^[^a-zA-Z0-9ⓘ].+$/
9396
# 全小写
9497
- derive/^.+$/\L$0/
9598
# 全大写
96-
- derive/^.+$/\U$0/
99+
- derive/^(?!ⓘ).+$/\U$0/
97100
# 首字母大写
98-
- derive/^./\U$0/
101+
- derive/^(?!ⓘ)./\U$0/
99102
# 前 2~10 个字母大写
100103
- derive/^([a-z]{2})/\U$1/
101104
- derive/^([a-z]{3})/\U$1/
@@ -106,6 +109,9 @@ speller:
106109
- derive/^([a-z]{8})/\U$1/
107110
- derive/^([a-z]{9})/\U$1/
108111
- derive/^([a-z]{10})/\U$1/
112+
# 派生中英混输词库(词库编码以ⓘ开头)
113+
- derive/^ⓘ(.+)$/$1/
114+
- derive/^ⓘ(.+)$/\L$1/
109115

110116
translator:
111117
dictionary: melt_eng

others/script/rime/cn_en.go

+9-7
Original file line numberDiff line numberDiff line change
@@ -65,10 +65,11 @@ var polyphones = map[string]string{
6565
"AB血型 > 血": "xue",
6666
"O型血 > 血": "xue",
6767
"O血型 > 血": "xue",
68-
"没Bug > 没": "mei",
69-
"没有Bug > 没": "mei",
70-
"卡Bug > 卡": "ka",
71-
"提Bug > 提": "ti",
68+
"没bug > 没": "mei",
69+
"没有bug > 没": "mei",
70+
"卡bug > 卡": "ka",
71+
"查bug > 查": "cha",
72+
"提bug > 提": "ti",
7273
"CT检查 > 查": "cha",
7374
"N卡 > 卡": "ka",
7475
"A卡 > 卡": "ka",
@@ -412,7 +413,7 @@ func CnEn() {
412413
uniq.Add(line)
413414
for _, schema := range schemas {
414415
code := textToPinyin(line, schema)
415-
_, err := schema.file.WriteString(line + "\t" + code + "\n")
416+
_, err := schema.file.WriteString(line + "\t" + "ⓘ" + code + "\n")
416417
if err != nil {
417418
log.Fatalln(err)
418419
}
@@ -432,8 +433,9 @@ func writePrefix(s schema) {
432433
#
433434
# https://github.com/iDvel/rime-ice
434435
# ------- 中英混输词库 for %s -------
435-
# 由 others/cn_en.txt 生成
436-
#
436+
# 由 others/cn_en.txt 自动生成
437+
# 编码前的 ⓘ 符号是为了防止英文方案拼写派生时派生出全大写字母
438+
# 示例:输入 txu 得到 T恤;输入 Txu 得到 T恤; 输入 TXU 则只会得到 TXU
437439
---
438440
name: %s
439441
version: "1"

0 commit comments

Comments
 (0)