mirror of
https://gitee.com/ShopeX/OMS
synced 2026-04-13 01:05:42 +08:00
293 lines
4.3 KiB
INI
293 lines
4.3 KiB
INI
;
|
||
; auto regular(utf-8)
|
||
; $Id$
|
||
;
|
||
; special word, 特殊词汇
|
||
;
|
||
|
||
[special]
|
||
C++
|
||
C#
|
||
R&B
|
||
P&G
|
||
J++
|
||
J#
|
||
UTF-8
|
||
PS/2
|
||
|
||
;
|
||
; nostats
|
||
;
|
||
[nostats]
|
||
about
|
||
all
|
||
also
|
||
an
|
||
and
|
||
any
|
||
are
|
||
as
|
||
at
|
||
be
|
||
but
|
||
by
|
||
both
|
||
can
|
||
for
|
||
from
|
||
have
|
||
here
|
||
if
|
||
in
|
||
is
|
||
it
|
||
no
|
||
not
|
||
of
|
||
on
|
||
or
|
||
our
|
||
out
|
||
that
|
||
the
|
||
this
|
||
to
|
||
up
|
||
us
|
||
|
||
;
|
||
; 词性语法规则表
|
||
;
|
||
[attrs]
|
||
; c 是连词
|
||
p(1) + n = 5
|
||
n + f(1) = 300
|
||
n + m(1) = 500
|
||
n(1) + v = 100
|
||
n + v(1) = 10
|
||
r + n(1) = 1000
|
||
r(1) + n = 100
|
||
d(1) + r = 100
|
||
d(1) + v = 100
|
||
v(1) + r = 100
|
||
n + m(1) = 500
|
||
v + f(1) = 30
|
||
v(1) + m = 100
|
||
v(1) + n = 3
|
||
a + u(1) = 5
|
||
v + n(1) = 5
|
||
u(1) + a = 2
|
||
c(1) + * = 50
|
||
* + c(1) = 50
|
||
|
||
;
|
||
; 名字停用词表
|
||
;
|
||
[noname]
|
||
:line = no
|
||
给的说对在和是被最所那这有将
|
||
你会与他为不没很了啊哦呵把去
|
||
|
||
;
|
||
; 双字节符号
|
||
;
|
||
[symbol]
|
||
:type = none
|
||
:line = no
|
||
`-=[]、‘;/。,|?》《:“{}+—)(*…%¥#·!~
|
||
’”〕〈〉「」『』〖〗【】<>
|
||
|
||
;
|
||
; 姓和外文名共同部分
|
||
;
|
||
[pubname]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:znum = 1,2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
艾安贝卜戴费福盖戈古赫华霍吉贾金柯赖劳雷黎利林卢
|
||
鲁伦罗洛马麦米莫穆齐乔冉萨沙史斯温谢尤詹诸
|
||
|
||
|
||
[pubname2]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
伍陆
|
||
|
||
[pubname3]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
万章
|
||
|
||
;
|
||
; 单姓
|
||
;
|
||
[surname]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
:znum = 1,2
|
||
|
||
敖白班包宝保鲍毕边卞柏蔡曹岑柴昌常车陈成程迟池褚
|
||
楚储淳崔刀邓狄刁丁董窦杜端段樊范方房斐丰封冯凤伏
|
||
傅甘高耿龚宫勾苟辜谷顾官关管桂郭韩杭郝禾何贺衡洪
|
||
侯胡花黄稽姬纪季简翦姜江蒋焦晋靳荆居康空孔匡邝况
|
||
蓝郎朗乐冷李理厉励连廉练良梁廖凌刘柳隆龙楼娄吕路
|
||
骆麻满茅毛梅孟苗缪闵明牟倪聂牛钮农潘庞裴彭皮朴平
|
||
蒲溥浦戚祁钱强秦丘邱仇裘屈瞿权饶任荣容阮瑞芮赛单
|
||
商邵佘申沈盛石寿舒宋苏孙邰谭谈汤唐陶滕田佟仝屠涂
|
||
汪王危韦魏卫蔚闻翁巫邬武吴奚习夏鲜席冼项萧解辛邢
|
||
幸熊徐许宣薛荀颜阎言严彦晏燕杨阳姚叶蚁易殷银尹应
|
||
英游于於鱼虞俞余禹喻郁尉袁岳云臧曾查翟湛张赵甄郑
|
||
钟周朱竺祝庄卓宗邹祖左肖
|
||
|
||
;
|
||
; 复姓
|
||
;
|
||
[surname2]
|
||
:type = prefix
|
||
:line = yes
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
:znum = 1, 2
|
||
东郭
|
||
公孙
|
||
皇甫
|
||
慕容
|
||
欧阳
|
||
单于
|
||
司空
|
||
司马
|
||
司徒
|
||
澹台
|
||
诸葛
|
||
|
||
;
|
||
; 地点名称
|
||
;
|
||
[areaname]
|
||
:type = suffix
|
||
:znum = 2
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 4.5
|
||
:idf = 3.0
|
||
:attr = ns
|
||
:line = no
|
||
|
||
县市镇村乡区
|
||
|
||
;
|
||
; 双字地点名称
|
||
;
|
||
[areaname2]
|
||
:type = suffix
|
||
:znum = 2
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 4.5
|
||
:idf = 3.0
|
||
:attr = ns
|
||
:line = yes
|
||
东路
|
||
西路
|
||
支路
|
||
街道
|
||
南路
|
||
北路
|
||
|
||
|
||
[munit]
|
||
:type = none
|
||
:line = no
|
||
萬亿零年点分秒回节名个多届次集
|
||
|
||
[chnum0]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 2.5
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum2,chnum3,munit,pubname3
|
||
0
|
||
|
||
[chnum1]
|
||
:type = prefix
|
||
:include = chnum0,chnum1,munit,pubname3
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:line = no
|
||
一二三四五六七八九十百千
|
||
|
||
[chnum2]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum0,chnum2,chnum3,munit,pubname3
|
||
123456789
|
||
|
||
[chnum3]
|
||
:type = none
|
||
:line = no
|
||
.
|
||
|
||
[chnum4]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum4,munit,pubname2,pubname3
|
||
|
||
壹贰叁肆柒捌玖拾佰仟
|
||
|
||
[chnum5]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.5
|
||
:idf = 2.0
|
||
:attr = nz
|
||
:include = chnum1,munit,pubname3,chnum2
|
||
|
||
第每
|
||
|
||
[alpha]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 2.5
|
||
:idf = 1.0
|
||
:attr = en
|
||
:include = alpha
|
||
|
||
abcdefghijklmnopqrstuvwxyz
|
||
ABCDEFGHIJKLMNOPQRSTUVWXYZ'
|
||
|
||
[foregin]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 4.0
|
||
:idf = 3.0
|
||
:attr = nr
|
||
:include = foregin,pubname,pubname2,pubname3
|
||
阿克拉加内亚巴尔姆爱兰西伊杰纳布可夫勒特坦芬尼根登都
|
||
伯泰胥俄科索沃森奥瓦茨普蒂塞维大莱德冈墨哥弗库澳哈兹
|
||
乌奇切诺里基延达塔卡雅来波迈蓬什比摩曼乃休合娜迪凯帕
|
||
桑佩蒙博托格泽及希匹印埃努烈累法图喀土腓耶逊宾
|