mirror of
https://gitee.com/ShopeX/OMS
synced 2026-04-13 01:05:42 +08:00
291 lines
4.3 KiB
INI
291 lines
4.3 KiB
INI
;
|
||
; auto regular(utf-8)
|
||
; $Id$
|
||
;
|
||
; special word, 特殊詞匯
|
||
;
|
||
|
||
[special]
|
||
C++
|
||
C#
|
||
R&B
|
||
P&G
|
||
J++
|
||
J#
|
||
UTF-8
|
||
PS/2
|
||
|
||
;
|
||
; nostats
|
||
;
|
||
[nostats]
|
||
about
|
||
all
|
||
also
|
||
an
|
||
and
|
||
any
|
||
are
|
||
as
|
||
at
|
||
be
|
||
but
|
||
by
|
||
both
|
||
can
|
||
for
|
||
from
|
||
have
|
||
here
|
||
if
|
||
in
|
||
is
|
||
it
|
||
no
|
||
not
|
||
of
|
||
on
|
||
or
|
||
our
|
||
out
|
||
that
|
||
the
|
||
this
|
||
to
|
||
up
|
||
us
|
||
|
||
;
|
||
; 词性语法规则表
|
||
;
|
||
[attrs]
|
||
; c 是连词
|
||
n + f(1) = 300
|
||
n + m(1) = 500
|
||
n(1) + v = 100
|
||
n + v(1) = 10
|
||
r + n(1) = 1000
|
||
r(1) + n = 100
|
||
d(1) + r = 100
|
||
d(1) + v = 100
|
||
v(1) + r = 100
|
||
n + m(1) = 500
|
||
v + f(1) = 30
|
||
v(1) + m = 100
|
||
v(1) + n = 5
|
||
a + u(1) = 5
|
||
v + n(1) = 5
|
||
c(1) + * = 50
|
||
* + c(1) = 50
|
||
|
||
;
|
||
; 名字停用詞表
|
||
;
|
||
[noname]
|
||
:line = no
|
||
給的說對在和是被最所那這有將
|
||
你會與他為不沒很了啊哦呵把去
|
||
|
||
;
|
||
; 雙字節符號
|
||
;
|
||
[symbol]
|
||
:type = none
|
||
:line = no
|
||
`-=[]、‘;/。,|?》《:“{}+—)(*…%¥#·!~
|
||
’”〕〈〉「」『』〖〗【】<>
|
||
|
||
;
|
||
; 姓和外文名共同部分
|
||
;
|
||
[pubname]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:znum = 1,2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
艾安貝卜戴費福蓋戈古赫華霍吉賈金柯賴勞雷黎利林盧
|
||
魯倫羅洛馬麥米莫穆齊喬冉薩沙史斯溫謝尤詹諸
|
||
|
||
|
||
[pubname2]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
伍陸
|
||
|
||
[pubname3]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
萬章
|
||
|
||
;
|
||
; 單姓
|
||
;
|
||
[surname]
|
||
:type = prefix
|
||
:line = no
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
:znum = 1,2
|
||
|
||
敖白班包寶保鮑畢邊卞柏蔡曹岑柴昌常車陳成程遲池褚
|
||
楚儲淳崔刀鄧狄刁丁董竇杜端段樊范方房斐豐封馮鳳伏
|
||
傅甘高耿龔宮勾苟辜谷顧官關管桂郭韓杭郝禾何賀衡洪
|
||
侯胡花黃稽姬紀季簡翦姜江蔣焦晉靳荊居康空孔匡鄺況
|
||
藍郎朗樂冷李理厲勵連廉練良樑廖凌劉柳隆龍樓婁呂路
|
||
駱麻滿茅毛梅孟苗繆閔明牟倪聶牛鈕農潘龐裴彭皮樸平
|
||
蒲溥浦戚祁錢強秦丘邱仇裘屈瞿權饒任榮容阮瑞芮賽單
|
||
商邵佘申沈盛石壽舒宋蘇孫邰譚談湯唐陶滕田佟仝屠塗
|
||
汪王危韋魏衛蔚聞翁巫鄔武吳奚習夏鮮席冼項蕭解辛邢
|
||
幸熊徐許宣薛荀顏閻言嚴彥晏燕楊陽姚葉蟻易殷銀尹應
|
||
英遊於於魚虞俞余禹喻鬱尉袁岳雲臧曾查翟湛張趙甄鄭
|
||
鐘周朱竺祝莊卓宗鄒祖左肖
|
||
|
||
;
|
||
; 復姓
|
||
;
|
||
[surname2]
|
||
:type = prefix
|
||
:line = yes
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 5.0
|
||
:idf = 3.5
|
||
:attr = nr
|
||
:znum = 1, 2
|
||
東郭
|
||
公孫
|
||
皇甫
|
||
慕容
|
||
歐陽
|
||
單於
|
||
司空
|
||
司馬
|
||
司徒
|
||
澹台
|
||
諸葛
|
||
|
||
;
|
||
; 地點名稱
|
||
;
|
||
[areaname]
|
||
:type = suffix
|
||
:znum = 2
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 4.5
|
||
:idf = 3.0
|
||
:attr = ns
|
||
:line = no
|
||
|
||
縣市鎮村鄉區
|
||
|
||
;
|
||
; 雙字地點名稱
|
||
;
|
||
[areaname2]
|
||
:type = suffix
|
||
:znum = 2
|
||
:exclude = noname,symbol,alpha,chnum2
|
||
:tf = 4.5
|
||
:idf = 3.0
|
||
:attr = ns
|
||
:line = yes
|
||
東路
|
||
西路
|
||
支路
|
||
街道
|
||
南路
|
||
北路
|
||
|
||
|
||
[munit]
|
||
:type = none
|
||
:line = no
|
||
萬億零年點分秒回節名個多屆次集
|
||
|
||
[chnum0]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 2.5
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum2,chnum3,munit,pubname3
|
||
0
|
||
|
||
[chnum1]
|
||
:type = prefix
|
||
:include = chnum0,chnum1,munit,pubname3
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:line = no
|
||
一二三四五六七八九十百千
|
||
|
||
[chnum2]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum0,chnum2,chnum3,munit,pubname3
|
||
123456789
|
||
|
||
[chnum3]
|
||
:type = none
|
||
:line = no
|
||
.
|
||
|
||
[chnum4]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.0
|
||
:idf = 1.0
|
||
:attr = mt
|
||
:include = chnum4,munit,pubname2,pubname3
|
||
|
||
壹貳三肆柒捌玖拾佰仟
|
||
|
||
[chnum5]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 3.5
|
||
:idf = 2.0
|
||
:attr = nz
|
||
:include = chnum1,munit,pubname3,chnum2
|
||
|
||
第每
|
||
|
||
[alpha]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 2.5
|
||
:idf = 1.0
|
||
:attr = en
|
||
:include = alpha
|
||
|
||
abcdefghijklmnopqrstuvwxyz
|
||
ABCDEFGHIJKLMNOPQRSTUVWXYZ'
|
||
|
||
[foregin]
|
||
:type = prefix
|
||
:line = no
|
||
:tf = 4.0
|
||
:idf = 3.0
|
||
:attr = nr
|
||
:include = foregin,pubname,pubname2,pubname3
|
||
阿克拉加內亞巴爾姆愛蘭西伊傑納布可夫勒特坦芬尼根登都
|
||
伯泰胥俄科索沃森奧瓦茨普蒂塞維大萊德岡墨哥弗庫澳哈茲
|
||
烏奇切諾裡基延達塔卡雅來波邁蓬什比摩曼乃休合娜迪凱帕
|
||
桑佩蒙博托格澤及希匹印埃努烈累法圖喀土腓耶遜賓
|