mirror of
https://gitee.com/lionsoul/friso.git
synced 2024-12-02 03:07:52 +08:00
61 lines
1.5 KiB
INI
61 lines
1.5 KiB
INI
#friso configuration file.
|
|
# do not change the name of the left key.
|
|
# @email chenxin619315@gmail.com
|
|
# @date 2012-12-20
|
|
#
|
|
|
|
#charset, only UTF8 and GBK support.
|
|
#set it with UTF8(0) or GBK(1)
|
|
friso.charset = 0
|
|
|
|
#lexicon directory absolute path.
|
|
# the value must end with '/'
|
|
#this will tell friso how to find friso.lex.ini configuration file and all the lexicon files.
|
|
friso.lex_dir = /c/products/friso/dict/UTF-8/
|
|
|
|
#the maximum matching length.
|
|
friso.max_len = 5
|
|
|
|
#1 for recognition chinese name.
|
|
# and 0 for closed it.
|
|
friso.r_name = 1
|
|
|
|
#the maximum length for the cjk words in a
|
|
# chinese and english mixed word.
|
|
friso.mix_len = 2
|
|
|
|
#the maxinum length for the chinese last name adron.
|
|
friso.lna_len = 1
|
|
|
|
#append the synonyms words
|
|
friso.add_syn = 1
|
|
|
|
#clear the stopwords or not (1 to open it and 0 to close it)
|
|
#@date 2013-06-13
|
|
friso.clr_stw = 0
|
|
|
|
#keep the unrecongized words or not (1 to open it and 0 to close it)
|
|
#@date 2013-06-13
|
|
friso.keep_urec = 0
|
|
|
|
#use sphinx output style like 'admire|love|enjoy einsten'
|
|
#@date 2013-10-25
|
|
friso.spx_out = 0
|
|
|
|
#start the secondary segmentation for complex english token.
|
|
friso.en_sseg = 1
|
|
|
|
#min length of the secondary segmentation token. (better larger than 1)
|
|
friso.st_minl = 2
|
|
|
|
#default keep punctuations for english token.
|
|
friso.kpuncs = @%.#&+
|
|
|
|
#the threshold value for a char not a part of a chinese name.
|
|
friso.nthreshold = 2000000
|
|
|
|
#default mode for friso.
|
|
# 1 : simple mode - simply maxmum matching algorithm.
|
|
# 2 : complex mode - four rules of mmseg alogrithm.
|
|
friso.mode = 2
|