-
Notifications
You must be signed in to change notification settings - Fork 3
/
dicrc
36 lines (30 loc) · 1.03 KB
/
dicrc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
; List of features
; f[0]: pos1
; f[1]: pos2
; f[2]: pos3
; f[3]: pos4
; f[4]: pinyin pronunciation
; f[5]: traditional Chinese character form
; f[6]: simplified Chinese character form
; f[7]: definition
cost-factor = 700
bos-feature = BOS/EOS,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*
; If the analysis target is a known word, eval-size specifies criteria for correct answers.
; Unlike Japanese, Chinese has no conjugation.
; Therefore, four elements that are pos 1, 2, 3, 4 are evaluated. Other elements, such as pronunciation information, are ignored.
eval-size = 4
unk-eval-size = 4
config-charset = utf8
output-format-type = cedict
node-format-cedict = %m\t%f[0],%f[1],%f[2],%f[3],%f[4],%f[5],%f[6],%f[7]\n
unk-format-cedict = %m\t%f[0],%f[1],%f[2],%f[3],%f[4],%f[5]\n
bos-format-cedict =
eos-format-cedict = EOS\n
node-format-traditional = %f[5]
unk-format-traditional = %f[5]
bos-format-traditional =
eos-format-traditional = \n
node-format-simplified = %f[6]
unk-format-simplified = %f[6]
bos-format-simplified =
eos-format-simplified = \n