-
Notifications
You must be signed in to change notification settings - Fork 0
/
matxin-spa.spa.cfg.in
68 lines (57 loc) · 2.07 KB
/
matxin-spa.spa.cfg.in
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
##
#### default configuration file for Spanish analyzer
##
#### General options
Lang=es
Locale=default
# consider each newline as a sentence end
AlwaysFlush=no
#### Tokenizer options
TokenizerFile=@prefix@/share/matxin/matxin-spa/freeling/tokenizer.dat
#### Splitter options
SplitterFile=@prefix@/share/matxin/matxin-spa/freeling/splitter.dat
#### Morfo options
AffixAnalysis=yes
MultiwordsDetection=yes
NumbersDetection=yes
PunctuationDetection=yes
DatesDetection=yes
QuantitiesDetection=yes
DictionarySearch=yes
ProbabilityAssignment=yes
OrthographicCorrection=no
DecimalPoint=,
ThousandPoint=.
LocutionsFile=@prefix@/share/matxin/matxin-spa/freeling/locucions.dat
QuantitiesFile=@prefix@/share/matxin/matxin-spa/freeling/quantities.dat
AffixFile=@prefix@/share/matxin/matxin-spa/freeling/afixos.dat
ProbabilityFile=@prefix@/share/matxin/matxin-spa/freeling/probabilitats.dat
DictionaryFile=@prefix@/share/matxin/matxin-spa/freeling/dicc.src
PunctuationFile=@prefix@/share/matxin/matxin-spa/freeling/common/punct.dat
ProbabilityThreshold=0.001
# NER options
NERecognition=yes
#NPDataFile=@prefix@/share/matxin/matxin-spa/freeling/np.dat
## --- comment line above and uncomment that below, if you want
## --- a better NE recognizer (higer accuracy, lower speed)
NPDataFile=@prefix@/share/matxin/matxin-spa/freeling/nerc/ner/ner-ab-rich.dat
#Spelling Corrector config file
CorrectorFile=@prefix@/share/matxin/matxin-spa/freeling/corrector/corrector.dat
## NEC options
NEClassification=yes
NECFile=@prefix@/share/matxin/matxin-spa/freeling/nerc/nec/nec-ab-rich.dat
#### Tagger options
#Tagger=hmm
Tagger=relax
TaggerHMMFile=@prefix@/share/matxin/matxin-spa/freeling/tagger.dat
TaggerRelaxFile=@prefix@/share/matxin/matxin-spa/freeling/constr_gram.dat
TaggerRelaxMaxIter=500
TaggerRelaxScaleFactor=670.0
TaggerRelaxEpsilon=0.001
#TaggerRelaxEpsilon=0.00001
TaggerRetokenize=yes
TaggerForceSelect=retok
#### Parser options
GrammarFile=@prefix@/share/matxin/matxin-spa/freeling/chunker/grammar-chunk.dat
#### Dependence Parser options
DepTxalaFile=@prefix@/share/matxin/matxin-spa/freeling/dep/dependences.dat