36 lines
1.3 KiB
XML
36 lines
1.3 KiB
XML
## tagger training invoked at Sat Oct 08 12:21:50 PDT 2016 with arguments:
|
|
model = spanish.tagger
|
|
arch = left3words,naacl2003unknowns,allwordshapes(-1,1)
|
|
wordFunction =
|
|
trainFile = format=TREES,/u/nlp/data/spanish/ancora/ancora.train;format=TREES,/u/nlp/data/spanish/ldc/ldc-DF.train;format=TREES,/u/nlp/data/spanish/ldc/ldc-NW.train
|
|
closedClassTags =
|
|
closedClassTagThreshold = 40
|
|
curWordMinFeatureThresh = 2
|
|
debug = true
|
|
debugPrefix =
|
|
tagSeparator = _
|
|
encoding = utf-8
|
|
iterations = 100
|
|
lang = spanish
|
|
learnClosedClassTags = false
|
|
minFeatureThresh = 2
|
|
openClassTags =
|
|
rareWordMinFeatureThresh = 10
|
|
rareWordThresh = 5
|
|
search = qn
|
|
sgml = false
|
|
sigmaSquared = 0.0
|
|
regL1 = 0.75
|
|
tagInside =
|
|
tokenize = true
|
|
tokenizerFactory =
|
|
tokenizerOptions = quotes=ascii
|
|
verbose = false
|
|
verboseResults = true
|
|
veryCommonWordThresh = 250
|
|
xmlInput = null
|
|
outputFile =
|
|
outputFormat = slashTags
|
|
outputFormatOptions =
|
|
nthreads = 16
|