CofeehousePy/services/corenlp/scripts/pos-tagger/chinese-distsim.tagger.props

## tagger training invoked at Fri Feb 14 01:19:49 PST 2014 with arguments:
                   model = chinese-distsim.tagger
                    arch = generic,suffix(4),prefix(4),unicodeshapes(-1,1),unicodeshapeconjunction(-1,1),words(-2,-2),words(2,2),distsim(/u/nlp/data/chinese/distsim/xin_cmn_2000-2010.ldc.seg.utf8.1M.random-c1000,-1,1),distsimconjunction(/u/nlp/data/chinese/distsim/xin_cmn_2000-2010.ldc.seg.utf8.1M.random-c1000,-1,1)
            wordFunction = edu.stanford.nlp.util.UTF8EquivalenceFunction
               trainFile = format=TREES,/u/nlp/data/chinese/ctb7/train.mrg
         closedClassTags = 
 closedClassTagThreshold = 40
 curWordMinFeatureThresh = 1
                   debug = false
             debugPrefix = 
            tagSeparator = #
                encoding = utf-8
              iterations = 100
                    lang = chinese
    learnClosedClassTags = false
        minFeatureThresh = 3
           openClassTags = 
rareWordMinFeatureThresh = 3
          rareWordThresh = 20
                  search = owlqn
                    sgml = false
            sigmaSquared = 0.0
                   regL1 = 0.75
               tagInside = 
                tokenize = false
        tokenizerFactory = 
        tokenizerOptions = 
                 verbose = false
          verboseResults = true
    veryCommonWordThresh = 250
                xmlInput = null
              outputFile = 
            outputFormat = slashTags
     outputFormatOptions = 
                nthreads = 1
Added CoreNLP 2021-01-09 03:43:33 +01:00			`## tagger training invoked at Fri Feb 14 01:19:49 PST 2014 with arguments:`
			`model = chinese-distsim.tagger`
			`arch = generic,suffix(4),prefix(4),unicodeshapes(-1,1),unicodeshapeconjunction(-1,1),words(-2,-2),words(2,2),distsim(/u/nlp/data/chinese/distsim/xin_cmn_2000-2010.ldc.seg.utf8.1M.random-c1000,-1,1),distsimconjunction(/u/nlp/data/chinese/distsim/xin_cmn_2000-2010.ldc.seg.utf8.1M.random-c1000,-1,1)`
			`wordFunction = edu.stanford.nlp.util.UTF8EquivalenceFunction`
			`trainFile = format=TREES,/u/nlp/data/chinese/ctb7/train.mrg`
			`closedClassTags =`
			`closedClassTagThreshold = 40`
			`curWordMinFeatureThresh = 1`
			`debug = false`
			`debugPrefix =`
			`tagSeparator = #`
			`encoding = utf-8`
			`iterations = 100`
			`lang = chinese`
			`learnClosedClassTags = false`
			`minFeatureThresh = 3`
			`openClassTags =`
			`rareWordMinFeatureThresh = 3`
			`rareWordThresh = 20`
			`search = owlqn`
			`sgml = false`
			`sigmaSquared = 0.0`
			`regL1 = 0.75`
			`tagInside =`
			`tokenize = false`
			`tokenizerFactory =`
			`tokenizerOptions =`
			`verbose = false`
			`verboseResults = true`
			`veryCommonWordThresh = 250`
			`xmlInput = null`
			`outputFile =`
			`outputFormat = slashTags`
			`outputFormatOptions =`
			`nthreads = 1`