CofeehousePy/services/corenlp/scripts/pos-tagger/chinese-nodistsim.tagger.props

## tagger training invoked at Fri Feb 14 02:20:03 PST 2014 with arguments:
                   model = chinese-nodistsim.tagger
                    arch = generic,suffix(4),prefix(4),unicodeshapes(-1,1),unicodeshapeconjunction(-1,1),words(-2,-2),words(2,2)
            wordFunction = edu.stanford.nlp.util.UTF8EquivalenceFunction
               trainFile = format=TREES,/u/nlp/data/chinese/ctb7/train.mrg
         closedClassTags = 
 closedClassTagThreshold = 40
 curWordMinFeatureThresh = 1
                   debug = false
             debugPrefix = 
            tagSeparator = #
                encoding = utf-8
              iterations = 100
                    lang = chinese
    learnClosedClassTags = false
        minFeatureThresh = 3
           openClassTags = 
rareWordMinFeatureThresh = 3
          rareWordThresh = 20
                  search = owlqn
                    sgml = false
            sigmaSquared = 0.0
                   regL1 = 0.75
               tagInside = 
                tokenize = false
        tokenizerFactory = 
        tokenizerOptions = 
                 verbose = false
          verboseResults = true
    veryCommonWordThresh = 250
                xmlInput = null
              outputFile = 
            outputFormat = slashTags
     outputFormatOptions = 
                nthreads = 1
Added NSFW classification 2021-01-14 08:07:24 +01:00			`## tagger training invoked at Fri Feb 14 02:20:03 PST 2014 with arguments:`
			`model = chinese-nodistsim.tagger`
			`arch = generic,suffix(4),prefix(4),unicodeshapes(-1,1),unicodeshapeconjunction(-1,1),words(-2,-2),words(2,2)`
			`wordFunction = edu.stanford.nlp.util.UTF8EquivalenceFunction`
			`trainFile = format=TREES,/u/nlp/data/chinese/ctb7/train.mrg`
			`closedClassTags =`
			`closedClassTagThreshold = 40`
			`curWordMinFeatureThresh = 1`
			`debug = false`
			`debugPrefix =`
			`tagSeparator = #`
			`encoding = utf-8`
			`iterations = 100`
			`lang = chinese`
			`learnClosedClassTags = false`
			`minFeatureThresh = 3`
			`openClassTags =`
			`rareWordMinFeatureThresh = 3`
			`rareWordThresh = 20`
			`search = owlqn`
			`sgml = false`
			`sigmaSquared = 0.0`
			`regL1 = 0.75`
			`tagInside =`
			`tokenize = false`
			`tokenizerFactory =`
			`tokenizerOptions =`
			`verbose = false`
			`verboseResults = true`
			`veryCommonWordThresh = 250`
			`xmlInput = null`
			`outputFile =`
			`outputFormat = slashTags`
			`outputFormatOptions =`
			`nthreads = 1`