annotate src/classifiers/english.all.3class.distsim.prop @ 6:50aeb96a8ee9

bugfix: person ml
author jdamerow
date Thu, 01 Nov 2012 13:23:25 -0700
parents 036535fcd179
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
036535fcd179 anteater
jdamerow
parents:
diff changeset
1 trainFile = /u/nlp/data/ner/goodClassifiers/data/all.3class.train
036535fcd179 anteater
jdamerow
parents:
diff changeset
2 testFile = /u/nlp/data/ner/column_data/conll.testa
036535fcd179 anteater
jdamerow
parents:
diff changeset
3 serializeTo = english.all.3class.distsim.crf.ser.gz
036535fcd179 anteater
jdamerow
parents:
diff changeset
4
036535fcd179 anteater
jdamerow
parents:
diff changeset
5 type = crf
036535fcd179 anteater
jdamerow
parents:
diff changeset
6
036535fcd179 anteater
jdamerow
parents:
diff changeset
7 #distSimLexicon = /u/nlp/data/pos_tags_are_useless/englishGigaword.200.pruned
036535fcd179 anteater
jdamerow
parents:
diff changeset
8 #distSimLexicon = /u/nlp/data/pos_tags_are_useless/egw.bnc.200
036535fcd179 anteater
jdamerow
parents:
diff changeset
9 distSimLexicon = /u/nlp/data/pos_tags_are_useless/egw4-reut.512.clusters
036535fcd179 anteater
jdamerow
parents:
diff changeset
10 useDistSim = true
036535fcd179 anteater
jdamerow
parents:
diff changeset
11
036535fcd179 anteater
jdamerow
parents:
diff changeset
12 map = word=0,answer=1
036535fcd179 anteater
jdamerow
parents:
diff changeset
13
036535fcd179 anteater
jdamerow
parents:
diff changeset
14 saveFeatureIndexToDisk = true
036535fcd179 anteater
jdamerow
parents:
diff changeset
15
036535fcd179 anteater
jdamerow
parents:
diff changeset
16 useClassFeature=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
17 useWord=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
18 #useWordPairs=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
19 useNGrams=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
20 noMidNGrams=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
21 maxNGramLeng=6
036535fcd179 anteater
jdamerow
parents:
diff changeset
22 usePrev=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
23 useNext=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
24 #useTags=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
25 #useWordTag=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
26 useLongSequences=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
27 useSequences=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
28 usePrevSequences=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
29 maxLeft=1
036535fcd179 anteater
jdamerow
parents:
diff changeset
30 useTypeSeqs=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
31 useTypeSeqs2=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
32 useTypeySequences=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
33 useOccurrencePatterns=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
34 useLastRealWord=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
35 useNextRealWord=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
36 #useReverse=false
036535fcd179 anteater
jdamerow
parents:
diff changeset
37 normalize=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
38 # normalizeTimex=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
39 wordShape=chris2useLC
036535fcd179 anteater
jdamerow
parents:
diff changeset
40 useDisjunctive=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
41 disjunctionWidth=5
036535fcd179 anteater
jdamerow
parents:
diff changeset
42 #useDisjunctiveShapeInteraction=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
43
036535fcd179 anteater
jdamerow
parents:
diff changeset
44 readerAndWriter=edu.stanford.nlp.sequences.ColumnDocumentReaderAndWriter
036535fcd179 anteater
jdamerow
parents:
diff changeset
45
036535fcd179 anteater
jdamerow
parents:
diff changeset
46 useObservedSequencesOnly=true
036535fcd179 anteater
jdamerow
parents:
diff changeset
47
036535fcd179 anteater
jdamerow
parents:
diff changeset
48 useQN = true
036535fcd179 anteater
jdamerow
parents:
diff changeset
49 QNsize = 25
036535fcd179 anteater
jdamerow
parents:
diff changeset
50
036535fcd179 anteater
jdamerow
parents:
diff changeset
51 # makes it go faster
036535fcd179 anteater
jdamerow
parents:
diff changeset
52 featureDiffThresh=0.05