|
|||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Objectjava.util.Dictionary<K,V>
java.util.Hashtable<java.lang.Object,java.lang.Object>
java.util.Properties
edu.stanford.nlp.tagger.maxent.TaggerConfig
public class TaggerConfig
Reads and stores configuration information for a POS tagger. Implementation note: To add a new parameter: (1) define a default String value, (2) add it to defaultValues hash, (3) add line to constructor, (4) add getter method, (5) add to dump() method, (6) add to printGenProps() method, (7) add to class javadoc of MaxentTagger.
Nested Class Summary | |
---|---|
static class |
TaggerConfig.Mode
|
Field Summary | |
---|---|
static java.lang.String |
APPROXIMATE
|
static java.lang.String |
ARCH
|
static java.lang.String |
CLOSED_CLASS_THRESHOLD
|
static java.lang.String |
CUR_WORD_MIN_FEATURE_THRESH
|
static java.lang.String |
DEBUG
|
static java.lang.String |
DEFAULT_REG_L1
|
static java.lang.String |
ENCODING
|
static java.lang.String |
ENCODING_PROPERTY
|
static java.lang.String |
INIT_FROM_TREES
|
static java.lang.String |
ITERATIONS
|
static java.lang.String |
LANG
|
static java.lang.String |
LEARN_CLOSED_CLASS
|
static java.lang.String |
MIN_FEATURE_THRESH
|
static java.lang.String |
OCCURING_TAGS_ONLY
|
static java.lang.String |
OUTPUT_FILE
|
static java.lang.String |
OUTPUT_FORMAT
|
static java.lang.String |
OUTPUT_FORMAT_OPTIONS
|
static java.lang.String |
POSSIBLE_TAGS_ONLY
|
static java.lang.String |
RARE_WORD_MIN_FEATURE_THRESH
|
static java.lang.String |
RARE_WORD_THRESH
|
static java.lang.String |
SEARCH
|
static java.lang.String |
SGML
|
static java.lang.String |
SIGMA_SQUARED
|
static java.lang.String |
TAG_INSIDE
|
static java.lang.String |
TAG_SEPARATOR
|
static java.lang.String |
TAG_SEPARATOR_PROPERTY
|
static java.lang.String |
TOKENIZE
|
static java.lang.String |
TOKENIZER_FACTORY
|
static java.lang.String |
TOKENIZER_OPTIONS
|
static java.lang.String |
TREE_NORMALIZER
|
static java.lang.String |
TREE_RANGE
|
static java.lang.String |
TREE_TRANSFORMER
|
static java.lang.String |
VERBOSE
|
static java.lang.String |
VERBOSE_RESULTS
|
static java.lang.String |
VERY_COMMON_WORD_THRESH
|
static java.lang.String |
XML_INPUT
|
Fields inherited from class java.util.Properties |
---|
defaults |
Constructor Summary | |
---|---|
TaggerConfig(java.util.Properties props)
|
|
TaggerConfig(java.lang.String... args)
|
|
TaggerConfig(TaggerConfig old)
We force you to pass in a TaggerConfig rather than any other superclass so that we know the arg error checking has already occurred |
Method Summary | |
---|---|
void |
dump()
|
void |
dump(java.io.PrintStream stream)
|
java.lang.String |
getArch()
|
java.lang.String[] |
getClosedClassTags()
|
int |
getClosedTagThreshold()
|
int |
getCurWordMinFeatureThresh()
|
boolean |
getDebug()
|
java.lang.String |
getDebugPrefix()
|
double |
getDefaultScore()
Returns a default score to be used for each tag that is incompatible with the current word (e.g., the tag CC for the word "apple"). |
static java.lang.String |
getDefaultTagSeparator()
|
java.lang.String |
getEncoding()
|
java.lang.String |
getFile()
|
int |
getIterations()
|
java.lang.String |
getJarModel()
|
java.lang.String |
getLang()
|
boolean |
getLearnClosedClassTags()
|
int |
getMinFeatureThresh()
|
TaggerConfig.Mode |
getMode()
|
java.lang.String |
getModel()
|
java.lang.String[] |
getOpenClassTags()
|
java.lang.String |
getOutputFile()
|
java.lang.String |
getOutputFormat()
|
boolean |
getOutputLemmas()
|
java.lang.String[] |
getOutputOptions()
|
boolean |
getOutputOptionsContains(java.lang.String sought)
|
boolean |
getOutputVerbosity()
|
int |
getRareWordMinFeatureThresh()
|
int |
getRareWordThresh()
|
double |
getRegL1()
|
java.lang.String |
getSearch()
|
java.lang.String |
getSentenceDelimiter()
This returns the sentence delimiter used when tokenizing text using the tokenizer requested in this config. |
boolean |
getSGML()
|
double |
getSigmaSquared()
|
java.lang.String |
getTagInside()
Return a regex of XML elements to tag inside of. |
java.lang.String |
getTagSeparator()
|
boolean |
getTokenize()
|
java.lang.String |
getTokenizerFactory()
|
boolean |
getTokenizerInvertible()
|
java.lang.String |
getTokenizerOptions()
|
boolean |
getVerbose()
|
boolean |
getVerboseResults()
|
int |
getVeryCommonWordThresh()
|
java.lang.String[] |
getXMLInput()
|
boolean |
occuringTagsOnly()
|
boolean |
possibleTagsOnly()
|
static TaggerConfig |
readConfig(java.io.DataInputStream stream)
Read in a TaggerConfig. |
void |
saveConfig(java.io.OutputStream os)
Serialize the TaggerConfig. |
java.lang.String |
toString()
|
boolean |
useStdin()
Returns whether or not we should use stdin for reading when tagging data. |
Methods inherited from class java.util.Properties |
---|
getProperty, getProperty, list, list, load, load, loadFromXML, propertyNames, save, setProperty, store, store, storeToXML, storeToXML, stringPropertyNames |
Methods inherited from class java.util.Hashtable |
---|
clear, clone, contains, containsKey, containsValue, elements, entrySet, equals, get, hashCode, isEmpty, keys, keySet, put, putAll, rehash, remove, size, values |
Methods inherited from class java.lang.Object |
---|
finalize, getClass, notify, notifyAll, wait, wait, wait |
Field Detail |
---|
public static final java.lang.String SEARCH
public static final java.lang.String TAG_SEPARATOR
public static final java.lang.String TOKENIZE
public static final java.lang.String DEBUG
public static final java.lang.String ITERATIONS
public static final java.lang.String ARCH
public static final java.lang.String RARE_WORD_THRESH
public static final java.lang.String MIN_FEATURE_THRESH
public static final java.lang.String CUR_WORD_MIN_FEATURE_THRESH
public static final java.lang.String RARE_WORD_MIN_FEATURE_THRESH
public static final java.lang.String VERY_COMMON_WORD_THRESH
public static final java.lang.String OCCURING_TAGS_ONLY
public static final java.lang.String POSSIBLE_TAGS_ONLY
public static final java.lang.String SIGMA_SQUARED
public static final java.lang.String ENCODING
public static final java.lang.String LEARN_CLOSED_CLASS
public static final java.lang.String CLOSED_CLASS_THRESHOLD
public static final java.lang.String VERBOSE
public static final java.lang.String VERBOSE_RESULTS
public static final java.lang.String SGML
public static final java.lang.String INIT_FROM_TREES
public static final java.lang.String LANG
public static final java.lang.String TOKENIZER_FACTORY
public static final java.lang.String XML_INPUT
public static final java.lang.String TREE_TRANSFORMER
public static final java.lang.String TREE_NORMALIZER
public static final java.lang.String TREE_RANGE
public static final java.lang.String TAG_INSIDE
public static final java.lang.String APPROXIMATE
public static final java.lang.String TOKENIZER_OPTIONS
public static final java.lang.String DEFAULT_REG_L1
public static final java.lang.String OUTPUT_FILE
public static final java.lang.String OUTPUT_FORMAT
public static final java.lang.String OUTPUT_FORMAT_OPTIONS
public static final java.lang.String ENCODING_PROPERTY
public static final java.lang.String TAG_SEPARATOR_PROPERTY
Constructor Detail |
---|
public TaggerConfig(TaggerConfig old)
public TaggerConfig(java.lang.String... args)
public TaggerConfig(java.util.Properties props)
Method Detail |
---|
public java.lang.String getModel()
public java.lang.String getJarModel()
public java.lang.String getFile()
public java.lang.String getOutputFile()
public java.lang.String getOutputFormat()
public java.lang.String[] getOutputOptions()
public boolean getOutputVerbosity()
public boolean getOutputLemmas()
public boolean getOutputOptionsContains(java.lang.String sought)
public java.lang.String getSearch()
public double getSigmaSquared()
public int getIterations()
public int getRareWordThresh()
public int getMinFeatureThresh()
public int getCurWordMinFeatureThresh()
public int getRareWordMinFeatureThresh()
public int getVeryCommonWordThresh()
public boolean occuringTagsOnly()
public boolean possibleTagsOnly()
public java.lang.String getLang()
public java.lang.String[] getOpenClassTags()
public java.lang.String[] getClosedClassTags()
public boolean getLearnClosedClassTags()
public int getClosedTagThreshold()
public java.lang.String getArch()
public boolean getDebug()
public java.lang.String getDebugPrefix()
public java.lang.String getTokenizerFactory()
public static java.lang.String getDefaultTagSeparator()
public final java.lang.String getTagSeparator()
public boolean getTokenize()
public java.lang.String getEncoding()
public double getRegL1()
public java.lang.String[] getXMLInput()
public boolean getVerbose()
public boolean getVerboseResults()
public boolean getSGML()
public java.lang.String getTagInside()
public java.lang.String getTokenizerOptions()
public boolean getTokenizerInvertible()
public double getDefaultScore()
public void dump()
public void dump(java.io.PrintStream stream)
public java.lang.String toString()
toString
in class java.util.Hashtable<java.lang.Object,java.lang.Object>
public java.lang.String getSentenceDelimiter()
public boolean useStdin()
public TaggerConfig.Mode getMode()
public void saveConfig(java.io.OutputStream os) throws java.io.IOException
os
- Where to write this TaggerConfig
java.io.IOException
- If any IO problemspublic static TaggerConfig readConfig(java.io.DataInputStream stream) throws java.io.IOException, java.lang.ClassNotFoundException
stream
- Where to read from
java.io.IOException
- Misc IOError
java.lang.ClassNotFoundException
- Class error
|
|||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |