Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
KEY_VAL_DELIM |
":" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
LEMMA_MARK |
"|||" |
public static final java.lang.String |
MORPHO_MARK |
"~#" |
public static final java.lang.String |
NO_ANALYSIS |
"XXX" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
defaultEncoding |
"utf-8" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
TAG_SEPARATOR |
"/" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
TAG_LABEL |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
EMPTY_STRING |
"*t*" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
LEMMA_LABEL |
1 |
public static final int |
TAG_LABEL |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
CASE_INSENSITIVE |
2 |
public static final int |
NORMALIZE |
4 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
GROUP_AFTER_MATCH |
-2147483647 |
public static final int |
GROUP_BEFORE_MATCH |
-2147483648 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
COMPOSITE_RULE_TYPE |
"composite" |
public static final java.lang.String |
FILTER_RULE_TYPE |
"filter" |
public static final java.lang.String |
TEXT_PATTERN_RULE_TYPE |
"text" |
public static final java.lang.String |
TOKEN_PATTERN_RULE_TYPE |
"tokens" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
BACKREF |
12 |
public static final int |
DEFAULT |
0 |
public static final int |
EOF |
0 |
public static final int |
IDENTIFIER |
7 |
public static final int |
INT |
14 |
public static final int |
LONGINT |
15 |
public static final int |
NONNEGINT |
13 |
public static final int |
NUMCMP |
19 |
public static final int |
REAL |
16 |
public static final int |
REGEX |
17 |
public static final int |
REGEXGROUP |
9 |
public static final int |
REGEXMRGROUP |
11 |
public static final int |
REGEXMRVAR |
10 |
public static final int |
REGEXVAR |
8 |
public static final int |
STR |
18 |
public static final int |
STRREGEXCMP |
20 |
public static final int |
STRSIMPLE |
21 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
TYPE_ANNOTATION_KEY |
"ANNOKEY" |
public static final java.lang.String |
TYPE_BOOLEAN |
"BOOLEAN" |
public static final java.lang.String |
TYPE_CLASS |
"CLASS" |
public static final java.lang.String |
TYPE_COMPOSITE |
"COMPOSITE" |
public static final java.lang.String |
TYPE_FUNCTION |
"FUNCTION" |
public static final java.lang.String |
TYPE_LIST |
"LIST" |
public static final java.lang.String |
TYPE_NUMBER |
"NUMBER" |
public static final java.lang.String |
TYPE_REGEX |
"REGEX" |
public static final java.lang.String |
TYPE_REGEXMATCHVAR |
"REGEXMATCHVAR" |
public static final java.lang.String |
TYPE_SET |
"SET" |
public static final java.lang.String |
TYPE_STRING |
"STRING" |
public static final java.lang.String |
TYPE_STRING_REGEX |
"STRING_REGEX" |
public static final java.lang.String |
TYPE_TOKEN_REGEX |
"TOKEN_REGEX" |
public static final java.lang.String |
TYPE_TOKENS |
"TOKENS" |
public static final java.lang.String |
TYPE_VAR |
"VAR" |
public static final java.lang.String |
VAR_SELF |
"_" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final boolean |
DEBUG_LEXICON |
false |
protected static final boolean |
DEBUG_LEXICON_SCORE |
false |
protected static final short |
nullTag |
-1 |
protected static final int |
nullWord |
-1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final boolean |
DEFAULT_USE_GOOD_TURNING_UNKNOWN_WORD_MODEL |
false |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ANY_DISTANCE_INT |
-1 |
public static final java.lang.String |
LEFT |
"left" |
public static final java.lang.String |
RIGHT |
"right" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
ANY |
".*." |
public static final int |
ANY_TAG_INT |
-1 |
public static final int |
ANY_WORD_INT |
-1 |
public static final java.lang.String |
STOP |
"STOP" |
public static final int |
STOP_TAG_INT |
-2 |
public static final int |
STOP_WORD_INT |
-2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
BOUNDARY |
".$." |
public static final java.lang.String |
BOUNDARY_TAG |
".$$." |
public static final java.lang.String |
UNKNOWN_WORD |
"UNK" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final double |
MIN_PROBABILITY |
1.0E-40 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_WORD_VECTOR_FILE |
"/scr/nlp/deeplearning/datasets/turian/embeddings-scaled.EMBEDDING_SIZE=25.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final double |
SUPPCUTOFF |
100.0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final boolean |
DO_TAGS |
true |
public static final double |
SUPPCUTOFF |
100.0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public final boolean |
exhaustiveTest |
false |
public final boolean |
pcfgThreshold |
false |
public final double |
pcfgThresholdValue |
-2.0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_BATCH_SIZE |
25 |
public static final double |
DEFAULT_DELTA_MARGIN |
0.1 |
public static final int |
DEFAULT_K_BEST |
100 |
public static final double |
DEFAULT_LEARNING_RATE |
0.1 |
public static final int |
DEFAULT_QN_ITERATIONS_PER_BATCH |
1 |
public static final double |
DEFAULT_REGCOST |
1.0E-4 |
public static final double |
DEFAULT_SCALING_FOR_INIT |
0.5 |
public static final int |
DEFAULT_STALLED_ITERATION_LIMIT |
12 |
public static final int |
DEFAULT_TRAINING_ITERATIONS |
40 |
public static final java.lang.String |
DEFAULT_UNK_WORD |
"*UNK*" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final short |
nullTag |
-1 |
public static final int |
nullWord |
-1 |
public static final java.lang.String |
unknown |
"UNK" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
STANFORD_CLEAN_XML |
"cleanxml" |
public static final java.lang.String |
STANFORD_DETERMINISTIC_COREF |
"dcoref" |
public static final java.lang.String |
STANFORD_GENDER |
"gender" |
public static final java.lang.String |
STANFORD_LEMMA |
"lemma" |
public static final java.lang.String |
STANFORD_NER |
"ner" |
public static final java.lang.String |
STANFORD_PARSE |
"parse" |
public static final java.lang.String |
STANFORD_POS |
"pos" |
public static final java.lang.String |
STANFORD_REGEXNER |
"regexner" |
public static final java.lang.String |
STANFORD_RELATION |
"relation" |
public static final java.lang.String |
STANFORD_SENTIMENT |
"sentiment" |
public static final java.lang.String |
STANFORD_SSPLIT |
"ssplit" |
public static final java.lang.String |
STANFORD_TOKENIZE |
"tokenize" |
public static final java.lang.String |
STANFORD_TRUECASE |
"truecase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DONT_CAPITALIZE_TIMEX |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
NOWORDSHAPE |
-1 |
public static final int |
WORDSHAPECHINESE |
14 |
public static final int |
WORDSHAPECHRIS1 |
1 |
public static final int |
WORDSHAPECHRIS2 |
8 |
public static final int |
WORDSHAPECHRIS2USELC |
9 |
public static final int |
WORDSHAPECHRIS3 |
10 |
public static final int |
WORDSHAPECHRIS3USELC |
11 |
public static final int |
WORDSHAPECHRIS4 |
12 |
public static final int |
WORDSHAPECLUSTER1 |
15 |
public static final int |
WORDSHAPEDAN1 |
0 |
public static final int |
WORDSHAPEDAN2 |
2 |
public static final int |
WORDSHAPEDAN2BIO |
4 |
public static final int |
WORDSHAPEDAN2BIOUSELC |
5 |
public static final int |
WORDSHAPEDAN2USELC |
3 |
public static final int |
WORDSHAPEDIGITS |
13 |
public static final int |
WORDSHAPEJENNY1 |
6 |
public static final int |
WORDSHAPEJENNY1USELC |
7 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_BOUNDARY_REGEX |
"\\.|[!?]+" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_BACKGROUND_SYMBOL |
"O" |
public static final java.lang.String |
DEFAULT_PLAIN_TEXT_READER |
"edu.stanford.nlp.sequences.PlainTextDocumentReaderAndWriter" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
EOS_TAG |
".$$." |
public static final java.lang.String |
EOS_WORD |
".$." |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
ENCODING |
"encoding" |
public static final java.lang.String |
FORMAT |
"format" |
public static final java.lang.String |
TAG_COLUMN |
"tagColumn" |
public static final java.lang.String |
TAG_SEPARATOR |
"tagSeparator" |
public static final java.lang.String |
TREE_FILTER |
"treeFilter" |
public static final java.lang.String |
TREE_NORMALIZER |
"treeNormalizer" |
public static final java.lang.String |
TREE_RANGE |
"treeRange" |
public static final java.lang.String |
TREE_READER |
"trf" |
public static final java.lang.String |
TREE_TRANSFORMER |
"treeTransformer" |
public static final java.lang.String |
WORD_COLUMN |
"wordColumn" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
BASE_TAGGER_HOME |
"$NLP_DATA_HOME/data/pos-tagger/distrib" |
public static final java.lang.String |
DEFAULT_DISTRIBUTION_PATH |
"models/english-left3words-distsim.tagger" |
public static final java.lang.String |
DEFAULT_JAR_PATH |
"edu/stanford/nlp/models/pos-tagger/english-left3words/english-left3words-distsim.tagger" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
APPROXIMATE |
"-1.0" |
public static final java.lang.String |
ARCH |
"" |
public static final java.lang.String |
CLOSED_CLASS_THRESHOLD |
"40" |
public static final java.lang.String |
CUR_WORD_MIN_FEATURE_THRESH |
"2" |
public static final java.lang.String |
DEBUG |
"false" |
public static final java.lang.String |
DEFAULT_REG_L1 |
"1.0" |
public static final java.lang.String |
ENCODING |
"UTF-8" |
public static final java.lang.String |
ENCODING_PROPERTY |
"encoding" |
public static final java.lang.String |
ITERATIONS |
"100" |
public static final java.lang.String |
LANG |
"" |
public static final java.lang.String |
LEARN_CLOSED_CLASS |
"false" |
public static final java.lang.String |
MIN_FEATURE_THRESH |
"5" |
public static final java.lang.String |
NTHREADS |
"1" |
public static final java.lang.String |
OCCURRING_TAGS_ONLY |
"false" |
public static final java.lang.String |
OUTPUT_FILE |
"" |
public static final java.lang.String |
OUTPUT_FORMAT |
"slashTags" |
public static final java.lang.String |
OUTPUT_FORMAT_OPTIONS |
"" |
public static final java.lang.String |
POSSIBLE_TAGS_ONLY |
"false" |
public static final java.lang.String |
RARE_WORD_MIN_FEATURE_THRESH |
"10" |
public static final java.lang.String |
RARE_WORD_THRESH |
"5" |
public static final java.lang.String |
SEARCH |
"qn" |
public static final java.lang.String |
SGML |
"false" |
public static final java.lang.String |
TAG_INSIDE |
"" |
public static final java.lang.String |
TAG_SEPARATOR |
"/" |
public static final java.lang.String |
TAG_SEPARATOR_PROPERTY |
"tagSeparator" |
public static final java.lang.String |
TOKENIZE |
"true" |
public static final java.lang.String |
TOKENIZER_FACTORY |
"" |
public static final java.lang.String |
TOKENIZER_OPTIONS |
"" |
public static final java.lang.String |
VERBOSE |
"false" |
public static final java.lang.String |
VERBOSE_RESULTS |
"true" |
public static final java.lang.String |
VERY_COMMON_WORD_THRESH |
"250" |
public static final java.lang.String |
WORD_FUNCTION |
"" |
public static final java.lang.String |
XML_INPUT |
"" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final boolean |
DBG |
false |
protected static final int |
kBestSize |
1 |
protected static final java.lang.String |
naTag |
"NA" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_ENCODING |
"UTF-8" |
protected static final char |
DEFAULT_GF_CHAR |
45 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
CoNLLX_FieldCount |
10 |
public static final int |
CoNLLX_GovField |
6 |
public static final int |
CoNLLX_POSField |
3 |
public static final int |
CoNLLX_RelnField |
7 |
public static final int |
CoNLLX_WordField |
1 |
public static final java.lang.String |
DEFAULT_PARSER_FILE |
"/u/nlp/data/lexparser/englishPCFG.ser.gz" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
TEMPORAL_9 |
9 |
public static final int |
TEMPORAL_ACL03PCFG |
1 |
public static final int |
TEMPORAL_ALL_NP |
4 |
public static final int |
TEMPORAL_ALL_NP_AND_PP |
5 |
public static final int |
TEMPORAL_ALL_NP_EVEN_UNDER_PP |
7 |
public static final int |
TEMPORAL_ALL_NP_PP_ADVP |
8 |
public static final int |
TEMPORAL_ALL_TERMINALS |
3 |
public static final int |
TEMPORAL_ANY_TMP_PERCOLATED |
2 |
public static final int |
TEMPORAL_NONE |
0 |
public static final int |
TEMPORAL_NP_AND_PP_WITH_NP_HEAD |
6 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_TREE_FILE_SUFFIX |
"mrg" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DEFAULT_ENCODING |
"UTF-8" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
headMark |
"=H" |
public static final java.lang.String |
rootLabelOnlyFormat |
"rootSymbolOnly" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
ENCODING |
"utf-8" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ASCII |
1 |
public static final int |
DELETE |
3 |
public static final int |
DELETE_EXCEPT_BETWEEN_ASCII |
4 |
public static final int |
FULLWIDTH |
2 |
public static final int |
LEAVE |
0 |
public static final int |
MAX_LEGAL |
4 |
public static final java.lang.String |
MID_DOT_REGEX_STR |
"[\u00b7\u0387\u2022\u2024\u2027\u2219\u22c5\u30fb]" |
public static final int |
NORMALIZE |
1 |
public static final java.lang.String |
NUMBERS |
"[\u4e00\u4e8c\u4e09\u56db\u4e94\u516d\u4e03\u516b\u4e5d\u5341]" |
public static final java.lang.String |
ONEWHITE |
"[\\s\\p{Zs}]" |
public static final java.lang.String |
WHITE |
"[\\s\\p{Zs}]*" |
public static final java.lang.String |
WHITEPLUS |
"[\\s\\p{Zs}]+" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
JJTLOCATION |
2 |
public static final int |
JJTNODENAME |
5 |
public static final int |
JJTNODESELECTION |
4 |
public static final int |
JJTNODESELECTIONLIST |
3 |
public static final int |
JJTOPERATION |
1 |
public static final int |
JJTROOT |
0 |
public static final int |
JJTTREEDTRS |
9 |
public static final int |
JJTTREELIST |
6 |
public static final int |
JJTTREENODE |
8 |
public static final int |
JJTTREEROOT |
7 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
HASH_MAP_PROPERTY |
"edu.stanford.nlp.hashmap.impl" |
public static final java.lang.String |
HASH_SET_PROPERTY |
"edu.stanford.nlp.hashset.impl" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
INTERVAL_OPEN_BEGIN |
1 |
public static final int |
INTERVAL_OPEN_END |
2 |
protected static final int |
REL_FLAGS_AFTER |
4 |
protected static final int |
REL_FLAGS_BEFORE |
2 |
public static final int |
REL_FLAGS_EE_AFTER |
16384 |
public static final int |
REL_FLAGS_EE_BEFORE |
8192 |
public static final int |
REL_FLAGS_EE_SAME |
4096 |
protected static final int |
REL_FLAGS_EE_SHIFT |
12 |
public static final int |
REL_FLAGS_EE_UNKNOWN |
28672 |
public static final int |
REL_FLAGS_ES_AFTER |
1024 |
public static final int |
REL_FLAGS_ES_BEFORE |
512 |
public static final int |
REL_FLAGS_ES_SAME |
256 |
protected static final int |
REL_FLAGS_ES_SHIFT |
8 |
public static final int |
REL_FLAGS_ES_UNKNOWN |
1792 |
public static final int |
REL_FLAGS_INTERVAL_AFTER |
262144 |
public static final int |
REL_FLAGS_INTERVAL_ALMOST_AFTER |
16777216 |
public static final int |
REL_FLAGS_INTERVAL_ALMOST_BEFORE |
16777216 |
public static final int |
REL_FLAGS_INTERVAL_ALMOST_SAME |
16777216 |
public static final int |
REL_FLAGS_INTERVAL_BEFORE |
131072 |
public static final int |
REL_FLAGS_INTERVAL_CONTAIN |
4194304 |
public static final int |
REL_FLAGS_INTERVAL_FUZZY |
-2147483648 |
public static final int |
REL_FLAGS_INTERVAL_INSIDE |
2097152 |
public static final int |
REL_FLAGS_INTERVAL_OVERLAP |
1048576 |
public static final int |
REL_FLAGS_INTERVAL_SAME |
65536 |
public static final int |
REL_FLAGS_INTERVAL_UNKNOWN |
7798784 |
protected static final int |
REL_FLAGS_SAME |
1 |
public static final int |
REL_FLAGS_SE_AFTER |
64 |
public static final int |
REL_FLAGS_SE_BEFORE |
32 |
public static final int |
REL_FLAGS_SE_SAME |
16 |
protected static final int |
REL_FLAGS_SE_SHIFT |
4 |
public static final int |
REL_FLAGS_SE_UNKNOWN |
112 |
public static final int |
REL_FLAGS_SS_AFTER |
4 |
public static final int |
REL_FLAGS_SS_BEFORE |
2 |
public static final int |
REL_FLAGS_SS_SAME |
1 |
protected static final int |
REL_FLAGS_SS_SHIFT |
0 |
public static final int |
REL_FLAGS_SS_UNKNOWN |
7 |
protected static final int |
REL_FLAGS_UNKNOWN |
7 |