public class Dictionaries
extends java.lang.Object
Modifier and Type | Class and Description |
---|---|
static class |
Dictionaries.Animacy |
static class |
Dictionaries.Gender |
static class |
Dictionaries.MentionType |
static class |
Dictionaries.Number |
static class |
Dictionaries.Person |
Modifier and Type | Field and Description |
---|---|
java.util.Set<java.lang.String> |
allPronouns |
java.util.Set<java.lang.String> |
animatePronouns |
java.util.Set<java.lang.String> |
animateWords |
java.util.Set<java.lang.String> |
copulas |
java.util.ArrayList<Counter<Pair<java.lang.String,java.lang.String>>> |
corefDict |
Counter<Pair<java.lang.String,java.lang.String>> |
corefDictPMI |
java.util.Set<java.lang.String> |
countries |
java.util.Set<java.lang.String> |
dateTimePronouns |
java.util.Set<java.lang.String> |
demonymSet |
java.util.Set<java.lang.String> |
determiners |
java.util.Set<java.lang.String> |
facilityVehicleWeaponPronouns |
java.util.Set<java.lang.String> |
femalePronouns |
java.util.Set<java.lang.String> |
femaleWords |
java.util.Set<java.lang.String> |
firstPersonPronouns |
java.util.Map<java.util.List<java.lang.String>,Dictionaries.Gender> |
genderNumber |
java.util.Set<java.lang.String> |
GPEPronouns |
java.util.Set<java.lang.String> |
inanimatePronouns |
java.util.Set<java.lang.String> |
inanimateWords |
java.util.Set<java.lang.String> |
indefinitePronouns |
java.util.Set<java.lang.String> |
locationPronouns |
java.util.Set<java.lang.String> |
malePronouns |
java.util.Set<java.lang.String> |
maleWords |
java.util.Set<java.lang.String> |
miscPronouns |
java.util.Set<java.lang.String> |
modals |
java.util.Set<java.lang.String> |
moneyPercentNumberPronouns |
java.util.Map<java.lang.String,Counter<java.lang.String>> |
NE_signatures |
java.util.Set<java.lang.String> |
neg_relations |
java.util.Set<java.lang.String> |
negations |
java.util.Set<java.lang.String> |
neutralPronouns |
java.util.Set<java.lang.String> |
neutralWords |
java.util.Set<java.lang.String> |
nonWords |
java.util.Set<java.lang.String> |
notOrganizationPRP |
java.util.Set<java.lang.String> |
organizationPronouns |
java.util.Set<java.lang.String> |
otherPronouns |
java.util.Set<java.lang.String> |
parts |
java.util.Set<java.lang.String> |
personPronouns |
java.util.Set<java.lang.String> |
pluralPronouns |
java.util.Set<java.lang.String> |
pluralWords |
java.util.Set<java.lang.String> |
possessivePronouns |
java.util.Set<java.lang.String> |
quantifiers |
java.util.Set<java.lang.String> |
quantifiers2 |
java.util.Set<java.lang.String> |
reflexivePronouns |
java.util.Set<java.lang.String> |
relativePronouns |
java.util.Set<java.lang.String> |
reportNoun |
java.util.Set<java.lang.String> |
reportVerb |
java.util.Set<java.lang.String> |
secondPersonPronouns |
java.util.Set<java.lang.String> |
singularPronouns |
java.util.Set<java.lang.String> |
singularWords |
java.util.Map<java.lang.String,java.lang.String> |
statesAbbreviation |
java.util.Set<java.lang.String> |
statesAndProvinces |
java.util.Set<java.lang.String> |
stopWords |
java.util.Set<java.lang.String> |
temporals |
java.util.Set<java.lang.String> |
thirdPersonPronouns |
java.util.Set<java.lang.String> |
transparentNouns |
Constructor and Description |
---|
Dictionaries() |
Dictionaries(java.util.Properties props) |
Dictionaries(java.lang.String demonymWords,
java.lang.String animateWords,
java.lang.String inanimateWords,
java.lang.String maleWords,
java.lang.String neutralWords,
java.lang.String femaleWords,
java.lang.String pluralWords,
java.lang.String singularWords,
java.lang.String statesWords,
java.lang.String genderNumber,
java.lang.String countries,
java.lang.String states,
boolean loadCorefDict,
java.lang.String[] corefDictFiles,
java.lang.String corefDictPMIFile,
java.lang.String signaturesFile) |
Modifier and Type | Method and Description |
---|---|
java.util.Set<java.lang.String> |
getDemonyms(java.lang.String name)
Returns a set of demonyms for a country (or city or region).
|
boolean |
isAdjectivalDemonym(java.lang.String token)
Returns whether this mention (possibly multi-word) is the
adjectival form of a demonym, like "African" or "Iraqi".
|
void |
loadStateAbbreviation(java.lang.String statesFile)
The format of each line of this file is
fullStateName ( TAB abbrev )*
The file is cased and checked cased.
|
java.lang.String |
lookupCanonicalAmericanStateName(java.lang.String name)
If the input string is an abbreviation of a U.S.
|
static java.lang.String |
signature(java.util.Properties props) |
public final java.util.Set<java.lang.String> reportVerb
public final java.util.Set<java.lang.String> reportNoun
public final java.util.Set<java.lang.String> nonWords
public final java.util.Set<java.lang.String> copulas
public final java.util.Set<java.lang.String> quantifiers
public final java.util.Set<java.lang.String> parts
public final java.util.Set<java.lang.String> temporals
public final java.util.Set<java.lang.String> femalePronouns
public final java.util.Set<java.lang.String> malePronouns
public final java.util.Set<java.lang.String> neutralPronouns
public final java.util.Set<java.lang.String> possessivePronouns
public final java.util.Set<java.lang.String> otherPronouns
public final java.util.Set<java.lang.String> thirdPersonPronouns
public final java.util.Set<java.lang.String> secondPersonPronouns
public final java.util.Set<java.lang.String> firstPersonPronouns
public final java.util.Set<java.lang.String> moneyPercentNumberPronouns
public final java.util.Set<java.lang.String> dateTimePronouns
public final java.util.Set<java.lang.String> organizationPronouns
public final java.util.Set<java.lang.String> locationPronouns
public final java.util.Set<java.lang.String> inanimatePronouns
public final java.util.Set<java.lang.String> animatePronouns
public final java.util.Set<java.lang.String> indefinitePronouns
public final java.util.Set<java.lang.String> relativePronouns
public final java.util.Set<java.lang.String> GPEPronouns
public final java.util.Set<java.lang.String> pluralPronouns
public final java.util.Set<java.lang.String> singularPronouns
public final java.util.Set<java.lang.String> facilityVehicleWeaponPronouns
public final java.util.Set<java.lang.String> miscPronouns
public final java.util.Set<java.lang.String> reflexivePronouns
public final java.util.Set<java.lang.String> transparentNouns
public final java.util.Set<java.lang.String> stopWords
public final java.util.Set<java.lang.String> notOrganizationPRP
public final java.util.Set<java.lang.String> quantifiers2
public final java.util.Set<java.lang.String> determiners
public final java.util.Set<java.lang.String> negations
public final java.util.Set<java.lang.String> neg_relations
public final java.util.Set<java.lang.String> modals
public final java.util.Set<java.lang.String> personPronouns
public final java.util.Set<java.lang.String> allPronouns
public final java.util.Map<java.lang.String,java.lang.String> statesAbbreviation
public final java.util.Set<java.lang.String> demonymSet
public final java.util.Set<java.lang.String> countries
public final java.util.Set<java.lang.String> statesAndProvinces
public final java.util.Set<java.lang.String> neutralWords
public final java.util.Set<java.lang.String> femaleWords
public final java.util.Set<java.lang.String> maleWords
public final java.util.Set<java.lang.String> pluralWords
public final java.util.Set<java.lang.String> singularWords
public final java.util.Set<java.lang.String> inanimateWords
public final java.util.Set<java.lang.String> animateWords
public final java.util.Map<java.util.List<java.lang.String>,Dictionaries.Gender> genderNumber
public final java.util.ArrayList<Counter<Pair<java.lang.String,java.lang.String>>> corefDict
public final java.util.Map<java.lang.String,Counter<java.lang.String>> NE_signatures
public Dictionaries(java.util.Properties props)
public Dictionaries(java.lang.String demonymWords, java.lang.String animateWords, java.lang.String inanimateWords, java.lang.String maleWords, java.lang.String neutralWords, java.lang.String femaleWords, java.lang.String pluralWords, java.lang.String singularWords, java.lang.String statesWords, java.lang.String genderNumber, java.lang.String countries, java.lang.String states, boolean loadCorefDict, java.lang.String[] corefDictFiles, java.lang.String corefDictPMIFile, java.lang.String signaturesFile)
public Dictionaries()
public void loadStateAbbreviation(java.lang.String statesFile)
public java.lang.String lookupCanonicalAmericanStateName(java.lang.String name)
name
- Is treated as a cased string. ME != mepublic java.util.Set<java.lang.String> getDemonyms(java.lang.String name)
name
- Some string perhaps a country name like "Australia"public boolean isAdjectivalDemonym(java.lang.String token)
public static java.lang.String signature(java.util.Properties props)