public class Dictionaries
extends java.lang.Object
Modifier and Type | Class and Description |
---|---|
static class |
Dictionaries.Animacy |
static class |
Dictionaries.Gender |
static class |
Dictionaries.MentionType |
static class |
Dictionaries.Number |
static class |
Dictionaries.Person |
Modifier and Type | Field and Description |
---|---|
java.util.Set<java.lang.String> |
allPronouns |
java.util.Set<java.lang.String> |
animatePronouns |
java.util.Set<java.lang.String> |
animateWords |
java.util.Set<java.lang.String> |
copulas |
java.util.ArrayList<Counter<Pair<java.lang.String,java.lang.String>>> |
corefDict |
Counter<Pair<java.lang.String,java.lang.String>> |
corefDictPMI |
java.util.Set<java.lang.String> |
countries |
java.util.Set<java.lang.String> |
dateTimePronouns |
java.util.Set<java.lang.String> |
demonymSet |
java.util.Set<java.lang.String> |
determiners |
Counter<java.lang.String> |
dictScore |
int |
dimVector |
java.util.Set<java.lang.String> |
facilityVehicleWeaponPronouns |
java.util.Set<java.lang.String> |
femalePronouns |
java.util.Set<java.lang.String> |
femaleWords |
java.util.Set<java.lang.String> |
firstPersonPronouns |
java.util.Map<java.util.List<java.lang.String>,Dictionaries.Gender> |
genderNumber |
java.util.Set<java.lang.String> |
GPEPronouns |
java.util.Set<java.lang.String> |
inanimatePronouns |
java.util.Set<java.lang.String> |
inanimateWords |
java.util.Set<java.lang.String> |
indefinitePronouns |
java.util.Set<java.lang.String> |
interrogativePronouns |
java.util.Set<java.lang.String> |
locationPronouns |
java.util.Set<java.lang.String> |
malePronouns |
java.util.Set<java.lang.String> |
maleWords |
java.util.Set<java.lang.String> |
miscPronouns |
java.util.Set<java.lang.String> |
modals |
java.util.Set<java.lang.String> |
moneyPercentNumberPronouns |
java.util.Map<java.lang.String,Counter<java.lang.String>> |
NE_signatures |
java.util.Set<java.lang.String> |
neg_relations |
java.util.Set<java.lang.String> |
negations |
java.util.Set<java.lang.String> |
neutralPronouns |
java.util.Set<java.lang.String> |
neutralWords |
java.util.Set<java.lang.String> |
nonWords |
java.util.Set<java.lang.String> |
notOrganizationPRP |
java.util.Set<java.lang.String> |
organizationPronouns |
java.util.Set<java.lang.String> |
otherPronouns |
java.util.Set<java.lang.String> |
parts |
java.util.Set<java.lang.String> |
personPronouns |
java.util.Set<java.lang.String> |
pluralPronouns |
java.util.Set<java.lang.String> |
pluralWords |
java.util.Set<java.lang.String> |
possessivePronouns |
java.util.Set<java.lang.String> |
quantifiers |
java.util.Set<java.lang.String> |
quantifiers2 |
java.util.Set<java.lang.String> |
reflexivePronouns |
java.util.Set<java.lang.String> |
relativePronouns |
java.util.Set<java.lang.String> |
removeChars |
java.util.Set<java.lang.String> |
removeWords |
java.util.Set<java.lang.String> |
reportNoun |
java.util.Set<java.lang.String> |
reportVerb |
java.util.Set<java.lang.String> |
secondPersonPronouns |
java.util.Set<java.lang.String> |
singularPronouns |
java.util.Set<java.lang.String> |
singularWords |
java.util.Map<java.lang.String,java.lang.String> |
statesAbbreviation |
java.util.Set<java.lang.String> |
statesAndProvinces |
java.util.Set<java.lang.String> |
stopWords |
java.util.Map<java.lang.String,java.lang.String> |
strToEntity |
java.util.Set<java.lang.String> |
temporals |
java.util.Set<java.lang.String> |
thirdPersonPronouns |
java.util.Set<java.lang.String> |
titleWords |
java.util.Set<java.lang.String> |
transparentNouns |
VectorMap |
vectors |
Constructor and Description |
---|
Dictionaries() |
Dictionaries(java.util.Properties props) |
Dictionaries(java.lang.String language,
java.lang.String demonymWords,
java.lang.String animateWords,
java.lang.String inanimateWords,
java.lang.String maleWords,
java.lang.String neutralWords,
java.lang.String femaleWords,
java.lang.String pluralWords,
java.lang.String singularWords,
java.lang.String statesWords,
java.lang.String genderNumber,
java.lang.String countries,
java.lang.String states,
boolean loadCorefDict,
java.lang.String[] corefDictFiles,
java.lang.String corefDictPMIFile,
java.lang.String signaturesFile) |
Modifier and Type | Method and Description |
---|---|
java.util.Set<java.lang.String> |
getDemonyms(java.lang.String name)
Returns a set of demonyms for a country (or city or region).
|
boolean |
isAdjectivalDemonym(java.lang.String token)
Returns whether this mention (possibly multi-word) is the
adjectival form of a demonym, like "African" or "Iraqi".
|
void |
loadSemantics(java.util.Properties props) |
java.lang.String |
lookupCanonicalAmericanStateName(java.lang.String name)
If the input string is an abbreviation of a U.S.
|
static java.lang.String |
signature(java.util.Properties props) |
public java.util.Set<java.lang.String> reportVerb
public java.util.Set<java.lang.String> reportNoun
public java.util.Set<java.lang.String> nonWords
public java.util.Set<java.lang.String> copulas
public java.util.Set<java.lang.String> quantifiers
public java.util.Set<java.lang.String> parts
public java.util.Set<java.lang.String> temporals
public java.util.Set<java.lang.String> femalePronouns
public java.util.Set<java.lang.String> malePronouns
public java.util.Set<java.lang.String> neutralPronouns
public java.util.Set<java.lang.String> possessivePronouns
public java.util.Set<java.lang.String> otherPronouns
public java.util.Set<java.lang.String> thirdPersonPronouns
public java.util.Set<java.lang.String> secondPersonPronouns
public java.util.Set<java.lang.String> firstPersonPronouns
public java.util.Set<java.lang.String> moneyPercentNumberPronouns
public java.util.Set<java.lang.String> dateTimePronouns
public java.util.Set<java.lang.String> organizationPronouns
public java.util.Set<java.lang.String> locationPronouns
public java.util.Set<java.lang.String> inanimatePronouns
public java.util.Set<java.lang.String> animatePronouns
public java.util.Set<java.lang.String> indefinitePronouns
public java.util.Set<java.lang.String> relativePronouns
public java.util.Set<java.lang.String> interrogativePronouns
public java.util.Set<java.lang.String> GPEPronouns
public java.util.Set<java.lang.String> pluralPronouns
public java.util.Set<java.lang.String> singularPronouns
public java.util.Set<java.lang.String> facilityVehicleWeaponPronouns
public java.util.Set<java.lang.String> miscPronouns
public java.util.Set<java.lang.String> reflexivePronouns
public java.util.Set<java.lang.String> transparentNouns
public java.util.Set<java.lang.String> stopWords
public java.util.Set<java.lang.String> notOrganizationPRP
public java.util.Set<java.lang.String> quantifiers2
public java.util.Set<java.lang.String> determiners
public java.util.Set<java.lang.String> negations
public java.util.Set<java.lang.String> neg_relations
public java.util.Set<java.lang.String> modals
public java.util.Set<java.lang.String> titleWords
public java.util.Set<java.lang.String> removeWords
public java.util.Set<java.lang.String> removeChars
public final java.util.Set<java.lang.String> personPronouns
public final java.util.Set<java.lang.String> allPronouns
public final java.util.Map<java.lang.String,java.lang.String> statesAbbreviation
public final java.util.Set<java.lang.String> demonymSet
public final java.util.Set<java.lang.String> countries
public final java.util.Set<java.lang.String> statesAndProvinces
public final java.util.Set<java.lang.String> neutralWords
public final java.util.Set<java.lang.String> femaleWords
public final java.util.Set<java.lang.String> maleWords
public final java.util.Set<java.lang.String> pluralWords
public final java.util.Set<java.lang.String> singularWords
public final java.util.Set<java.lang.String> inanimateWords
public final java.util.Set<java.lang.String> animateWords
public final java.util.Map<java.util.List<java.lang.String>,Dictionaries.Gender> genderNumber
public final java.util.ArrayList<Counter<Pair<java.lang.String,java.lang.String>>> corefDict
public final java.util.Map<java.lang.String,Counter<java.lang.String>> NE_signatures
public int dimVector
public VectorMap vectors
public java.util.Map<java.lang.String,java.lang.String> strToEntity
public Counter<java.lang.String> dictScore
public Dictionaries(java.util.Properties props) throws java.lang.ClassNotFoundException, java.io.IOException
java.lang.ClassNotFoundException
java.io.IOException
public Dictionaries(java.lang.String language, java.lang.String demonymWords, java.lang.String animateWords, java.lang.String inanimateWords, java.lang.String maleWords, java.lang.String neutralWords, java.lang.String femaleWords, java.lang.String pluralWords, java.lang.String singularWords, java.lang.String statesWords, java.lang.String genderNumber, java.lang.String countries, java.lang.String states, boolean loadCorefDict, java.lang.String[] corefDictFiles, java.lang.String corefDictPMIFile, java.lang.String signaturesFile)
public Dictionaries() throws java.lang.ClassNotFoundException, java.io.IOException
java.lang.ClassNotFoundException
java.io.IOException
public java.lang.String lookupCanonicalAmericanStateName(java.lang.String name)
name
- Is treated as a cased string. ME != mepublic java.util.Set<java.lang.String> getDemonyms(java.lang.String name)
name
- Some string perhaps a country name like "Australia"public boolean isAdjectivalDemonym(java.lang.String token)
public void loadSemantics(java.util.Properties props) throws java.lang.ClassNotFoundException, java.io.IOException
java.lang.ClassNotFoundException
java.io.IOException
public static java.lang.String signature(java.util.Properties props)