public class PatternFactory
extends java.lang.Object
Modifier and Type | Class and Description |
---|---|
static class |
PatternFactory.PatternType |
Modifier and Type | Field and Description |
---|---|
static java.util.List<java.lang.String> |
fillerWords |
static java.util.regex.Pattern |
ignoreWordRegex
by default doesn't ignore anything.
|
static java.lang.String |
numWordsCompound
Can just write a number (if same for all labels) or "Label1,2;Label2,3;...."
|
static java.util.Map<java.lang.String,java.lang.Integer> |
numWordsCompoundMapped |
static int |
numWordsCompoundMax |
static boolean |
useLemmaContextTokens
Use lemma instead of words for the context tokens
|
static boolean |
useNER |
static boolean |
useStopWordsBeforeTerm
allow to match stop words before a target term.
|
static boolean |
useTargetNERRestriction
Add NER restriction to the target phrase in the patterns
|
Constructor and Description |
---|
PatternFactory() |
Modifier and Type | Method and Description |
---|---|
static boolean |
doNotUse(java.lang.String word,
java.util.Set<CandidatePhrase> stopWords) |
static java.util.Map<java.lang.Integer,java.util.Set> |
getPatternsAroundTokens(PatternFactory.PatternType patternType,
DataInstance sent,
java.util.Set<CandidatePhrase> stopWords) |
static void |
setUp(java.util.Properties props,
PatternFactory.PatternType patternType,
java.util.Set<java.lang.String> labels) |
@ArgumentParser.Option(name="useStopWordsBeforeTerm") public static boolean useStopWordsBeforeTerm
@ArgumentParser.Option(name="useTargetNERRestriction") public static boolean useTargetNERRestriction
@ArgumentParser.Option(name="useNER") public static boolean useNER
@ArgumentParser.Option(name="numWordsCompound") public static java.lang.String numWordsCompound
public static java.util.Map<java.lang.String,java.lang.Integer> numWordsCompoundMapped
public static int numWordsCompoundMax
@ArgumentParser.Option(name="useLemmaContextTokens") public static boolean useLemmaContextTokens
public static java.util.List<java.lang.String> fillerWords
public static java.util.regex.Pattern ignoreWordRegex
public static void setUp(java.util.Properties props, PatternFactory.PatternType patternType, java.util.Set<java.lang.String> labels)
public static boolean doNotUse(java.lang.String word, java.util.Set<CandidatePhrase> stopWords)
public static java.util.Map<java.lang.Integer,java.util.Set> getPatternsAroundTokens(PatternFactory.PatternType patternType, DataInstance sent, java.util.Set<CandidatePhrase> stopWords)