public class InvertedIndexByTokens<E extends Pattern> extends SentenceIndex<E> implements java.io.Serializable
Constructor and Description |
---|
InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString) |
InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString,
java.util.Map<java.lang.String,java.util.Set<java.lang.String>> index) |
Modifier and Type | Method and Description |
---|---|
protected void |
add(java.util.List<CoreLabel> sent,
java.lang.String sentId,
boolean addProcessedText) |
void |
add(java.util.Map<java.lang.String,DataInstance> sents,
boolean addProcessedText)
addProcessedText is true when inserting sentences for the first time
|
static InvertedIndexByTokens |
createIndex(java.util.Map<java.lang.String,java.util.List<CoreLabel>> sentences,
java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.lang.String dir,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformCoreLabeltoString) |
void |
finishUpdating() |
java.util.Set<java.lang.String> |
getFileSentIds(CollectionValuedMap<java.lang.String,java.lang.String> relevantWords) |
java.util.Map<E,java.util.Set<java.lang.String>> |
getFileSentIdsFromPats(java.util.Collection<E> pats) |
static InvertedIndexByTokens |
loadIndex(java.util.Properties props,
java.util.Set<java.lang.String> stopwords,
java.lang.String dir,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString) |
java.util.Map<E,java.util.Set<java.lang.String>> |
queryIndex(java.util.Collection<E> patterns) |
void |
saveIndex(java.lang.String dir) |
void |
update(java.util.List<CoreLabel> tokens,
java.lang.String sentid) |
createIndex, loadIndex, setUp, size
public InvertedIndexByTokens(java.util.Properties props, java.util.Set<java.lang.String> stopWords, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString)
public InvertedIndexByTokens(java.util.Properties props, java.util.Set<java.lang.String> stopWords, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString, java.util.Map<java.lang.String,java.util.Set<java.lang.String>> index)
public void add(java.util.Map<java.lang.String,DataInstance> sents, boolean addProcessedText)
SentenceIndex
add
in class SentenceIndex<E extends Pattern>
protected void add(java.util.List<CoreLabel> sent, java.lang.String sentId, boolean addProcessedText)
add
in class SentenceIndex<E extends Pattern>
public void finishUpdating()
finishUpdating
in class SentenceIndex<E extends Pattern>
public void update(java.util.List<CoreLabel> tokens, java.lang.String sentid)
update
in class SentenceIndex<E extends Pattern>
public java.util.Set<java.lang.String> getFileSentIds(CollectionValuedMap<java.lang.String,java.lang.String> relevantWords)
public java.util.Map<E,java.util.Set<java.lang.String>> getFileSentIdsFromPats(java.util.Collection<E> pats)
public static InvertedIndexByTokens createIndex(java.util.Map<java.lang.String,java.util.List<CoreLabel>> sentences, java.util.Properties props, java.util.Set<java.lang.String> stopWords, java.lang.String dir, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformCoreLabeltoString)
public java.util.Map<E,java.util.Set<java.lang.String>> queryIndex(java.util.Collection<E> patterns)
queryIndex
in class SentenceIndex<E extends Pattern>
public void saveIndex(java.lang.String dir)
saveIndex
in class SentenceIndex<E extends Pattern>
public static InvertedIndexByTokens loadIndex(java.util.Properties props, java.util.Set<java.lang.String> stopwords, java.lang.String dir, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString)