public class InvertedIndexByTokens<E extends Pattern> extends SentenceIndex<E> implements java.io.Serializable
| Constructor and Description |
|---|
InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString) |
InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString,
java.util.Map<java.lang.String,java.util.Set<java.lang.String>> index) |
| Modifier and Type | Method and Description |
|---|---|
protected void |
add(java.util.List<CoreLabel> sent,
java.lang.String sentId,
boolean addProcessedText) |
void |
add(java.util.Map<java.lang.String,DataInstance> sents,
boolean addProcessedText)
addProcessedText is true when inserting sentences for the first time
|
static InvertedIndexByTokens |
createIndex(java.util.Map<java.lang.String,java.util.List<CoreLabel>> sentences,
java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.lang.String dir,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformCoreLabeltoString) |
void |
finishUpdating() |
java.util.Set<java.lang.String> |
getFileSentIds(CollectionValuedMap<java.lang.String,java.lang.String> relevantWords) |
java.util.Map<E,java.util.Set<java.lang.String>> |
getFileSentIdsFromPats(java.util.Collection<E> pats) |
static InvertedIndexByTokens |
loadIndex(java.util.Properties props,
java.util.Set<java.lang.String> stopwords,
java.lang.String dir,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString) |
java.util.Map<E,java.util.Set<java.lang.String>> |
queryIndex(java.util.Collection<E> patterns) |
void |
saveIndex(java.lang.String dir) |
void |
update(java.util.List<CoreLabel> tokens,
java.lang.String sentid) |
createIndex, loadIndex, setUp, sizepublic InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString)
public InvertedIndexByTokens(java.util.Properties props,
java.util.Set<java.lang.String> stopWords,
java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString,
java.util.Map<java.lang.String,java.util.Set<java.lang.String>> index)
public void add(java.util.Map<java.lang.String,DataInstance> sents, boolean addProcessedText)
SentenceIndexadd in class SentenceIndex<E extends Pattern>protected void add(java.util.List<CoreLabel> sent, java.lang.String sentId, boolean addProcessedText)
add in class SentenceIndex<E extends Pattern>public void finishUpdating()
finishUpdating in class SentenceIndex<E extends Pattern>public void update(java.util.List<CoreLabel> tokens, java.lang.String sentid)
update in class SentenceIndex<E extends Pattern>public java.util.Set<java.lang.String> getFileSentIds(CollectionValuedMap<java.lang.String,java.lang.String> relevantWords)
public java.util.Map<E,java.util.Set<java.lang.String>> getFileSentIdsFromPats(java.util.Collection<E> pats)
public static InvertedIndexByTokens createIndex(java.util.Map<java.lang.String,java.util.List<CoreLabel>> sentences, java.util.Properties props, java.util.Set<java.lang.String> stopWords, java.lang.String dir, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformCoreLabeltoString)
public java.util.Map<E,java.util.Set<java.lang.String>> queryIndex(java.util.Collection<E> patterns)
queryIndex in class SentenceIndex<E extends Pattern>public void saveIndex(java.lang.String dir)
saveIndex in class SentenceIndex<E extends Pattern>public static InvertedIndexByTokens loadIndex(java.util.Properties props, java.util.Set<java.lang.String> stopwords, java.lang.String dir, java.util.function.Function<CoreLabel,java.util.Map<java.lang.String,java.lang.String>> transformSentenceToString)