public class LuceneKeywordCPFE extends LuceneKeywordPFE implements PairFeatureExtractor
LuceneNGramPFE.| Modifier and Type | Field and Description |
|---|---|
static String |
KEYWORD_NGRAM_FIELD_COMBO |
protected int |
ngramMaxNCombo |
protected int |
ngramMinNCombo |
protected boolean |
ngramUseSymmetricalCombos |
protected int |
ngramUseTopKCombo |
static String |
PARAM_KEYWORD_NGRAM_MAX_N_COMBO
Maximum token length of the combination
|
static String |
PARAM_KEYWORD_NGRAM_MIN_N_COMBO
Minimum token length of the combination.
|
static String |
PARAM_KEYWORD_NGRAM_SYMMETRY_COMBO
If true, both orderings of ngram combinations will be used.
|
static String |
PARAM_KEYWORD_NGRAM_USE_TOP_K_COMBO
Use this number of most frequent combinations
|
protected de.tudarmstadt.ukp.dkpro.core.api.frequency.util.FrequencyDistribution<String> |
topKSetCombo |
includeCommas, KEYWORD_NGRAM_FIELD, KEYWORD_NGRAM_FIELD1, KEYWORD_NGRAM_FIELD2, keywordMaxN, keywordMinN, keywordNgramUseTopK, keywords, keywordsFile, markSentenceBoundary, markSentenceLocation, markViewBlindNgramsWithLocalView, ngramMaxN1, ngramMaxN2, ngramMinN1, ngramMinN2, PARAM_KEYWORD_NGRAM_INCLUDE_COMMAS, PARAM_KEYWORD_NGRAM_MARK_SENTENCE_BOUNDARY, PARAM_KEYWORD_NGRAM_MARK_SENTENCE_LOCATION, PARAM_KEYWORD_NGRAM_MAX_N, PARAM_KEYWORD_NGRAM_MAX_N_VIEW1, PARAM_KEYWORD_NGRAM_MAX_N_VIEW2, PARAM_KEYWORD_NGRAM_MIN_N, PARAM_KEYWORD_NGRAM_MIN_N_VIEW1, PARAM_KEYWORD_NGRAM_MIN_N_VIEW2, PARAM_KEYWORD_NGRAM_USE_TOP_K, PARAM_MARK_VIEWBLIND_KEYWORD_NGRAMS_WITH_LOCAL_VIEW, PARAM_NGRAM_KEYWORDS_FILE, PARAM_USE_VIEW1_KEYWORD_NGRAMS_AS_FEATURES, PARAM_USE_VIEW2_KEYWORD_NGRAMS_AS_FEATURES, PARAM_USE_VIEWBLIND_KEYWORD_NGRAMS_AS_FEATURES, useView1NgramsAsFeatures, useView2NgramsAsFeatures, useViewBlindNgramsAsFeaturesfieldOfTheMoment, kngramUseTopK, ngramBinaryFeatureValuesCombos, ngramUseTopK1, ngramUseTopK2, PARAM_NGRAM_BINARY_FEATURE_VALUES_COMBO, PARAM_NGRAM_USE_TOP_K_VIEW1, PARAM_NGRAM_USE_TOP_K_VIEW2, topKSetView1, topKSetView2, topNOfTheMomentforceRereadFromIndex, LUCENE_NGRAM_FIELD, luceneDir, PARAM_SOURCE_LOCATIONdfStore, filterPartialStopwordMatches, ngramFreqThreshold, ngramLowerCase, ngramStopwordsFile, ngramUseTopK, PARAM_FILTER_PARTIAL_STOPWORD_MATCHES, PARAM_NGRAM_FREQ_THRESHOLD, PARAM_NGRAM_LOWER_CASE, PARAM_NGRAM_MAX_N, PARAM_NGRAM_MIN_N, PARAM_NGRAM_STOPWORDS_FILE, PARAM_NGRAM_USE_TOP_K, PARAM_TF_IDF_CALCULATION, prefix, stopwords, tfIdfCalculation, topKSetfeatureExtractorName, PARAM_UNIQUE_EXTRACTOR_NAME| Constructor and Description |
|---|
LuceneKeywordCPFE() |
| Modifier and Type | Method and Description |
|---|---|
Set<Feature> |
extract(org.apache.uima.jcas.JCas view1,
org.apache.uima.jcas.JCas view2) |
List<MetaCollectorConfiguration> |
getMetaCollectorClasses(Map<String,Object> parameterSettings) |
boolean |
initialize(org.apache.uima.resource.ResourceSpecifier aSpecifier,
Map<String,Object> aAdditionalParams) |
protected boolean |
passesScreening(String term) |
getFeaturePrefix, getFieldName, getTopN, getViewNgramsaddToFeatureArraygetTopNgrams, logSelectionProcessafterResourcesInitialized, getLogger, getResourceNamepublic static final String PARAM_KEYWORD_NGRAM_MIN_N_COMBO
protected int ngramMinNCombo
public static final String PARAM_KEYWORD_NGRAM_MAX_N_COMBO
protected int ngramMaxNCombo
public static final String PARAM_KEYWORD_NGRAM_USE_TOP_K_COMBO
protected int ngramUseTopKCombo
public static final String PARAM_KEYWORD_NGRAM_SYMMETRY_COMBO
protected boolean ngramUseSymmetricalCombos
public static final String KEYWORD_NGRAM_FIELD_COMBO
protected de.tudarmstadt.ukp.dkpro.core.api.frequency.util.FrequencyDistribution<String> topKSetCombo
public List<MetaCollectorConfiguration> getMetaCollectorClasses(Map<String,Object> parameterSettings) throws org.apache.uima.resource.ResourceInitializationException
getMetaCollectorClasses in interface MetaDependentgetMetaCollectorClasses in class LuceneKeywordPFEorg.apache.uima.resource.ResourceInitializationExceptionpublic boolean initialize(org.apache.uima.resource.ResourceSpecifier aSpecifier,
Map<String,Object> aAdditionalParams)
throws org.apache.uima.resource.ResourceInitializationException
initialize in interface org.apache.uima.resource.Resourceinitialize in class LuceneKeywordPFEorg.apache.uima.resource.ResourceInitializationExceptionpublic Set<Feature> extract(org.apache.uima.jcas.JCas view1, org.apache.uima.jcas.JCas view2) throws org.dkpro.tc.api.exception.TextClassificationException
extract in interface PairFeatureExtractorextract in class LuceneKeywordPFEorg.dkpro.tc.api.exception.TextClassificationExceptionprotected boolean passesScreening(String term)
passesScreening in class LuceneFeatureExtractorBaseCopyright © 2013–2018 Ubiquitous Knowledge Processing (UKP) Lab. All rights reserved.