public class LvgBaseTokenAnnotator
extends JCasAnnotator_ImplBase
Modifier and Type | Class and Description |
---|---|
(package private) class |
LvgBaseTokenAnnotator.LemmaLocalClass
Basic class to group a lemma word with its various parts of speech.
|
Modifier and Type | Field and Description |
---|---|
private java.lang.String |
cmdCacheFileLocation |
private int |
cmdCacheFreqCutoff |
private UimaContext |
context |
private java.util.Set |
exclusionSet |
private java.lang.String |
lemmaCacheFileLocation |
private int |
lemmaCacheFreqCutoff |
private java.util.Map |
lemmaCacheMap |
private Logger |
logger |
private LvgCmdApi |
lvgCmd |
private java.lang.String |
LVGCMDAPI_RESRC_KEY |
private LvgLexItemApi |
lvgLexItem |
private java.util.Map |
normCacheMap |
static java.lang.String |
PARAM_LEMMA_CACHE_FILE_LOCATION
Value is "LemmaCacheFileLocation".
|
static java.lang.String |
PARAM_LEMMA_CACHE_FREQUENCY_CUTOFF
Value is "LemmaCacheFrequencyCutoff".
|
static java.lang.String |
PARAM_POST_LEMMAS
Value is "PostLemmas".
|
static java.lang.String |
PARAM_USE_LEMMA_CACHE
Value is "UseLemmaCache".
|
private boolean |
postLemmas |
private java.util.Set |
skipSegmentsSet |
private boolean |
useCmdCache |
private boolean |
useLemmaCache |
private boolean |
useSegments |
private java.util.Map |
xeroxTreebankMap |
Constructor and Description |
---|
LvgBaseTokenAnnotator() |
Modifier and Type | Method and Description |
---|---|
protected void |
annotateRange(JCas jcas,
java.lang.String text,
int rangeBegin,
int rangeEnd)
A utility method that annotates a given range.
|
private void |
configInit()
Sets configuration parameters with values from the descriptor.
|
void |
initialize(UimaContext aContext)
Performs initialization logic.
|
private void |
loadCmdCacheFile(java.lang.String cpLocation)
Helper method that loads a Norm cache file.
|
private void |
loadLemmaCacheFile(java.lang.String cpLocation)
Helper method that loads a Lemma cache file.
|
void |
process(JCas jcas)
Invokes this annotator's analysis logic.
|
private void |
setLemma(BaseToken wordAnnotation,
java.lang.String word,
JCas jcas) |
private void |
setNormalizedForm(BaseToken tokenAnnotation,
java.lang.String token) |
public static final java.lang.String PARAM_POST_LEMMAS
public static final java.lang.String PARAM_USE_LEMMA_CACHE
public static final java.lang.String PARAM_LEMMA_CACHE_FILE_LOCATION
public static final java.lang.String PARAM_LEMMA_CACHE_FREQUENCY_CUTOFF
private Logger logger
private final java.lang.String LVGCMDAPI_RESRC_KEY
private LvgCmdApi lvgCmd
private LvgLexItemApi lvgLexItem
private UimaContext context
private boolean useSegments
private java.util.Set skipSegmentsSet
private boolean useCmdCache
private java.lang.String cmdCacheFileLocation
private int cmdCacheFreqCutoff
private java.util.Map xeroxTreebankMap
private boolean postLemmas
private boolean useLemmaCache
private java.lang.String lemmaCacheFileLocation
private int lemmaCacheFreqCutoff
private java.util.Map normCacheMap
private java.util.Map lemmaCacheMap
private java.util.Set exclusionSet
public void initialize(UimaContext aContext) throws ResourceInitializationException
ResourceInitializationException
org.apache.uima.analysis_engine.annotator.BaseAnnotator#initialize(AnnotatorContext)
private void configInit() throws ResourceInitializationException
ResourceInitializationException
public void process(JCas jcas) throws AnalysisEngineProcessException
AnalysisEngineProcessException
protected void annotateRange(JCas jcas, java.lang.String text, int rangeBegin, int rangeEnd) throws AnalysisEngineProcessException
AnalysisEngineProcessException
private void setNormalizedForm(BaseToken tokenAnnotation, java.lang.String token) throws AnalysisEngineProcessException
AnalysisEngineProcessException
private void setLemma(BaseToken wordAnnotation, java.lang.String word, JCas jcas) throws AnalysisEngineProcessException
AnalysisEngineProcessException
private void loadCmdCacheFile(java.lang.String cpLocation) throws java.io.FileNotFoundException, java.io.IOException
location
- java.io.FileNotFoundException
java.io.IOException
private void loadLemmaCacheFile(java.lang.String cpLocation) throws java.io.FileNotFoundException, java.io.IOException
location
- java.io.FileNotFoundException
java.io.IOException