@PipeBitInfo(name="Regex Sectionizer (A)", description="Annotates Document Sections by detecting Section Headers using Regular Expressions.", products=SECTION) public abstract class RegexSectionizer extends org.apache.uima.fit.component.JCasAnnotator_ImplBase
Modifier and Type | Class and Description |
---|---|
protected static class |
RegexSectionizer.SectionType
Holder for section type as defined in the user's specification bsv file
|
Modifier and Type | Field and Description |
---|---|
static String |
DIVIDER_LINE_NAME |
protected static org.apache.ctakes.core.ae.RegexSectionizer.SectionTag |
LINE_DIVIDER_TAG |
static String |
PARAM_TAG_DIVIDERS |
Constructor and Description |
---|
RegexSectionizer() |
Modifier and Type | Method and Description |
---|---|
protected static void |
addSectionType(RegexSectionizer.SectionType sectionType) |
static Map<String,RegexSectionizer.SectionType> |
getSectionTypes() |
void |
initialize(org.apache.uima.UimaContext context) |
protected static boolean |
isBoolean(String text) |
protected abstract void |
loadSections()
Load Sections in a manner appropriate for the Regex Sectionizer
|
void |
process(org.apache.uima.jcas.JCas jcas) |
static boolean |
shouldParseSegment(String segmentId)
Normally I would put this in a singleton but I'm not sure that a singleton will work well with/as uima ae
|
getRequiredCasInterface, process
getCasInstancesRequired, hasNext, next
public static final String PARAM_TAG_DIVIDERS
public static final String DIVIDER_LINE_NAME
protected static final org.apache.ctakes.core.ae.RegexSectionizer.SectionTag LINE_DIVIDER_TAG
public static boolean shouldParseSegment(String segmentId)
segmentId
- id of a section / segmentprotected static void addSectionType(RegexSectionizer.SectionType sectionType)
public static Map<String,RegexSectionizer.SectionType> getSectionTypes()
public void initialize(org.apache.uima.UimaContext context) throws org.apache.uima.resource.ResourceInitializationException
initialize
in interface org.apache.uima.analysis_component.AnalysisComponent
initialize
in class org.apache.uima.fit.component.JCasAnnotator_ImplBase
org.apache.uima.resource.ResourceInitializationException
public void process(org.apache.uima.jcas.JCas jcas) throws org.apache.uima.analysis_engine.AnalysisEngineProcessException
process
in class org.apache.uima.analysis_component.JCasAnnotator_ImplBase
org.apache.uima.analysis_engine.AnalysisEngineProcessException
protected abstract void loadSections() throws org.apache.uima.resource.ResourceInitializationException
org.apache.uima.resource.ResourceInitializationException
- -protected static boolean isBoolean(String text)
text
- -Copyright © 2012-2017 The Apache Software Foundation. All Rights Reserved.