public static class WekaFormatterFactory.WekaFormatter extends BaseSparseDataFormatter
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
CLASS |
static java.lang.String |
INSTANCE_ID |
(package private) InstanceData |
instanceLabel |
(package private) FastVector |
wekaAttributes |
exportProperties, kernelUtil, labelToClassIndexMap, maxAttributeIndex, nominalAttributeMap, numericAttributeMap, outdir
ATTR_INSTANCE_ID, SCOPE, SCOPE_FOLD, SCOPE_LABEL
Constructor and Description |
---|
WekaFormatterFactory.WekaFormatter(KernelUtil kernelUtil) |
Modifier and Type | Method and Description |
---|---|
private void |
addNominalAttribute(java.lang.String attributeName,
java.util.SortedSet<java.lang.String> attributeValues,
boolean addDummy0)
Add a nominal attribute to the list of attributes
|
private void |
addWordsToInstances(Instances instances,
SparseData bagOfWordsData,
java.util.SortedMap<java.lang.Long,java.lang.String> instanceClasses)
add sparse data to instances
|
void |
clearFold()
clear all data structures set up during initializeFold
|
void |
clearLabel() |
void |
exportFold(SparseData sparseData,
java.util.SortedMap<java.lang.Long,java.lang.String> sortedMap,
boolean train,
java.lang.String label,
java.lang.Integer run,
java.lang.Integer fold)
export the fold train/test set.
|
protected void |
initializeAttributes(SparseData bagOfWordsData,
java.util.SortedSet<java.lang.String> classNames)
initialize attributes
|
void |
initializeExport(InstanceData instanceLabel,
java.util.Properties properties,
SparseData sparseData)
get needed properties out of outdir.
|
void |
initializeFold(SparseData sparseData,
java.lang.String label,
java.lang.Integer run,
java.lang.Integer fold,
java.util.SortedMap<java.lang.Boolean,java.util.SortedMap<java.lang.Long,java.lang.String>> foldInstanceLabelMap)
initialize data structures for the fold that will be exported.
|
Instances |
initializeInstances(SparseData sparseData,
java.util.SortedMap<java.lang.Long,java.lang.String> instanceClasses,
boolean train,
java.lang.String label,
java.lang.Integer run,
java.lang.Integer fold)
initialize the weka Instances
|
void |
initializeLabel(java.lang.String label,
java.util.SortedMap<java.lang.Integer,java.util.SortedMap<java.lang.Integer,java.util.SortedMap<java.lang.Boolean,java.util.SortedMap<java.lang.Long,java.lang.String>>>> labelInstances,
java.util.Properties properties,
SparseData sparseData)
initialize attributes on a per-label basis even if the data is the
same across all labels.
|
addNumericAttribute, exportAttributeNames, exportAttributeNames, exportSparseMatrix, exportSparseRow, getSparseLineValues, updateLabelClassMapTransductive
public static final java.lang.String CLASS
public static final java.lang.String INSTANCE_ID
InstanceData instanceLabel
FastVector wekaAttributes
public WekaFormatterFactory.WekaFormatter(KernelUtil kernelUtil)
private void addNominalAttribute(java.lang.String attributeName, java.util.SortedSet<java.lang.String> attributeValues, boolean addDummy0)
attributeName
- attributeValues
- addDummy0
- if true, add a dummy attribute as the first attribute
value in the list of potential attribute values.private void addWordsToInstances(Instances instances, SparseData bagOfWordsData, java.util.SortedMap<java.lang.Long,java.lang.String> instanceClasses) throws java.io.IOException
instances
- bagOfWordsData
- instanceClasses
- java.io.IOException
public void clearFold()
SparseDataFormatter
public void clearLabel()
public void exportFold(SparseData sparseData, java.util.SortedMap<java.lang.Long,java.lang.String> sortedMap, boolean train, java.lang.String label, java.lang.Integer run, java.lang.Integer fold) throws java.io.IOException
SparseDataFormatter
java.io.IOException
protected void initializeAttributes(SparseData bagOfWordsData, java.util.SortedSet<java.lang.String> classNames)
bagOfWordsData
- classNames
- public void initializeExport(InstanceData instanceLabel, java.util.Properties properties, SparseData sparseData) throws java.io.IOException
BaseSparseDataFormatter
initializeExport
in interface SparseDataFormatter
initializeExport
in class BaseSparseDataFormatter
java.io.IOException
public void initializeFold(SparseData sparseData, java.lang.String label, java.lang.Integer run, java.lang.Integer fold, java.util.SortedMap<java.lang.Boolean,java.util.SortedMap<java.lang.Long,java.lang.String>> foldInstanceLabelMap) throws java.io.IOException
SparseDataFormatter
java.io.IOException
public Instances initializeInstances(SparseData sparseData, java.util.SortedMap<java.lang.Long,java.lang.String> instanceClasses, boolean train, java.lang.String label, java.lang.Integer run, java.lang.Integer fold) throws java.io.IOException
arffRelation
- sql
- classLabels
- idfMap
- docLengthMap
- java.io.IOException
public void initializeLabel(java.lang.String label, java.util.SortedMap<java.lang.Integer,java.util.SortedMap<java.lang.Integer,java.util.SortedMap<java.lang.Boolean,java.util.SortedMap<java.lang.Long,java.lang.String>>>> labelInstances, java.util.Properties properties, SparseData sparseData) throws java.io.IOException
java.io.IOException