public class CorrelationMatrixHadoopJob extends HadoopJob implements TextProducer, ImageProducer, CommandlineRunnable
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
OUTPUT_SUBDIR
Subdirectory of the output directory for storing results to
|
COLT_JAR, DISTRIBUTED_WEKA_BASE_JAR, DISTRIBUTED_WEKA_HADOOP_JAR, JCOMMON_JAR, JFREECHART_JAR, LA4J_JAR, OPEN_CSV_JAR, TDIGEST_JAR
Constructor and Description |
---|
CorrelationMatrixHadoopJob()
Constructor
|
Modifier and Type | Method and Description |
---|---|
java.lang.String |
classAttributeTipText()
Tip text for this property
|
java.lang.String |
getClassAttribute()
Get the name or index of the class attribute.
|
java.lang.String |
getCorrelationMapTaskOptions()
Get options for the correlation map tasks
|
java.lang.String |
getCSVMapTaskOptions()
Get the options for the csv map tasks
|
java.awt.Image |
getImage() |
java.lang.String[] |
getJobOptionsOnly()
Get just the job options
|
Matrix |
getMatrix()
Get the matrix generated by this job, or null if the job has not been run
yet.
|
java.lang.String |
getNumNodesInCluster()
Get the number of nodes in the Hadoop cluster
|
java.lang.String[] |
getOptions() |
boolean |
getRunPCA()
Get whether to run a PCA analysis (using the generated correlation matrix
as inpu) as a post-processing step
|
java.lang.String |
getText() |
java.lang.String |
globalInfo()
Textual help info for this job
|
java.util.Enumeration<Option> |
listOptions() |
static void |
main(java.lang.String[] args)
Main method for executing this job from the command line
|
java.lang.String |
numNodesInClusterTipText()
Tip text for this property
|
void |
run(java.lang.Object toRun,
java.lang.String[] args) |
boolean |
runJob() |
java.lang.String |
runPCATipText()
Tip text for this property
|
void |
setClassAttribute(java.lang.String c)
Set the name or index of the class attribute.
|
void |
setCorrelationMapTaskOptions(java.lang.String opts)
Set options for the correlation map tasks
|
void |
setCSVMapTaskOptions(java.lang.String opts)
Set the options for the csv map tasks
|
void |
setNumNodesInCluster(java.lang.String n)
Set the number of nodes in the Hadoop cluster
|
void |
setOptions(java.lang.String[] options) |
void |
setRunPCA(boolean runPCA)
Set whether to run a PCA analysis (using the generated correlation matrix
as inpu) as a post-processing step
|
additionalWekaPackagesTipText, cleanOutputDirectory, deubgTipText, getAdditionalWekaPackages, getBaseOptionsOnly, getDebug, getLoggingInterval, getMapNumber, getMapReduceJobConfig, getMapReduceNumber, getPathToWekaJar, getReduceNumber, loggingIntervalTipText, logMessage, pathToWekaJarTipText, setAdditionalWekaPackages, setDebug, setLoggingInterval, setMapReduceJobConfig, setPathToWekaJar
environmentSubstitute, getAdditionalWekaPackageNames, getJobName, getJobStatus, getLog, logMessage, logMessage, makeOptionsStr, objectRowToInstance, parseInstance, postExecution, preExecution, setEnvironment, setJobDescription, setJobName, setJobStatus, setLog, setStatusMessagePrefix, stackTraceToString, statusMessage, stopJob
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
postExecution, preExecution
public static final java.lang.String OUTPUT_SUBDIR
public java.lang.String globalInfo()
public void setCSVMapTaskOptions(java.lang.String opts)
opts
- options for the csv map takskpublic java.lang.String getCSVMapTaskOptions()
public void setCorrelationMapTaskOptions(java.lang.String opts)
opts
- options for the correlation map taskspublic java.lang.String getCorrelationMapTaskOptions()
public java.lang.String numNodesInClusterTipText()
public void setNumNodesInCluster(java.lang.String n)
n
- the number of nodes in the Hadoop clusterpublic java.lang.String getNumNodesInCluster()
public Matrix getMatrix()
public java.util.Enumeration<Option> listOptions()
listOptions
in interface OptionHandler
listOptions
in class HadoopJob
public void setOptions(java.lang.String[] options) throws java.lang.Exception
setOptions
in interface OptionHandler
setOptions
in class HadoopJob
java.lang.Exception
public java.lang.String[] getOptions()
getOptions
in interface OptionHandler
getOptions
in class HadoopJob
public java.lang.String[] getJobOptionsOnly()
public java.lang.String classAttributeTipText()
public void setClassAttribute(java.lang.String c)
c
- the name or index of the class attributepublic java.lang.String getClassAttribute()
public java.lang.String runPCATipText()
public void setRunPCA(boolean runPCA)
runPCA
- true if PCA should be run after the correlation job finishespublic boolean getRunPCA()
public boolean runJob() throws weka.distributed.DistributedWekaException
runJob
in class distributed.core.DistributedJob
weka.distributed.DistributedWekaException
public java.lang.String getText()
getText
in interface TextProducer
public java.awt.Image getImage()
getImage
in interface ImageProducer
public static void main(java.lang.String[] args)
args
- arguments to the jobpublic void run(java.lang.Object toRun, java.lang.String[] args)
run
in interface CommandlineRunnable
run
in class distributed.core.DistributedJob