@KFStep(name="Join", category="Flow", toolTipText="Performs an inner join on two incoming datasets/instance streams (IMPORTANT: assumes that both datasets are sorted in ascending order of the key fields). If data is not sorted then usea Sorter step to sort both into ascending order of the key fields. Does not handle the case wherekeys are not unique in one or both inputs.", iconPath="weka/gui/knowledgeflow/icons/Join.gif") public class Join extends BaseStep
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
KEY_SPEC_SEPARATOR
Separator used to separate first and second input key specifications
|
Constructor and Description |
---|
Join() |
Modifier and Type | Method and Description |
---|---|
java.util.List<java.lang.String> |
getConnectedInputNames()
Get the names of the connected steps as a list
|
java.lang.String |
getCustomEditorForStep()
Return the fully qualified name of a custom editor component (JComponent)
to use for editing the properties of the step.
|
Instances |
getFirstInputStructure()
Get the Instances structure being produced by the first input
|
java.util.List<java.lang.String> |
getIncomingConnectionTypes()
Get a list of incoming connection types that this step can accept.
|
java.lang.String |
getKeySpec()
Get the key specification (in internal format -
k11,k12,...,k1nKEY_SPEC_SEPARATORk21,k22,...,k2n)
|
java.util.List<java.lang.String> |
getOutgoingConnectionTypes()
Get a list of outgoing connection types that this step can produce.
|
Instances |
getSecondInputStructure()
Get the Instances structure being produced by the second input
|
void |
processIncoming(Data data)
Process some incoming data
|
void |
setKeySpec(java.lang.String ks)
Set the key specification (in internal format -
k11,k12,...,k1nKEY_SPEC_SEPARATORk21,k22,...,k2n)
|
void |
stepInit()
Initialize the step
|
environmentSubstitute, getDefaultSettings, getInteractiveViewers, getInteractiveViewersImpls, getName, getStepManager, globalInfo, isResourceIntensive, isStopRequested, outputStructureForConnectionType, outputStructureForConnectionType, setName, setStepIsResourceIntensive, setStepManager, setStepMustRunSingleThreaded, start, stepMustRunSingleThreaded, stop
public static final java.lang.String KEY_SPEC_SEPARATOR
public void setKeySpec(java.lang.String ks)
ks
- the keys specificationpublic java.lang.String getKeySpec()
public java.util.List<java.lang.String> getConnectedInputNames()
public Instances getFirstInputStructure() throws WekaException
WekaException
- if a problem occurspublic Instances getSecondInputStructure() throws WekaException
WekaException
- if a problem occurspublic void stepInit() throws WekaException
WekaException
- if a problem occurspublic void processIncoming(Data data) throws WekaException
processIncoming
in interface BaseStepExtender
processIncoming
in interface Step
processIncoming
in class BaseStep
data
- the data to processWekaException
- if a problem occurspublic java.util.List<java.lang.String> getIncomingConnectionTypes()
public java.util.List<java.lang.String> getOutgoingConnectionTypes()
public java.lang.String getCustomEditorForStep()
getCustomEditorForStep
in interface Step
getCustomEditorForStep
in class BaseStep