use of org.knime.core.data.container.CellFactory in project knime-core by knime.
the class PCANodeModel method execute.
/**
* Performs the PCA.
*
* {@inheritDoc}
*/
@Override
protected PortObject[] execute(final PortObject[] inData, final ExecutionContext exec) throws Exception {
// remove all non-numeric columns from the input date
// final DataTable filteredTable =
// filterNonNumericalColumns(inData[DATA_INPORT]);
final BufferedDataTable dataTable = (BufferedDataTable) inData[DATA_INPORT];
if (dataTable.size() == 0) {
throw new IllegalArgumentException("Input table is empty!");
}
if (dataTable.size() == 1) {
throw new IllegalArgumentException("Input table has only one row!");
}
final double[] meanVector = getMeanVector(dataTable, m_inputColumnIndices, false, exec.createSubExecutionContext(0.2));
final double[][] m = new double[m_inputColumnIndices.length][m_inputColumnIndices.length];
final int missingValues = getCovarianceMatrix(exec.createSubExecutionContext(0.2), dataTable, m_inputColumnIndices, meanVector, m);
final Matrix covarianceMatrix = new Matrix(m);
if (missingValues > 0) {
if (m_failOnMissingValues.getBooleanValue()) {
throw new IllegalArgumentException("missing, infinite or impossible values in table");
}
setWarningMessage(missingValues + " rows ignored because of missing" + ", infinite or impossible values");
}
final ExecutionContext evdContext = exec.createSubExecutionContext(0.2);
evdContext.setMessage("computing spectral decomposition");
final EigenvalueDecomposition eig = covarianceMatrix.eig();
exec.checkCanceled();
evdContext.setProgress(0.8);
final double[] evs = EigenValue.extractEVVector(eig);
m_dimSelection.setEigenValues(evs);
final int dimensions = m_dimSelection.getNeededDimensions();
// don't remember these in case input changes
m_dimSelection.setEigenValues(null);
// adjust to selected numerical columns
if (dimensions > m_inputColumnIndices.length || dimensions < 1) {
throw new IllegalArgumentException("invalid number of dimensions to reduce to: " + dimensions);
}
exec.checkCanceled();
evdContext.setProgress(0.9);
final Matrix eigenvectors = EigenValue.getSortedEigenVectors(eig.getV().getArray(), evs, dimensions);
exec.checkCanceled();
evdContext.setProgress(1);
exec.checkCanceled();
final DataColumnSpec[] specs = createAddTableSpec((DataTableSpec) inData[DATA_INPORT].getSpec(), dimensions);
final CellFactory fac = new CellFactory() {
@Override
public DataCell[] getCells(final DataRow row) {
return convertInputRow(eigenvectors, row, meanVector, m_inputColumnIndices, dimensions, false);
}
@Override
public DataColumnSpec[] getColumnSpecs() {
return specs;
}
@Override
public void setProgress(final int curRowNr, final int rowCount, final RowKey lastKey, final ExecutionMonitor texec) {
texec.setProgress(curRowNr / (double) rowCount, "processing " + curRowNr + " of " + rowCount);
}
};
final ColumnRearranger cr = new ColumnRearranger((DataTableSpec) inData[0].getSpec());
cr.append(fac);
if (m_removeOriginalCols.getBooleanValue()) {
cr.remove(m_inputColumnIndices);
}
final BufferedDataTable result = exec.createColumnRearrangeTable((BufferedDataTable) inData[0], cr, exec.createSubProgress(0.4));
final PortObject[] out = new PortObject[1];
out[DATA_OUTPORT] = result;
// m_inputColumnNames);
return out;
}
Aggregations