Search in sources :

Example 1 with PMMLDiscretize

use of org.knime.core.util.binning.auto.pmml.PMMLDiscretize in project knime-core by knime.

the class AutoBinnerUtility method createDisretizeOp.

private static PMMLPreprocDiscretize createDisretizeOp(final AutoBinnerLearnSettings settings, final Map<String, double[]> edgesMap, final String[] includeCols) {
    final Map<String, List<PMMLDiscretizeBin>> binMap = createBins(settings, edgesMap, includeCols);
    final List<String> names = new ArrayList<String>();
    final Map<String, PMMLDiscretize> discretize = new HashMap<String, PMMLDiscretize>();
    for (String target : includeCols) {
        final String binnedCol = settings.getReplaceColumn() ? target : target + " [Binned]";
        names.add(binnedCol);
        discretize.put(binnedCol, new PMMLDiscretize(target, binMap.get(target)));
    }
    final DisretizeConfiguration config = new DisretizeConfiguration(names, discretize);
    return new PMMLPreprocDiscretize(config);
}
Also used : HashMap(java.util.HashMap) LinkedHashMap(java.util.LinkedHashMap) DisretizeConfiguration(org.knime.core.util.binning.auto.pmml.DisretizeConfiguration) ArrayList(java.util.ArrayList) PMMLDiscretize(org.knime.core.util.binning.auto.pmml.PMMLDiscretize) ArrayList(java.util.ArrayList) LinkedList(java.util.LinkedList) List(java.util.List) PMMLPreprocDiscretize(org.knime.core.util.binning.auto.pmml.PMMLPreprocDiscretize)

Example 2 with PMMLDiscretize

use of org.knime.core.util.binning.auto.pmml.PMMLDiscretize in project knime-core by knime.

the class AutoBinnerUtility method translate.

/**
 * This method translates a {@link PMMLPreprocDiscretize} object into {@link PMMLPortObject}.
 *
 * @param pmmlDiscretize {@link PMMLPreprocDiscretize} object
 * @param dataTableSpec {@link DataTableSpec} if incoming {@link BufferedDataTable}
 * @return a {@link PMMLPortObject} containing required parameters for binning operation
 */
public static PMMLPortObject translate(final PMMLPreprocDiscretize pmmlDiscretize, final DataTableSpec dataTableSpec) {
    final Map<String, Bin[]> columnToBins = new HashMap<>();
    final Map<String, String> columnToAppend = new HashMap<>();
    final List<String> replacedColumnNames = pmmlDiscretize.getConfiguration().getNames();
    for (String replacedColumnName : replacedColumnNames) {
        final PMMLDiscretize discretize = pmmlDiscretize.getConfiguration().getDiscretize(replacedColumnName);
        final List<PMMLDiscretizeBin> bins = discretize.getBins();
        final String originalColumnName = discretize.getField();
        final boolean replaceColumnTheSame = replacedColumnName.equals(originalColumnName);
        columnToAppend.put(originalColumnName, replaceColumnTheSame ? null : replacedColumnName);
        final NumericBin[] numericBin = bins.stream().map(AutoBinnerUtility::getNumericBin).toArray(NumericBin[]::new);
        columnToBins.put(originalColumnName, numericBin);
    }
    final DataTableSpec newDataTableSpec = createNewDataTableSpec(dataTableSpec, columnToAppend);
    final PMMLPortObjectSpecCreator pmmlSpecCreator = new PMMLPortObjectSpecCreator(newDataTableSpec);
    final PMMLPortObject pmmlPortObject = new PMMLPortObject(pmmlSpecCreator.createSpec(), null, newDataTableSpec);
    final PMMLBinningTranslator trans = new PMMLBinningTranslator(columnToBins, columnToAppend, new DerivedFieldMapper(pmmlPortObject));
    final TransformationDictionary exportToTransDict = trans.exportToTransDict();
    pmmlPortObject.addGlobalTransformations(exportToTransDict);
    return pmmlPortObject;
}
Also used : NumericBin(org.knime.core.util.binning.numeric.NumericBin) DataTableSpec(org.knime.core.data.DataTableSpec) HashMap(java.util.HashMap) LinkedHashMap(java.util.LinkedHashMap) TransformationDictionary(org.dmg.pmml.TransformationDictionaryDocument.TransformationDictionary) PMMLDiscretizeBin(org.knime.core.util.binning.auto.pmml.PMMLDiscretizeBin) DerivedFieldMapper(org.knime.core.node.port.pmml.preproc.DerivedFieldMapper) PMMLPortObject(org.knime.core.node.port.pmml.PMMLPortObject) PMMLBinningTranslator(org.knime.core.util.binning.numeric.PMMLBinningTranslator) PMMLDiscretize(org.knime.core.util.binning.auto.pmml.PMMLDiscretize) PMMLPortObjectSpecCreator(org.knime.core.node.port.pmml.PMMLPortObjectSpecCreator)

Aggregations

HashMap (java.util.HashMap)2 LinkedHashMap (java.util.LinkedHashMap)2 PMMLDiscretize (org.knime.core.util.binning.auto.pmml.PMMLDiscretize)2 ArrayList (java.util.ArrayList)1 LinkedList (java.util.LinkedList)1 List (java.util.List)1 TransformationDictionary (org.dmg.pmml.TransformationDictionaryDocument.TransformationDictionary)1 DataTableSpec (org.knime.core.data.DataTableSpec)1 PMMLPortObject (org.knime.core.node.port.pmml.PMMLPortObject)1 PMMLPortObjectSpecCreator (org.knime.core.node.port.pmml.PMMLPortObjectSpecCreator)1 DerivedFieldMapper (org.knime.core.node.port.pmml.preproc.DerivedFieldMapper)1 DisretizeConfiguration (org.knime.core.util.binning.auto.pmml.DisretizeConfiguration)1 PMMLDiscretizeBin (org.knime.core.util.binning.auto.pmml.PMMLDiscretizeBin)1 PMMLPreprocDiscretize (org.knime.core.util.binning.auto.pmml.PMMLPreprocDiscretize)1 NumericBin (org.knime.core.util.binning.numeric.NumericBin)1 PMMLBinningTranslator (org.knime.core.util.binning.numeric.PMMLBinningTranslator)1