Search in sources :

Example 71 with RowMeta

use of org.pentaho.di.core.row.RowMeta in project pentaho-kettle by pentaho.

the class DimensionLookup method setDimLookup.

/**
 * table: dimension table keys[]: which dim-fields do we use to look up key? retval: name of the key to return
 * datefield: do we have a datefield? datefrom, dateto: date-range, if any.
 */
private void setDimLookup(RowMetaInterface rowMeta) throws KettleDatabaseException {
    DatabaseMeta databaseMeta = meta.getDatabaseMeta();
    data.lookupRowMeta = new RowMeta();
    /*
     * DEFAULT, SYSDATE, START_TRANS, COLUMN_VALUE :
     *
     * SELECT <tk>, <version>, ... , FROM <table> WHERE key1=keys[1] AND key2=keys[2] ... AND <datefrom> <= <datefield>
     * AND <dateto> > <datefield> ;
     *
     * NULL :
     *
     * SELECT <tk>, <version>, ... , FROM <table> WHERE key1=keys[1] AND key2=keys[2] ... AND ( <datefrom> is null OR
     * <datefrom> <= <datefield> ) AND <dateto> >= <datefield>
     */
    String sql = "SELECT " + databaseMeta.quoteField(meta.getKeyField()) + ", " + databaseMeta.quoteField(meta.getVersionField());
    if (!Utils.isEmpty(meta.getFieldLookup())) {
        for (int i = 0; i < meta.getFieldLookup().length; i++) {
            // Don't retrieve the fields without input
            if (!Utils.isEmpty(meta.getFieldLookup()[i]) && !DimensionLookupMeta.isUpdateTypeWithoutArgument(meta.isUpdate(), meta.getFieldUpdate()[i])) {
                sql += ", " + databaseMeta.quoteField(meta.getFieldLookup()[i]);
                if (!Utils.isEmpty(meta.getFieldStream()[i]) && !meta.getFieldLookup()[i].equals(meta.getFieldStream()[i])) {
                    sql += " AS " + databaseMeta.quoteField(meta.getFieldStream()[i]);
                }
            }
        }
    }
    if (meta.getCacheSize() >= 0) {
        sql += ", " + databaseMeta.quoteField(meta.getDateFrom()) + ", " + databaseMeta.quoteField(meta.getDateTo());
    }
    sql += " FROM " + data.schemaTable + " WHERE ";
    for (int i = 0; i < meta.getKeyLookup().length; i++) {
        if (i != 0) {
            sql += " AND ";
        }
        sql += databaseMeta.quoteField(meta.getKeyLookup()[i]) + " = ? ";
        data.lookupRowMeta.addValueMeta(rowMeta.getValueMeta(data.keynrs[i]));
    }
    String dateFromField = databaseMeta.quoteField(meta.getDateFrom());
    String dateToField = databaseMeta.quoteField(meta.getDateTo());
    if (meta.isUsingStartDateAlternative() && (meta.getStartDateAlternative() == DimensionLookupMeta.START_DATE_ALTERNATIVE_NULL) || (meta.getStartDateAlternative() == DimensionLookupMeta.START_DATE_ALTERNATIVE_COLUMN_VALUE)) {
        // Null as a start date is possible...
        // 
        sql += " AND ( " + dateFromField + " IS NULL OR " + dateFromField + " <= ? )" + Const.CR;
        sql += " AND " + dateToField + " > ?" + Const.CR;
        data.lookupRowMeta.addValueMeta(new ValueMetaDate(meta.getDateFrom()));
        data.lookupRowMeta.addValueMeta(new ValueMetaDate(meta.getDateTo()));
    } else {
        // Null as a start date is NOT possible
        // 
        sql += " AND ? >= " + dateFromField + Const.CR;
        sql += " AND ? < " + dateToField + Const.CR;
        data.lookupRowMeta.addValueMeta(new ValueMetaDate(meta.getDateFrom()));
        data.lookupRowMeta.addValueMeta(new ValueMetaDate(meta.getDateTo()));
    }
    try {
        logDetailed("Dimension Lookup setting preparedStatement to [" + sql + "]");
        data.prepStatementLookup = data.db.getConnection().prepareStatement(databaseMeta.stripCR(sql));
        if (databaseMeta.supportsSetMaxRows()) {
            // alywas get only 1 line back!
            data.prepStatementLookup.setMaxRows(1);
        }
        if (databaseMeta.getDatabaseInterface().isMySQLVariant()) {
            // Make sure to DISABLE Streaming Result sets
            data.prepStatementLookup.setFetchSize(0);
        }
        logDetailed("Finished preparing dimension lookup statement.");
    } catch (SQLException ex) {
        throw new KettleDatabaseException("Unable to prepare dimension lookup", ex);
    }
}
Also used : RowMeta(org.pentaho.di.core.row.RowMeta) SQLException(java.sql.SQLException) KettleDatabaseException(org.pentaho.di.core.exception.KettleDatabaseException) DatabaseMeta(org.pentaho.di.core.database.DatabaseMeta) ValueMetaDate(org.pentaho.di.core.row.value.ValueMetaDate)

Example 72 with RowMeta

use of org.pentaho.di.core.row.RowMeta in project pentaho-kettle by pentaho.

the class DimensionLookup method dimPunchThrough.

// This updates all versions of a dimension entry.
// 
public void dimPunchThrough(RowMetaInterface rowMeta, Object[] row) throws KettleDatabaseException {
    if (data.prepStatementPunchThrough == null) {
        // first time: construct prepared statement
        DatabaseMeta databaseMeta = meta.getDatabaseMeta();
        data.punchThroughRowMeta = new RowMeta();
        /*
       * UPDATE table SET punchv1 = fieldx, ... , last_updated = <now> WHERE keylookup[] = keynrs[] ;
       */
        String sql_upd = "UPDATE " + data.schemaTable + Const.CR;
        sql_upd += "SET ";
        boolean first = true;
        for (int i = 0; i < meta.getFieldLookup().length; i++) {
            if (meta.getFieldUpdate()[i] == DimensionLookupMeta.TYPE_UPDATE_DIM_PUNCHTHROUGH) {
                if (!first) {
                    sql_upd += ", ";
                } else {
                    sql_upd += "  ";
                }
                first = false;
                sql_upd += databaseMeta.quoteField(meta.getFieldLookup()[i]) + " = ?" + Const.CR;
                data.punchThroughRowMeta.addValueMeta(rowMeta.getValueMeta(data.fieldnrs[i]));
            }
        }
        // 
        for (int i = 0; i < meta.getFieldUpdate().length; i++) {
            ValueMetaInterface valueMeta = null;
            switch(meta.getFieldUpdate()[i]) {
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
                case DimensionLookupMeta.TYPE_UPDATE_DATE_UPDATED:
                    valueMeta = new ValueMetaDate(meta.getFieldLookup()[i]);
                    break;
                default:
                    break;
            }
            if (valueMeta != null) {
                sql_upd += ", " + databaseMeta.quoteField(valueMeta.getName()) + " = ?" + Const.CR;
                data.punchThroughRowMeta.addValueMeta(valueMeta);
            }
        }
        sql_upd += "WHERE ";
        for (int i = 0; i < meta.getKeyLookup().length; i++) {
            if (i > 0) {
                sql_upd += "AND   ";
            }
            sql_upd += databaseMeta.quoteField(meta.getKeyLookup()[i]) + " = ?" + Const.CR;
            data.punchThroughRowMeta.addValueMeta(rowMeta.getValueMeta(data.keynrs[i]));
        }
        try {
            data.prepStatementPunchThrough = data.db.getConnection().prepareStatement(meta.getDatabaseMeta().stripCR(sql_upd));
        } catch (SQLException ex) {
            throw new KettleDatabaseException("Unable to prepare dimension punchThrough update statement : " + Const.CR + sql_upd, ex);
        }
    }
    Object[] punchThroughRow = new Object[data.punchThroughRowMeta.size()];
    int punchIndex = 0;
    for (int i = 0; i < meta.getFieldLookup().length; i++) {
        if (meta.getFieldUpdate()[i] == DimensionLookupMeta.TYPE_UPDATE_DIM_PUNCHTHROUGH) {
            punchThroughRow[punchIndex++] = row[data.fieldnrs[i]];
        }
    }
    for (int i = 0; i < meta.getFieldUpdate().length; i++) {
        switch(meta.getFieldUpdate()[i]) {
            case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
            case DimensionLookupMeta.TYPE_UPDATE_DATE_UPDATED:
                punchThroughRow[punchIndex++] = new Date();
                break;
            default:
                break;
        }
    }
    for (int i = 0; i < data.keynrs.length; i++) {
        punchThroughRow[punchIndex++] = row[data.keynrs[i]];
    }
    // UPDATE VALUES
    // set values for
    data.db.setValues(data.punchThroughRowMeta, punchThroughRow, data.prepStatementPunchThrough);
    // update
    // do the actual punch through update
    data.db.insertRow(data.prepStatementPunchThrough);
}
Also used : RowMeta(org.pentaho.di.core.row.RowMeta) SQLException(java.sql.SQLException) KettleDatabaseException(org.pentaho.di.core.exception.KettleDatabaseException) DatabaseMeta(org.pentaho.di.core.database.DatabaseMeta) ValueMetaDate(org.pentaho.di.core.row.value.ValueMetaDate) Date(java.util.Date) ValueMetaDate(org.pentaho.di.core.row.value.ValueMetaDate) ValueMetaInterface(org.pentaho.di.core.row.ValueMetaInterface)

Example 73 with RowMeta

use of org.pentaho.di.core.row.RowMeta in project pentaho-kettle by pentaho.

the class DimensionLookup method dimInsert.

/**
 * This inserts new record into dimension Optionally, if the entry already exists, update date range from previous
 * version of the entry.
 */
public Long dimInsert(RowMetaInterface inputRowMeta, Object[] row, Long technicalKey, boolean newEntry, Long versionNr, Date dateFrom, Date dateTo) throws KettleException {
    DatabaseMeta databaseMeta = meta.getDatabaseMeta();
    if (data.prepStatementInsert == null && data.prepStatementUpdate == null) {
        // first time: construct prepared statement
        RowMetaInterface insertRowMeta = new RowMeta();
        /*
       * Construct the SQL statement...
       *
       * INSERT INTO d_customer(keyfield, versionfield, datefrom, dateto, key[], fieldlookup[], last_updated,
       * last_inserted, last_version) VALUES (val_key ,val_version , val_datfrom, val_datto, keynrs[], fieldnrs[],
       * last_updated, last_inserted, last_version) ;
       */
        String sql = "INSERT INTO " + data.schemaTable + "( ";
        if (!isAutoIncrement()) {
            // NO
            sql += databaseMeta.quoteField(meta.getKeyField()) + ", ";
            // AUTOINCREMENT
            // the first return value
            insertRowMeta.addValueMeta(data.outputRowMeta.getValueMeta(inputRowMeta.size()));
        // after the input
        } else {
            if (databaseMeta.needsPlaceHolder()) {
                // placeholder on informix!
                sql += "0, ";
            }
        }
        sql += databaseMeta.quoteField(meta.getVersionField()) + ", " + databaseMeta.quoteField(meta.getDateFrom()) + ", " + databaseMeta.quoteField(meta.getDateTo());
        insertRowMeta.addValueMeta(new ValueMetaInteger(meta.getVersionField()));
        insertRowMeta.addValueMeta(new ValueMetaDate(meta.getDateFrom()));
        insertRowMeta.addValueMeta(new ValueMetaDate(meta.getDateTo()));
        for (int i = 0; i < meta.getKeyLookup().length; i++) {
            sql += ", " + databaseMeta.quoteField(meta.getKeyLookup()[i]);
            insertRowMeta.addValueMeta(inputRowMeta.getValueMeta(data.keynrs[i]));
        }
        for (int i = 0; i < meta.getFieldLookup().length; i++) {
            // 
            if (!DimensionLookupMeta.isUpdateTypeWithoutArgument(meta.isUpdate(), meta.getFieldUpdate()[i])) {
                sql += ", " + databaseMeta.quoteField(meta.getFieldLookup()[i]);
                insertRowMeta.addValueMeta(inputRowMeta.getValueMeta(data.fieldnrs[i]));
            }
        }
        // 
        for (int i = 0; i < meta.getFieldUpdate().length; i++) {
            ValueMetaInterface valueMeta = null;
            switch(meta.getFieldUpdate()[i]) {
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSERTED:
                    valueMeta = new ValueMetaDate(meta.getFieldLookup()[i]);
                    break;
                case DimensionLookupMeta.TYPE_UPDATE_LAST_VERSION:
                    valueMeta = new ValueMetaBoolean(meta.getFieldLookup()[i]);
                    break;
                default:
                    break;
            }
            if (valueMeta != null) {
                sql += ", " + databaseMeta.quoteField(valueMeta.getName());
                insertRowMeta.addValueMeta(valueMeta);
            }
        }
        sql += ") VALUES (";
        if (!isAutoIncrement()) {
            sql += "?, ";
        }
        sql += "?, ?, ?";
        for (int i = 0; i < data.keynrs.length; i++) {
            sql += ", ?";
        }
        for (int i = 0; i < meta.getFieldLookup().length; i++) {
            // 
            if (!DimensionLookupMeta.isUpdateTypeWithoutArgument(meta.isUpdate(), meta.getFieldUpdate()[i])) {
                sql += ", ?";
            }
        }
        // 
        for (int i = 0; i < meta.getFieldUpdate().length; i++) {
            switch(meta.getFieldUpdate()[i]) {
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSERTED:
                case DimensionLookupMeta.TYPE_UPDATE_LAST_VERSION:
                    sql += ", ?";
                    break;
                default:
                    break;
            }
        }
        sql += " )";
        try {
            if (technicalKey == null && databaseMeta.supportsAutoGeneratedKeys()) {
                logDetailed("SQL w/ return keys=[" + sql + "]");
                data.prepStatementInsert = data.db.getConnection().prepareStatement(databaseMeta.stripCR(sql), Statement.RETURN_GENERATED_KEYS);
            } else {
                logDetailed("SQL=[" + sql + "]");
                data.prepStatementInsert = data.db.getConnection().prepareStatement(databaseMeta.stripCR(sql));
            }
        // pstmt=con.prepareStatement(sql, new String[] { "klant_tk" } );
        } catch (SQLException ex) {
            throw new KettleDatabaseException("Unable to prepare dimension insert :" + Const.CR + sql, ex);
        }
        /*
       * UPDATE d_customer SET dateto = val_datnow, last_updated = <now> last_version = false WHERE keylookup[] =
       * keynrs[] AND versionfield = val_version - 1 ;
       */
        RowMetaInterface updateRowMeta = new RowMeta();
        String sql_upd = "UPDATE " + data.schemaTable + Const.CR;
        // The end of the date range
        // 
        sql_upd += "SET " + databaseMeta.quoteField(meta.getDateTo()) + " = ?" + Const.CR;
        updateRowMeta.addValueMeta(new ValueMetaDate(meta.getDateTo()));
        // 
        for (int i = 0; i < meta.getFieldUpdate().length; i++) {
            ValueMetaInterface valueMeta = null;
            switch(meta.getFieldUpdate()[i]) {
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
                case DimensionLookupMeta.TYPE_UPDATE_DATE_UPDATED:
                    valueMeta = new ValueMetaDate(meta.getFieldLookup()[i]);
                    break;
                case DimensionLookupMeta.TYPE_UPDATE_LAST_VERSION:
                    valueMeta = new ValueMetaBoolean(meta.getFieldLookup()[i]);
                    break;
                default:
                    break;
            }
            if (valueMeta != null) {
                sql_upd += ", " + databaseMeta.quoteField(valueMeta.getName()) + " = ?" + Const.CR;
                updateRowMeta.addValueMeta(valueMeta);
            }
        }
        sql_upd += "WHERE ";
        for (int i = 0; i < meta.getKeyLookup().length; i++) {
            if (i > 0) {
                sql_upd += "AND   ";
            }
            sql_upd += databaseMeta.quoteField(meta.getKeyLookup()[i]) + " = ?" + Const.CR;
            updateRowMeta.addValueMeta(inputRowMeta.getValueMeta(data.keynrs[i]));
        }
        sql_upd += "AND   " + databaseMeta.quoteField(meta.getVersionField()) + " = ? ";
        updateRowMeta.addValueMeta(new ValueMetaInteger(meta.getVersionField()));
        try {
            logDetailed("Preparing update: " + Const.CR + sql_upd + Const.CR);
            data.prepStatementUpdate = data.db.getConnection().prepareStatement(databaseMeta.stripCR(sql_upd));
        } catch (SQLException ex) {
            throw new KettleDatabaseException("Unable to prepare dimension update :" + Const.CR + sql_upd, ex);
        }
        data.insertRowMeta = insertRowMeta;
        data.updateRowMeta = updateRowMeta;
    }
    Object[] insertRow = new Object[data.insertRowMeta.size()];
    int insertIndex = 0;
    if (!isAutoIncrement()) {
        insertRow[insertIndex++] = technicalKey;
    }
    // Caller is responsible for setting proper version number depending
    // on if newEntry == true
    insertRow[insertIndex++] = versionNr;
    switch(data.startDateChoice) {
        case DimensionLookupMeta.START_DATE_ALTERNATIVE_NONE:
            insertRow[insertIndex++] = dateFrom;
            break;
        case DimensionLookupMeta.START_DATE_ALTERNATIVE_SYSDATE:
            // use the time the step execution begins as the date from (passed in as dateFrom).
            // before, the current system time was used. this caused an exclusion of the row in the
            // lookup portion of the step that uses this 'valueDate' and not the current time.
            // the result was multiple inserts for what should have been 1 [PDI-4317]
            insertRow[insertIndex++] = dateFrom;
            break;
        case DimensionLookupMeta.START_DATE_ALTERNATIVE_START_OF_TRANS:
            insertRow[insertIndex++] = getTrans().getStartDate();
            break;
        case DimensionLookupMeta.START_DATE_ALTERNATIVE_NULL:
            insertRow[insertIndex++] = null;
            break;
        case DimensionLookupMeta.START_DATE_ALTERNATIVE_COLUMN_VALUE:
            insertRow[insertIndex++] = inputRowMeta.getDate(row, data.startDateFieldIndex);
            break;
        default:
            throw new KettleStepException(BaseMessages.getString(PKG, "DimensionLookup.Exception.IllegalStartDateSelection", Integer.toString(data.startDateChoice)));
    }
    insertRow[insertIndex++] = dateTo;
    for (int i = 0; i < data.keynrs.length; i++) {
        insertRow[insertIndex++] = row[data.keynrs[i]];
    }
    for (int i = 0; i < data.fieldnrs.length; i++) {
        if (data.fieldnrs[i] >= 0) {
            // Ignore last_version, last_updated, etc. These are handled below...
            // 
            insertRow[insertIndex++] = row[data.fieldnrs[i]];
        }
    }
    // 
    for (int i = 0; i < meta.getFieldUpdate().length; i++) {
        switch(meta.getFieldUpdate()[i]) {
            case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
            case DimensionLookupMeta.TYPE_UPDATE_DATE_INSERTED:
                insertRow[insertIndex++] = new Date();
                break;
            case DimensionLookupMeta.TYPE_UPDATE_LAST_VERSION:
                insertRow[insertIndex++] = Boolean.TRUE;
                // Always the last version on insert.
                break;
            default:
                break;
        }
    }
    if (isDebug()) {
        logDebug("rins, size=" + data.insertRowMeta.size() + ", values=" + data.insertRowMeta.getString(insertRow));
    }
    // INSERT NEW VALUE!
    data.db.setValues(data.insertRowMeta, insertRow, data.prepStatementInsert);
    data.db.insertRow(data.prepStatementInsert);
    if (isDebug()) {
        logDebug("Row inserted!");
    }
    if (technicalKey == null && databaseMeta.supportsAutoGeneratedKeys()) {
        try {
            RowMetaAndData keys = data.db.getGeneratedKeys(data.prepStatementInsert);
            if (keys.getRowMeta().size() > 0) {
                technicalKey = keys.getRowMeta().getInteger(keys.getData(), 0);
            } else {
                throw new KettleDatabaseException("Unable to retrieve value of auto-generated technical key : no value found!");
            }
        } catch (Exception e) {
            throw new KettleDatabaseException("Unable to retrieve value of auto-generated technical key : unexpected error: ", e);
        }
    }
    if (!newEntry) {
        // we have to update the previous version in the dimension!
        /*
       * UPDATE d_customer SET dateto = val_datfrom , last_updated = <now> , last_version = false WHERE keylookup[] =
       * keynrs[] AND versionfield = val_version - 1 ;
       */
        Object[] updateRow = new Object[data.updateRowMeta.size()];
        int updateIndex = 0;
        switch(data.startDateChoice) {
            case DimensionLookupMeta.START_DATE_ALTERNATIVE_NONE:
                updateRow[updateIndex++] = dateFrom;
                break;
            case DimensionLookupMeta.START_DATE_ALTERNATIVE_SYSDATE:
                updateRow[updateIndex++] = new Date();
                break;
            case DimensionLookupMeta.START_DATE_ALTERNATIVE_START_OF_TRANS:
                updateRow[updateIndex++] = getTrans().getCurrentDate();
                break;
            case DimensionLookupMeta.START_DATE_ALTERNATIVE_NULL:
                updateRow[updateIndex++] = null;
                break;
            case DimensionLookupMeta.START_DATE_ALTERNATIVE_COLUMN_VALUE:
                updateRow[updateIndex++] = inputRowMeta.getDate(row, data.startDateFieldIndex);
                break;
            default:
                throw new KettleStepException(BaseMessages.getString("DimensionLookup.Exception.IllegalStartDateSelection", Integer.toString(data.startDateChoice)));
        }
        // 
        for (int i = 0; i < meta.getFieldUpdate().length; i++) {
            switch(meta.getFieldUpdate()[i]) {
                case DimensionLookupMeta.TYPE_UPDATE_DATE_INSUP:
                    updateRow[updateIndex++] = new Date();
                    break;
                case DimensionLookupMeta.TYPE_UPDATE_LAST_VERSION:
                    updateRow[updateIndex++] = Boolean.FALSE;
                    // Never the last version on this update
                    break;
                case DimensionLookupMeta.TYPE_UPDATE_DATE_UPDATED:
                    updateRow[updateIndex++] = new Date();
                    break;
                default:
                    break;
            }
        }
        for (int i = 0; i < data.keynrs.length; i++) {
            updateRow[updateIndex++] = row[data.keynrs[i]];
        }
        updateRow[updateIndex++] = versionNr - 1;
        if (isRowLevel()) {
            logRowlevel("UPDATE using rupd=" + data.updateRowMeta.getString(updateRow));
        }
        // UPDATE VALUES
        // set values for update
        // 
        data.db.setValues(data.updateRowMeta, updateRow, data.prepStatementUpdate);
        if (isDebug()) {
            logDebug("Values set for update (" + data.updateRowMeta.size() + ")");
        }
        // do the actual update
        data.db.insertRow(data.prepStatementUpdate);
        if (isDebug()) {
            logDebug("Row updated!");
        }
    }
    return technicalKey;
}
Also used : KettleStepException(org.pentaho.di.core.exception.KettleStepException) RowMeta(org.pentaho.di.core.row.RowMeta) SQLException(java.sql.SQLException) KettleDatabaseException(org.pentaho.di.core.exception.KettleDatabaseException) RowMetaInterface(org.pentaho.di.core.row.RowMetaInterface) ValueMetaBoolean(org.pentaho.di.core.row.value.ValueMetaBoolean) DatabaseMeta(org.pentaho.di.core.database.DatabaseMeta) Date(java.util.Date) ValueMetaDate(org.pentaho.di.core.row.value.ValueMetaDate) KettleException(org.pentaho.di.core.exception.KettleException) KettleDatabaseException(org.pentaho.di.core.exception.KettleDatabaseException) SQLException(java.sql.SQLException) KettleValueException(org.pentaho.di.core.exception.KettleValueException) KettleStepException(org.pentaho.di.core.exception.KettleStepException) ValueMetaInterface(org.pentaho.di.core.row.ValueMetaInterface) RowMetaAndData(org.pentaho.di.core.RowMetaAndData) ValueMetaInteger(org.pentaho.di.core.row.value.ValueMetaInteger) ValueMetaDate(org.pentaho.di.core.row.value.ValueMetaDate)

Example 74 with RowMeta

use of org.pentaho.di.core.row.RowMeta in project pentaho-kettle by pentaho.

the class ExcelInput method processRow.

public boolean processRow(StepMetaInterface smi, StepDataInterface sdi) throws KettleException {
    meta = (ExcelInputMeta) smi;
    data = (ExcelInputData) sdi;
    if (first) {
        first = false;
        // start from scratch!
        data.outputRowMeta = new RowMeta();
        meta.getFields(data.outputRowMeta, getStepname(), null, null, this, repository, metaStore);
        if (meta.isAcceptingFilenames()) {
            // Read the files from the specified input stream...
            data.files.getFiles().clear();
            int idx = -1;
            RowSet rowSet = findInputRowSet(meta.getAcceptingStepName());
            Object[] fileRow = getRowFrom(rowSet);
            while (fileRow != null) {
                if (idx < 0) {
                    idx = rowSet.getRowMeta().indexOfValue(meta.getAcceptingField());
                    if (idx < 0) {
                        logError(BaseMessages.getString(PKG, "ExcelInput.Error.FilenameFieldNotFound", "" + meta.getAcceptingField()));
                        setErrors(1);
                        stopAll();
                        return false;
                    }
                }
                String fileValue = rowSet.getRowMeta().getString(fileRow, idx);
                try {
                    data.files.addFile(KettleVFS.getFileObject(fileValue, getTransMeta()));
                } catch (KettleFileException e) {
                    throw new KettleException(BaseMessages.getString(PKG, "ExcelInput.Exception.CanNotCreateFileObject", fileValue), e);
                }
                // Grab another row
                fileRow = getRowFrom(rowSet);
            }
        }
        handleMissingFiles();
    }
    // We are done processing if the filenr >= number of files.
    if (data.filenr >= data.files.nrOfFiles()) {
        if (log.isDetailed()) {
            logDetailed(BaseMessages.getString(PKG, "ExcelInput.Log.NoMoreFiles", "" + data.filenr));
        }
        // signal end to receiver(s)
        setOutputDone();
        // end of data or error.
        return false;
    }
    // in this case we have to stop a row "earlier", since we start a row number 0 !!!
    if ((meta.getRowLimit() > 0 && data.rownr > meta.getRowLimit()) || (meta.readAllSheets() && meta.getRowLimit() > 0 && data.defaultStartRow == 0 && data.rownr > meta.getRowLimit() - 1) || (!meta.readAllSheets() && meta.getRowLimit() > 0 && data.startRow[data.sheetnr] == 0 && data.rownr > meta.getRowLimit() - 1)) {
        // The close of the openFile is in dispose()
        if (log.isDetailed()) {
            logDetailed(BaseMessages.getString(PKG, "ExcelInput.Log.RowLimitReached", "" + meta.getRowLimit()));
        }
        // signal end to receiver(s)
        setOutputDone();
        // end of data or error.
        return false;
    }
    Object[] r = getRowFromWorkbooks();
    if (r != null) {
        incrementLinesInput();
        // OK, see if we need to repeat values.
        if (data.previousRow != null) {
            for (int i = 0; i < meta.getField().length; i++) {
                ValueMetaInterface valueMeta = data.outputRowMeta.getValueMeta(i);
                Object valueData = r[i];
                if (valueMeta.isNull(valueData) && meta.getField()[i].isRepeated()) {
                    // Take the value from the previous row.
                    r[i] = data.previousRow[i];
                }
            }
        }
        // Remember this row for the next time around!
        data.previousRow = data.outputRowMeta.cloneRow(r);
        // Send out the good news: we found a row of data!
        putRow(data.outputRowMeta, r);
        return true;
    } else {
        // We continue though.
        return true;
    }
}
Also used : KettleException(org.pentaho.di.core.exception.KettleException) KettleFileException(org.pentaho.di.core.exception.KettleFileException) RowMeta(org.pentaho.di.core.row.RowMeta) RowSet(org.pentaho.di.core.RowSet) FileObject(org.apache.commons.vfs2.FileObject) ValueMetaInterface(org.pentaho.di.core.row.ValueMetaInterface)

Example 75 with RowMeta

use of org.pentaho.di.core.row.RowMeta in project pentaho-kettle by pentaho.

the class ExcelInputMeta method getEmptyFields.

public RowMetaInterface getEmptyFields() {
    RowMetaInterface row = new RowMeta();
    if (field != null) {
        for (int i = 0; i < field.length; i++) {
            ValueMetaInterface v;
            try {
                v = ValueMetaFactory.createValueMeta(field[i].getName(), field[i].getType());
            } catch (KettlePluginException e) {
                v = new ValueMetaNone(field[i].getName());
            }
            row.addValueMeta(v);
        }
    }
    return row;
}
Also used : KettlePluginException(org.pentaho.di.core.exception.KettlePluginException) ValueMetaNone(org.pentaho.di.core.row.value.ValueMetaNone) RowMeta(org.pentaho.di.core.row.RowMeta) RowMetaInterface(org.pentaho.di.core.row.RowMetaInterface) ValueMetaInterface(org.pentaho.di.core.row.ValueMetaInterface)

Aggregations

RowMeta (org.pentaho.di.core.row.RowMeta)540 RowMetaInterface (org.pentaho.di.core.row.RowMetaInterface)280 ValueMetaString (org.pentaho.di.core.row.value.ValueMetaString)249 ValueMetaInterface (org.pentaho.di.core.row.ValueMetaInterface)209 Test (org.junit.Test)174 ValueMetaInteger (org.pentaho.di.core.row.value.ValueMetaInteger)135 KettleException (org.pentaho.di.core.exception.KettleException)112 ArrayList (java.util.ArrayList)68 KettleStepException (org.pentaho.di.core.exception.KettleStepException)56 RowMetaAndData (org.pentaho.di.core.RowMetaAndData)52 ValueMetaDate (org.pentaho.di.core.row.value.ValueMetaDate)44 ValueMetaNumber (org.pentaho.di.core.row.value.ValueMetaNumber)41 RowSet (org.pentaho.di.core.RowSet)34 KettleDatabaseException (org.pentaho.di.core.exception.KettleDatabaseException)27 ValueMetaBase (org.pentaho.di.core.row.value.ValueMetaBase)26 SQLException (java.sql.SQLException)24 FileObject (org.apache.commons.vfs2.FileObject)24 ValueMetaBoolean (org.pentaho.di.core.row.value.ValueMetaBoolean)23 StepMeta (org.pentaho.di.trans.step.StepMeta)23 ErrorDialog (org.pentaho.di.ui.core.dialog.ErrorDialog)23