Search in sources :

Example 1 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class GroupByOperatorTest method testSqlGroupBy.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlGroupBy() {
    // create operator
    GroupByHavingOperator oper = new GroupByHavingOperator();
    oper.addColumnGroupByIndex(new ColumnIndex("b", null));
    try {
        oper.addAggregateIndex(new SumFunction("c", null));
    } catch (Exception e) {
        // TODO Auto-generated catch block
        e.printStackTrace();
        return;
    }
    EqualValueCondition condition = new EqualValueCondition();
    condition.addEqualValue("a", 1);
    oper.setCondition(condition);
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 1);
    tuple.put("c", 4);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 2);
    tuple.put("c", 6);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 2);
    tuple.put("c", 7);
    oper.inport.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : SumFunction(org.apache.apex.malhar.contrib.misc.streamquery.function.SumFunction) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) EqualValueCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.EqualValueCondition) HashMap(java.util.HashMap) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 2 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class InnerJoinOperatorTest method testSqlSelect.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlSelect() {
    // create operator
    InnerJoinOperator oper = new InnerJoinOperator();
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    // set column join condition
    Condition cond = new JoinColumnEqualCondition("a", "a");
    oper.setJoinCondition(cond);
    // add columns
    oper.selectTable1Column(new ColumnIndex("b", null));
    oper.selectTable2Column(new ColumnIndex("c", null));
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : Condition(org.apache.apex.malhar.lib.streamquery.condition.Condition) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 3 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class GroupByHavingOperator method endWindow.

/**
 * Create aggregate at end window.
 */
@Override
public void endWindow() {
    // group names
    if (columnGroupIndexes.size() == 0) {
        rows = new ArrayList<Map<String, Object>>();
        return;
    }
    // group rows
    HashMap<MultiKeyCompare, ArrayList<Map<String, Object>>> groups = new HashMap<MultiKeyCompare, ArrayList<Map<String, Object>>>();
    for (Map<String, Object> row : rows) {
        MultiKeyCompare key = new MultiKeyCompare();
        for (ColumnIndex index : columnGroupIndexes) {
            key.addCompareKey(row.get(index.getColumn()));
        }
        ArrayList<Map<String, Object>> subRows;
        if (groups.containsKey(key)) {
            subRows = groups.get(key);
        } else {
            subRows = new ArrayList<Map<String, Object>>();
            groups.put(key, subRows);
        }
        subRows.add(row);
    }
    // Iterate over groups and emit aggregate values
    for (Map.Entry<MultiKeyCompare, ArrayList<Map<String, Object>>> entry : groups.entrySet()) {
        ArrayList<Map<String, Object>> subRows = entry.getValue();
        // get result
        Map<String, Object> result = new HashMap<String, Object>();
        for (ColumnIndex index : columnGroupIndexes) {
            index.filter(subRows.get(0), result);
        }
        // append aggregate values
        for (FunctionIndex aggregate : aggregates) {
            try {
                aggregate.filter(subRows, result);
            } catch (Exception e) {
                e.printStackTrace();
            }
        }
        // check valid having aggregate
        boolean isValidHaving = true;
        for (HavingCondition condition : havingConditions) {
            try {
                isValidHaving &= condition.isValidAggregate(subRows);
            } catch (Exception e) {
                e.printStackTrace();
                return;
            }
        }
        if (isValidHaving) {
            outport.emit(result);
        }
    }
    rows = new ArrayList<Map<String, Object>>();
}
Also used : HashMap(java.util.HashMap) ArrayList(java.util.ArrayList) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) FunctionIndex(org.apache.apex.malhar.contrib.misc.streamquery.function.FunctionIndex) HavingCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCondition) Map(java.util.Map) HashMap(java.util.HashMap)

Example 4 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class BetweenConditionTest method testSqlSelect.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlSelect() {
    // create operator
    SelectOperator oper = new SelectOperator();
    oper.addIndex(new ColumnIndex("b", null));
    oper.addIndex(new ColumnIndex("c", null));
    BetweenCondition cond = new BetweenCondition("a", 0, 2);
    oper.setCondition(cond);
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 2);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 3);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : SelectOperator(org.apache.apex.malhar.contrib.misc.streamquery.SelectOperator) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) BetweenCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.BetweenCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 5 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class InConditionTest method testSqlSelect.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlSelect() {
    // create operator
    SelectOperator oper = new SelectOperator();
    oper.addIndex(new ColumnIndex("b", null));
    oper.addIndex(new ColumnIndex("c", null));
    InCondition cond = new InCondition("a");
    cond.addInValue(0);
    cond.addInValue(1);
    oper.setCondition(cond);
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 2);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 3);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : SelectOperator(org.apache.apex.malhar.contrib.misc.streamquery.SelectOperator) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) InCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.InCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Aggregations

ColumnIndex (org.apache.apex.malhar.lib.streamquery.index.ColumnIndex)15 HashMap (java.util.HashMap)14 CollectorTestSink (org.apache.apex.malhar.lib.testbench.CollectorTestSink)13 Test (org.junit.Test)13 Condition (org.apache.apex.malhar.lib.streamquery.condition.Condition)6 JoinColumnEqualCondition (org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition)6 SelectOperator (org.apache.apex.malhar.contrib.misc.streamquery.SelectOperator)5 EqualValueCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.EqualValueCondition)5 HavingCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCondition)2 FunctionIndex (org.apache.apex.malhar.contrib.misc.streamquery.function.FunctionIndex)2 SumFunction (org.apache.apex.malhar.contrib.misc.streamquery.function.SumFunction)2 ArrayList (java.util.ArrayList)1 Map (java.util.Map)1 BetweenCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.BetweenCondition)1 CompoundCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.CompoundCondition)1 HavingCompareValue (org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCompareValue)1 InCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.InCondition)1 LikeCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.LikeCondition)1