Search in sources :

Example 11 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class FullOuterJoinOperatorTest method testSqlSelect.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlSelect() {
    // create operator
    OuterJoinOperator oper = new OuterJoinOperator();
    oper.setFullJoin(true);
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    // set column join condition
    Condition cond = new JoinColumnEqualCondition("a", "a");
    oper.setJoinCondition(cond);
    // add columns
    oper.selectTable1Column(new ColumnIndex("b", null));
    oper.selectTable2Column(new ColumnIndex("c", null));
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 2);
    tuple.put("b", 11);
    tuple.put("c", 12);
    oper.inport1.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 0);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : Condition(org.apache.apex.malhar.lib.streamquery.condition.Condition) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 12 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class HavingOperatorTest method testSqlGroupBy.

@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlGroupBy() throws Exception {
    // create operator
    GroupByHavingOperator oper = new GroupByHavingOperator();
    oper.addColumnGroupByIndex(new ColumnIndex("b", null));
    FunctionIndex sum = new SumFunction("c", null);
    oper.addAggregateIndex(sum);
    // create having condition
    HavingCondition having = new HavingCompareValue<Double>(sum, 6.0, 0);
    oper.addHavingCondition(having);
    EqualValueCondition condition = new EqualValueCondition();
    condition.addEqualValue("a", 1);
    oper.setCondition(condition);
    CollectorTestSink sink = new CollectorTestSink();
    oper.outport.setSink(sink);
    oper.setup(null);
    oper.beginWindow(1);
    HashMap<String, Object> tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 1);
    tuple.put("c", 4);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 2);
    tuple.put("c", 6);
    oper.inport.process(tuple);
    tuple = new HashMap<String, Object>();
    tuple.put("a", 1);
    tuple.put("b", 2);
    tuple.put("c", 7);
    oper.inport.process(tuple);
    oper.endWindow();
    oper.teardown();
    LOG.debug("{}", sink.collectedTuples);
}
Also used : SumFunction(org.apache.apex.malhar.contrib.misc.streamquery.function.SumFunction) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) EqualValueCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.EqualValueCondition) FunctionIndex(org.apache.apex.malhar.contrib.misc.streamquery.function.FunctionIndex) HashMap(java.util.HashMap) HavingCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCondition) HavingCompareValue(org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCompareValue) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 13 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class AntiJoinOperatorTest method testSqlSelect.

@Test
public void testSqlSelect() {
    // create operator
    AntiJoinOperator oper = new AntiJoinOperator();
    CollectorTestSink sink = new CollectorTestSink();
    TestUtils.setSink(oper.outport, sink);
    // set column join condition
    Condition cond = new JoinColumnEqualCondition("a", "a");
    oper.setJoinCondition(cond);
    // add columns
    oper.selectTable1Column(new ColumnIndex("b", null));
    oper.selectTable1Column(new ColumnIndex("c", null));
    oper.setup(null);
    HashMap<String, Object> tuple = new HashMap<>();
    // test 1, positive result
    oper.beginWindow(1);
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 0);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 2);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    // expected anti-joined result: {b=3, c=4}
    Assert.assertEquals("number of anti-join result", 1, sink.collectedTuples.size());
    sink.clear();
    // test 2, negative result (empty result)
    oper.beginWindow(2);
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 0);
    tuple.put("b", 7);
    tuple.put("c", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 1);
    tuple.put("b", 5);
    tuple.put("c", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    oper.teardown();
    // expected anti-joined result: []
    Assert.assertEquals("number of anti-join result (empty)", 0, sink.collectedTuples.size());
}
Also used : Condition(org.apache.apex.malhar.lib.streamquery.condition.Condition) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 14 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class SemiJoinOperatorTest method testSqlSelect.

@Test
public void testSqlSelect() {
    // create operator
    SemiJoinOperator oper = new SemiJoinOperator();
    CollectorTestSink sink = new CollectorTestSink();
    TestUtils.setSink(oper.outport, sink);
    // set column join condition
    Condition cond = new JoinColumnEqualCondition("a", "a");
    oper.setJoinCondition(cond);
    // add columns (only columns from the left table)
    oper.selectTable1Column(new ColumnIndex("b", null));
    oper.selectTable1Column(new ColumnIndex("c", null));
    oper.setup(null);
    HashMap<String, Object> tuple = new HashMap<>();
    /**
     * test 1, positive result
     *
     * table1                      table2
     * ======                      ======
     *    a     b    c             a    e    f
     *    -------------            -----------
     *    0     1    2             0    7    8
     *    1     3    4             2    5    6
     *    0     6    8
     *
     * select b, c
     * from   table1 semi-join table2
     * where  table1.a = table2.a
     *
     * result:
     *
     *         b    c
     *    -------------
     *         1    2
     *         6    8
     */
    oper.beginWindow(1);
    tuple.put("a", 0);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 0);
    tuple.put("b", 6);
    tuple.put("c", 8);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 0);
    tuple.put("e", 7);
    tuple.put("f", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 2);
    tuple.put("e", 5);
    tuple.put("f", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    // expected semi-joined result: {1,2}, {6, 8} (two rows)
    Assert.assertEquals("number of semi-join result", 2, sink.collectedTuples.size());
    sink.clear();
    /**
     * test 2, negative result (empty result)
     *
     * table1                      table2
     * ======                      ======
     *    a     b    c             a    e    f
     *    -------------            -----------
     *    1     1    2             0    7    8
     *    1     3    4             2    5    6
     *    3     6    8
     *
     * select b, c
     * from   table1 semi-join table2
     * where  table1.a = table2.a
     *
     * result:
     *
     *         b    c
     *    -------------
     *
     *    (0 row)
     */
    oper.beginWindow(2);
    tuple.put("a", 1);
    tuple.put("b", 1);
    tuple.put("c", 2);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 1);
    tuple.put("b", 3);
    tuple.put("c", 4);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 3);
    tuple.put("b", 6);
    tuple.put("c", 8);
    oper.inport1.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 0);
    tuple.put("e", 7);
    tuple.put("f", 8);
    oper.inport2.process(tuple);
    tuple = new HashMap<>();
    tuple.put("a", 2);
    tuple.put("e", 5);
    tuple.put("f", 6);
    oper.inport2.process(tuple);
    oper.endWindow();
    oper.teardown();
    // expected semi-joined result: [] (empty)
    Assert.assertEquals("number of semi-join result (empty)", 0, sink.collectedTuples.size());
}
Also used : Condition(org.apache.apex.malhar.lib.streamquery.condition.Condition) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) HashMap(java.util.HashMap) JoinColumnEqualCondition(org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition) CollectorTestSink(org.apache.apex.malhar.lib.testbench.CollectorTestSink) Test(org.junit.Test)

Example 15 with ColumnIndex

use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.

the class Application method getFilteredMessagesOperator.

private SelectOperator getFilteredMessagesOperator(String name, DAG dag) {
    SelectOperator oper = dag.addOperator(name, new SelectOperator());
    oper.addIndex(new ColumnIndex(APACHE_KEYS.host.value, null));
    oper.addIndex(new ColumnIndex(APACHE_KEYS.request.value, null));
    oper.addIndex(new ColumnIndex(APACHE_KEYS.response.value, null));
    EqualValueCondition condition = new EqualValueCondition();
    condition.addEqualValue(APACHE_KEYS.response.value, "404");
    oper.setCondition(condition);
    return oper;
}
Also used : SelectOperator(org.apache.apex.malhar.contrib.misc.streamquery.SelectOperator) ColumnIndex(org.apache.apex.malhar.lib.streamquery.index.ColumnIndex) EqualValueCondition(org.apache.apex.malhar.contrib.misc.streamquery.condition.EqualValueCondition)

Aggregations

ColumnIndex (org.apache.apex.malhar.lib.streamquery.index.ColumnIndex)15 HashMap (java.util.HashMap)14 CollectorTestSink (org.apache.apex.malhar.lib.testbench.CollectorTestSink)13 Test (org.junit.Test)13 Condition (org.apache.apex.malhar.lib.streamquery.condition.Condition)6 JoinColumnEqualCondition (org.apache.apex.malhar.lib.streamquery.condition.JoinColumnEqualCondition)6 SelectOperator (org.apache.apex.malhar.contrib.misc.streamquery.SelectOperator)5 EqualValueCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.EqualValueCondition)5 HavingCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCondition)2 FunctionIndex (org.apache.apex.malhar.contrib.misc.streamquery.function.FunctionIndex)2 SumFunction (org.apache.apex.malhar.contrib.misc.streamquery.function.SumFunction)2 ArrayList (java.util.ArrayList)1 Map (java.util.Map)1 BetweenCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.BetweenCondition)1 CompoundCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.CompoundCondition)1 HavingCompareValue (org.apache.apex.malhar.contrib.misc.streamquery.condition.HavingCompareValue)1 InCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.InCondition)1 LikeCondition (org.apache.apex.malhar.contrib.misc.streamquery.condition.LikeCondition)1