use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.
the class FullOuterJoinOperatorTest method testSqlSelect.
@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlSelect() {
// create operator
OuterJoinOperator oper = new OuterJoinOperator();
oper.setFullJoin(true);
CollectorTestSink sink = new CollectorTestSink();
oper.outport.setSink(sink);
// set column join condition
Condition cond = new JoinColumnEqualCondition("a", "a");
oper.setJoinCondition(cond);
// add columns
oper.selectTable1Column(new ColumnIndex("b", null));
oper.selectTable2Column(new ColumnIndex("c", null));
oper.setup(null);
oper.beginWindow(1);
HashMap<String, Object> tuple = new HashMap<String, Object>();
tuple.put("a", 0);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport1.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 3);
tuple.put("c", 4);
oper.inport1.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 2);
tuple.put("b", 11);
tuple.put("c", 12);
oper.inport1.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 0);
tuple.put("b", 7);
tuple.put("c", 8);
oper.inport2.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 5);
tuple.put("c", 6);
oper.inport2.process(tuple);
oper.endWindow();
oper.teardown();
LOG.debug("{}", sink.collectedTuples);
}
use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.
the class HavingOperatorTest method testSqlGroupBy.
@SuppressWarnings({ "rawtypes", "unchecked" })
@Test
public void testSqlGroupBy() throws Exception {
// create operator
GroupByHavingOperator oper = new GroupByHavingOperator();
oper.addColumnGroupByIndex(new ColumnIndex("b", null));
FunctionIndex sum = new SumFunction("c", null);
oper.addAggregateIndex(sum);
// create having condition
HavingCondition having = new HavingCompareValue<Double>(sum, 6.0, 0);
oper.addHavingCondition(having);
EqualValueCondition condition = new EqualValueCondition();
condition.addEqualValue("a", 1);
oper.setCondition(condition);
CollectorTestSink sink = new CollectorTestSink();
oper.outport.setSink(sink);
oper.setup(null);
oper.beginWindow(1);
HashMap<String, Object> tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 1);
tuple.put("c", 4);
oper.inport.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 2);
tuple.put("c", 6);
oper.inport.process(tuple);
tuple = new HashMap<String, Object>();
tuple.put("a", 1);
tuple.put("b", 2);
tuple.put("c", 7);
oper.inport.process(tuple);
oper.endWindow();
oper.teardown();
LOG.debug("{}", sink.collectedTuples);
}
use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.
the class AntiJoinOperatorTest method testSqlSelect.
@Test
public void testSqlSelect() {
// create operator
AntiJoinOperator oper = new AntiJoinOperator();
CollectorTestSink sink = new CollectorTestSink();
TestUtils.setSink(oper.outport, sink);
// set column join condition
Condition cond = new JoinColumnEqualCondition("a", "a");
oper.setJoinCondition(cond);
// add columns
oper.selectTable1Column(new ColumnIndex("b", null));
oper.selectTable1Column(new ColumnIndex("c", null));
oper.setup(null);
HashMap<String, Object> tuple = new HashMap<>();
// test 1, positive result
oper.beginWindow(1);
tuple.put("a", 0);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 1);
tuple.put("b", 3);
tuple.put("c", 4);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 0);
tuple.put("b", 7);
tuple.put("c", 8);
oper.inport2.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 2);
tuple.put("b", 5);
tuple.put("c", 6);
oper.inport2.process(tuple);
oper.endWindow();
// expected anti-joined result: {b=3, c=4}
Assert.assertEquals("number of anti-join result", 1, sink.collectedTuples.size());
sink.clear();
// test 2, negative result (empty result)
oper.beginWindow(2);
tuple.put("a", 0);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 1);
tuple.put("b", 3);
tuple.put("c", 4);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 0);
tuple.put("b", 7);
tuple.put("c", 8);
oper.inport2.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 1);
tuple.put("b", 5);
tuple.put("c", 6);
oper.inport2.process(tuple);
oper.endWindow();
oper.teardown();
// expected anti-joined result: []
Assert.assertEquals("number of anti-join result (empty)", 0, sink.collectedTuples.size());
}
use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.
the class SemiJoinOperatorTest method testSqlSelect.
@Test
public void testSqlSelect() {
// create operator
SemiJoinOperator oper = new SemiJoinOperator();
CollectorTestSink sink = new CollectorTestSink();
TestUtils.setSink(oper.outport, sink);
// set column join condition
Condition cond = new JoinColumnEqualCondition("a", "a");
oper.setJoinCondition(cond);
// add columns (only columns from the left table)
oper.selectTable1Column(new ColumnIndex("b", null));
oper.selectTable1Column(new ColumnIndex("c", null));
oper.setup(null);
HashMap<String, Object> tuple = new HashMap<>();
/**
* test 1, positive result
*
* table1 table2
* ====== ======
* a b c a e f
* ------------- -----------
* 0 1 2 0 7 8
* 1 3 4 2 5 6
* 0 6 8
*
* select b, c
* from table1 semi-join table2
* where table1.a = table2.a
*
* result:
*
* b c
* -------------
* 1 2
* 6 8
*/
oper.beginWindow(1);
tuple.put("a", 0);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 1);
tuple.put("b", 3);
tuple.put("c", 4);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 0);
tuple.put("b", 6);
tuple.put("c", 8);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 0);
tuple.put("e", 7);
tuple.put("f", 8);
oper.inport2.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 2);
tuple.put("e", 5);
tuple.put("f", 6);
oper.inport2.process(tuple);
oper.endWindow();
// expected semi-joined result: {1,2}, {6, 8} (two rows)
Assert.assertEquals("number of semi-join result", 2, sink.collectedTuples.size());
sink.clear();
/**
* test 2, negative result (empty result)
*
* table1 table2
* ====== ======
* a b c a e f
* ------------- -----------
* 1 1 2 0 7 8
* 1 3 4 2 5 6
* 3 6 8
*
* select b, c
* from table1 semi-join table2
* where table1.a = table2.a
*
* result:
*
* b c
* -------------
*
* (0 row)
*/
oper.beginWindow(2);
tuple.put("a", 1);
tuple.put("b", 1);
tuple.put("c", 2);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 1);
tuple.put("b", 3);
tuple.put("c", 4);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 3);
tuple.put("b", 6);
tuple.put("c", 8);
oper.inport1.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 0);
tuple.put("e", 7);
tuple.put("f", 8);
oper.inport2.process(tuple);
tuple = new HashMap<>();
tuple.put("a", 2);
tuple.put("e", 5);
tuple.put("f", 6);
oper.inport2.process(tuple);
oper.endWindow();
oper.teardown();
// expected semi-joined result: [] (empty)
Assert.assertEquals("number of semi-join result (empty)", 0, sink.collectedTuples.size());
}
use of org.apache.apex.malhar.lib.streamquery.index.ColumnIndex in project apex-malhar by apache.
the class Application method getFilteredMessagesOperator.
private SelectOperator getFilteredMessagesOperator(String name, DAG dag) {
SelectOperator oper = dag.addOperator(name, new SelectOperator());
oper.addIndex(new ColumnIndex(APACHE_KEYS.host.value, null));
oper.addIndex(new ColumnIndex(APACHE_KEYS.request.value, null));
oper.addIndex(new ColumnIndex(APACHE_KEYS.response.value, null));
EqualValueCondition condition = new EqualValueCondition();
condition.addEqualValue(APACHE_KEYS.response.value, "404");
oper.setCondition(condition);
return oper;
}
Aggregations