Search in sources :

Example 6 with Event

use of org.apache.flink.cep.Event in project flink by apache.

the class CEPOperatorTest method testKeyedCEPOperatorCheckpointing.

@Test
public void testKeyedCEPOperatorCheckpointing() throws Exception {
    OneInputStreamOperatorTestHarness<Event, Map<String, Event>> harness = getCepTestHarness(false);
    harness.open();
    Event startEvent = new Event(42, "start", 1.0);
    SubEvent middleEvent = new SubEvent(42, "foo", 1.0, 10.0);
    Event endEvent = new Event(42, "end", 1.0);
    harness.processElement(new StreamRecord<>(startEvent, 1L));
    harness.processElement(new StreamRecord<>(new Event(42, "foobar", 1.0), 2L));
    // simulate snapshot/restore with some elements in internal sorting queue
    OperatorStateHandles snapshot = harness.snapshot(0L, 0L);
    harness.close();
    harness = getCepTestHarness(false);
    harness.setup();
    harness.initializeState(snapshot);
    harness.open();
    harness.processWatermark(new Watermark(Long.MIN_VALUE));
    harness.processElement(new StreamRecord<Event>(new SubEvent(42, "barfoo", 1.0, 5.0), 3L));
    // if element timestamps are not correctly checkpointed/restored this will lead to
    // a pruning time underflow exception in NFA
    harness.processWatermark(new Watermark(2L));
    harness.processElement(new StreamRecord<Event>(middleEvent, 3L));
    harness.processElement(new StreamRecord<>(new Event(42, "start", 1.0), 4L));
    harness.processElement(new StreamRecord<>(endEvent, 5L));
    // simulate snapshot/restore with empty element queue but NFA state
    OperatorStateHandles snapshot2 = harness.snapshot(1L, 1L);
    harness.close();
    harness = getCepTestHarness(false);
    harness.setup();
    harness.initializeState(snapshot2);
    harness.open();
    harness.processWatermark(new Watermark(Long.MAX_VALUE));
    // get and verify the output
    Queue<Object> result = harness.getOutput();
    assertEquals(2, result.size());
    verifyPattern(result.poll(), startEvent, middleEvent, endEvent);
    verifyWatermark(result.poll(), Long.MAX_VALUE);
    harness.close();
}
Also used : SubEvent(org.apache.flink.cep.SubEvent) OperatorStateHandles(org.apache.flink.streaming.runtime.tasks.OperatorStateHandles) Event(org.apache.flink.cep.Event) SubEvent(org.apache.flink.cep.SubEvent) HashMap(java.util.HashMap) Map(java.util.Map) Watermark(org.apache.flink.streaming.api.watermark.Watermark) Test(org.junit.Test)

Example 7 with Event

use of org.apache.flink.cep.Event in project flink by apache.

the class CEPOperatorTest method testKeyedAdvancingTimeWithoutElements.

/**
	 * Tests that the internal time of a CEP operator advances only given watermarks. See FLINK-5033
	 */
@Test
public void testKeyedAdvancingTimeWithoutElements() throws Exception {
    final KeySelector<Event, Integer> keySelector = new TestKeySelector();
    final Event startEvent = new Event(42, "start", 1.0);
    final long watermarkTimestamp1 = 5L;
    final long watermarkTimestamp2 = 13L;
    final Map<String, Event> expectedSequence = new HashMap<>(2);
    expectedSequence.put("start", startEvent);
    OneInputStreamOperatorTestHarness<Event, Either<Tuple2<Map<String, Event>, Long>, Map<String, Event>>> harness = new KeyedOneInputStreamOperatorTestHarness<>(new TimeoutKeyedCEPPatternOperator<>(Event.createTypeSerializer(), false, keySelector, IntSerializer.INSTANCE, new NFAFactory(true), true), keySelector, BasicTypeInfo.INT_TYPE_INFO);
    try {
        harness.setup(new KryoSerializer<>((Class<Either<Tuple2<Map<String, Event>, Long>, Map<String, Event>>>) (Object) Either.class, new ExecutionConfig()));
        harness.open();
        harness.processElement(new StreamRecord<>(startEvent, 3L));
        harness.processWatermark(new Watermark(watermarkTimestamp1));
        harness.processWatermark(new Watermark(watermarkTimestamp2));
        Queue<Object> result = harness.getOutput();
        assertEquals(3L, result.size());
        Object watermark1 = result.poll();
        assertTrue(watermark1 instanceof Watermark);
        assertEquals(watermarkTimestamp1, ((Watermark) watermark1).getTimestamp());
        Object resultObject = result.poll();
        assertTrue(resultObject instanceof StreamRecord);
        StreamRecord<Either<Tuple2<Map<String, Event>, Long>, Map<String, Event>>> streamRecord = (StreamRecord<Either<Tuple2<Map<String, Event>, Long>, Map<String, Event>>>) resultObject;
        assertTrue(streamRecord.getValue() instanceof Either.Left);
        Either.Left<Tuple2<Map<String, Event>, Long>, Map<String, Event>> left = (Either.Left<Tuple2<Map<String, Event>, Long>, Map<String, Event>>) streamRecord.getValue();
        Tuple2<Map<String, Event>, Long> leftResult = left.left();
        assertEquals(watermarkTimestamp2, (long) leftResult.f1);
        assertEquals(expectedSequence, leftResult.f0);
        Object watermark2 = result.poll();
        assertTrue(watermark2 instanceof Watermark);
        assertEquals(watermarkTimestamp2, ((Watermark) watermark2).getTimestamp());
    } finally {
        harness.close();
    }
}
Also used : HashMap(java.util.HashMap) ExecutionConfig(org.apache.flink.api.common.ExecutionConfig) KeyedOneInputStreamOperatorTestHarness(org.apache.flink.streaming.util.KeyedOneInputStreamOperatorTestHarness) Either(org.apache.flink.types.Either) StreamRecord(org.apache.flink.streaming.runtime.streamrecord.StreamRecord) Tuple2(org.apache.flink.api.java.tuple.Tuple2) Event(org.apache.flink.cep.Event) SubEvent(org.apache.flink.cep.SubEvent) HashMap(java.util.HashMap) Map(java.util.Map) Watermark(org.apache.flink.streaming.api.watermark.Watermark) Test(org.junit.Test)

Example 8 with Event

use of org.apache.flink.cep.Event in project flink by apache.

the class CEPOperatorTest method testCEPOperatorCleanupEventTime.

@Test
public void testCEPOperatorCleanupEventTime() throws Exception {
    Event startEvent1 = new Event(42, "start", 1.0);
    Event startEvent2 = new Event(42, "start", 2.0);
    SubEvent middleEvent1 = new SubEvent(42, "foo1", 1.0, 10.0);
    SubEvent middleEvent2 = new SubEvent(42, "foo2", 1.0, 10.0);
    SubEvent middleEvent3 = new SubEvent(42, "foo3", 1.0, 10.0);
    Event endEvent1 = new Event(42, "end", 1.0);
    Event endEvent2 = new Event(42, "end", 2.0);
    Event startEventK2 = new Event(43, "start", 1.0);
    TestKeySelector keySelector = new TestKeySelector();
    KeyedCEPPatternOperator<Event, Integer> operator = getKeyedCepOpearator(false, keySelector);
    OneInputStreamOperatorTestHarness<Event, Map<String, Event>> harness = getCepTestHarness(operator);
    harness.open();
    harness.processWatermark(new Watermark(Long.MIN_VALUE));
    harness.processElement(new StreamRecord<>(startEvent1, 1L));
    harness.processElement(new StreamRecord<>(startEventK2, 1L));
    harness.processElement(new StreamRecord<>(new Event(42, "foobar", 1.0), 2L));
    harness.processElement(new StreamRecord<Event>(middleEvent1, 2L));
    harness.processElement(new StreamRecord<Event>(new SubEvent(42, "barfoo", 1.0, 5.0), 3L));
    // there must be 2 keys 42, 43 registered for the watermark callback
    // all the seen elements must be in the priority queues but no NFA yet.
    assertEquals(2L, harness.numKeysForWatermarkCallback());
    assertEquals(4L, operator.getPQSize(42));
    assertEquals(1L, operator.getPQSize(43));
    assertTrue(!operator.hasNonEmptyNFA(42));
    assertTrue(!operator.hasNonEmptyNFA(43));
    harness.processWatermark(new Watermark(2L));
    verifyWatermark(harness.getOutput().poll(), Long.MIN_VALUE);
    verifyWatermark(harness.getOutput().poll(), 2L);
    // still the 2 keys
    // one element in PQ for 42 (the barfoo) as it arrived early
    // for 43 the element entered the NFA and the PQ is empty
    assertEquals(2L, harness.numKeysForWatermarkCallback());
    assertTrue(operator.hasNonEmptyNFA(42));
    assertEquals(1L, operator.getPQSize(42));
    assertTrue(operator.hasNonEmptyNFA(43));
    assertTrue(!operator.hasNonEmptyPQ(43));
    harness.processElement(new StreamRecord<>(startEvent2, 4L));
    harness.processElement(new StreamRecord<Event>(middleEvent2, 5L));
    harness.processElement(new StreamRecord<>(endEvent1, 6L));
    harness.processWatermark(11L);
    harness.processWatermark(12L);
    // now we have 1 key because the 43 expired and was removed.
    // 42 is still there due to startEvent2
    assertEquals(1L, harness.numKeysForWatermarkCallback());
    assertTrue(operator.hasNonEmptyNFA(42));
    assertTrue(!operator.hasNonEmptyPQ(42));
    assertTrue(!operator.hasNonEmptyNFA(43));
    assertTrue(!operator.hasNonEmptyPQ(43));
    verifyPattern(harness.getOutput().poll(), startEvent1, middleEvent1, endEvent1);
    verifyPattern(harness.getOutput().poll(), startEvent1, middleEvent2, endEvent1);
    verifyPattern(harness.getOutput().poll(), startEvent2, middleEvent2, endEvent1);
    verifyWatermark(harness.getOutput().poll(), 11L);
    verifyWatermark(harness.getOutput().poll(), 12L);
    harness.processElement(new StreamRecord<Event>(middleEvent3, 12L));
    harness.processElement(new StreamRecord<>(endEvent2, 13L));
    harness.processWatermark(20L);
    harness.processWatermark(21L);
    assertTrue(!operator.hasNonEmptyNFA(42));
    assertTrue(!operator.hasNonEmptyPQ(42));
    assertEquals(0L, harness.numKeysForWatermarkCallback());
    verifyPattern(harness.getOutput().poll(), startEvent2, middleEvent2, endEvent2);
    verifyPattern(harness.getOutput().poll(), startEvent2, middleEvent3, endEvent2);
    verifyWatermark(harness.getOutput().poll(), 20L);
    verifyWatermark(harness.getOutput().poll(), 21L);
    harness.close();
}
Also used : SubEvent(org.apache.flink.cep.SubEvent) Event(org.apache.flink.cep.Event) SubEvent(org.apache.flink.cep.SubEvent) HashMap(java.util.HashMap) Map(java.util.Map) Watermark(org.apache.flink.streaming.api.watermark.Watermark) Test(org.junit.Test)

Example 9 with Event

use of org.apache.flink.cep.Event in project flink by apache.

the class CEPOperatorTest method testKeyedCEPOperatorWatermarkForwarding.

@Test
public void testKeyedCEPOperatorWatermarkForwarding() throws Exception {
    OneInputStreamOperatorTestHarness<Event, Map<String, Event>> harness = getCepTestHarness(false);
    harness.open();
    Watermark expectedWatermark = new Watermark(42L);
    harness.processWatermark(expectedWatermark);
    verifyWatermark(harness.getOutput().poll(), 42L);
    harness.close();
}
Also used : Event(org.apache.flink.cep.Event) SubEvent(org.apache.flink.cep.SubEvent) HashMap(java.util.HashMap) Map(java.util.Map) Watermark(org.apache.flink.streaming.api.watermark.Watermark) Test(org.junit.Test)

Example 10 with Event

use of org.apache.flink.cep.Event in project flink by apache.

the class CEPOperatorTest method testKeyedCEPOperatorCheckpointingWithRocksDB.

@Test
public void testKeyedCEPOperatorCheckpointingWithRocksDB() throws Exception {
    String rocksDbPath = tempFolder.newFolder().getAbsolutePath();
    RocksDBStateBackend rocksDBStateBackend = new RocksDBStateBackend(new MemoryStateBackend());
    rocksDBStateBackend.setDbStoragePath(rocksDbPath);
    OneInputStreamOperatorTestHarness<Event, Map<String, Event>> harness = getCepTestHarness(false);
    harness.setStateBackend(rocksDBStateBackend);
    harness.open();
    Event startEvent = new Event(42, "start", 1.0);
    SubEvent middleEvent = new SubEvent(42, "foo", 1.0, 10.0);
    Event endEvent = new Event(42, "end", 1.0);
    harness.processElement(new StreamRecord<>(startEvent, 1L));
    harness.processElement(new StreamRecord<>(new Event(42, "foobar", 1.0), 2L));
    // simulate snapshot/restore with some elements in internal sorting queue
    OperatorStateHandles snapshot = harness.snapshot(0L, 0L);
    harness.close();
    harness = getCepTestHarness(false);
    rocksDBStateBackend = new RocksDBStateBackend(new MemoryStateBackend());
    rocksDBStateBackend.setDbStoragePath(rocksDbPath);
    harness.setStateBackend(rocksDBStateBackend);
    harness.setup();
    harness.initializeState(snapshot);
    harness.open();
    harness.processWatermark(new Watermark(Long.MIN_VALUE));
    harness.processElement(new StreamRecord<Event>(new SubEvent(42, "barfoo", 1.0, 5.0), 3L));
    // if element timestamps are not correctly checkpointed/restored this will lead to
    // a pruning time underflow exception in NFA
    harness.processWatermark(new Watermark(2L));
    // simulate snapshot/restore with empty element queue but NFA state
    OperatorStateHandles snapshot2 = harness.snapshot(1L, 1L);
    harness.close();
    harness = getCepTestHarness(false);
    rocksDBStateBackend = new RocksDBStateBackend(new MemoryStateBackend());
    rocksDBStateBackend.setDbStoragePath(rocksDbPath);
    harness.setStateBackend(rocksDBStateBackend);
    harness.setup();
    harness.initializeState(snapshot2);
    harness.open();
    harness.processElement(new StreamRecord<Event>(middleEvent, 3L));
    harness.processElement(new StreamRecord<>(new Event(42, "start", 1.0), 4L));
    harness.processElement(new StreamRecord<>(endEvent, 5L));
    harness.processWatermark(new Watermark(Long.MAX_VALUE));
    // get and verify the output
    Queue<Object> result = harness.getOutput();
    assertEquals(2, result.size());
    verifyPattern(result.poll(), startEvent, middleEvent, endEvent);
    verifyWatermark(result.poll(), Long.MAX_VALUE);
    harness.close();
}
Also used : RocksDBStateBackend(org.apache.flink.contrib.streaming.state.RocksDBStateBackend) SubEvent(org.apache.flink.cep.SubEvent) MemoryStateBackend(org.apache.flink.runtime.state.memory.MemoryStateBackend) OperatorStateHandles(org.apache.flink.streaming.runtime.tasks.OperatorStateHandles) Event(org.apache.flink.cep.Event) SubEvent(org.apache.flink.cep.SubEvent) HashMap(java.util.HashMap) Map(java.util.Map) Watermark(org.apache.flink.streaming.api.watermark.Watermark) Test(org.junit.Test)

Aggregations

Event (org.apache.flink.cep.Event)20 Test (org.junit.Test)20 Map (java.util.Map)17 SubEvent (org.apache.flink.cep.SubEvent)14 HashMap (java.util.HashMap)13 StreamRecord (org.apache.flink.streaming.runtime.streamrecord.StreamRecord)11 Watermark (org.apache.flink.streaming.api.watermark.Watermark)9 ArrayList (java.util.ArrayList)7 HashSet (java.util.HashSet)5 FilterFunction (org.apache.flink.api.common.functions.FilterFunction)4 OperatorStateHandles (org.apache.flink.streaming.runtime.tasks.OperatorStateHandles)4 KeySelector (org.apache.flink.api.java.functions.KeySelector)3 KeyedOneInputStreamOperatorTestHarness (org.apache.flink.streaming.util.KeyedOneInputStreamOperatorTestHarness)3 ByteArrayInputStream (java.io.ByteArrayInputStream)2 ObjectInputStream (java.io.ObjectInputStream)2 ObjectOutputStream (java.io.ObjectOutputStream)2 NullByteKeySelector (org.apache.flink.api.java.functions.NullByteKeySelector)2 Tuple2 (org.apache.flink.api.java.tuple.Tuple2)2 LinkedHashMultimap (com.google.common.collect.LinkedHashMultimap)1 ByteArrayOutputStream (java.io.ByteArrayOutputStream)1