Search in sources :

Example 6 with Limit

use of org.apache.drill.exec.physical.config.Limit in project drill by apache.

the class TestLimitBatchEmitOutcome method testMultipleLimitWithEMITOutcome.

/**
 * Test to show that limit refreshes it's state after seeing first EMIT
 * outcome and works on data batches following it as new set's of incoming
 * batch and apply the limits rule from fresh on those. So for first set of
 * batches with OK_NEW_SCHEMA and EMIT outcome but total number of records
 * received being less than limit condition, it still produces an output with
 * that many records (in this case 1 even though limit number of records is
 * 2).
 * <p>
 * After seeing EMIT, it refreshes it's state and operate on next input
 * batches to again return limit number of records. So for 3rd batch with 2
 * records but with EMIT outcome it produces an output batch with 2 records
 * not with 1 since state is refreshed.
 */
@Test
public void testMultipleLimitWithEMITOutcome() throws Throwable {
    final RowSet.SingleRowSet nonEmptyInputRowSet2 = operatorFixture.rowSetBuilder(inputSchema).addRow(2, 20, "item2").addRow(3, 30, "item3").build();
    inputContainer.add(nonEmptyInputRowSet.container());
    inputContainer.add(emptyInputRowSet.container());
    inputContainer.add(nonEmptyInputRowSet2.container());
    inputContainer.add(emptyInputRowSet.container());
    inputOutcomes.add(RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    inputOutcomes.add(RecordBatch.IterOutcome.EMIT);
    inputOutcomes.add(RecordBatch.IterOutcome.EMIT);
    final MockRecordBatch mockInputBatch = new MockRecordBatch(operatorFixture.getFragmentContext(), opContext, inputContainer, inputOutcomes, emptyInputRowSet.container().getSchema());
    // Only set for this Test class
    mockInputBatch.useUnnestKillHandlingForLimit(true);
    final Limit limitConf = new Limit(null, 0, 2);
    @SuppressWarnings("resource") final LimitRecordBatch limitBatch = new LimitRecordBatch(limitConf, operatorFixture.getFragmentContext(), mockInputBatch);
    // first limit evaluation
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    assertEquals(1, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.EMIT);
    assertEquals(0, limitBatch.getRecordCount());
    // After seeing EMIT limit will refresh it's state and again evaluate limit on next set of input batches
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.EMIT);
    assertEquals(2, limitBatch.getRecordCount());
    // Since limit is hit it will return NONE
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.NONE);
}
Also used : RowSet(org.apache.drill.exec.physical.rowSet.RowSet) MockRecordBatch(org.apache.drill.exec.physical.impl.MockRecordBatch) Limit(org.apache.drill.exec.physical.config.Limit) OperatorTest(org.apache.drill.categories.OperatorTest) Test(org.junit.Test)

Example 7 with Limit

use of org.apache.drill.exec.physical.config.Limit in project drill by apache.

the class TestLimitBatchEmitOutcome method testLimitNonEmptyFirst_NonEmptyOK_EmptyBatchEmitOutcome.

/**
 * Test shows that limit operates on multiple input batches until it finds
 * limit number of records or it sees an EMIT outcome to refresh it's state.
 */
@Test
public void testLimitNonEmptyFirst_NonEmptyOK_EmptyBatchEmitOutcome() throws Throwable {
    final RowSet.SingleRowSet nonEmptyInputRowSet2 = operatorFixture.rowSetBuilder(inputSchema).addRow(2, 20, "item2").build();
    inputContainer.add(nonEmptyInputRowSet.container());
    inputContainer.add(emptyInputRowSet.container());
    inputContainer.add(nonEmptyInputRowSet2.container());
    inputContainer.add(emptyInputRowSet.container());
    inputOutcomes.add(RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    inputOutcomes.add(RecordBatch.IterOutcome.OK);
    inputOutcomes.add(RecordBatch.IterOutcome.OK);
    inputOutcomes.add(RecordBatch.IterOutcome.EMIT);
    final MockRecordBatch mockInputBatch = new MockRecordBatch(operatorFixture.getFragmentContext(), opContext, inputContainer, inputOutcomes, emptyInputRowSet.container().getSchema());
    // Only set for this Test class
    mockInputBatch.useUnnestKillHandlingForLimit(true);
    final Limit limitConf = new Limit(null, 0, 2);
    @SuppressWarnings("resource") final LimitRecordBatch limitBatch = new LimitRecordBatch(limitConf, operatorFixture.getFragmentContext(), mockInputBatch);
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    assertEquals(1, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK);
    assertEquals(1, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.EMIT);
    assertEquals(0, limitBatch.getRecordCount());
    nonEmptyInputRowSet2.clear();
}
Also used : RowSet(org.apache.drill.exec.physical.rowSet.RowSet) MockRecordBatch(org.apache.drill.exec.physical.impl.MockRecordBatch) Limit(org.apache.drill.exec.physical.config.Limit) OperatorTest(org.apache.drill.categories.OperatorTest) Test(org.junit.Test)

Example 8 with Limit

use of org.apache.drill.exec.physical.config.Limit in project drill by apache.

the class TestLimitBatchEmitOutcome method testLimitNonEmptyBatchEmitOutcome.

/**
 * Test to validate limit considers all the data until it sees EMIT outcome
 * and return output batch with data that meets the limit criteria.
 */
@Test
public void testLimitNonEmptyBatchEmitOutcome() throws Throwable {
    inputContainer.add(emptyInputRowSet.container());
    inputContainer.add(nonEmptyInputRowSet.container());
    inputOutcomes.add(RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    inputOutcomes.add(RecordBatch.IterOutcome.EMIT);
    final MockRecordBatch mockInputBatch = new MockRecordBatch(operatorFixture.getFragmentContext(), opContext, inputContainer, inputOutcomes, emptyInputRowSet.container().getSchema());
    // Only set for this Test class
    mockInputBatch.useUnnestKillHandlingForLimit(true);
    final Limit limitConf = new Limit(null, 0, 1);
    @SuppressWarnings("resource") final LimitRecordBatch limitBatch = new LimitRecordBatch(limitConf, operatorFixture.getFragmentContext(), mockInputBatch);
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    outputRecordCount += limitBatch.getRecordCount();
    assertEquals(0, outputRecordCount);
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.EMIT);
    outputRecordCount += limitBatch.getRecordCount();
    assertEquals(1, outputRecordCount);
}
Also used : MockRecordBatch(org.apache.drill.exec.physical.impl.MockRecordBatch) Limit(org.apache.drill.exec.physical.config.Limit) OperatorTest(org.apache.drill.categories.OperatorTest) Test(org.junit.Test)

Example 9 with Limit

use of org.apache.drill.exec.physical.config.Limit in project drill by apache.

the class TestLimitBatchEmitOutcome method testLimitResetsAfterFirstEmitOutcome.

/**
 * Test to show that once a limit number of records is produced using first
 * set of batches then on getting a batch with EMIT outcome, the limit state
 * is again refreshed and applied to next set of batches with data.
 */
@Test
public void testLimitResetsAfterFirstEmitOutcome() throws Throwable {
    final RowSet.SingleRowSet nonEmptyInputRowSet2 = operatorFixture.rowSetBuilder(inputSchema).addRow(2, 20, "item2").addRow(3, 30, "item3").build();
    inputContainer.add(nonEmptyInputRowSet.container());
    inputContainer.add(emptyInputRowSet.container());
    inputContainer.add(nonEmptyInputRowSet2.container());
    inputOutcomes.add(RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    inputOutcomes.add(RecordBatch.IterOutcome.EMIT);
    inputOutcomes.add(RecordBatch.IterOutcome.OK);
    final MockRecordBatch mockInputBatch = new MockRecordBatch(operatorFixture.getFragmentContext(), opContext, inputContainer, inputOutcomes, emptyInputRowSet.container().getSchema());
    // Only set for this Test class
    mockInputBatch.useUnnestKillHandlingForLimit(true);
    final Limit limitConf = new Limit(null, 0, 1);
    @SuppressWarnings("resource") final LimitRecordBatch limitBatch = new LimitRecordBatch(limitConf, operatorFixture.getFragmentContext(), mockInputBatch);
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK_NEW_SCHEMA);
    assertEquals(1, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.EMIT);
    // State refresh happens and limit again works on new data batches
    assertEquals(0, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.OK);
    assertEquals(1, limitBatch.getRecordCount());
    assertTrue(limitBatch.next() == RecordBatch.IterOutcome.NONE);
}
Also used : RowSet(org.apache.drill.exec.physical.rowSet.RowSet) MockRecordBatch(org.apache.drill.exec.physical.impl.MockRecordBatch) Limit(org.apache.drill.exec.physical.config.Limit) OperatorTest(org.apache.drill.categories.OperatorTest) Test(org.junit.Test)

Example 10 with Limit

use of org.apache.drill.exec.physical.config.Limit in project drill by apache.

the class TestNullInputMiniPlan method testLimitEmpty.

@Test
public void testLimitEmpty() throws Exception {
    final PhysicalOperator limit = new Limit(null, 10, 5);
    testSingleInputNullBatchHandling(limit);
}
Also used : PhysicalOperator(org.apache.drill.exec.physical.base.PhysicalOperator) Limit(org.apache.drill.exec.physical.config.Limit) Test(org.junit.Test)

Aggregations

Limit (org.apache.drill.exec.physical.config.Limit)17 Test (org.junit.Test)15 OperatorTest (org.apache.drill.categories.OperatorTest)6 MockRecordBatch (org.apache.drill.exec.physical.impl.MockRecordBatch)6 PhysicalOperator (org.apache.drill.exec.physical.base.PhysicalOperator)4 RowSet (org.apache.drill.exec.physical.rowSet.RowSet)3 PartitionLimit (org.apache.drill.exec.physical.config.PartitionLimit)1