Search in sources :

Example 1 with START_INCLUSIVE

use of com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE in project bullet-core by yahoo.

the class QuantileSketchingStrategyTest method testNegativeSize.

@Test
public void testNegativeSize() {
    // MAX_POINTS is configured to -1 and we will use the min BulletConfig.DEFAULT_DISTRIBUTION_AGGREGATION_MAX_POINTS
    // and aggregation size, which is 1
    QuantileSketchingStrategy distribution = makeDistribution(makeConfiguration(-1, 128), 1, "field", DistributionType.PMF, 10);
    IntStream.range(0, 100).mapToDouble(i -> i).mapToObj(d -> RecordBox.get().add("field", d).getRecord()).forEach(distribution::consume);
    Clip result = distribution.getResult();
    Map<String, Object> metadata = (Map<String, Object>) result.getMeta().asMap().get("meta");
    Assert.assertEquals(metadata.size(), 7);
    Assert.assertFalse((Boolean) metadata.get("isEst"));
    List<BulletRecord> records = result.getRecords();
    Assert.assertEquals(records.size(), 2);
    BulletRecord expectedA = RecordBox.get().add(RANGE_FIELD, NEGATIVE_INFINITY_START + SEPARATOR + 0.0 + END_EXCLUSIVE).add(COUNT_FIELD, 0.0).add(PROBABILITY_FIELD, 0.0).getRecord();
    BulletRecord expectedB = RecordBox.get().add(RANGE_FIELD, START_INCLUSIVE + 0.0 + SEPARATOR + POSITIVE_INFINITY_END).add(COUNT_FIELD, 100.0).add(PROBABILITY_FIELD, 1.0).getRecord();
    Assert.assertEquals(records.get(0), expectedA);
    Assert.assertEquals(records.get(1), expectedB);
    Assert.assertEquals(distribution.getRecords(), result.getRecords());
    Assert.assertEquals(distribution.getMetadata().asMap(), result.getMeta().asMap());
}
Also used : LinearDistribution(com.yahoo.bullet.query.aggregations.LinearDistribution) IntStream(java.util.stream.IntStream) Arrays(java.util.Arrays) ManualDistribution(com.yahoo.bullet.query.aggregations.ManualDistribution) RegionDistribution(com.yahoo.bullet.query.aggregations.RegionDistribution) START_INCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE) END_EXCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.END_EXCLUSIVE) PROBABILITY_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.PROBABILITY_FIELD) Concept(com.yahoo.bullet.result.Meta.Concept) Test(org.testng.annotations.Test) RecordBox(com.yahoo.bullet.result.RecordBox) NEGATIVE_INFINITY_START(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.NEGATIVE_INFINITY_START) Clip(com.yahoo.bullet.result.Clip) Family(com.yahoo.sketches.Family) HashSet(java.util.HashSet) Pair(org.apache.commons.lang3.tuple.Pair) Assert(org.testng.Assert) VALUE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.VALUE_FIELD) Arrays.asList(java.util.Arrays.asList) Map(java.util.Map) Distribution(com.yahoo.bullet.query.aggregations.Distribution) POSITIVE_INFINITY_END(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.POSITIVE_INFINITY_END) BulletRecord(com.yahoo.bullet.record.BulletRecord) DoublesSketch(com.yahoo.sketches.quantiles.DoublesSketch) QUANTILE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.QUANTILE_FIELD) Set(java.util.Set) Collectors(java.util.stream.Collectors) List(java.util.List) TestHelpers.assertApproxEquals(com.yahoo.bullet.TestHelpers.assertApproxEquals) RANGE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.RANGE_FIELD) TestHelpers.addMetadata(com.yahoo.bullet.TestHelpers.addMetadata) BulletConfig(com.yahoo.bullet.common.BulletConfig) DistributionType(com.yahoo.bullet.query.aggregations.DistributionType) COUNT_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.COUNT_FIELD) SEPARATOR(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.SEPARATOR) Collections(java.util.Collections) Clip(com.yahoo.bullet.result.Clip) BulletRecord(com.yahoo.bullet.record.BulletRecord) Map(java.util.Map) Test(org.testng.annotations.Test)

Example 2 with START_INCLUSIVE

use of com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE in project bullet-core by yahoo.

the class QuantileSketchingStrategyTest method testPMF.

@Test
public void testPMF() {
    QuantileSketchingStrategy distribution = makeDistribution(DistributionType.PMF, asList(5.0, 2.5));
    IntStream.range(0, 100).mapToDouble(i -> (i * 0.1)).mapToObj(d -> RecordBox.get().add("field", d).getRecord()).forEach(distribution::consume);
    Clip result = distribution.getResult();
    Map<String, Object> metadata = (Map<String, Object>) result.getMeta().asMap().get("meta");
    Assert.assertEquals(metadata.size(), 7);
    Assert.assertFalse((Boolean) metadata.get("isEst"));
    List<BulletRecord> records = result.getRecords();
    Assert.assertEquals(records.size(), 3);
    BulletRecord expectedA = RecordBox.get().add(RANGE_FIELD, NEGATIVE_INFINITY_START + SEPARATOR + 2.5 + END_EXCLUSIVE).add(COUNT_FIELD, 25.0).add(PROBABILITY_FIELD, 0.25).getRecord();
    BulletRecord expectedB = RecordBox.get().add(RANGE_FIELD, START_INCLUSIVE + 2.5 + SEPARATOR + 5.0 + END_EXCLUSIVE).add(COUNT_FIELD, 25.0).add(PROBABILITY_FIELD, 0.25).getRecord();
    BulletRecord expectedC = RecordBox.get().add(RANGE_FIELD, START_INCLUSIVE + 5.0 + SEPARATOR + POSITIVE_INFINITY_END).add(COUNT_FIELD, 50.0).add(PROBABILITY_FIELD, 0.5).getRecord();
    Assert.assertEquals(records.get(0), expectedA);
    Assert.assertEquals(records.get(1), expectedB);
    Assert.assertEquals(records.get(2), expectedC);
    Assert.assertEquals(distribution.getRecords(), result.getRecords());
    Assert.assertEquals(distribution.getMetadata().asMap(), result.getMeta().asMap());
}
Also used : LinearDistribution(com.yahoo.bullet.query.aggregations.LinearDistribution) IntStream(java.util.stream.IntStream) Arrays(java.util.Arrays) ManualDistribution(com.yahoo.bullet.query.aggregations.ManualDistribution) RegionDistribution(com.yahoo.bullet.query.aggregations.RegionDistribution) START_INCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE) END_EXCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.END_EXCLUSIVE) PROBABILITY_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.PROBABILITY_FIELD) Concept(com.yahoo.bullet.result.Meta.Concept) Test(org.testng.annotations.Test) RecordBox(com.yahoo.bullet.result.RecordBox) NEGATIVE_INFINITY_START(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.NEGATIVE_INFINITY_START) Clip(com.yahoo.bullet.result.Clip) Family(com.yahoo.sketches.Family) HashSet(java.util.HashSet) Pair(org.apache.commons.lang3.tuple.Pair) Assert(org.testng.Assert) VALUE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.VALUE_FIELD) Arrays.asList(java.util.Arrays.asList) Map(java.util.Map) Distribution(com.yahoo.bullet.query.aggregations.Distribution) POSITIVE_INFINITY_END(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.POSITIVE_INFINITY_END) BulletRecord(com.yahoo.bullet.record.BulletRecord) DoublesSketch(com.yahoo.sketches.quantiles.DoublesSketch) QUANTILE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.QUANTILE_FIELD) Set(java.util.Set) Collectors(java.util.stream.Collectors) List(java.util.List) TestHelpers.assertApproxEquals(com.yahoo.bullet.TestHelpers.assertApproxEquals) RANGE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.RANGE_FIELD) TestHelpers.addMetadata(com.yahoo.bullet.TestHelpers.addMetadata) BulletConfig(com.yahoo.bullet.common.BulletConfig) DistributionType(com.yahoo.bullet.query.aggregations.DistributionType) COUNT_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.COUNT_FIELD) SEPARATOR(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.SEPARATOR) Collections(java.util.Collections) Clip(com.yahoo.bullet.result.Clip) BulletRecord(com.yahoo.bullet.record.BulletRecord) Map(java.util.Map) Test(org.testng.annotations.Test)

Example 3 with START_INCLUSIVE

use of com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE in project bullet-core by yahoo.

the class QuantileSketchingStrategyTest method testCasting.

@Test
public void testCasting() {
    QuantileSketchingStrategy distribution = makeDistribution(DistributionType.PMF, Collections.singletonList(50.0));
    IntStream.range(0, 25).mapToObj(String::valueOf).map(s -> RecordBox.get().add("field", s).getRecord()).forEach(distribution::consume);
    distribution.consume(RecordBox.get().add("field", "garbage").getRecord());
    distribution.consume(RecordBox.get().add("field", "1.0 garbage").getRecord());
    IntStream.range(50, 100).mapToDouble(i -> i).mapToObj(d -> RecordBox.get().add("field", d).getRecord()).forEach(distribution::consume);
    Clip result = distribution.getResult();
    Map<String, Object> metadata = (Map<String, Object>) result.getMeta().asMap().get("meta");
    Assert.assertEquals(metadata.size(), 7);
    Assert.assertFalse((Boolean) metadata.get("isEst"));
    List<BulletRecord> records = result.getRecords();
    Assert.assertEquals(records.size(), 2);
    BulletRecord expectedA = RecordBox.get().add(RANGE_FIELD, NEGATIVE_INFINITY_START + SEPARATOR + 50.0 + END_EXCLUSIVE).add(COUNT_FIELD, 25.0).add(PROBABILITY_FIELD, 1.0 / 3).getRecord();
    BulletRecord expectedB = RecordBox.get().add(RANGE_FIELD, START_INCLUSIVE + 50.0 + SEPARATOR + POSITIVE_INFINITY_END).add(COUNT_FIELD, 50.0).add(PROBABILITY_FIELD, 2.0 / 3).getRecord();
    Assert.assertEquals(records.get(0), expectedA);
    Assert.assertEquals(records.get(1), expectedB);
    Assert.assertEquals(distribution.getRecords(), result.getRecords());
    Assert.assertEquals(distribution.getMetadata().asMap(), result.getMeta().asMap());
}
Also used : LinearDistribution(com.yahoo.bullet.query.aggregations.LinearDistribution) IntStream(java.util.stream.IntStream) Arrays(java.util.Arrays) ManualDistribution(com.yahoo.bullet.query.aggregations.ManualDistribution) RegionDistribution(com.yahoo.bullet.query.aggregations.RegionDistribution) START_INCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE) END_EXCLUSIVE(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.END_EXCLUSIVE) PROBABILITY_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.PROBABILITY_FIELD) Concept(com.yahoo.bullet.result.Meta.Concept) Test(org.testng.annotations.Test) RecordBox(com.yahoo.bullet.result.RecordBox) NEGATIVE_INFINITY_START(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.NEGATIVE_INFINITY_START) Clip(com.yahoo.bullet.result.Clip) Family(com.yahoo.sketches.Family) HashSet(java.util.HashSet) Pair(org.apache.commons.lang3.tuple.Pair) Assert(org.testng.Assert) VALUE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.VALUE_FIELD) Arrays.asList(java.util.Arrays.asList) Map(java.util.Map) Distribution(com.yahoo.bullet.query.aggregations.Distribution) POSITIVE_INFINITY_END(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.POSITIVE_INFINITY_END) BulletRecord(com.yahoo.bullet.record.BulletRecord) DoublesSketch(com.yahoo.sketches.quantiles.DoublesSketch) QUANTILE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.QUANTILE_FIELD) Set(java.util.Set) Collectors(java.util.stream.Collectors) List(java.util.List) TestHelpers.assertApproxEquals(com.yahoo.bullet.TestHelpers.assertApproxEquals) RANGE_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.RANGE_FIELD) TestHelpers.addMetadata(com.yahoo.bullet.TestHelpers.addMetadata) BulletConfig(com.yahoo.bullet.common.BulletConfig) DistributionType(com.yahoo.bullet.query.aggregations.DistributionType) COUNT_FIELD(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.COUNT_FIELD) SEPARATOR(com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.SEPARATOR) Collections(java.util.Collections) Clip(com.yahoo.bullet.result.Clip) BulletRecord(com.yahoo.bullet.record.BulletRecord) Map(java.util.Map) Test(org.testng.annotations.Test)

Aggregations

TestHelpers.addMetadata (com.yahoo.bullet.TestHelpers.addMetadata)3 TestHelpers.assertApproxEquals (com.yahoo.bullet.TestHelpers.assertApproxEquals)3 BulletConfig (com.yahoo.bullet.common.BulletConfig)3 Distribution (com.yahoo.bullet.query.aggregations.Distribution)3 DistributionType (com.yahoo.bullet.query.aggregations.DistributionType)3 LinearDistribution (com.yahoo.bullet.query.aggregations.LinearDistribution)3 ManualDistribution (com.yahoo.bullet.query.aggregations.ManualDistribution)3 RegionDistribution (com.yahoo.bullet.query.aggregations.RegionDistribution)3 COUNT_FIELD (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.COUNT_FIELD)3 END_EXCLUSIVE (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.END_EXCLUSIVE)3 NEGATIVE_INFINITY_START (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.NEGATIVE_INFINITY_START)3 POSITIVE_INFINITY_END (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.POSITIVE_INFINITY_END)3 PROBABILITY_FIELD (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.PROBABILITY_FIELD)3 QUANTILE_FIELD (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.QUANTILE_FIELD)3 RANGE_FIELD (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.RANGE_FIELD)3 SEPARATOR (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.SEPARATOR)3 START_INCLUSIVE (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.START_INCLUSIVE)3 VALUE_FIELD (com.yahoo.bullet.querying.aggregations.sketches.QuantileSketch.VALUE_FIELD)3 BulletRecord (com.yahoo.bullet.record.BulletRecord)3 Clip (com.yahoo.bullet.result.Clip)3