use of io.prestosql.spi.dynamicfilter.HashSetDynamicFilter in project hetu-core by openlookeng.
the class TestDynamicFiltersCollector method TestCollectingGlobalDynamicFilters.
@Test
public void TestCollectingGlobalDynamicFilters() throws InterruptedException {
final QueryId queryId = new QueryId("test_query");
final String filterId = "1";
final String columnName = "column";
final TestingColumnHandle columnHandle = new TestingColumnHandle(columnName);
final Set<String> valueSet = ImmutableSet.of("1", "2", "3");
TaskContext taskContext = mock(TaskContext.class);
Session session = testSessionBuilder().setQueryId(queryId).setSystemProperty(ENABLE_DYNAMIC_FILTERING, "true").setSystemProperty(DYNAMIC_FILTERING_DATA_TYPE, "HASHSET").build();
when(taskContext.getSession()).thenReturn(session);
// set up state store and merged dynamic filters map
Map mockMap = new HashMap<>();
StateStoreProvider stateStoreProvider = mock(StateStoreProvider.class);
StateStore stateStore = mock(StateStore.class);
StateMap stateMap = new MockStateMap<>("test-map", mockMap);
when(stateStoreProvider.getStateStore()).thenReturn(stateStore);
when(stateStore.getStateCollection(any())).thenReturn(stateMap);
when(stateStore.createStateMap(any())).thenReturn(stateMap);
when(stateStore.getOrCreateStateCollection(any(), any())).thenReturn(stateMap);
// set up state store listener and dynamic filter cache
StateStoreListenerManager stateStoreListenerManager = new StateStoreListenerManager(stateStoreProvider);
DynamicFilterCacheManager dynamicFilterCacheManager = new DynamicFilterCacheManager();
stateStoreListenerManager.addStateStoreListener(new DynamicFilterListener(dynamicFilterCacheManager), MERGED_DYNAMIC_FILTERS);
LocalDynamicFiltersCollector collector = new LocalDynamicFiltersCollector(taskContext, Optional.empty(), dynamicFilterCacheManager);
TableScanNode tableScan = mock(TableScanNode.class);
when(tableScan.getAssignments()).thenReturn(ImmutableMap.of(new Symbol(columnName), columnHandle));
List<DynamicFilters.Descriptor> dynamicFilterDescriptors = ImmutableList.of(new DynamicFilters.Descriptor(filterId, new VariableReferenceExpression(columnName, BIGINT)));
collector.initContext(ImmutableList.of(dynamicFilterDescriptors), SymbolUtils.toLayOut(tableScan.getOutputSymbols()));
assertTrue(collector.getDynamicFilters(tableScan).isEmpty(), "there should be no dynamic filter available");
// put some values in state store as a new dynamic filter
// and wait for the listener to process the event
stateMap.put(createKey(DynamicFilterUtils.FILTERPREFIX, filterId, queryId.getId()), valueSet);
TimeUnit.MILLISECONDS.sleep(100);
// get available dynamic filter and verify it
List<Map<ColumnHandle, DynamicFilter>> dynamicFilters = collector.getDynamicFilters(tableScan);
assertEquals(dynamicFilters.size(), 1, "there should be a new dynamic filter");
assertEquals(dynamicFilters.size(), 1);
DynamicFilter dynamicFilter = dynamicFilters.get(0).get(columnHandle);
assertTrue(dynamicFilter instanceof HashSetDynamicFilter, "new dynamic filter should be hashset");
assertEquals(dynamicFilter.getSize(), valueSet.size(), "new dynamic filter should have correct size");
for (String value : valueSet) {
assertTrue(dynamicFilter.contains(value), "new dynamic filter should contain correct values");
}
// clean up when task finishes
collector.removeDynamicFilter(true);
DynamicFilter cachedFilter = dynamicFilterCacheManager.getDynamicFilter(DynamicFilterCacheManager.createCacheKey(filterId, queryId.getId()));
assertNull(cachedFilter, "cached dynamic filter should have been removed");
}
use of io.prestosql.spi.dynamicfilter.HashSetDynamicFilter in project hetu-core by openlookeng.
the class TestDynamicFilterServiceWithHashSet method testRegisterAndMergeDynamicFiltersHashSet.
@Test
public void testRegisterAndMergeDynamicFiltersHashSet() throws InterruptedException {
setUpHashSet();
filterId = "df2";
registerDf(filterId, session, PARTITIONED, dynamicFilterService);
// Test getDynamicFilterSupplier
VariableReferenceExpression mockExpression = mock(VariableReferenceExpression.class);
when(mockExpression.getName()).thenReturn("name");
ColumnHandle mockColumnHandle = mock(ColumnHandle.class);
Supplier<List<Set<DynamicFilter>>> dynamicFilterSupplier = DynamicFilterService.getDynamicFilterSupplier(session.getQueryId(), ImmutableList.of(ImmutableList.of(new DynamicFilters.Descriptor(filterId, mockExpression))), ImmutableMap.of(new Symbol("name"), mockColumnHandle));
assertTrue(dynamicFilterSupplier.get().isEmpty(), "should return empty dynamic filter set when dynamic filters are not available");
mockLocalDynamicFilterHashSet("task1.0", filterId, session.getQueryId().toString(), Arrays.asList("11", "12", "13", "14"));
mockLocalDynamicFilterHashSet("task1.1", filterId, session.getQueryId().toString(), Arrays.asList("15", "16", "17", "18"));
Thread.sleep(2000);
Set hs = fetchDynamicFilterHashSet(filterId, session.getQueryId().toString());
for (int i = 11; i < 19; i++) {
Assert.assertEquals(true, hs.contains(i + ""));
}
Assert.assertEquals(false, hs.contains("10"));
// Test getDynamicFilterSupplier
dynamicFilterSupplier = DynamicFilterService.getDynamicFilterSupplier(session.getQueryId(), ImmutableList.of(ImmutableList.of(new DynamicFilters.Descriptor(filterId, mockExpression))), ImmutableMap.of(new Symbol("name"), mockColumnHandle));
List<Set<DynamicFilter>> dynamicFilters = dynamicFilterSupplier.get();
assertFalse(dynamicFilters == null, "dynamic filters should be ready");
assertEquals(dynamicFilters.size(), 1, "there should be 1 dynamic filter in supplier");
HashSetDynamicFilter hsDF = ((HashSetDynamicFilter) dynamicFilters.get(0).toArray()[0]);
assertEquals(hs, hsDF.getSetValues(), "dynamic filter in supplier should be the same as the one merged");
dynamicFilterSupplier = DynamicFilterService.getDynamicFilterSupplier(new QueryId("invalid"), ImmutableList.of(ImmutableList.of(new DynamicFilters.Descriptor(filterId, mockExpression))), ImmutableMap.of(new Symbol("name"), mockColumnHandle));
assertTrue(dynamicFilterSupplier.get().isEmpty(), "should return empty dynamic filter set for invalid or non-existing queryId");
String queryId = session.getQueryId().getId();
assertEquals(stateStoreProvider.getStateStore().getStateCollection(createKey(DynamicFilterUtils.PARTIALPREFIX, filterId, queryId)).size(), 2);
assertEquals(stateStoreProvider.getStateStore().getStateCollection(createKey(DynamicFilterUtils.TASKSPREFIX, filterId, queryId)).size(), 2);
dynamicFilterService.clearDynamicFiltersForQuery(queryId);
Thread.sleep(1000);
assertEquals(stateStoreProvider.getStateStore().getStateCollection(createKey(DynamicFilterUtils.PARTIALPREFIX, filterId, queryId)).size(), 0);
assertEquals(stateStoreProvider.getStateStore().getStateCollection(createKey(DynamicFilterUtils.TASKSPREFIX, filterId, queryId)).size(), 0);
}
use of io.prestosql.spi.dynamicfilter.HashSetDynamicFilter in project hetu-core by openlookeng.
the class TestHiveUtil method testIsPartitionFilteredWithNonPartitionFilter.
@Test
public void testIsPartitionFilteredWithNonPartitionFilter() {
TypeManager typeManager = new TestingTypeManager();
Set<DynamicFilter> dynamicFilters = new HashSet<>();
List<HivePartitionKey> partitions = new ArrayList<>();
partitions.add(new HivePartitionKey("pt_d", "0"));
partitions.add(new HivePartitionKey("app_id", "10000"));
ColumnHandle nameColumn = new HiveColumnHandle("name", HIVE_STRING, parseTypeSignature(VARCHAR), 0, REGULAR, Optional.empty());
Set nameFilter = new HashSet();
nameFilter.add("Alice");
dynamicFilters.add(new HashSetDynamicFilter("1", nameColumn, nameFilter, DynamicFilter.Type.GLOBAL));
assertFalse(isPartitionFiltered(partitions, ImmutableList.of(dynamicFilters), typeManager), "Should not filter partition if dynamicFilter is on non-partition column");
}
use of io.prestosql.spi.dynamicfilter.HashSetDynamicFilter in project hetu-core by openlookeng.
the class DataCenterPageSource method applyDynamicFilters.
private void applyDynamicFilters(Map<ColumnHandle, DynamicFilter> dynamicFilters) {
ImmutableMap.Builder<String, byte[]> builder = new ImmutableMap.Builder();
for (Map.Entry<ColumnHandle, DynamicFilter> entry : dynamicFilters.entrySet()) {
if (!appliedDynamicFilters.contains(entry.getKey().getColumnName())) {
DynamicFilter df = entry.getValue();
String columnName = entry.getKey().getColumnName();
if (df instanceof HashSetDynamicFilter) {
// FIXME: Read fpp from config
BloomFilterDynamicFilter bloomFilterDynamicFilter = BloomFilterDynamicFilter.fromHashSetDynamicFilter((HashSetDynamicFilter) df);
builder.put(columnName, bloomFilterDynamicFilter.createSerializedBloomFilter());
} else if (df instanceof CombinedDynamicFilter) {
BloomFilterDynamicFilter bloomFilterDynamicFilter = BloomFilterDynamicFilter.fromCombinedDynamicFilter((CombinedDynamicFilter) df);
if (bloomFilterDynamicFilter != null) {
builder.put(columnName, bloomFilterDynamicFilter.createSerializedBloomFilter());
}
} else if (df instanceof BloomFilterDynamicFilter) {
builder.put(columnName, ((BloomFilterDynamicFilter) df).getBloomFilterSerialized());
} else {
LOGGER.info("Dynamic Filter (type: " + df.getClass().getSimpleName() + ") skipped for DC connector");
}
}
}
Map<String, byte[]> newDynamicFilters = builder.build();
if (!newDynamicFilters.isEmpty()) {
if (client.applyDynamicFilters(newDynamicFilters)) {
appliedDynamicFilters.addAll(newDynamicFilters.keySet());
}
}
}
use of io.prestosql.spi.dynamicfilter.HashSetDynamicFilter in project hetu-core by openlookeng.
the class TestDynamicFilterSourceOperator method testGlobalDynamicFilterSourceOperatorHashSet.
@Test
public void testGlobalDynamicFilterSourceOperatorHashSet() {
String filterId = "22";
DynamicFilterSourceOperatorFactory operatorFactory = createOperatorFactory(GLOBAL, HASHSET, 1, channel(0, BIGINT, filterId));
// will finish before noMoreOperators()
DynamicFilterSourceOperator op1 = createOperator(operatorFactory);
verifyPassthrough(op1, ImmutableList.of(BIGINT), new Page(createLongsBlock(1, 2)), new Page(createLongsBlock(12, 21)), new Page(createLongsBlock(13, 22)), new Page(createLongsBlock(3, 5)));
String key = DynamicFilterUtils.createKey(PARTIALPREFIX, filterId, TEST_SESSION.getQueryId().toString());
StateSet states = ((StateSet) stateStoreProvider.getStateStore().getStateCollection(key));
for (Object bfSerialized : states.getAll()) {
HashSetDynamicFilter bfdf = new HashSetDynamicFilter(filterId, null, (Set) bfSerialized, GLOBAL);
assertTrue(bfdf.contains(22L));
assertEquals(bfdf.getSize(), 8);
}
assertEquals(stateStoreProvider.getStateStore().getStateCollection(DynamicFilterUtils.createKey(TASKSPREFIX, filterId, TEST_SESSION.getQueryId().toString())).size(), 1);
}
Aggregations