prestodb · highker · Oct 12, 2021 · Sep 24, 2021 · highker · Oct 7, 2021
@@ -318,7 +318,7 @@ public Page getLoadedPage()
 
     public Page getLoadedPage(int channel)
     {
-        return wrapBlocksWithoutCopy(positionCount, new Block[]{this.blocks[channel].getLoadedBlock()});
+        return wrapBlocksWithoutCopy(positionCount, new Block[] {this.blocks[channel].getLoadedBlock()});
     }
 
     public Page getLoadedPage(int... channels)
@@ -377,7 +377,7 @@ public Page copyPositions(int[] retainedPositions, int offset, int length)
 
     public Page extractChannel(int channel)
     {
-        return wrapBlocksWithoutCopy(positionCount, new Block[]{this.blocks[channel]});
+        return wrapBlocksWithoutCopy(positionCount, new Block[] {this.blocks[channel]});
     }
 
     public Page extractChannels(int[] channels)
@@ -404,6 +404,18 @@ public Page prependColumn(Block column)
         return wrapBlocksWithoutCopy(positionCount, result);
     }
 
+    public Page dropColumn(int channelIndex)
+    {
+        if (channelIndex < 0 || channelIndex >= getChannelCount()) {
+            throw new IndexOutOfBoundsException(format("Invalid channel %d in page with %s channels", channelIndex, getChannelCount()));
+        }
+
+        Block[] result = new Block[getChannelCount() - 1];
+        System.arraycopy(blocks, 0, result, 0, channelIndex);
+        System.arraycopy(blocks, channelIndex + 1, result, channelIndex, getChannelCount() - channelIndex - 1);
+        return wrapBlocksWithoutCopy(positionCount, result);
+    }
+
     private long updateRetainedSize()
     {
         long retainedSizeInBytes = INSTANCE_SIZE + sizeOf(blocks);

@@ -147,6 +147,21 @@ public int getPositionCount()
         return nullCheckBlock.getPositionCount();
     }
 
+    public int getNonNullPositionCount()
+    {
+        if (!nullCheckBlock.mayHaveNull()) {
+            return getPositionCount();
+        }
+
+        int count = 0;
+        for (int i = 0; i < getPositionCount(); i++) {
+            if (!isNull(i)) {
+                count++;
+            }
+        }
+        return count;
+    }
+
     public boolean isNull(int position)
     {
         return nullCheckBlock.isNull(position);

@@ -125,6 +125,7 @@ public final class SystemSessionProperties
     public static final String JOIN_SPILL_ENABLED = "join_spill_enabled";
     public static final String AGGREGATION_SPILL_ENABLED = "aggregation_spill_enabled";
     public static final String DISTINCT_AGGREGATION_SPILL_ENABLED = "distinct_aggregation_spill_enabled";
+    public static final String DEDUP_BASED_DISTINCT_AGGREGATION_SPILL_ENABLED = "dedup_based_distinct_aggregation_spill_enabled";
     public static final String ORDER_BY_AGGREGATION_SPILL_ENABLED = "order_by_aggregation_spill_enabled";
     public static final String WINDOW_SPILL_ENABLED = "window_spill_enabled";
     public static final String ORDER_BY_SPILL_ENABLED = "order_by_spill_enabled";
@@ -630,6 +631,11 @@ public SystemSessionProperties(
                         "Enable spill for distinct aggregations if spill_enabled and aggregation_spill_enabled",
                         featuresConfig.isDistinctAggregationSpillEnabled(),
                         false),
+                booleanProperty(
+                        DEDUP_BASED_DISTINCT_AGGREGATION_SPILL_ENABLED,
+                        "Perform deduplication of input data for distinct aggregates before spilling",
+                        featuresConfig.isDedupBasedDistinctAggregationSpillEnabled(),
+                        false),
                 booleanProperty(
                         ORDER_BY_AGGREGATION_SPILL_ENABLED,
                         "Enable spill for order-by aggregations if spill_enabled and aggregation_spill_enabled",
@@ -1506,6 +1512,11 @@ public static boolean isDistinctAggregationSpillEnabled(Session session)
         return session.getSystemProperty(DISTINCT_AGGREGATION_SPILL_ENABLED, Boolean.class) && isAggregationSpillEnabled(session);
     }
 
+    public static boolean isDedupBasedDistinctAggregationSpillEnabled(Session session)
+    {
+        return session.getSystemProperty(DEDUP_BASED_DISTINCT_AGGREGATION_SPILL_ENABLED, Boolean.class);
+    }
+
     public static boolean isOrderByAggregationSpillEnabled(Session session)
     {
         return session.getSystemProperty(ORDER_BY_AGGREGATION_SPILL_ENABLED, Boolean.class) && isAggregationSpillEnabled(session);

@@ -164,6 +164,14 @@ public Work<?> addPage(Page page)
         return new AddPageWork(page.getBlock(hashChannel));
     }
 
+    @Override
+    public List<Page> getBufferedPages()
+    {
+        // This method is left unimplemented since it is not invoked from anywhere within code.
+        // Add an implementation, if needed in future
+        throw new UnsupportedOperationException("BigIntGroupByHash does not support getBufferedPages");
+    }
+
     @Override
     public Work<GroupByIdBlock> getGroupIds(Page page)
     {

@@ -69,6 +69,8 @@ static GroupByHash createGroupByHash(
 
     Work<?> addPage(Page page);
 
+    List<Page> getBufferedPages();
+
     Work<GroupByIdBlock> getGroupIds(Page page);
 
     boolean contains(int position, Page page, int[] hashChannels);

@@ -60,6 +60,11 @@ public int getCapacity()
         return groupByHash.getCapacity();
     }
 
+    public List<Page> getDistinctPages()
+    {
+        return groupByHash.getBufferedPages();
+    }
+
     private Block processNextGroupIds(GroupByIdBlock ids)
     {
         int positions = ids.getPositionCount();

@@ -224,6 +224,25 @@ public Work<?> addPage(Page page)
         return new AddNonDictionaryPageWork(page);
     }
 
+    @Override
+    public List<Page> getBufferedPages()
+    {
+        ImmutableList.Builder<Page> inputPages = ImmutableList.builder();
+        int numPages = channelBuilders.get(0).size();
+        for (int i = 0; i < numPages; i++) {
+            Block[] blocks = new Block[channels.length];
+            for (int channel = 0; channel < channels.length; channel++) {
+                blocks[channel] = ((BlockBuilder) channelBuilders.get(channel).get(i)).build();
+            }
+
+            Page page = new Page(blocks);
+            if (page.getPositionCount() > 0) {
+                inputPages.add(page);
+            }
+        }
+        return inputPages.build();
+    }
+
     @Override
     public Work<GroupByIdBlock> getGroupIds(Page page)
     {

@@ -75,6 +75,14 @@ public Work<?> addPage(Page page)
         return new CompletedWork<>(0);
     }
 
+    @Override
+    public List<Page> getBufferedPages()
+    {
+        // This method is left unimplemented since it is not invoked from anywhere within code.
+        // Add an implementation, if needed in future
+        throw new UnsupportedOperationException("NoChannelGroupByHash does not support getBufferedPages");
+    }
+
     @Override
     public Work<GroupByIdBlock> getGroupIds(Page page)
     {