apache · difin · Oct 30, 2024 · Nov 14, 2024 · zratkai · Nov 14, 2024
diff --git a/common/src/java/org/apache/hadoop/hive/conf/HiveConf.java b/common/src/java/org/apache/hadoop/hive/conf/HiveConf.java
@@ -2229,12 +2229,18 @@ public static enum ConfVars {
     HIVE_ICEBERG_EXPIRE_SNAPSHOT_NUMTHREADS("hive.iceberg.expire.snapshot.numthreads", 4,
         "The number of threads to be used for deleting files during expire snapshot. If set to 0 or below it uses the" +
             " defult DirectExecutorService"),
-
     HIVE_ICEBERG_MASK_DEFAULT_LOCATION("hive.iceberg.mask.default.location", false,
         "If this is set to true the URI for auth will have the default location masked with DEFAULT_TABLE_LOCATION"),
     HIVE_ICEBERG_ALLOW_DATAFILES_IN_TABLE_LOCATION_ONLY("hive.iceberg.allow.datafiles.in.table.location.only", false,
         "If this is set to true, then all the data files being read should be withing the table location"),
-
+    HIVE_ICEBERG_MAJOR_COMPACTION_FILE_SIZE_THRESHOLD("hive.iceberg.major.compaction.file.size.threshold", "96mb",
+        new SizeValidator(), "Iceberg data file size in megabytes below which a file needs to be compacted."),
+    HIVE_ICEBERG_MINOR_COMPACTION_FILE_SIZE_THRESHOLD("hive.iceberg.minor.compaction.file.size.threshold", "16mb",
+        new SizeValidator(), "Iceberg data file size in megabytes below which a file needs to be compacted."),
+    ICEBERG_COMPACTION_FILE_SIZE_RATIO("hive.iceberg.compaction.file.size.ratio", 0.1f,
+        "Ratio of # data files below threshold / # data files above threshold above which compaction is needed"),
+    ICEBERG_COMPACTION_DELETE_RECORDS_THRESHOLD("hive.iceberg.delete.records.threshold", 100,
+        "Number of delete records in a table/partition above which a file needs to be compacted."),
     HIVE_USE_EXPLICIT_RCFILE_HEADER("hive.exec.rcfile.use.explicit.header", true,
         "If this is set the header for RCFiles will simply be RCF.  If this is not\n" +
         "set the header will be that borrowed from sequence files, e.g. SEQ- followed\n" +

diff --git a/...g/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/HiveIcebergStorageHandler.java b/...g/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/HiveIcebergStorageHandler.java
@@ -63,6 +63,7 @@
 import org.apache.hadoop.hive.metastore.Warehouse;
 import org.apache.hadoop.hive.metastore.api.ColumnStatistics;
 import org.apache.hadoop.hive.metastore.api.ColumnStatisticsObj;
+import org.apache.hadoop.hive.metastore.api.CompactionType;
 import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
 import org.apache.hadoop.hive.metastore.api.FieldSchema;
 import org.apache.hadoop.hive.metastore.api.InvalidObjectException;
@@ -2232,4 +2233,59 @@ private static List<FieldSchema> schema(List<VirtualColumn> exprs) {
   private static List<FieldSchema> orderBy(VirtualColumn... exprs) {
     return schema(Arrays.asList(exprs));
   }
+
+  @Override
+  public boolean canCompact(HiveConf hiveConf, org.apache.hadoop.hive.ql.metadata.Table table, String partitionPath,
+      CompactionType compactionType) throws HiveException {
+    Table icebergTable = IcebergTableUtil.getTable(hiveConf, table.getTTable());
+    return canCompact(hiveConf, icebergTable, partitionPath, compactionType);
+  }
+
+  @VisibleForTesting
+  boolean canCompact(HiveConf hiveConf, Table icebergTable, String partitionPath,
+      CompactionType compactionType) throws HiveException {
+
+    if (icebergTable.currentSnapshot() == null) {
+      LOG.info("Table {}{} doesn't require compaction because it is empty", icebergTable,
+          partitionPath == null ? "" : " partition " + partitionPath);
+      return false;
+    }
+
+    int deleteRecordsThreshold = HiveConf.getIntVar(hiveConf, ConfVars.ICEBERG_COMPACTION_DELETE_RECORDS_THRESHOLD);
+    long deleteRecordsCount = IcebergTableUtil.countDeleteRecords(icebergTable, partitionPath);
+    if (deleteRecordsCount > deleteRecordsThreshold) {
+      return true;
+    }
+
+    int dataFilesCount = IcebergTableUtil.getDataFiles(icebergTable, partitionPath).size();
+    if (dataFilesCount < 2) {
+      LOG.info("Table {}{} doesn't require compaction because it has less than 2 data files", icebergTable,
+          partitionPath == null ? "" : " partition " + partitionPath);
+      return false;
+    }
+
+    long fileSizeInBytesThreshold;
+    switch (compactionType) {
+      case MAJOR:
+        fileSizeInBytesThreshold = HiveConf.getSizeVar(hiveConf,
+            ConfVars.HIVE_ICEBERG_MAJOR_COMPACTION_FILE_SIZE_THRESHOLD);
+        break;
+      case MINOR:
+        fileSizeInBytesThreshold = HiveConf.getSizeVar(hiveConf,
+            ConfVars.HIVE_ICEBERG_MINOR_COMPACTION_FILE_SIZE_THRESHOLD);
+        break;
+      default:
+        throw new HiveException(String.format("Invalid compaction type: %s", compactionType.name()));
+    }
+
+    float fileSizeRatioThreshold = HiveConf.getFloatVar(hiveConf, ConfVars.ICEBERG_COMPACTION_FILE_SIZE_RATIO);
+    float fileSizeRatio = IcebergTableUtil.getUncompactedRatio(icebergTable, partitionPath, fileSizeInBytesThreshold);
+    if (fileSizeRatio > fileSizeRatioThreshold) {
+      return true;
+    }
+    LOG.info("Table {}{} doesn't require compaction because its uncompacted ratio of {} is below the threshold of {}",
+        icebergTable, partitionPath == null ? "" : " partition " + partitionPath, fileSizeRatio,
+        fileSizeRatioThreshold);
+    return false;
+  }
 }
diff --git a/iceberg/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/IcebergTableUtil.java b/iceberg/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/IcebergTableUtil.java
@@ -458,6 +458,52 @@ public static List<DeleteFile> getDeleteFiles(Table table, String partitionPath)
         t -> ((PositionDeletesScanTask) t).file()));
   }
 
+  public static float getUncompactedRatio(Table table, String partitionPath, long fileSizeInBytesThreshold) {
+    long uncompactedFilesCount = getDataFileCount(table, partitionPath, fileSizeInBytesThreshold, true);
+    long compactedFilesCount = getDataFileCount(table, partitionPath, fileSizeInBytesThreshold, false);
+
+    if (uncompactedFilesCount == 0) {
+      return 0;
+    } else if (compactedFilesCount == 0) {
+      return 1;
+    } else {
+      return uncompactedFilesCount * 1.0f / (uncompactedFilesCount + compactedFilesCount);
+    }
+  }
+
+  private static long getDataFileCount(Table table, String partitionPath, long fileSizeInBytesThreshold,
+      boolean isLess) {
+    CloseableIterable<FileScanTask> fileScanTasks =
+        table.newScan().useSnapshot(table.currentSnapshot().snapshotId()).ignoreResiduals().planFiles();
+    CloseableIterable<FileScanTask> filteredFileScanTasks =
+        CloseableIterable.filter(fileScanTasks, t -> {
+          DataFile file = t.asFileScanTask().file();
+          return (!table.spec().isPartitioned() ||
+              partitionPath == null && file.specId() != table.spec().specId() ||
+              partitionPath != null &&
+                  table.specs().get(file.specId()).partitionToPath(file.partition()).equals(partitionPath)) &&
+              (isLess ? file.fileSizeInBytes() < fileSizeInBytesThreshold :
+                  file.fileSizeInBytes() >= fileSizeInBytesThreshold);
+        });
+    return Lists.newArrayList(filteredFileScanTasks).size();
+  }
+
+  public static long countDeleteRecords(Table table, String partitionPath) {
+    Table deletesTable =
+        MetadataTableUtils.createMetadataTableInstance(table, MetadataTableType.POSITION_DELETES);
+    CloseableIterable<ScanTask> deletesScanTasks = deletesTable.newBatchScan().planFiles();
+    CloseableIterable<ScanTask> filteredDeletesScanTasks =
+        CloseableIterable.filter(deletesScanTasks, t -> {
+          DeleteFile file = ((PositionDeletesScanTask) t).file();
+          return !table.spec().isPartitioned() ||
+              partitionPath == null && file.specId() != table.spec().specId() ||
+              partitionPath != null &&
+                  table.specs().get(file.specId()).partitionToPath(file.partition()).equals(partitionPath);
+        });
+    return Lists.newArrayList(CloseableIterable.transform(filteredDeletesScanTasks,
+        t -> ((PositionDeletesScanTask) t).file().recordCount())).stream().mapToLong(Long::longValue).sum();
+  }
+
   public static Expression generateExpressionFromPartitionSpec(Table table, Map<String, String> partitionSpec)
       throws SemanticException {
     Map<String, PartitionField> partitionFieldMap = getPartitionFields(table).stream()