Blazer-007 commented on code in PR #4058: URL: https://github.com/apache/gobblin/pull/4058#discussion_r1813222492
########## gobblin-data-management/src/main/java/org/apache/gobblin/data/management/copy/iceberg/IcebergTable.java: ########## @@ -237,31 +238,35 @@ protected void registerIcebergTable(TableMetadata srcMetadata, TableMetadata dst * @throws RuntimeException if error occurred while reading the manifest file */ public List<DataFile> getPartitionSpecificDataFiles(Predicate<StructLike> icebergPartitionFilterPredicate) - throws TableNotFoundException { + throws IOException { TableMetadata tableMetadata = accessTableMetadata(); Snapshot currentSnapshot = tableMetadata.currentSnapshot(); long currentSnapshotId = currentSnapshot.snapshotId(); List<DataFile> knownDataFiles = new ArrayList<>(); - log.info("~{}~ for snapshot '{}' - '{}' total known iceberg datafiles", tableId, currentSnapshotId, - knownDataFiles.size()); + GrowthMilestoneTracker growthMilestoneTracker = new GrowthMilestoneTracker(); //TODO: Add support for deleteManifests as well later // Currently supporting dataManifests only List<ManifestFile> dataManifestFiles = currentSnapshot.dataManifests(this.tableOps.io()); for (ManifestFile manifestFile : dataManifestFiles) { + if (growthMilestoneTracker.isAnotherMilestone(knownDataFiles.size())) { + log.info("~{}~ for snapshot '{}' - before manifest-file '{}' '{}' total known iceberg datafiles", tableId, + currentSnapshotId, + manifestFile.path(), + knownDataFiles.size() + ); + } Review Comment: Yes, seems a valid approach let me remove growthMileStonetracker from that function -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: dev-unsubscr...@gobblin.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org