codope commented on issue #7209:
URL: https://github.com/apache/hudi/issues/7209#issuecomment-1330149146

   Inspected the last clean instant in the above timeline but not hitting the 
same issue.
   ```
   scala> import org.apache.hudi.common.table.HoodieTableMetaClient
   import org.apache.hudi.common.table.HoodieTableMetaClient
   
   scala> import org.apache.hudi.common.table.timeline.TimelineMetadataUtils
   import org.apache.hudi.common.table.timeline.TimelineMetadataUtils
   
   scala> import org.apache.hudi.avro.model.HoodieCleanMetadata
   import org.apache.hudi.avro.model.HoodieCleanMetadata
   
   scala> val metaClient = 
HoodieTableMetaClient.builder().setConf(sc.hadoopConfiguration).setBasePath("file:///opt/issue-7209").build()
   metaClient: org.apache.hudi.common.table.HoodieTableMetaClient = 
HoodieTableMetaClient{basePath='file:/opt/issue-7209', 
metaPath='file:/opt/issue-7209/.hoodie', tableType=MERGE_ON_READ}
   
   scala> val lastCleanInstant = 
metaClient.getActiveTimeline().getCleanerTimeline().filterCompletedInstants().lastInstant()
   lastCleanInstant: 
org.apache.hudi.common.util.Option[org.apache.hudi.common.table.timeline.HoodieInstant]
 = Option{val=[20221110205549920__clean__COMPLETED]}
   
   scala> val cleanMetadata = 
TimelineMetadataUtils.deserializeHoodieCleanMetadata(metaClient.getActiveTimeline().getInstantDetails(lastCleanInstant.get()).get())
   cleanMetadata: org.apache.hudi.avro.model.HoodieCleanMetadata = 
{"startCleanTime": "20221110205549920", "timeTakenInMillis": 2354, 
"totalFilesDeleted": 2668, "earliestCommitToRetain": "20221110201240334", 
"lastCompletedCommitTimestamp": "", "partitionMetadata": 
{"year=2022/month=10/week=41/day=11/hour=06/app=mapy/os=android": 
{"partitionPath": 
"year=2022/month=10/week=41/day=11/hour=06/app=mapy/os=android", "policy": 
"KEEP_LATEST_COMMITS", "deletePathPatterns": 
["e4eff7fe-2c45-4a54-a64a-447f05c5c271-0_393-184-83092_20221110194231092.parquet"],
 "successDeleteFiles": 
["e4eff7fe-2c45-4a54-a64a-447f05c5c271-0_393-184-83092_20221110194231092.parquet"],
 "failedDeleteFiles": [], "isPartitionDeleted": false}, 
"year=2022/month=11/week=44/day=05/hour=18/app=sbrowser/os=android": 
{"partitionPath":...
   scala>
   ```
   
   Looks like the offending commit `20221115122551524` is not present in the 
attached timeline.
   Just before the error, we see following logs:
   ```
   2022-11-15 12:32:28,321 INFO fs.FSUtils: Removed directory at 
/hits/app/hudi_cileni/.hoodie/.temp/20221115122551524
   2022-11-15 12:32:28,321 INFO client.BaseHoodieWriteClient: Async cleaner has 
been spawned. Waiting for it to finish
   2022-11-15 12:32:28,321 INFO async.AsyncCleanerService: Waiting for async 
clean service to finish
   ```
   
   We need to inspect this commit. @koldic Do you have the above commit info?


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Reply via email to