Ethan Guo created HUDI-3398:
-------------------------------

             Summary: Schema validation fails for metadata table base file
                 Key: HUDI-3398
                 URL: https://issues.apache.org/jira/browse/HUDI-3398
             Project: Apache Hudi
          Issue Type: Bug
          Components: writer-core
            Reporter: Ethan Guo
            Assignee: Ethan Guo
             Fix For: 0.11.0


Stacktrace:
{code:java}
java.lang.IllegalArgumentException: Unknown file format 
:file:/Users/ethan/Work/data/hudi/metadata_test_ds_mor_continuous_4/.hoodie/metadata/files/files-0000_0-93-815_20220208164926830001.hfile
       at 
org.apache.hudi.common.table.TableSchemaResolver.getTableParquetSchemaFromDataFile(TableSchemaResolver.java:103)
     at 
org.apache.hudi.common.table.TableSchemaResolver.getTableAvroSchemaFromDataFile(TableSchemaResolver.java:119)
        at 
org.apache.hudi.common.table.TableSchemaResolver.hasOperationField(TableSchemaResolver.java:480)
     at 
org.apache.hudi.common.table.TableSchemaResolver.<init>(TableSchemaResolver.java:65)
 at org.apache.hudi.table.HoodieTable.validateSchema(HoodieTable.java:682)      
 at 
org.apache.hudi.table.HoodieTable.validateUpsertSchema(HoodieTable.java:698) at 
org.apache.hudi.client.SparkRDDWriteClient.upsertPreppedRecords(SparkRDDWriteClient.java:173)
        at 
org.apache.hudi.metadata.SparkHoodieBackedTableMetadataWriter.commit(SparkHoodieBackedTableMetadataWriter.java:154)
  at 
org.apache.hudi.metadata.HoodieBackedTableMetadataWriter.processAndCommit(HoodieBackedTableMetadataWriter.java:663)
  at 
org.apache.hudi.metadata.HoodieBackedTableMetadataWriter.update(HoodieBackedTableMetadataWriter.java:675)
    at 
org.apache.hudi.client.BaseHoodieWriteClient.lambda$writeTableMetadata$0(BaseHoodieWriteClient.java:273)
     at org.apache.hudi.common.util.Option.ifPresent(Option.java:96) at 
org.apache.hudi.client.BaseHoodieWriteClient.writeTableMetadata(BaseHoodieWriteClient.java:273)
      at 
org.apache.hudi.client.BaseHoodieWriteClient.commit(BaseHoodieWriteClient.java:229)
  at 
org.apache.hudi.client.BaseHoodieWriteClient.commitStats(BaseHoodieWriteClient.java:199)
     at 
org.apache.hudi.client.SparkRDDWriteClient.commit(SparkRDDWriteClient.java:127) 
     at 
org.apache.hudi.utilities.deltastreamer.DeltaSync.writeToSink(DeltaSync.java:609)
    at 
org.apache.hudi.utilities.deltastreamer.DeltaSync.syncOnce(DeltaSync.java:329)  
     at 
org.apache.hudi.utilities.deltastreamer.HoodieDeltaStreamer$DeltaSyncService.lambda$startService$0(HoodieDeltaStreamer.java:652)
     at 
java.util.concurrent.CompletableFuture$AsyncSupply.run(CompletableFuture.java:1604)
  at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
     at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
     at java.lang.Thread.run(Thread.java:748) {code}
full logs: https://gist.github.com/yihua/e00a1caddacbdc570b5b757049750f39



--
This message was sent by Atlassian Jira
(v8.20.1#820001)

Reply via email to