[I] Query failure for 0.14.0 [hudi]

via GitHub Sun, 30 Nov 2025 01:12:46 -0800


hudi-bot opened a new issue, #16278:
URL: https://github.com/apache/hudi/issues/16278


   {code:java}
   Caused by: org.apache.spark.SparkException: Job aborted due to stage 
failure: ShuffleMapStage 1054 (run at AccessController.java:0) has failed the 
maximum allowable number of times: 4. Most recent failure 
reason:org.apache.spark.shuffle.MetadataFetchFailedException: Missing an output 
location for shuffle 259 partition 31   at 
org.apache.spark.MapOutputTracker$.validateStatus(MapOutputTracker.scala:1705)  
     at 
org.apache.spark.MapOutputTracker$.$anonfun$convertMapStatuses$10(MapOutputTracker.scala:1652)
       at 
org.apache.spark.MapOutputTracker$.$anonfun$convertMapStatuses$10$adapted(MapOutputTracker.scala:1651)
       at scala.collection.Iterator.foreach(Iterator.scala:943)        at 
scala.collection.Iterator.foreach$(Iterator.scala:943)       at 
scala.collection.AbstractIterator.foreach(Iterator.scala:1431)       at 
org.apache.spark.MapOutputTracker$.convertMapStatuses(MapOutputTracker.scala:1651)
   at 
org.apache.spark.MapOutputTrackerWorker.getMapSizesByExecutorIdImpl(MapOutputTracker.scala:1294)
     at org.apache.spark
 .MapOutputTrackerWorker.getMapSizesByExecutorId(MapOutputTracker.scala:1256)   
at 
org.apache.spark.shuffle.sort.SortShuffleManager.getReader(SortShuffleManager.scala:140)
     at 
org.apache.spark.shuffle.ShuffleManager.getReader(ShuffleManager.scala:63)   at 
org.apache.spark.shuffle.ShuffleManager.getReader$(ShuffleManager.scala:57)  at 
org.apache.spark.shuffle.sort.SortShuffleManager.getReader(SortShuffleManager.scala:73)
      at 
org.apache.spark.sql.execution.ShuffledRowRDD.compute(ShuffledRowRDD.scala:208) 
     at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:365)      at 
org.apache.spark.rdd.RDD.iterator(RDD.scala:329)     at 
org.apache.spark.rdd.ZippedPartitionsRDD2.compute(ZippedPartitionsRDD.scala:89) 
     at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:365)      at 
org.apache.spark.rdd.RDD.iterator(RDD.scala:329)     at 
org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)     at 
org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:365)      at 
org.apache.spark.rdd.RDD.itera
 tor(RDD.scala:329)     at 
org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)     at 
org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:365)      at 
org.apache.spark.rdd.RDD.iterator(RDD.scala:329)     at 
org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
 at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)  
 at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)  
 at org.apache.spark.scheduler.Task.run(Task.scala:138)  at 
org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:548)
     at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1516)    at 
org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:551)        at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
     at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
     at java.lang.Thread.run(Thread.java:750)
        at 
org.apache.spark.scheduler.DAGScheduler.failJobAndIndependentStages(DAGScheduler.scala:2863)
 at 
org.apache.spark.scheduler.DAGScheduler.$anonfun$abortStage$2(DAGScheduler.scala:2799)
       at 
org.apache.spark.scheduler.DAGScheduler.$anonfun$abortStage$2$adapted(DAGScheduler.scala:2798)
       at 
scala.collection.mutable.ResizableArray.foreach(ResizableArray.scala:62)     at 
scala.collection.mutable.ResizableArray.foreach$(ResizableArray.scala:55)    at 
scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:49)   at 
org.apache.spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:2798)  at 
org.apache.spark.scheduler.DAGScheduler.handleTaskCompletion(DAGScheduler.scala:1995)
        at 
org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.doOnReceive(DAGScheduler.scala:3048)
 at 
org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:2993)
   at 
org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:2982)
   at org.apache.spark.util.EventLoop$
 $anon$1.run(EventLoop.scala:49)        at 
org.apache.spark.sql.execution.adaptive.AdaptiveExecutor.checkNoFailures(AdaptiveExecutor.scala:154)
 at 
org.apache.spark.sql.execution.adaptive.AdaptiveExecutor.doRun(AdaptiveExecutor.scala:88)
    at 
org.apache.spark.sql.execution.adaptive.AdaptiveExecutor.tryRunningAndGetFuture(AdaptiveExecutor.scala:66)
   at 
org.apache.spark.sql.execution.adaptive.AdaptiveExecutor.execute(AdaptiveExecutor.scala:57)
  at 
org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec.$anonfun$getFinalPhysicalPlan$1(AdaptiveSparkPlanExec.scala:249)
       at org.apache.spark.sql.SparkSession.withActive(SparkSession.scala:779) 
at 
org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec.getFinalPhysicalPlan(AdaptiveSparkPlanExec.scala:248)
  at 
org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec.withFinalPlanUpdate(AdaptiveSparkPlanExec.scala:521)
   at 
org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec.executeCollect(AdaptiveSparkPlanExec.scala:483)
        at org.apac
 he.spark.sql.Dataset.collectFromPlan(Dataset.scala:3932)       at 
org.apache.spark.sql.Dataset.$anonfun$collect$1(Dataset.scala:3161)  at 
org.apache.spark.sql.Dataset.$anonfun$withAction$2(Dataset.scala:3922)       at 
org.apache.spark.sql.execution.QueryExecution$.withInternalError(QueryExecution.scala:554)
   at org.apache.spark.sql.Dataset.$anonfun$withAction$1(Dataset.scala:3920)    
   at 
org.apache.spark.sql.catalyst.QueryPlanningTracker$.withTracker(QueryPlanningTracker.scala:107)
      at 
org.apache.spark.sql.execution.SQLExecution$.withTracker(SQLExecution.scala:224)
     at 
org.apache.spark.sql.execution.SQLExecution$.executeQuery$1(SQLExecution.scala:114)
  at 
org.apache.spark.sql.execution.SQLExecution$.$anonfun$withNewExecutionId$7(SQLExecution.scala:139)
   at 
org.apache.spark.sql.catalyst.QueryPlanningTracker$.withTracker(QueryPlanningTracker.scala:107)
      at 
org.apache.spark.sql.execution.SQLExecution$.withTracker(SQLExecution.scala:224)
     at org.apache.spark.sql.execution.SQLExecution$.$anonfun$withNewExecutio
 nId$6(SQLExecution.scala:139)  at 
org.apache.spark.sql.execution.SQLExecution$.withSQLConfPropagated(SQLExecution.scala:245)
   at 
org.apache.spark.sql.execution.SQLExecution$.$anonfun$withNewExecutionId$1(SQLExecution.scala:138)
   at org.apache.spark.sql.SparkSession.withActive(SparkSession.scala:779) at 
org.apache.spark.sql.execution.SQLExecution$.withNewExecutionId(SQLExecution.scala:68)
       at org.apache.spark.sql.Dataset.withAction(Dataset.scala:3920)  at 
org.apache.spark.sql.Dataset.collect(Dataset.scala:3161)     at 
org.apache.spark.sql.hive.thriftserver.SparkExecuteStatementOperation.org$apache$spark$sql$hive$thriftserver$SparkExecuteStatementOperation$$execute(SparkExecuteStatementOperation.scala:300)
       ... 16 more
        at 
org.apache.hive.jdbc.HiveStatement.waitForOperationToComplete(HiveStatement.java:401)
 ~[hive-jdbc-3.1.3.jar:3.1.3]   at 
org.apache.hive.jdbc.HiveStatement.execute(HiveStatement.java:266) 
~[hive-jdbc-3.1.3.jar:3.1.3]      at 
com.microsoft.lst_bench.common.LSTBenchmarkExecutor$Worker.executeTask(LSTBenchmarkExecutor.java:274)
 ~[lst-bench-0.1-SNAPSHOT.jar:?]        at 
com.microsoft.lst_bench.common.LSTBenchmarkExecutor$Worker.call(LSTBenchmarkExecutor.java:248)
 ~[lst-bench-0.1-SNAPSHOT.jar:?]       at 
com.microsoft.lst_bench.common.LSTBenchmarkExecutor$Worker.call(LSTBenchmarkExecutor.java:222)
 ~[lst-bench-0.1-SNAPSHOT.jar:?]       at 
java.util.concurrent.FutureTask.run(FutureTask.java:264) ~[?:?]      at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128) 
~[?:?]       at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628) 
~[?:?]       at java.lang.Thread.run(Thread.java:829) ~[?:?] {code}
   
   ## JIRA info
   
   - Link: https://issues.apache.org/jira/browse/HUDI-6988
   - Type: Sub-task


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

[I] Query failure for 0.14.0 [hudi]

Reply via email to