[
https://issues.apache.org/jira/browse/HIVE-29658?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=18088365#comment-18088365
]
tanishqchugh commented on HIVE-29658:
-------------------------------------
[~zabetak] updated the description, and have added the entire trace as an
attachment as well.
> OrcEncodedDataReader runs into NPE when LLAP IO cache is disabled
> -----------------------------------------------------------------
>
> Key: HIVE-29658
> URL: https://issues.apache.org/jira/browse/HIVE-29658
> Project: Hive
> Issue Type: Bug
> Reporter: tanishqchugh
> Assignee: tanishqchugh
> Priority: Major
> Labels: pull-request-available
> Attachments: complete_error_trace.log
>
>
> When the LLAP IO cache is disabled with setting _hive.llap.io.memory.mode_ to
> {_}none{_}, queries using ORC reader runs into NPE
> Minimal Queries to Repro:
> {code:java}
> CREATE TABLE llap_none_orc_src (
> id INT,
> name STRING
> )
> STORED AS ORC;
> INSERT INTO llap_none_orc_src VALUES (1, 'a'), (2, 'b');
> CREATE TABLE llap_none_orc_merged STORED AS ORC AS
> SELECT id, name FROM llap_none_orc_src;{code}
> Error Stack Trace:
> {code:java}
> org.apache.hadoop.hive.ql.exec.tez.TezRuntimeException: Vertex failed,
> vertexName=Map 1, vertexId=vertex_1781205777276_0001_2_00, diagnostics=[Task
> failed, taskId=task_1781205777276_0001_2_00_000000, diagnostics=[TaskAttempt
> 0 failed, info=[Error: Error while running task ( failure ) :
> attempt_1781205777276_0001_2_00_000000_0:java.lang.RuntimeException:
> org.apache.hadoop.hive.ql.metadata.HiveException: java.io.IOException:
> java.lang.NullPointerException: Cannot invoke
> "org.apache.hadoop.hive.llap.cache.PathCache.touch(Object, String)" because
> "this.pathCache" is null
> at
> org.apache.hadoop.hive.ql.exec.tez.TezProcessor.initializeAndRunProcessor(TezProcessor.java:341)
> at org.apache.hadoop.hive.ql.exec.tez.TezProcessor.run(TezProcessor.java:276)
> at
> org.apache.tez.runtime.LogicalIOProcessorRuntimeTask.run(LogicalIOProcessorRuntimeTask.java:381)
> at
> org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:86)
> at
> org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:72)
> at
> java.base/java.security.AccessController.doPrivileged(AccessController.java:714)
> at java.base/javax.security.auth.Subject.doAs(Subject.java:525)
> at
> org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1953)
> at
> org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:72)
> at
> org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:42)
> at org.apache.tez.common.CallableWithNdc.call(CallableWithNdc.java:36)
> at
> org.apache.hadoop.hive.llap.daemon.impl.StatsRecordingThreadPool$WrappedCallable.call(StatsRecordingThreadPool.java:111)
> at java.base/java.util.concurrent.FutureTask.run(FutureTask.java:317)
> at
> java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1144)
> at
> java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:642)
> at java.base/java.lang.Thread.run(Thread.java:1583)
> Caused by: org.apache.hadoop.hive.ql.metadata.HiveException:
> java.io.IOException: java.lang.NullPointerException: Cannot invoke
> "org.apache.hadoop.hive.llap.cache.PathCache.touch(Object, String)" because
> "this.pathCache" is null
> at
> org.apache.hadoop.hive.ql.exec.tez.MapRecordSource.pushRecord(MapRecordSource.java:89)
>
> at
> org.apache.hadoop.hive.ql.exec.tez.MapRecordProcessor.run(MapRecordProcessor.java:417)
>
> at
> org.apache.hadoop.hive.ql.exec.tez.TezProcessor.initializeAndRunProcessor(TezProcessor.java:293)
>
> ... 15 more
> Caused by: java.io.IOException: java.lang.NullPointerException: Cannot invoke
> "org.apache.hadoop.hive.llap.cache.PathCache.touch(Object, String)" because
> "this.pathCache" is null
> at
> org.apache.hadoop.hive.llap.io.api.impl.LlapRecordReader.rethrowErrorIfAny(LlapRecordReader.java:611)
>
> at
> org.apache.hadoop.hive.llap.io.api.impl.LlapRecordReader.nextCvb(LlapRecordReader.java:564)
>
> at
> org.apache.hadoop.hive.llap.io.api.impl.LlapRecordReader.next(LlapRecordReader.java:387)
>
> at
> org.apache.hadoop.hive.llap.io.api.impl.LlapRecordReader.next(LlapRecordReader.java:89)
>
> at
> org.apache.hadoop.hive.ql.io.HiveContextAwareRecordReader.doNext(HiveContextAwareRecordReader.java:374)
>
> at
> org.apache.hadoop.hive.ql.io.HiveRecordReader.doNext(HiveRecordReader.java:82)
>
> at
> org.apache.hadoop.hive.ql.io.HiveContextAwareRecordReader.next(HiveContextAwareRecordReader.java:118)
>
> at
> org.apache.hadoop.hive.ql.io.HiveContextAwareRecordReader.next(HiveContextAwareRecordReader.java:58)
>
> at
> org.apache.hadoop.mapred.split.TezGroupedSplitsInputFormat$TezGroupedSplitsRecordReader.next(TezGroupedSplitsInputFormat.java:208)
>
> at org.apache.tez.mapreduce.lib.MRReaderMapred.next(MRReaderMapred.java:116)
> at
> org.apache.hadoop.hive.ql.exec.tez.MapRecordSource.pushRecord(MapRecordSource.java:75)
>
> ... 17 more
> Caused by: java.lang.NullPointerException: Cannot invoke
> "org.apache.hadoop.hive.llap.cache.PathCache.touch(Object, String)" because
> "this.pathCache" is null
> at
> org.apache.hadoop.hive.llap.io.encoded.OrcEncodedDataReader.performDataRead(OrcEncodedDataReader.java:380)
>
> at
> org.apache.hadoop.hive.llap.io.encoded.OrcEncodedDataReader.lambda$callInternal$0(OrcEncodedDataReader.java:294)
>
> at
> java.base/java.security.AccessController.doPrivileged(AccessController.java:714)
>
> at java.base/javax.security.auth.Subject.doAs(Subject.java:525)
> at
> org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1953)
>
> at
> org.apache.hadoop.hive.llap.io.encoded.OrcEncodedDataReader.callInternal(OrcEncodedDataReader.java:290)
>
> at
> org.apache.hadoop.hive.llap.io.encoded.OrcEncodedDataReader.callInternal(OrcEncodedDataReader.java:120)
>
> at org.apache.tez.common.CallableWithNdc.call(CallableWithNdc.java:36)
> at
> org.apache.hadoop.hive.llap.io.decode.EncodedDataConsumer$CpuRecordingCallable.call(EncodedDataConsumer.java:88)
>
> at
> org.apache.hadoop.hive.llap.io.decode.EncodedDataConsumer$CpuRecordingCallable.call(EncodedDataConsumer.java:73)
> ... 5 more{code}
--
This message was sent by Atlassian Jira
(v8.20.10#820010)