nyq created IMPALA-13161:
----------------------------

             Summary: impalad crash -- 
impala::DelimitedTextParser<true>::ParseFieldLocations
                 Key: IMPALA-13161
                 URL: https://issues.apache.org/jira/browse/IMPALA-13161
             Project: IMPALA
          Issue Type: Bug
          Components: be
    Affects Versions: Impala 4.0.0
            Reporter: nyq


Impala version: 4.0.0

 

Problem:

impalad crash, by operating a text table, which has a 3GB data file that only 
contains '\x00' char

 

Steps:

python -c 'f=open("impala_0_3gb.data.csv", "wb");tmp="\x00"*1024*1024*3; 
[f.write(tmp) for i in range(1024)] ;f.close()'

create table impala_0_3gb (id int)

hdfs dfs -put impala_0_3gb.data.csv /user/hive/warehouse/impala_0_3gb/

refresh impala_0_3gb

select count(1) from impala_0_3gb

 

Errors:

Wrote minidump to 1dcf110f-5a2e-49a2-be4eb7a5-4709ed19.dmp

#

# A fatal error has been detected by the Java Runtime Environment:

#

#  SIGSEGV (0xb) at pc=0x000000000181861c, pid=956182, tid=0x00007fc6b340e700

#

# JRE version: OpenJDK Runtime Environment (8.0) (build 1.8.0)

# Java VM: OpenJDK 64-Bit Server VM

# Problematic frame:

# C  [impalad+0x141861c]  
impala::DelimitedTextParser<true>::ParseFieldLocations(int, long, char**, 
char**, impala::FieldLocation*, int*, int*, char**)+0x7cc

#

# Failed to write core dump. Core dumps have been disabled. To enable core 
dumping, try "ulimit -c unlimited" before starting Java again

#

# An error report file with more information is saved as:

# /tmp/hs_err_pid956182.log

#

#

 

 

C  [impalad+0x141861c]  
impala::DelimitedTextParser<true>::ParseFieldLocations(int, long, char**, 
char**, impala::FieldLocation*, int*, int*, char**)+0x7cc

C  [impalad+0x136fe11]  
impala::HdfsTextScanner::ProcessRange(impala::RowBatch*, int*)+0x1a1

C  [impalad+0x137100e]  
impala::HdfsTextScanner::FinishScanRange(impala::RowBatch*)+0x3be

C  [impalad+0x13721ac]  
impala::HdfsTextScanner::GetNextInternal(impala::RowBatch*)+0x12c

C  [impalad+0x131cdfc]  impala::HdfsScanner::ProcessSplit()+0x19c

C  [impalad+0x1443e17]  
impala::HdfsScanNode::ProcessSplit(std::vector<impala::FilterContext, 
std::allocator<impala::FilterContext> > const&, impala::MemPool*, 
impala::io::ScanRange*, long*)+0x7e7

C  [impalad+0x1447001]  impala::HdfsScanNode::ScannerThread(bool, long)+0x541

 



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to