[
https://issues.apache.org/jira/browse/CARBONDATA-3954?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
xiaohui updated CARBONDATA-3954:
--------------------------------
Description:
orc table sql test:
create table array_orc(name string, col array<String>,fee int) STORED AS orc;
insert into array_orc values("xiao3",array('上呼吸道疾病 1','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1 ','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障 1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡 1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao5",array(null,'白内障1','胃溃疡1'),2);
insert into array_orc values("xiao5",null,2);
insert into array_orc values("xiao3",array('jjjjj'),2);
insert into array_orc values("xiao4",array('jjjjj','jjjjj'),2);
insert into array_orc values("xiao4",NULL,2);
0: jdbc:hive2://localhost:10000> use dict;
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (0.391 seconds)
0: jdbc:hive2://localhost:10000> select * from array_orc;
+--------+-------------------------------+------+--+
| name | col | fee |
+--------+-------------------------------+------+--+
| xiao3 | ["",null,"jkkkk"] | 3 |
| xiao2 | ["上呼吸道疾病1","白内障1","胃溃疡1"] | 2 |
| xiao3 | ["",null,"jkkkk"] | 3 |
| xiao1 | ["上呼吸道疾病","白内障","胃溃疡"] | 1 |
| xiao9 | NULL | 3 |
| xiao9 | NULL | 3 |
| xiao3 | NULL | 3 |
| xiao6 | NULL | 3 |
| xiao2 | ["上呼吸道疾病 1","白内障 1","胃溃疡 1"] | 2 |
| xiao1 | ["上呼吸道疾病 ","白内障 ","胃溃疡 "] | 1 |
| xiao3 | NULL | 3 |
| xiao3 | [null] | 3 |
| xiao3 | [""] | 3 |
+--------+-------------------------------+------+--+
13 rows selected (0.416 seconds)
0: jdbc:hive2://localhost:10000> create table array_carbon4(name string, col
array<String>,fee int) STORED AS carbondata TBLPROPERTIES
('SORT_COLUMNS'='name',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='no_SORT');
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (1.04 seconds)
0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon4 select
name,col,fee from array_orc;
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (5.065 seconds)
0: jdbc:hive2://localhost:10000> create table array_carbon5(name string, col
array<String>,fee int) STORED AS carbondata TBLPROPERTIES
('SORT_COLUMNS'='name',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='global_SORT');
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (0.098 seconds)
0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon5 select
name,col,fee from array_orc;
Error: java.lang.Exception: DataLoad failure (state=,code=0)
was:
orcdata
create table array_orc(name string, col array<String>,fee int) STORED AS orc;
insert into array_orc values("xiao3",array('上呼吸道疾病 1','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1 ','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障 1','胃溃疡1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡 1'),2);
insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡1'),2);
insert into array_orc values("xiao5",array(null,'白内障1','胃溃疡1'),2);
insert into array_orc values("xiao5",null,2);
insert into array_orc values("xiao3",array('jjjjj'),2);
insert into array_orc values("xiao4",array('jjjjj','jjjjj'),2);
insert into array_orc values("xiao4",NULL,2);
0: jdbc:hive2://localhost:10000> use dict;
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (0.391 seconds)
0: jdbc:hive2://localhost:10000> select * from array_orc;
+--------+-------------------------------+------+--+
| name | col | fee |
+--------+-------------------------------+------+--+
| xiao3 | ["",null,"jkkkk"] | 3 |
| xiao2 | ["上呼吸道疾病1","白内障1","胃溃疡1"] | 2 |
| xiao3 | ["",null,"jkkkk"] | 3 |
| xiao1 | ["上呼吸道疾病","白内障","胃溃疡"] | 1 |
| xiao9 | NULL | 3 |
| xiao9 | NULL | 3 |
| xiao3 | NULL | 3 |
| xiao6 | NULL | 3 |
| xiao2 | ["上呼吸道疾病 1","白内障 1","胃溃疡 1"] | 2 |
| xiao1 | ["上呼吸道疾病 ","白内障 ","胃溃疡 "] | 1 |
| xiao3 | NULL | 3 |
| xiao3 | [null] | 3 |
| xiao3 | [""] | 3 |
+--------+-------------------------------+------+--+
13 rows selected (0.416 seconds)
0: jdbc:hive2://localhost:10000> create table array_carbon4(name string, col
array<String>,fee int) STORED AS carbondata TBLPROPERTIES
('SORT_COLUMNS'='name',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='no_SORT');
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (1.04 seconds)
0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon4 select
name,col,fee from array_orc;
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (5.065 seconds)
0: jdbc:hive2://localhost:10000> create table array_carbon5(name string, col
array<String>,fee int) STORED AS carbondata TBLPROPERTIES
('SORT_COLUMNS'='name',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='global_SORT');
+---------+--+
| Result |
+---------+--+
+---------+--+
No rows selected (0.098 seconds)
0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon5 select
name,col,fee from array_orc;
Error: java.lang.Exception: DataLoad failure (state=,code=0)
> Global sorting with array, if read from ORC format, write to carbon, error;
> If you use no_sort, success;
> --------------------------------------------------------------------------------------------------------
>
> Key: CARBONDATA-3954
> URL: https://issues.apache.org/jira/browse/CARBONDATA-3954
> Project: CarbonData
> Issue Type: Bug
> Components: spark-integration
> Affects Versions: 2.0.0
> Reporter: xiaohui
> Priority: Major
> Attachments: [email protected], [email protected]
>
>
> orc table sql test:
> create table array_orc(name string, col array<String>,fee int) STORED AS orc;
> insert into array_orc values("xiao3",array('上呼吸道疾病 1','白内障1','胃溃疡1'),2);
> insert into array_orc values("xiao3",array('上呼吸道疾病1 ','白内障1','胃溃疡1'),2);
> insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障 1','胃溃疡1'),2);
> insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡 1'),2);
> insert into array_orc values("xiao3",array('上呼吸道疾病1','白内障1','胃溃疡1'),2);
> insert into array_orc values("xiao5",array(null,'白内障1','胃溃疡1'),2);
> insert into array_orc values("xiao5",null,2);
> insert into array_orc values("xiao3",array('jjjjj'),2);
> insert into array_orc values("xiao4",array('jjjjj','jjjjj'),2);
> insert into array_orc values("xiao4",NULL,2);
> 0: jdbc:hive2://localhost:10000> use dict;
> +---------+--+
> | Result |
> +---------+--+
> +---------+--+
> No rows selected (0.391 seconds)
> 0: jdbc:hive2://localhost:10000> select * from array_orc;
> +--------+-------------------------------+------+--+
> | name | col | fee |
> +--------+-------------------------------+------+--+
> | xiao3 | ["",null,"jkkkk"] | 3 |
> | xiao2 | ["上呼吸道疾病1","白内障1","胃溃疡1"] | 2 |
> | xiao3 | ["",null,"jkkkk"] | 3 |
> | xiao1 | ["上呼吸道疾病","白内障","胃溃疡"] | 1 |
> | xiao9 | NULL | 3 |
> | xiao9 | NULL | 3 |
> | xiao3 | NULL | 3 |
> | xiao6 | NULL | 3 |
> | xiao2 | ["上呼吸道疾病 1","白内障 1","胃溃疡 1"] | 2 |
> | xiao1 | ["上呼吸道疾病 ","白内障 ","胃溃疡 "] | 1 |
> | xiao3 | NULL | 3 |
> | xiao3 | [null] | 3 |
> | xiao3 | [""] | 3 |
> +--------+-------------------------------+------+--+
> 13 rows selected (0.416 seconds)
> 0: jdbc:hive2://localhost:10000> create table array_carbon4(name string, col
> array<String>,fee int) STORED AS carbondata TBLPROPERTIES
> ('SORT_COLUMNS'='name',
> 0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
> 0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
> 0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='no_SORT');
> +---------+--+
> | Result |
> +---------+--+
> +---------+--+
> No rows selected (1.04 seconds)
> 0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon4 select
> name,col,fee from array_orc;
> +---------+--+
> | Result |
> +---------+--+
> +---------+--+
> No rows selected (5.065 seconds)
> 0: jdbc:hive2://localhost:10000> create table array_carbon5(name string, col
> array<String>,fee int) STORED AS carbondata TBLPROPERTIES
> ('SORT_COLUMNS'='name',
> 0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKSIZE'='128',
> 0: jdbc:hive2://localhost:10000> 'TABLE_BLOCKLET_SIZE'='128',
> 0: jdbc:hive2://localhost:10000> 'SORT_SCOPE'='global_SORT');
> +---------+--+
> | Result |
> +---------+--+
> +---------+--+
> No rows selected (0.098 seconds)
> 0: jdbc:hive2://localhost:10000> insert overwrite table array_carbon5 select
> name,col,fee from array_orc;
> Error: java.lang.Exception: DataLoad failure (state=,code=0)
--
This message was sent by Atlassian Jira
(v8.3.4#803005)