xuchuanyin created CARBONDATA-2799:
--------------------------------------
Summary: Query failed with bloom datamap on preagg table with
dictionary column
Key: CARBONDATA-2799
URL: https://issues.apache.org/jira/browse/CARBONDATA-2799
Project: CarbonData
Issue Type: Bug
Reporter: xuchuanyin
Assignee: xuchuanyin
Steps to reproduce:
CREATE TABLE datamap_test (id int,name string,salary float,dob date)STORED BY
'carbondata' TBLPROPERTIES('dictionary_include'='id');
LOAD DATA INPATH 'hdfs://hacluster/user/surbhi/datamap_test.csv' into table
datamap_test OPTIONS('DELIMITER'=',',
'QUOTECHAR'='"','BAD_RECORDS_ACTION'='FORCE','FILEHEADER'='id,name,salary,dob');
LOAD DATA INPATH 'hdfs://hacluster/user/surbhi/datamap_test.csv' into table
datamap_test OPTIONS('DELIMITER'=',',
'QUOTECHAR'='"','BAD_RECORDS_ACTION'='FORCE','FILEHEADER'='id,name,salary,dob');
LOAD DATA INPATH 'hdfs://hacluster/user/surbhi/datamap_test.csv' into table
datamap_test OPTIONS('DELIMITER'=',',
'QUOTECHAR'='"','BAD_RECORDS_ACTION'='FORCE','FILEHEADER'='id,name,salary,dob');
CREATE DATAMAP dm_datamap_test2 ON TABLE datamap_test USING 'bloomfilter'
DMPROPERTIES ('INDEX_COLUMNS' = 'id', 'BLOOM_SIZE'='320000',
'BLOOM_FPP'='0.01', 'BLOOM_COMPRESS'='true');
LOAD DATA INPATH 'hdfs://hacluster/user/surbhi/datamap_test.csv' into table
datamap_test OPTIONS('DELIMITER'=',',
'QUOTECHAR'='"','BAD_RECORDS_ACTION'='FORCE','FILEHEADER'='id,name,salary,dob');
create datamap datamap_preaggr ON TABLE datamap_test USING "preaggregate" as
select id,count(id) from datamap_test group by id;
create datamap dm_preag_bloom_cust_id on table datamap_test_datamap_preaggr
using 'bloomfilter' dmproperties('index_columns'='datamap_test_id');
select id,count(id) from datamap_test where id = 12 group by id;
QUERY FAILED:Error:
org.apache.spark.sql.catalyst.errors.package$TreeNodeException: execute, tree:
drop datamap dm_preag_bloom_cust_id on table datamap_test_datamap_preaggr;
select id,count(id) from datamap_test where id = 12 group by id;
QUERY OK
create datamap dm_preag_bloom_cust_id on table datamap_test_datamap_preaggr
using 'bloomfilter' dmproperties('index_columns'='datamap_test_id');
drop datamap dm_preag_bloom_cust_id on table datamap_test_datamap_preaggr;
select id,count(id) from datamap_test where id = 12 group by id;
QUERY FAILED:Error: org.apache.spark.SparkException: Job aborted due to stage
failure: Task 0 in stage 117.0 failed 4 times
--
This message was sent by Atlassian JIRA
(v7.6.3#76005)