HIVE-18079 : Statistics: Allow HyperLogLog to be merged to the 
lowest-common-denominator bit-size (Gopal V via Prasanth J)

Signed-off-by: Ashutosh Chauhan <[email protected]>


Project: http://git-wip-us.apache.org/repos/asf/hive/repo
Commit: http://git-wip-us.apache.org/repos/asf/hive/commit/13960aa9
Tree: http://git-wip-us.apache.org/repos/asf/hive/tree/13960aa9
Diff: http://git-wip-us.apache.org/repos/asf/hive/diff/13960aa9

Branch: refs/heads/master
Commit: 13960aa999aeeba5105fd64fef79dc6ed2fbe220
Parents: 5aa8f87
Author: Gopal V <[email protected]>
Authored: Sat Dec 2 21:20:00 2017 -0800
Committer: Ashutosh Chauhan <[email protected]>
Committed: Thu Jun 7 22:59:43 2018 -0700

----------------------------------------------------------------------
 .../clientpositive/autoColumnStats_2.q.out      |   16 +-
 .../clientpositive/autoColumnStats_9.q.out      |    4 +-
 .../test/results/clientpositive/bitvector.q.out |    2 +-
 .../clientpositive/compute_stats_date.q.out     |    2 +-
 .../confirm_initial_tbl_stats.q.out             |   14 +-
 .../clientpositive/cross_join_merge.q.out       |   80 +-
 .../results/clientpositive/describe_table.q.out |    4 +-
 .../encrypted/encryption_move_tbl.q.out         |    4 +-
 ql/src/test/results/clientpositive/hll.q.out    |    6 +-
 .../clientpositive/llap/autoColumnStats_2.q.out |   16 +-
 .../clientpositive/llap/auto_join1.q.out        |    8 +-
 .../clientpositive/llap/auto_join21.q.out       |   10 +-
 .../clientpositive/llap/auto_join29.q.out       |   90 +-
 .../clientpositive/llap/auto_join30.q.out       |   16 +-
 .../llap/auto_sortmerge_join_6.q.out            |  558 ++--
 .../clientpositive/llap/bucket_groupby.q.out    |   16 +-
 .../llap/bucket_map_join_tez1.q.out             |  198 +-
 .../llap/bucket_map_join_tez2.q.out             |  312 +-
 .../clientpositive/llap/check_constraint.q.out  |    4 +-
 .../llap/correlationoptimizer1.q.out            |   86 +-
 .../llap/correlationoptimizer2.q.out            |   20 +-
 .../llap/correlationoptimizer3.q.out            |   68 +-
 .../llap/correlationoptimizer6.q.out            |  148 +-
 .../clientpositive/llap/cross_join.q.out        |    8 +-
 .../llap/dynamic_semijoin_reduction.q.out       |    8 +-
 .../llap/dynamic_semijoin_reduction_sw.q.out    |    8 +-
 .../llap/dynamic_semijoin_user_level.q.out      |    8 +-
 .../clientpositive/llap/explainanalyze_2.q.out  | 1455 ++++-----
 .../clientpositive/llap/explainuser_1.q.out     |   44 +-
 .../clientpositive/llap/explainuser_2.q.out     | 2788 +++++++++---------
 .../clientpositive/llap/explainuser_4.q.out     |   14 +-
 .../results/clientpositive/llap/groupby1.q.out  |    6 +-
 .../results/clientpositive/llap/groupby2.q.out  |   10 +-
 .../llap/groupby_resolution.q.out               |   16 +-
 .../llap/hybridgrace_hashjoin_1.q.out           |   12 +-
 .../llap/hybridgrace_hashjoin_2.q.out           |   24 +-
 .../results/clientpositive/llap/join1.q.out     |    8 +-
 .../clientpositive/llap/join32_lessSize.q.out   |  173 +-
 .../llap/join_max_hashtable.q.out               |   32 +-
 .../llap/limit_join_transpose.q.out             |    8 +-
 .../clientpositive/llap/limit_pushdown.q.out    |   14 +-
 .../clientpositive/llap/limit_pushdown3.q.out   |   34 +-
 .../llap/llap_vector_nohybridgrace.q.out        |    4 +-
 .../clientpositive/llap/llapdecider.q.out       |   64 +-
 .../clientpositive/llap/mapjoin_decimal.q.out   |    8 +-
 .../clientpositive/llap/mapjoin_mapjoin.q.out   |   18 +-
 .../test/results/clientpositive/llap/mrr.q.out  |   42 +-
 .../clientpositive/llap/multiMapJoin2.q.out     |   58 +-
 .../llap/offset_limit_ppd_optimizer.q.out       |   18 +-
 .../clientpositive/llap/partialdhj.q.out        |    8 +-
 .../clientpositive/llap/quotedid_smb.q.out      |    4 +-
 .../llap/reduce_deduplicate_extended.q.out      |   58 +-
 .../clientpositive/llap/results_cache_1.q.out   |    4 +-
 .../llap/results_cache_lifetime.q.out           |    2 +-
 .../results/clientpositive/llap/semijoin.q.out  |    4 +-
 .../clientpositive/llap/semijoin_hint.q.out     |   26 +-
 .../clientpositive/llap/sharedworkext.q.out     |   62 +-
 .../results/clientpositive/llap/skewjoin.q.out  |   14 +-
 .../clientpositive/llap/smb_mapjoin_6.q.out     |   12 +-
 .../clientpositive/llap/subquery_corr.q.out     |   12 +-
 .../clientpositive/llap/subquery_exists.q.out   |    8 +-
 .../clientpositive/llap/subquery_in.q.out       |   52 +-
 .../llap/subquery_in_having.q.out               |   32 +-
 .../clientpositive/llap/subquery_multi.q.out    |   24 +-
 .../clientpositive/llap/subquery_notin.q.out    |   36 +-
 .../clientpositive/llap/subquery_scalar.q.out   |   16 +-
 .../clientpositive/llap/subquery_select.q.out   |   12 +-
 .../clientpositive/llap/subquery_views.q.out    |   18 +-
 .../llap/tez_bmj_schema_evolution.q.out         |    8 +-
 .../llap/tez_dynpart_hashjoin_2.q.out           |   24 +-
 .../clientpositive/llap/tez_join_hash.q.out     |   22 +-
 .../clientpositive/llap/tez_join_tests.q.out    |   12 +-
 .../clientpositive/llap/tez_joins_explain.q.out |   12 +-
 .../clientpositive/llap/tez_smb_main.q.out      |    4 +-
 .../results/clientpositive/llap/tez_union.q.out |   64 +-
 .../clientpositive/llap/tez_union2.q.out        |   16 +-
 .../llap/tez_union_multiinsert.q.out            |   24 +-
 .../llap/tez_vector_dynpart_hashjoin_2.q.out    |   24 +-
 .../clientpositive/llap/unionDistinct_1.q.out   |   38 +-
 .../clientpositive/llap/unionDistinct_3.q.out   |   48 +-
 .../clientpositive/llap/union_fast_stats.q.out  |    8 +-
 .../clientpositive/llap/union_top_level.q.out   |   16 +-
 .../llap/vector_cast_constant.q.out             |   12 +-
 .../llap/vector_count_distinct.q.out            |    6 +-
 .../llap/vector_groupby_mapjoin.q.out           |    4 +-
 .../llap/vector_groupby_reduce.q.out            |   26 +-
 .../llap/vector_left_outer_join.q.out           |    4 +-
 .../llap/vector_llap_text_1.q.out               |    8 +-
 .../clientpositive/llap/vectorization_0.q.out   |   14 +-
 .../llap/vectorization_div0.q.out               |    8 +-
 .../vectorization_input_format_excludes.q.out   |   40 +-
 .../llap/vectorization_limit.q.out              |   34 +-
 .../llap/vectorization_short_regress.q.out      |   26 +-
 .../llap/vectorized_context.q.out               |   10 +-
 .../llap/vectorized_distinct_gby.q.out          |    8 +-
 .../llap/vectorized_mapjoin.q.out               |    4 +-
 .../llap/vectorized_nested_mapjoin.q.out        |    6 +-
 .../llap/vectorized_parquet.q.out               |   10 +-
 .../llap/vectorized_shufflejoin.q.out           |    4 +-
 .../clientpositive/mapjoin_mapjoin.q.out        |   30 +-
 .../spark/bucket_map_join_tez1.q.out            |   76 +-
 .../spark/bucket_map_join_tez2.q.out            |  208 +-
 .../clientpositive/spark/join32_lessSize.q.out  |   90 +-
 .../clientpositive/spark/mapjoin_mapjoin.q.out  |   26 +-
 .../spark/spark_explainuser_1.q.out             |   44 +-
 .../clientpositive/tez/explainanalyze_1.q.out   |   14 +-
 .../clientpositive/tez/explainanalyze_3.q.out   |    4 +-
 .../clientpositive/tez/explainanalyze_4.q.out   |   12 +-
 .../clientpositive/tez/explainanalyze_5.q.out   |    6 +-
 .../clientpositive/tez/explainuser_3.q.out      |    4 +-
 .../tez/hybridgrace_hashjoin_1.q.out            |   12 +-
 .../tez/hybridgrace_hashjoin_2.q.out            |   24 +-
 .../results/clientpositive/tez/tez-tag.q.out    |    2 +-
 .../ndv/NumDistinctValueEstimatorFactory.java   |    7 +-
 .../hive/common/ndv/hll/HLLDenseRegister.java   |   25 +
 .../hive/common/ndv/hll/HLLSparseRegister.java  |   13 +
 .../hadoop/hive/common/ndv/hll/HyperLogLog.java |   63 +-
 .../hive/common/ndv/hll/HyperLogLogUtils.java   |   19 +-
 .../hive/common/ndv/hll/TestHyperLogLog.java    |  124 +-
 .../common/ndv/hll/TestHyperLogLogMerge.java    |  147 +
 120 files changed, 4444 insertions(+), 4018 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/autoColumnStats_2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/autoColumnStats_2.q.out 
b/ql/src/test/results/clientpositive/autoColumnStats_2.q.out
index b9c6835..854c779 100644
--- a/ql/src/test/results/clientpositive/autoColumnStats_2.q.out
+++ b/ql/src/test/results/clientpositive/autoColumnStats_2.q.out
@@ -129,7 +129,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -148,7 +148,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -253,7 +253,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -272,7 +272,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -301,7 +301,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -320,7 +320,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -349,7 +349,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              20                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -368,7 +368,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         319                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            8.0                                                     
                                         
 max_col_len            8                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/autoColumnStats_9.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/autoColumnStats_9.q.out 
b/ql/src/test/results/clientpositive/autoColumnStats_9.q.out
index 898598f..f2a8cdc 100644
--- a/ql/src/test/results/clientpositive/autoColumnStats_9.q.out
+++ b/ql/src/test/results/clientpositive/autoColumnStats_9.q.out
@@ -253,7 +253,7 @@ data_type                   int
 min                    0                                                       
                                         
 max                    498                                                     
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         303                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         
@@ -272,7 +272,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.834630350194552                                       
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/bitvector.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/bitvector.q.out 
b/ql/src/test/results/clientpositive/bitvector.q.out
index 1e0284f..e310ebe 100644
--- a/ql/src/test/results/clientpositive/bitvector.q.out
+++ b/ql/src/test/results/clientpositive/bitvector.q.out
@@ -9,7 +9,7 @@ data_type               string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/compute_stats_date.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/compute_stats_date.q.out 
b/ql/src/test/results/clientpositive/compute_stats_date.q.out
index 35c0f8d..58d2d70 100644
--- a/ql/src/test/results/clientpositive/compute_stats_date.q.out
+++ b/ql/src/test/results/clientpositive/compute_stats_date.q.out
@@ -43,7 +43,7 @@ POSTHOOK: query: select compute_stats(fl_date, 'hll') from 
tab_date
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@tab_date
 #### A masked pattern was here ####
-{"columntype":"Date","min":"2000-11-20","max":"2010-10-29","countnulls":0,"numdistinctvalues":19,"ndvbitvector":HLL����!���]����������������Y���T��P��R������W���
�ĈN������������}
+{"columntype":"Date","min":"2000-11-20","max":"2010-10-29","countnulls":0,"numdistinctvalues":19,"ndvbitvector":HLL�Ǫ����!���]����������������Y���T���P��R������W���
�ĈN������������}
 PREHOOK: query: explain
 analyze table tab_date compute statistics for columns fl_date
 PREHOOK: type: ANALYZE_TABLE

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out 
b/ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out
index a900194..3d64168 100644
--- a/ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out
+++ b/ql/src/test/results/clientpositive/confirm_initial_tbl_stats.q.out
@@ -19,7 +19,7 @@ data_type             string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -105,7 +105,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -134,7 +134,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         430                                                     
                                         
+distinct_count         431                                                     
                                         
 avg_col_len            6.802                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -163,7 +163,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -199,7 +199,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -237,7 +237,7 @@ data_type                   tinyint
 min                    -64                                                     
                                         
 max                    62                                                      
                                         
 num_nulls              3115                                                    
                                         
-distinct_count         127                                                     
                                         
+distinct_count         130                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         
@@ -275,7 +275,7 @@ data_type                   timestamp
 min                    -30                                                     
                                         
 max                    31                                                      
                                         
 num_nulls              3115                                                    
                                         
-distinct_count         35                                                      
                                         
+distinct_count         36                                                      
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/cross_join_merge.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/cross_join_merge.q.out 
b/ql/src/test/results/clientpositive/cross_join_merge.q.out
index 84d78f3..3389638 100644
--- a/ql/src/test/results/clientpositive/cross_join_merge.q.out
+++ b/ql/src/test/results/clientpositive/cross_join_merge.q.out
@@ -233,7 +233,7 @@ STAGE PLANS:
       Processor Tree:
         ListSink
 
-Warning: Shuffle Join JOIN[11][tables = [$hdt$_0, $hdt$_1]] in Stage 
'Stage-1:MAPRED' is a cross product
+Warning: Shuffle Join JOIN[14][tables = [$hdt$_0, $hdt$_1, $hdt$_2]] in Stage 
'Stage-2:MAPRED' is a cross product
 PREHOOK: query: explain
 select src1.key from src src1 join src src2 on 5 = src2.key join src src3 on 
src1.key=src3.key
 PREHOOK: type: QUERY
@@ -250,7 +250,7 @@ STAGE PLANS:
     Map Reduce
       Map Operator Tree:
           TableScan
-            alias: src3
+            alias: src1
             Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE 
Column stats: NONE
             Filter Operator
               predicate: key is not null (type: boolean)
@@ -260,29 +260,34 @@ STAGE PLANS:
                 outputColumnNames: _col0
                 Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
                 Reduce Output Operator
-                  sort order: 
+                  key expressions: _col0 (type: string)
+                  sort order: +
+                  Map-reduce partition columns: _col0 (type: string)
                   Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
-                  value expressions: _col0 (type: string)
           TableScan
-            alias: src2
+            alias: src3
             Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE 
Column stats: NONE
             Filter Operator
-              predicate: (UDFToDouble(key) = 5.0D) (type: boolean)
-              Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE 
Column stats: NONE
+              predicate: key is not null (type: boolean)
+              Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE 
Column stats: NONE
               Select Operator
-                Statistics: Num rows: 250 Data size: 2656 Basic stats: 
COMPLETE Column stats: NONE
+                expressions: key (type: string)
+                outputColumnNames: _col0
+                Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
                 Reduce Output Operator
-                  sort order: 
-                  Statistics: Num rows: 250 Data size: 2656 Basic stats: 
COMPLETE Column stats: NONE
+                  key expressions: _col0 (type: string)
+                  sort order: +
+                  Map-reduce partition columns: _col0 (type: string)
+                  Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Join Operator
           condition map:
                Inner Join 0 to 1
           keys:
-            0 
-            1 
+            0 _col0 (type: string)
+            1 _col0 (type: string)
           outputColumnNames: _col0
-          Statistics: Num rows: 125000 Data size: 2781000 Basic stats: 
COMPLETE Column stats: NONE
+          Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE 
Column stats: NONE
           File Output Operator
             compressed: false
             table:
@@ -295,45 +300,36 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             Reduce Output Operator
-              key expressions: _col0 (type: string)
-              sort order: +
-              Map-reduce partition columns: _col0 (type: string)
-              Statistics: Num rows: 125000 Data size: 2781000 Basic stats: 
COMPLETE Column stats: NONE
+              sort order: 
+              Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE 
Column stats: NONE
+              value expressions: _col0 (type: string)
           TableScan
-            alias: src1
+            alias: src2
             Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE 
Column stats: NONE
             Filter Operator
-              predicate: key is not null (type: boolean)
-              Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE 
Column stats: NONE
+              predicate: (UDFToDouble(key) = 5.0D) (type: boolean)
+              Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE 
Column stats: NONE
               Select Operator
-                expressions: key (type: string)
-                outputColumnNames: _col0
-                Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 250 Data size: 2656 Basic stats: 
COMPLETE Column stats: NONE
                 Reduce Output Operator
-                  key expressions: _col0 (type: string)
-                  sort order: +
-                  Map-reduce partition columns: _col0 (type: string)
-                  Statistics: Num rows: 500 Data size: 5312 Basic stats: 
COMPLETE Column stats: NONE
+                  sort order: 
+                  Statistics: Num rows: 250 Data size: 2656 Basic stats: 
COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Join Operator
           condition map:
                Inner Join 0 to 1
           keys:
-            0 _col0 (type: string)
-            1 _col0 (type: string)
-          outputColumnNames: _col2
-          Statistics: Num rows: 137500 Data size: 3059100 Basic stats: 
COMPLETE Column stats: NONE
-          Select Operator
-            expressions: _col2 (type: string)
-            outputColumnNames: _col0
-            Statistics: Num rows: 137500 Data size: 3059100 Basic stats: 
COMPLETE Column stats: NONE
-            File Output Operator
-              compressed: false
-              Statistics: Num rows: 137500 Data size: 3059100 Basic stats: 
COMPLETE Column stats: NONE
-              table:
-                  input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
-                  output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
-                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            0 
+            1 
+          outputColumnNames: _col0
+          Statistics: Num rows: 137500 Data size: 3059050 Basic stats: 
COMPLETE Column stats: NONE
+          File Output Operator
+            compressed: false
+            Statistics: Num rows: 137500 Data size: 3059050 Basic stats: 
COMPLETE Column stats: NONE
+            table:
+                input format: org.apache.hadoop.mapred.SequenceFileInputFormat
+                output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
+                serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
 
   Stage: Stage-0
     Fetch Operator

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/describe_table.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/describe_table.q.out 
b/ql/src/test/results/clientpositive/describe_table.q.out
index d88424f..8c7a16c 100644
--- a/ql/src/test/results/clientpositive/describe_table.q.out
+++ b/ql/src/test/results/clientpositive/describe_table.q.out
@@ -206,7 +206,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -304,7 +304,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out
----------------------------------------------------------------------
diff --git 
a/ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out 
b/ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out
index a63cd86..b73f3ac 100644
--- a/ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out
+++ b/ql/src/test/results/clientpositive/encrypted/encryption_move_tbl.q.out
@@ -66,7 +66,7 @@ data_type             int
 min                    0                                                       
                                         
 max                    498                                                     
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         303                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         
@@ -85,7 +85,7 @@ data_type             string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/hll.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/hll.q.out 
b/ql/src/test/results/clientpositive/hll.q.out
index 12f6a36..4b445ea 100644
--- a/ql/src/test/results/clientpositive/hll.q.out
+++ b/ql/src/test/results/clientpositive/hll.q.out
@@ -182,7 +182,7 @@ data_type                   int
 min                    0                                                       
                                         
 max                    498                                                     
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         303                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         
@@ -236,7 +236,7 @@ data_type                   double
 min                    0.0                                                     
                                         
 max                    498.0                                                   
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         
@@ -290,7 +290,7 @@ data_type                   decimal(10,0)
 min                    0                                                       
                                         
 max                    498                                                     
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len                                                                    
                                         
 max_col_len                                                                    
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out 
b/ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out
index 83c538b..7f0867a 100644
--- a/ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out
+++ b/ql/src/test/results/clientpositive/llap/autoColumnStats_2.q.out
@@ -127,7 +127,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -146,7 +146,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -251,7 +251,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -270,7 +270,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              0                                                       
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -299,7 +299,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -318,7 +318,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         307                                                     
                                         
 avg_col_len            6.812                                                   
                                         
 max_col_len            7                                                       
                                         
 num_trues                                                                      
                                         
@@ -347,7 +347,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              20                                                      
                                         
-distinct_count         309                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            2.812                                                   
                                         
 max_col_len            3                                                       
                                         
 num_trues                                                                      
                                         
@@ -366,7 +366,7 @@ data_type                   string
 min                                                                            
                                         
 max                                                                            
                                         
 num_nulls              10                                                      
                                         
-distinct_count         319                                                     
                                         
+distinct_count         316                                                     
                                         
 avg_col_len            8.0                                                     
                                         
 max_col_len            8                                                       
                                         
 num_trues                                                                      
                                         

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/llap/auto_join1.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_join1.q.out 
b/ql/src/test/results/clientpositive/llap/auto_join1.q.out
index 61cedb7..17987a7 100644
--- a/ql/src/test/results/clientpositive/llap/auto_join1.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_join1.q.out
@@ -69,14 +69,14 @@ STAGE PLANS:
                         outputColumnNames: _col0, _col2
                         input vertices:
                           0 Map 1
-                        Statistics: Num rows: 809 Data size: 144002 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 791 Data size: 140798 Basic 
stats: COMPLETE Column stats: COMPLETE
                         Select Operator
                           expressions: UDFToInteger(_col0) (type: int), _col2 
(type: string)
                           outputColumnNames: _col0, _col1
-                          Statistics: Num rows: 809 Data size: 76855 Basic 
stats: COMPLETE Column stats: COMPLETE
+                          Statistics: Num rows: 791 Data size: 75145 Basic 
stats: COMPLETE Column stats: COMPLETE
                           File Output Operator
                             compressed: false
-                            Statistics: Num rows: 809 Data size: 76855 Basic 
stats: COMPLETE Column stats: COMPLETE
+                            Statistics: Num rows: 791 Data size: 75145 Basic 
stats: COMPLETE Column stats: COMPLETE
                             table:
                                 input format: 
org.apache.hadoop.mapred.TextInputFormat
                                 output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -85,7 +85,7 @@ STAGE PLANS:
                           Select Operator
                             expressions: _col0 (type: int), _col1 (type: 
string)
                             outputColumnNames: key, value
-                            Statistics: Num rows: 809 Data size: 76855 Basic 
stats: COMPLETE Column stats: COMPLETE
+                            Statistics: Num rows: 791 Data size: 75145 Basic 
stats: COMPLETE Column stats: COMPLETE
                             Group By Operator
                               aggregations: compute_stats(key, 'hll'), 
compute_stats(value, 'hll')
                               mode: hash

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/llap/auto_join21.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_join21.q.out 
b/ql/src/test/results/clientpositive/llap/auto_join21.q.out
index 64e6422..5889720 100644
--- a/ql/src/test/results/clientpositive/llap/auto_join21.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_join21.q.out
@@ -75,25 +75,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/llap/auto_join29.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_join29.q.out 
b/ql/src/test/results/clientpositive/llap/auto_join29.q.out
index c357c1f..3891ea0 100644
--- a/ql/src/test/results/clientpositive/llap/auto_join29.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_join29.q.out
@@ -75,25 +75,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -693,25 +693,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 137 Data size: 73158 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 137 Data size: 73158 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 137 Data size: 73158 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 137 Data size: 73158 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 137 Data size: 73158 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -1311,25 +1311,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 432 Data size: 230688 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 432 Data size: 230688 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 432 Data size: 230688 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 432 Data size: 230688 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 432 Data size: 230688 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -1938,25 +1938,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 434 Data size: 231756 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 415 Data size: 221610 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -2567,25 +2567,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -2685,25 +2685,25 @@ STAGE PLANS:
                   1 key (type: string)
                   2 key (type: string)
                 outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                   Reduce Output Operator
                     key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                     sort order: ++++++
-                    Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
         Reducer 3 
             Execution mode: vectorized, llap
             Reduce Operator Tree:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -3263,15 +3263,15 @@ STAGE PLANS:
                     input vertices:
                       1 Map 3
                       2 Map 4
-                    Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                    Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                     Select Operator
                       expressions: _col0 (type: string), _col1 (type: string), 
_col5 (type: string), _col6 (type: string), _col10 (type: string), _col11 
(type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
-                      Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                      Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                       Reduce Output Operator
                         key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                         sort order: ++++++
-                        Statistics: Num rows: 143 Data size: 76362 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 136 Data size: 72624 Basic 
stats: COMPLETE Column stats: COMPLETE
             Execution mode: vectorized, llap
             LLAP IO: no inputs
         Map 3 
@@ -3312,10 +3312,10 @@ STAGE PLANS:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 136 Data size: 72624 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -3394,15 +3394,15 @@ STAGE PLANS:
                       input vertices:
                         0 Map 1
                         2 Map 4
-                      Statistics: Num rows: 431 Data size: 230154 Basic stats: 
COMPLETE Column stats: COMPLETE
+                      Statistics: Num rows: 414 Data size: 221076 Basic stats: 
COMPLETE Column stats: COMPLETE
                       Select Operator
                         expressions: _col0 (type: string), _col1 (type: 
string), _col5 (type: string), _col6 (type: string), _col10 (type: string), 
_col11 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
-                        Statistics: Num rows: 431 Data size: 230154 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 414 Data size: 221076 Basic 
stats: COMPLETE Column stats: COMPLETE
                         Reduce Output Operator
                           key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                           sort order: ++++++
-                          Statistics: Num rows: 431 Data size: 230154 Basic 
stats: COMPLETE Column stats: COMPLETE
+                          Statistics: Num rows: 414 Data size: 221076 Basic 
stats: COMPLETE Column stats: COMPLETE
             Execution mode: vectorized, llap
             LLAP IO: no inputs
         Map 4 
@@ -3427,10 +3427,10 @@ STAGE PLANS:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 431 Data size: 230154 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 414 Data size: 221076 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 431 Data size: 230154 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 414 Data size: 221076 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -3511,15 +3511,15 @@ STAGE PLANS:
                       input vertices:
                         1 Map 3
                         2 Map 4
-                      Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                      Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                       Select Operator
                         expressions: _col0 (type: string), _col1 (type: 
string), _col5 (type: string), _col6 (type: string), _col10 (type: string), 
_col11 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
-                        Statistics: Num rows: 143 Data size: 76362 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 135 Data size: 72090 Basic 
stats: COMPLETE Column stats: COMPLETE
                         Reduce Output Operator
                           key expressions: _col0 (type: string), _col1 (type: 
string), _col2 (type: string), _col3 (type: string), _col4 (type: string), 
_col5 (type: string)
                           sort order: ++++++
-                          Statistics: Num rows: 143 Data size: 76362 Basic 
stats: COMPLETE Column stats: COMPLETE
+                          Statistics: Num rows: 135 Data size: 72090 Basic 
stats: COMPLETE Column stats: COMPLETE
             Execution mode: vectorized, llap
             LLAP IO: no inputs
         Map 3 
@@ -3560,10 +3560,10 @@ STAGE PLANS:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: string), 
KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: string), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: string), 
KEY.reducesinkkey5 (type: string)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
-                Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 143 Data size: 76362 Basic stats: 
COMPLETE Column stats: COMPLETE
+                  Statistics: Num rows: 135 Data size: 72090 Basic stats: 
COMPLETE Column stats: COMPLETE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/13960aa9/ql/src/test/results/clientpositive/llap/auto_join30.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_join30.q.out 
b/ql/src/test/results/clientpositive/llap/auto_join30.q.out
index 19d6c55..1f95237 100644
--- a/ql/src/test/results/clientpositive/llap/auto_join30.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_join30.q.out
@@ -67,7 +67,7 @@ STAGE PLANS:
                         outputColumnNames: _col2, _col3
                         input vertices:
                           0 Map 1
-                        Statistics: Num rows: 809 Data size: 144002 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 791 Data size: 140798 Basic 
stats: COMPLETE Column stats: COMPLETE
                         Group By Operator
                           aggregations: sum(hash(_col2,_col3))
                           mode: hash
@@ -167,7 +167,7 @@ STAGE PLANS:
                       outputColumnNames: _col2, _col3
                       input vertices:
                         1 Map 3
-                      Statistics: Num rows: 809 Data size: 144002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                      Statistics: Num rows: 791 Data size: 140798 Basic stats: 
COMPLETE Column stats: COMPLETE
                       Group By Operator
                         aggregations: sum(hash(_col2,_col3))
                         mode: hash
@@ -300,7 +300,7 @@ STAGE PLANS:
                       outputColumnNames: _col2, _col3
                       input vertices:
                         0 Map 1
-                      Statistics: Num rows: 809 Data size: 144002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                      Statistics: Num rows: 791 Data size: 140798 Basic stats: 
COMPLETE Column stats: COMPLETE
                       Group By Operator
                         aggregations: sum(hash(_col2,_col3))
                         mode: hash
@@ -431,7 +431,7 @@ STAGE PLANS:
                         input vertices:
                           0 Map 1
                           2 Map 4
-                        Statistics: Num rows: 1309 Data size: 233002 Basic 
stats: COMPLETE Column stats: COMPLETE
+                        Statistics: Num rows: 1251 Data size: 222678 Basic 
stats: COMPLETE Column stats: COMPLETE
                         Group By Operator
                           aggregations: sum(hash(_col2,_col3))
                           mode: hash
@@ -605,7 +605,7 @@ STAGE PLANS:
                   1 _col0 (type: string)
                   2 _col0 (type: string)
                 outputColumnNames: _col2, _col3
-                Statistics: Num rows: 1309 Data size: 233002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 1251 Data size: 222678 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Group By Operator
                   aggregations: sum(hash(_col2,_col3))
                   mode: hash
@@ -758,7 +758,7 @@ STAGE PLANS:
                   1 _col0 (type: string)
                   2 _col0 (type: string)
                 outputColumnNames: _col2, _col3
-                Statistics: Num rows: 1309 Data size: 233002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 1251 Data size: 222678 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Group By Operator
                   aggregations: sum(hash(_col2,_col3))
                   mode: hash
@@ -911,7 +911,7 @@ STAGE PLANS:
                   1 _col0 (type: string)
                   2 _col0 (type: string)
                 outputColumnNames: _col2, _col3
-                Statistics: Num rows: 1309 Data size: 233002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 1251 Data size: 222678 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Group By Operator
                   aggregations: sum(hash(_col2,_col3))
                   mode: hash
@@ -1064,7 +1064,7 @@ STAGE PLANS:
                   1 _col0 (type: string)
                   2 _col0 (type: string)
                 outputColumnNames: _col2, _col3
-                Statistics: Num rows: 1309 Data size: 233002 Basic stats: 
COMPLETE Column stats: COMPLETE
+                Statistics: Num rows: 1251 Data size: 222678 Basic stats: 
COMPLETE Column stats: COMPLETE
                 Group By Operator
                   aggregations: sum(hash(_col2,_col3))
                   mode: hash

Reply via email to