http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_14.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_14.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_14.q.out
index 95bf29b..5266764 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_14.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_14.q.out
@@ -84,7 +84,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -94,7 +94,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprAndExpr(children: 
FilterLongColLessEqualLongColumn(col 0:bigint, col 3:bigint)(children: col 
0:tinyint), FilterExprOrExpr(children: FilterDoubleColLessEqualDoubleColumn(col 
13:double, col 5:double)(children: CastLongToDouble(col 2:int) -> 13:double), 
FilterTimestampColLessTimestampColumn(col 9:timestamp, col 8:timestamp)), 
FilterDoubleColLessDoubleColumn(col 5:double, col 13:double)(children: 
CastLongToDouble(col 0:tinyint) -> 13:double), FilterExprOrExpr(children: 
FilterLongColGreaterLongScalar(col 3:bigint, val -257), 
FilterDoubleColLessDoubleColumn(col 4:float, col 13:float)(children: 
CastLongToFloatViaLongToDouble(col 2:int) -> 13:float)))
                     predicate: (((UDFToDouble(cint) <= cdouble) or 
(ctimestamp2 < ctimestamp1)) and ((cbigint > -257L) or (cfloat < 
UDFToFloat(cint))) and (UDFToLong(ctinyint) <= cbigint) and (cdouble < 
UDFToDouble(ctinyint))) (type: boolean)
-                    Statistics: Num rows: 606 Data size: 130292 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 606 Data size: 143411 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: ctimestamp1 (type: timestamp), cfloat 
(type: float), cstring1 (type: string), cboolean1 (type: boolean), cdouble 
(type: double), (- (-26.28D + cdouble)) (type: double), ((- (-26.28D + 
cdouble)) * (- (-26.28D + cdouble))) (type: double), UDFToDouble(cfloat) (type: 
double), (UDFToDouble(cfloat) * UDFToDouble(cfloat)) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8
@@ -103,7 +103,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [8, 4, 6, 10, 5, 14, 13, 
4, 15]
                           selectExpressions: DoubleColUnaryMinus(col 
13:double)(children: DoubleScalarAddDoubleColumn(val -26.28, col 5:double) -> 
13:double) -> 14:double, DoubleColMultiplyDoubleColumn(col 15:double, col 
16:double)(children: DoubleColUnaryMinus(col 13:double)(children: 
DoubleScalarAddDoubleColumn(val -26.28, col 5:double) -> 13:double) -> 
15:double, DoubleColUnaryMinus(col 13:double)(children: 
DoubleScalarAddDoubleColumn(val -26.28, col 5:double) -> 13:double) -> 
16:double) -> 13:double, DoubleColMultiplyDoubleColumn(col 4:double, col 
4:double)(children: col 4:float, col 4:float) -> 15:double
-                      Statistics: Num rows: 606 Data size: 130292 Basic stats: 
COMPLETE Column stats: NONE
+                      Statistics: Num rows: 606 Data size: 143411 Basic stats: 
COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: sum(_col6), sum(_col5), count(_col5), 
max(_col1), sum(_col8), sum(_col7), count(_col1)
                         Group By Vectorization:
@@ -117,7 +117,7 @@ STAGE PLANS:
                         keys: _col2 (type: string), _col1 (type: float), _col4 
(type: double), _col0 (type: timestamp), _col3 (type: boolean)
                         mode: hash
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11
-                        Statistics: Num rows: 606 Data size: 130292 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 606 Data size: 143411 Basic 
stats: COMPLETE Column stats: NONE
                         Reduce Output Operator
                           key expressions: _col0 (type: string), _col1 (type: 
float), _col2 (type: double), _col3 (type: timestamp), _col4 (type: boolean)
                           sort order: +++++
@@ -128,7 +128,7 @@ STAGE PLANS:
                               native: true
                               nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                               valueColumnNums: [5, 6, 7, 8, 9, 10, 11]
-                          Statistics: Num rows: 606 Data size: 130292 Basic 
stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 606 Data size: 143411 Basic 
stats: COMPLETE Column stats: NONE
                           value expressions: _col5 (type: double), _col6 
(type: double), _col7 (type: bigint), _col8 (type: float), _col9 (type: 
double), _col10 (type: double), _col11 (type: bigint)
             Execution mode: vectorized
             Map Vectorization:
@@ -175,7 +175,7 @@ STAGE PLANS:
                 keys: KEY._col0 (type: string), KEY._col1 (type: float), 
KEY._col2 (type: double), KEY._col3 (type: timestamp), KEY._col4 (type: boolean)
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11
-                Statistics: Num rows: 303 Data size: 65146 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 303 Data size: 71705 Basic stats: 
COMPLETE Column stats: NONE
                 Select Operator
                   expressions: _col3 (type: timestamp), _col1 (type: float), 
_col0 (type: string), _col4 (type: boolean), _col2 (type: double), (-26.28D + 
_col2) (type: double), (- (-26.28D + _col2)) (type: double), power(((_col5 - 
((_col6 * _col6) / _col7)) / CASE WHEN ((_col7 = 1L)) THEN (null) ELSE ((_col7 
- 1)) END), 0.5) (type: double), (_col1 * -26.28) (type: float), _col8 (type: 
float), (- _col1) (type: float), (- _col8) (type: float), ((- (-26.28D + 
_col2)) / 10.175D) (type: double), power(((_col9 - ((_col10 * _col10) / 
_col11)) / _col11), 0.5) (type: double), _col11 (type: bigint), (- ((- (-26.28D 
+ _col2)) / 10.175D)) (type: double), (-1.389D % power(((_col5 - ((_col6 * 
_col6) / _col7)) / CASE WHEN ((_col7 = 1L)) THEN (null) ELSE ((_col7 - 1)) 
END), 0.5)) (type: double), (UDFToDouble(_col1) - _col2) (type: double), 
((_col9 - ((_col10 * _col10) / _col11)) / _col11) (type: double), (((_col9 - 
((_col10 * _col10) / _col11)) / _col11) % 10.175D) (type: double), ((_col9 - 
((_col
 10 * _col10) / _col11)) / CASE WHEN ((_col11 = 1L)) THEN (null) ELSE ((_col11 
- 1)) END) (type: double), (- (UDFToDouble(_col1) - _col2)) (type: double)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, 
_col16, _col17, _col18, _col19, _col20, _col21
@@ -184,7 +184,7 @@ STAGE PLANS:
                       native: true
                       projectedOutputColumnNums: [3, 1, 0, 4, 2, 12, 14, 13, 
15, 8, 19, 20, 21, 22, 11, 24, 25, 23, 29, 28, 31, 34]
                       selectExpressions: DoubleScalarAddDoubleColumn(val 
-26.28, col 2:double) -> 12:double, DoubleColUnaryMinus(col 
13:double)(children: DoubleScalarAddDoubleColumn(val -26.28, col 2:double) -> 
13:double) -> 14:double, FuncPowerDoubleToDouble(col 15:double)(children: 
DoubleColDivideLongColumn(col 13:double, col 18:bigint)(children: 
DoubleColSubtractDoubleColumn(col 5:double, col 15:double)(children: 
DoubleColDivideLongColumn(col 13:double, col 7:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 6:double, col 6:double) -> 13:double) -> 
15:double) -> 13:double, IfExprNullCondExpr(col 16:boolean, null, col 
17:bigint)(children: LongColEqualLongScalar(col 7:bigint, val 1) -> 16:boolean, 
LongColSubtractLongScalar(col 7:bigint, val 1) -> 17:bigint) -> 18:bigint) -> 
15:double) -> 13:double, DoubleColMultiplyDoubleScalar(col 1:float, val 
-26.280000686645508) -> 15:float, DoubleColUnaryMinus(col 1:float) -> 19:float, 
DoubleColUnaryMinus(col 8:float) -> 20:float, DoubleColDi
 videDoubleScalar(col 22:double, val 10.175)(children: DoubleColUnaryMinus(col 
21:double)(children: DoubleScalarAddDoubleColumn(val -26.28, col 2:double) -> 
21:double) -> 22:double) -> 21:double, FuncPowerDoubleToDouble(col 
23:double)(children: DoubleColDivideLongColumn(col 22:double, col 
11:bigint)(children: DoubleColSubtractDoubleColumn(col 9:double, col 
23:double)(children: DoubleColDivideLongColumn(col 22:double, col 
11:bigint)(children: DoubleColMultiplyDoubleColumn(col 10:double, col 
10:double) -> 22:double) -> 23:double) -> 22:double) -> 23:double) -> 
22:double, DoubleColUnaryMinus(col 23:double)(children: 
DoubleColDivideDoubleScalar(col 24:double, val 10.175)(children: 
DoubleColUnaryMinus(col 23:double)(children: DoubleScalarAddDoubleColumn(val 
-26.28, col 2:double) -> 23:double) -> 24:double) -> 23:double) -> 24:double, 
DoubleScalarModuloDoubleColumn(val -1.389, col 23:double)(children: 
FuncPowerDoubleToDouble(col 25:double)(children: DoubleColDivideLongColumn(col 
23:double,
  col 27:bigint)(children: DoubleColSubtractDoubleColumn(col 5:double, col 
25:double)(children: DoubleColDivideLongColumn(col 23:double, col 
7:bigint)(children: DoubleColMultiplyDoubleColumn(col 6:double, col 6:double) 
-> 23:double) -> 25:double) -> 23:double, IfExprNullCondExpr(col 18:boolean, 
null, col 26:bigint)(children: LongColEqualLongScalar(col 7:bigint, val 1) -> 
18:boolean, LongColSubtractLongScalar(col 7:bigint, val 1) -> 26:bigint) -> 
27:bigint) -> 25:double) -> 23:double) -> 25:double, 
DoubleColSubtractDoubleColumn(col 1:double, col 2:double)(children: col 
1:float) -> 23:double, DoubleColDivideLongColumn(col 28:double, col 
11:bigint)(children: DoubleColSubtractDoubleColumn(col 9:double, col 
29:double)(children: DoubleColDivideLongColumn(col 28:double, col 
11:bigint)(children: DoubleColMultiplyDoubleColumn(col 10:double, col 
10:double) -> 28:double) -> 29:double) -> 28:double) -> 29:double, 
DoubleColModuloDoubleScalar(col 30:double, val 10.175)(children: 
DoubleColDivideLon
 gColumn(col 28:double, col 11:bigint)(children: 
DoubleColSubtractDoubleColumn(col 9:double, col 30:double)(children: 
DoubleColDivideLongColumn(col 28:double, col 11:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 10:double, col 10:double) -> 28:double) -> 
30:double) -> 28:double) -> 30:double) -> 28:double, 
DoubleColDivideLongColumn(col 30:double, col 33:bigint)(children: 
DoubleColSubtractDoubleColumn(col 9:double, col 31:double)(children: 
DoubleColDivideLongColumn(col 30:double, col 11:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 10:double, col 10:double) -> 30:double) -> 
31:double) -> 30:double, IfExprNullCondExpr(col 27:boolean, null, col 
32:bigint)(children: LongColEqualLongScalar(col 11:bigint, val 1) -> 
27:boolean, LongColSubtractLongScalar(col 11:bigint, val 1) -> 32:bigint) -> 
33:bigint) -> 31:double, DoubleColUnaryMinus(col 30:double)(children: 
DoubleColSubtractDoubleColumn(col 1:double, col 2:double)(children: col 
1:float) -> 30:double) -> 34:double
-                  Statistics: Num rows: 303 Data size: 65146 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 303 Data size: 71705 Basic stats: 
COMPLETE Column stats: NONE
                   Reduce Output Operator
                     key expressions: _col2 (type: string), _col1 (type: 
float), _col4 (type: double), _col0 (type: timestamp)
                     sort order: ++++
@@ -194,7 +194,7 @@ STAGE PLANS:
                         native: true
                         nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                         valueColumnNums: [4, 12, 14, 13, 15, 8, 19, 20, 21, 
22, 11, 24, 25, 23, 29, 28, 31, 34]
-                    Statistics: Num rows: 303 Data size: 65146 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 303 Data size: 71705 Basic stats: 
COMPLETE Column stats: NONE
                     value expressions: _col3 (type: boolean), _col5 (type: 
double), _col6 (type: double), _col7 (type: double), _col8 (type: float), _col9 
(type: float), _col10 (type: float), _col11 (type: float), _col12 (type: 
double), _col13 (type: double), _col14 (type: bigint), _col15 (type: double), 
_col16 (type: double), _col17 (type: double), _col18 (type: double), _col19 
(type: double), _col20 (type: double), _col21 (type: double)
         Reducer 3 
             Execution mode: vectorized
@@ -219,13 +219,13 @@ STAGE PLANS:
                     className: VectorSelectOperator
                     native: true
                     projectedOutputColumnNums: [3, 1, 0, 4, 2, 5, 6, 7, 8, 9, 
10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21]
-                Statistics: Num rows: 303 Data size: 65146 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 303 Data size: 71705 Basic stats: 
COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   File Sink Vectorization:
                       className: VectorFileSinkOperator
                       native: false
-                  Statistics: Num rows: 303 Data size: 65146 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 303 Data size: 71705 Basic stats: 
COMPLETE Column stats: NONE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_15.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_15.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_15.q.out
index d0b03b3..5d51c87 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_15.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_15.q.out
@@ -80,7 +80,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -90,7 +90,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprOrExpr(children: 
FilterStringColLikeStringScalar(col 7:string, pattern %ss%), 
FilterStringColLikeStringScalar(col 6:string, pattern 10%), 
FilterExprAndExpr(children: FilterLongColGreaterEqualLongScalar(col 2:int, val 
-75), FilterLongColEqualLongColumn(col 0:smallint, col 1:smallint)(children: 
col 0:tinyint), FilterDoubleColGreaterEqualDoubleScalar(col 5:double, val 
-3728.0)))
                     predicate: (((cint >= -75) and (UDFToShort(ctinyint) = 
csmallint) and (cdouble >= -3728.0D)) or (cstring1 like '10%') or (cstring2 
like '%ss%')) (type: boolean)
-                    Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cfloat (type: float), cboolean1 (type: 
boolean), cdouble (type: double), cstring1 (type: string), ctinyint (type: 
tinyint), cint (type: int), ctimestamp1 (type: timestamp), UDFToDouble(cfloat) 
(type: double), (UDFToDouble(cfloat) * UDFToDouble(cfloat)) (type: double), 
UDFToDouble(ctinyint) (type: double), (UDFToDouble(ctinyint) * 
UDFToDouble(ctinyint)) (type: double), UDFToDouble(cint) (type: double), 
(UDFToDouble(cint) * UDFToDouble(cint)) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12
@@ -99,7 +99,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [4, 10, 5, 6, 0, 2, 8, 4, 
13, 14, 17, 15, 19]
                           selectExpressions: DoubleColMultiplyDoubleColumn(col 
4:double, col 4:double)(children: col 4:float, col 4:float) -> 13:double, 
CastLongToDouble(col 0:tinyint) -> 14:double, DoubleColMultiplyDoubleColumn(col 
15:double, col 16:double)(children: CastLongToDouble(col 0:tinyint) -> 
15:double, CastLongToDouble(col 0:tinyint) -> 16:double) -> 17:double, 
CastLongToDouble(col 2:int) -> 15:double, DoubleColMultiplyDoubleColumn(col 
16:double, col 18:double)(children: CastLongToDouble(col 2:int) -> 16:double, 
CastLongToDouble(col 2:int) -> 18:double) -> 19:double
-                      Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: sum(_col8), sum(_col7), count(_col0), 
min(_col2), sum(_col10), sum(_col9), count(_col4), sum(_col12), sum(_col11), 
count(_col5)
                         Group By Vectorization:
@@ -113,7 +113,7 @@ STAGE PLANS:
                         keys: _col0 (type: float), _col1 (type: boolean), 
_col2 (type: double), _col3 (type: string), _col4 (type: tinyint), _col5 (type: 
int), _col6 (type: timestamp)
                         mode: hash
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, 
_col15, _col16
-                        Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                         Reduce Output Operator
                           key expressions: _col0 (type: float), _col1 (type: 
boolean), _col2 (type: double), _col3 (type: string), _col4 (type: tinyint), 
_col5 (type: int), _col6 (type: timestamp)
                           sort order: +++++++
@@ -124,7 +124,7 @@ STAGE PLANS:
                               native: true
                               nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                               valueColumnNums: [7, 8, 9, 10, 11, 12, 13, 14, 
15, 16]
-                          Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                           value expressions: _col7 (type: double), _col8 
(type: double), _col9 (type: bigint), _col10 (type: double), _col11 (type: 
double), _col12 (type: double), _col13 (type: bigint), _col14 (type: double), 
_col15 (type: double), _col16 (type: bigint)
             Execution mode: vectorized
             Map Vectorization:
@@ -153,15 +153,15 @@ STAGE PLANS:
                 keys: KEY._col0 (type: float), KEY._col1 (type: boolean), 
KEY._col2 (type: double), KEY._col3 (type: string), KEY._col4 (type: tinyint), 
KEY._col5 (type: int), KEY._col6 (type: timestamp)
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, 
_col16
-                Statistics: Num rows: 6144 Data size: 1320982 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 6144 Data size: 1453997 Basic stats: 
COMPLETE Column stats: NONE
                 Select Operator
                   expressions: _col0 (type: float), _col1 (type: boolean), 
_col2 (type: double), _col3 (type: string), _col4 (type: tinyint), _col5 (type: 
int), _col6 (type: timestamp), power(((_col7 - ((_col8 * _col8) / _col9)) / 
CASE WHEN ((_col9 = 1L)) THEN (null) ELSE ((_col9 - 1)) END), 0.5) (type: 
double), (-26.28 - CAST( _col5 AS decimal(10,0))) (type: decimal(13,2)), _col10 
(type: double), (_col2 * 79.553D) (type: double), (33.0 % _col0) (type: float), 
power(((_col11 - ((_col12 * _col12) / _col13)) / CASE WHEN ((_col13 = 1L)) THEN 
(null) ELSE ((_col13 - 1)) END), 0.5) (type: double), ((_col11 - ((_col12 * 
_col12) / _col13)) / _col13) (type: double), (-23.0D % _col2) (type: double), 
(- _col4) (type: tinyint), ((_col14 - ((_col15 * _col15) / _col16)) / CASE WHEN 
((_col16 = 1L)) THEN (null) ELSE ((_col16 - 1)) END) (type: double), 
(UDFToFloat(_col5) - _col0) (type: float), (-23 % UDFToInteger(_col4)) (type: 
int), (- (-26.28 - CAST( _col5 AS decimal(10,0)))) (type: decimal(13,2)
 ), power(((_col14 - ((_col15 * _col15) / _col16)) / _col16), 0.5) (type: 
double)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, 
_col16, _col17, _col18, _col19, _col20
-                  Statistics: Num rows: 6144 Data size: 1320982 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 6144 Data size: 1453997 Basic stats: 
COMPLETE Column stats: NONE
                   Reduce Output Operator
                     key expressions: _col0 (type: float), _col1 (type: 
boolean), _col2 (type: double), _col3 (type: string), _col4 (type: tinyint), 
_col5 (type: int), _col6 (type: timestamp)
                     sort order: +++++++
-                    Statistics: Num rows: 6144 Data size: 1320982 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 6144 Data size: 1453997 Basic stats: 
COMPLETE Column stats: NONE
                     value expressions: _col7 (type: double), _col8 (type: 
decimal(13,2)), _col9 (type: double), _col10 (type: double), _col11 (type: 
float), _col12 (type: double), _col13 (type: double), _col14 (type: double), 
_col15 (type: tinyint), _col16 (type: double), _col17 (type: float), _col18 
(type: int), _col19 (type: decimal(13,2)), _col20 (type: double)
         Reducer 3 
             Reduce Vectorization:
@@ -172,10 +172,10 @@ STAGE PLANS:
               Select Operator
                 expressions: KEY.reducesinkkey0 (type: float), 
KEY.reducesinkkey1 (type: boolean), KEY.reducesinkkey2 (type: double), 
KEY.reducesinkkey3 (type: string), KEY.reducesinkkey4 (type: tinyint), 
KEY.reducesinkkey5 (type: int), KEY.reducesinkkey6 (type: timestamp), 
VALUE._col0 (type: double), VALUE._col1 (type: decimal(13,2)), VALUE._col2 
(type: double), VALUE._col3 (type: double), VALUE._col4 (type: float), 
VALUE._col5 (type: double), VALUE._col6 (type: double), VALUE._col7 (type: 
double), VALUE._col8 (type: tinyint), VALUE._col9 (type: double), VALUE._col10 
(type: float), VALUE._col11 (type: int), VALUE._col12 (type: decimal(13,2)), 
VALUE._col13 (type: double)
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, 
_col16, _col17, _col18, _col19, _col20
-                Statistics: Num rows: 6144 Data size: 1320982 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 6144 Data size: 1453997 Basic stats: 
COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
-                  Statistics: Num rows: 6144 Data size: 1320982 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 6144 Data size: 1453997 Basic stats: 
COMPLETE Column stats: NONE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_16.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_16.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_16.q.out
index 8798ebe..56bbb89 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_16.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_16.q.out
@@ -57,7 +57,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -67,7 +67,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprAndExpr(children: 
FilterStringColLikeStringScalar(col 7:string, pattern %b%), 
FilterExprOrExpr(children: FilterDoubleColGreaterEqualDoubleScalar(col 
5:double, val -1.389), FilterStringGroupColLessStringScalar(col 6:string, val 
a)))
                     predicate: (((cdouble >= -1.389D) or (cstring1 < 'a')) and 
(cstring2 like '%b%')) (type: boolean)
-                    Statistics: Num rows: 4096 Data size: 880654 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 4096 Data size: 969331 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cstring1 (type: string), cdouble (type: 
double), ctimestamp1 (type: timestamp), (cdouble * cdouble) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3
@@ -76,7 +76,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [6, 5, 8, 13]
                           selectExpressions: DoubleColMultiplyDoubleColumn(col 
5:double, col 5:double) -> 13:double
-                      Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: count(_col1), sum(_col3), sum(_col1), 
min(_col1)
                         Group By Vectorization:
@@ -90,7 +90,7 @@ STAGE PLANS:
                         keys: _col0 (type: string), _col1 (type: double), 
_col2 (type: timestamp)
                         mode: hash
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6
-                        Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                         Reduce Output Operator
                           key expressions: _col0 (type: string), _col1 (type: 
double), _col2 (type: timestamp)
                           sort order: +++
@@ -101,7 +101,7 @@ STAGE PLANS:
                               native: true
                               nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                               valueColumnNums: [3, 4, 5, 6]
-                          Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                           value expressions: _col3 (type: bigint), _col4 
(type: double), _col5 (type: double), _col6 (type: double)
             Execution mode: vectorized
             Map Vectorization:
@@ -148,7 +148,7 @@ STAGE PLANS:
                 keys: KEY._col0 (type: string), KEY._col1 (type: double), 
KEY._col2 (type: timestamp)
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6
-                Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: double), 
_col2 (type: timestamp), (_col1 - 9763215.5639D) (type: double), (- (_col1 - 
9763215.5639D)) (type: double), _col3 (type: bigint), power(((_col4 - ((_col5 * 
_col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) 
END), 0.5) (type: double), (- power(((_col4 - ((_col5 * _col5) / _col3)) / CASE 
WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) END), 0.5)) (type: double), 
(power(((_col4 - ((_col5 * _col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN 
(null) ELSE ((_col3 - 1)) END), 0.5) * UDFToDouble(_col3)) (type: double), 
_col6 (type: double), (9763215.5639D / _col1) (type: double), (CAST( _col3 AS 
decimal(19,0)) / -1.389) (type: decimal(28,6)), power(((_col4 - ((_col5 * 
_col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) 
END), 0.5) (type: double)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12
@@ -157,13 +157,13 @@ STAGE PLANS:
                       native: true
                       projectedOutputColumnNums: [0, 1, 2, 7, 9, 3, 8, 14, 20, 
6, 10, 22, 17]
                       selectExpressions: DoubleColSubtractDoubleScalar(col 
1:double, val 9763215.5639) -> 7:double, DoubleColUnaryMinus(col 
8:double)(children: DoubleColSubtractDoubleScalar(col 1:double, val 
9763215.5639) -> 8:double) -> 9:double, FuncPowerDoubleToDouble(col 
10:double)(children: DoubleColDivideLongColumn(col 8:double, col 
13:bigint)(children: DoubleColSubtractDoubleColumn(col 4:double, col 
10:double)(children: DoubleColDivideLongColumn(col 8:double, col 
3:bigint)(children: DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) 
-> 8:double) -> 10:double) -> 8:double, IfExprNullCondExpr(col 11:boolean, 
null, col 12:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 
11:boolean, LongColSubtractLongScalar(col 3:bigint, val 1) -> 12:bigint) -> 
13:bigint) -> 10:double) -> 8:double, DoubleColUnaryMinus(col 
10:double)(children: FuncPowerDoubleToDouble(col 14:double)(children: 
DoubleColDivideLongColumn(col 10:double, col 16:bigint)(children: 
DoubleColSubtract
 DoubleColumn(col 4:double, col 14:double)(children: 
DoubleColDivideLongColumn(col 10:double, col 3:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) -> 10:double) -> 
14:double) -> 10:double, IfExprNullCondExpr(col 13:boolean, null, col 
15:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 13:boolean, 
LongColSubtractLongScalar(col 3:bigint, val 1) -> 15:bigint) -> 16:bigint) -> 
14:double) -> 10:double) -> 14:double, DoubleColMultiplyDoubleColumn(col 
10:double, col 17:double)(children: FuncPowerDoubleToDouble(col 
17:double)(children: DoubleColDivideLongColumn(col 10:double, col 
19:bigint)(children: DoubleColSubtractDoubleColumn(col 4:double, col 
17:double)(children: DoubleColDivideLongColumn(col 10:double, col 
3:bigint)(children: DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) 
-> 10:double) -> 17:double) -> 10:double, IfExprNullCondExpr(col 16:boolean, 
null, col 18:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 
16:boo
 lean, LongColSubtractLongScalar(col 3:bigint, val 1) -> 18:bigint) -> 
19:bigint) -> 17:double) -> 10:double, CastLongToDouble(col 3:bigint) -> 
17:double) -> 20:double, DoubleScalarDivideDoubleColumn(val 9763215.5639, col 
1:double) -> 10:double, DecimalColDivideDecimalScalar(col 21:decimal(19,0), val 
-1.389)(children: CastLongToDecimal(col 3:bigint) -> 21:decimal(19,0)) -> 
22:decimal(28,6), FuncPowerDoubleToDouble(col 23:double)(children: 
DoubleColDivideLongColumn(col 17:double, col 25:bigint)(children: 
DoubleColSubtractDoubleColumn(col 4:double, col 23:double)(children: 
DoubleColDivideLongColumn(col 17:double, col 3:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) -> 17:double) -> 
23:double) -> 17:double, IfExprNullCondExpr(col 19:boolean, null, col 
24:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 19:boolean, 
LongColSubtractLongScalar(col 3:bigint, val 1) -> 24:bigint) -> 25:bigint) -> 
23:double) -> 17:double
-                  Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                   File Output Operator
                     compressed: false
                     File Sink Vectorization:
                         className: VectorFileSinkOperator
                         native: false
-                    Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                     table:
                         input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                         output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_17.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_17.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_17.q.out
index c333ab1..1877fb3 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_17.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_17.q.out
@@ -65,7 +65,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -75,7 +75,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprAndExpr(children: 
FilterLongColGreaterLongScalar(col 3:bigint, val -23), 
FilterExprOrExpr(children: FilterDoubleColNotEqualDoubleScalar(col 5:double, 
val 988888.0), FilterDecimalColGreaterDecimalScalar(col 13:decimal(13,3), val 
-863.257)(children: CastLongToDecimal(col 2:int) -> 13:decimal(13,3))), 
FilterExprOrExpr(children: FilterLongColGreaterEqualLongScalar(col 0:tinyint, 
val 33), FilterLongColGreaterEqualLongColumn(col 1:bigint, col 
3:bigint)(children: col 1:smallint), FilterDoubleColEqualDoubleColumn(col 
4:double, col 5:double)(children: col 4:float)))
                     predicate: (((cdouble <> 988888.0D) or (CAST( cint AS 
decimal(13,3)) > -863.257)) and ((ctinyint >= 33Y) or (UDFToLong(csmallint) >= 
cbigint) or (UDFToDouble(cfloat) = cdouble)) and (cbigint > -23L)) (type: 
boolean)
-                    Statistics: Num rows: 4096 Data size: 880654 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 4096 Data size: 969331 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cfloat (type: float), cstring1 (type: 
string), cint (type: int), ctimestamp1 (type: timestamp), cdouble (type: 
double), cbigint (type: bigint), (UDFToDouble(cfloat) / UDFToDouble(ctinyint)) 
(type: double), (UDFToLong(cint) % cbigint) (type: bigint), (- cdouble) (type: 
double), (cdouble + (UDFToDouble(cfloat) / UDFToDouble(ctinyint))) (type: 
double), (cdouble / UDFToDouble(cint)) (type: double), (- (- cdouble)) (type: 
double), (9763215.5639 % CAST( cbigint AS decimal(19,0))) (type: 
decimal(11,4)), (2563.58D + (- (- cdouble))) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13
@@ -84,7 +84,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [4, 6, 2, 8, 5, 3, 15, 
16, 14, 17, 19, 20, 22, 18]
                           selectExpressions: DoubleColDivideDoubleColumn(col 
4:double, col 14:double)(children: col 4:float, CastLongToDouble(col 0:tinyint) 
-> 14:double) -> 15:double, LongColModuloLongColumn(col 2:bigint, col 
3:bigint)(children: col 2:int) -> 16:bigint, DoubleColUnaryMinus(col 5:double) 
-> 14:double, DoubleColAddDoubleColumn(col 5:double, col 18:double)(children: 
DoubleColDivideDoubleColumn(col 4:double, col 17:double)(children: col 4:float, 
CastLongToDouble(col 0:tinyint) -> 17:double) -> 18:double) -> 17:double, 
DoubleColDivideDoubleColumn(col 5:double, col 18:double)(children: 
CastLongToDouble(col 2:int) -> 18:double) -> 19:double, DoubleColUnaryMinus(col 
18:double)(children: DoubleColUnaryMinus(col 5:double) -> 18:double) -> 
20:double, DecimalScalarModuloDecimalColumn(val 9763215.5639, col 
21:decimal(19,0))(children: CastLongToDecimal(col 3:bigint) -> 
21:decimal(19,0)) -> 22:decimal(11,4), DoubleScalarAddDoubleColumn(val 2563.58, 
col 23:double)(children: Double
 ColUnaryMinus(col 18:double)(children: DoubleColUnaryMinus(col 5:double) -> 
18:double) -> 23:double) -> 18:double
-                      Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         key expressions: _col5 (type: bigint), _col0 (type: 
float)
                         sort order: ++
@@ -94,7 +94,7 @@ STAGE PLANS:
                             native: true
                             nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                             valueColumnNums: [6, 2, 8, 5, 15, 16, 14, 17, 19, 
20, 22, 18]
-                        Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                         value expressions: _col1 (type: string), _col2 (type: 
int), _col3 (type: timestamp), _col4 (type: double), _col6 (type: double), 
_col7 (type: bigint), _col8 (type: double), _col9 (type: double), _col10 (type: 
double), _col11 (type: double), _col12 (type: decimal(11,4)), _col13 (type: 
double)
             Execution mode: vectorized
             Map Vectorization:
@@ -135,13 +135,13 @@ STAGE PLANS:
                     className: VectorSelectOperator
                     native: true
                     projectedOutputColumnNums: [1, 2, 3, 4, 5, 0, 6, 7, 8, 9, 
10, 11, 12, 13]
-                Statistics: Num rows: 4096 Data size: 880654 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 4096 Data size: 969331 Basic stats: 
COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   File Sink Vectorization:
                       className: VectorFileSinkOperator
                       native: false
-                  Statistics: Num rows: 4096 Data size: 880654 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 4096 Data size: 969331 Basic stats: 
COMPLETE Column stats: NONE
                   table:
                       input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                       output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_2.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_2.q.out
index 99afc2b..1af403a 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_2.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_2.q.out
@@ -63,7 +63,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -73,7 +73,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprOrExpr(children: 
FilterExprAndExpr(children: FilterTimestampColLessTimestampColumn(col 
8:timestamp, col 9:timestamp), FilterStringColLikeStringScalar(col 7:string, 
pattern b%), FilterDoubleColLessEqualDoubleScalar(col 4:float, val 
-5638.14990234375)), FilterExprAndExpr(children: 
FilterDoubleColLessDoubleColumn(col 5:double, col 13:double)(children: 
CastLongToDouble(col 0:tinyint) -> 13:double), FilterExprOrExpr(children: 
FilterDoubleColNotEqualDoubleScalar(col 13:double, val -10669.0)(children: 
CastTimestampToDouble(col 9:timestamp) -> 13:double), 
FilterLongColLessLongScalar(col 2:int, val 359))))
                     predicate: (((cdouble < UDFToDouble(ctinyint)) and 
((UDFToDouble(ctimestamp2) <> -10669.0D) or (cint < 359))) or ((ctimestamp1 < 
ctimestamp2) and (cstring2 like 'b%') and (cfloat <= -5638.15))) (type: boolean)
-                    Statistics: Num rows: 4778 Data size: 1027287 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 4778 Data size: 1130728 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: csmallint (type: smallint), cfloat (type: 
float), cbigint (type: bigint), ctinyint (type: tinyint), cdouble (type: 
double), UDFToDouble(cbigint) (type: double), (UDFToDouble(cbigint) * 
UDFToDouble(cbigint)) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6
@@ -82,7 +82,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [1, 4, 3, 0, 5, 13, 16]
                           selectExpressions: CastLongToDouble(col 3:bigint) -> 
13:double, DoubleColMultiplyDoubleColumn(col 14:double, col 
15:double)(children: CastLongToDouble(col 3:bigint) -> 14:double, 
CastLongToDouble(col 3:bigint) -> 15:double) -> 16:double
-                      Statistics: Num rows: 4778 Data size: 1027287 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 4778 Data size: 1130728 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: sum(_col0), count(_col0), sum(_col1), 
sum(_col6), sum(_col5), count(_col2), count(), min(_col3), sum(_col4), 
count(_col4)
                         Group By Vectorization:

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_3.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_3.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_3.q.out
index 2bccf64..51d04cc 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_3.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_3.q.out
@@ -68,7 +68,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -78,7 +78,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprOrExpr(children: 
FilterExprAndExpr(children: FilterDoubleColLessEqualDoubleColumn(col 13:float, 
col 4:float)(children: CastLongToFloatViaLongToDouble(col 2:int) -> 13:float), 
FilterDecimalColNotEqualDecimalScalar(col 14:decimal(22,3), val 
79.553)(children: CastLongToDecimal(col 3:bigint) -> 14:decimal(22,3)), 
FilterDoubleColEqualDoubleScalar(col 13:double, val -29071.0)(children: 
CastTimestampToDouble(col 9:timestamp) -> 13:double)), 
FilterExprAndExpr(children: FilterDoubleColGreaterDoubleColumn(col 13:double, 
col 5:double)(children: CastLongToDouble(col 3:bigint) -> 13:double), 
FilterDecimalColGreaterEqualDecimalScalar(col 15:decimal(8,3), val 
79.553)(children: CastLongToDecimal(col 1:smallint) -> 15:decimal(8,3)), 
FilterTimestampColGreaterTimestampColumn(col 8:timestamp, col 9:timestamp)))
                     predicate: (((UDFToDouble(cbigint) > cdouble) and (CAST( 
csmallint AS decimal(8,3)) >= 79.553) and (ctimestamp1 > ctimestamp2)) or 
((UDFToFloat(cint) <= cfloat) and (CAST( cbigint AS decimal(22,3)) <> 79.553) 
and (UDFToDouble(ctimestamp2) = -29071.0D))) (type: boolean)
-                    Statistics: Num rows: 2503 Data size: 538153 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2503 Data size: 592342 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: csmallint (type: smallint), ctinyint (type: 
tinyint), cfloat (type: float), cint (type: int), UDFToDouble(csmallint) (type: 
double), (UDFToDouble(csmallint) * UDFToDouble(csmallint)) (type: double), 
UDFToDouble(ctinyint) (type: double), (UDFToDouble(ctinyint) * 
UDFToDouble(ctinyint)) (type: double), UDFToDouble(cfloat) (type: double), 
(UDFToDouble(cfloat) * UDFToDouble(cfloat)) (type: double), UDFToDouble(cint) 
(type: double), (UDFToDouble(cint) * UDFToDouble(cint)) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11
@@ -87,7 +87,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [1, 0, 4, 2, 13, 18, 16, 
20, 4, 17, 19, 23]
                           selectExpressions: CastLongToDouble(col 1:smallint) 
-> 13:double, DoubleColMultiplyDoubleColumn(col 16:double, col 
17:double)(children: CastLongToDouble(col 1:smallint) -> 16:double, 
CastLongToDouble(col 1:smallint) -> 17:double) -> 18:double, 
CastLongToDouble(col 0:tinyint) -> 16:double, DoubleColMultiplyDoubleColumn(col 
17:double, col 19:double)(children: CastLongToDouble(col 0:tinyint) -> 
17:double, CastLongToDouble(col 0:tinyint) -> 19:double) -> 20:double, 
DoubleColMultiplyDoubleColumn(col 4:double, col 4:double)(children: col 
4:float, col 4:float) -> 17:double, CastLongToDouble(col 2:int) -> 19:double, 
DoubleColMultiplyDoubleColumn(col 21:double, col 22:double)(children: 
CastLongToDouble(col 2:int) -> 21:double, CastLongToDouble(col 2:int) -> 
22:double) -> 23:double
-                      Statistics: Num rows: 2503 Data size: 538153 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2503 Data size: 592342 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: sum(_col5), sum(_col4), count(_col0), 
sum(_col7), sum(_col6), count(_col1), sum(_col9), sum(_col8), count(_col2), 
sum(_col2), sum(_col3), count(_col3), sum(_col11), sum(_col10)
                         Group By Vectorization:

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_4.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_4.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_4.q.out
index 922eb90..07d30cf 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_4.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_4.q.out
@@ -63,7 +63,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -73,7 +73,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprOrExpr(children: 
FilterLongColGreaterEqualLongColumn(col 1:int, col 2:int)(children: col 
1:smallint), FilterExprAndExpr(children: FilterLongColLessEqualLongScalar(col 
0:int, val -89010)(children: col 0:tinyint), 
FilterDoubleColGreaterDoubleScalar(col 5:double, val 79.553)), 
FilterExprAndExpr(children: FilterLongColNotEqualLongScalar(col 3:bigint, val 
-563), FilterExprOrExpr(children: FilterLongColNotEqualLongColumn(col 0:bigint, 
col 3:bigint)(children: col 0:tinyint), 
FilterDoubleColLessEqualDoubleScalar(col 5:double, val -3728.0))))
                     predicate: (((UDFToInteger(ctinyint) <= -89010) and 
(cdouble > 79.553D)) or ((cbigint <> -563L) and ((UDFToLong(ctinyint) <> 
cbigint) or (cdouble <= -3728.0D))) or (UDFToInteger(csmallint) >= cint)) 
(type: boolean)
-                    Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cint (type: int), cdouble (type: double), 
ctinyint (type: tinyint), (cdouble * cdouble) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3
@@ -82,7 +82,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [2, 5, 0, 13]
                           selectExpressions: DoubleColMultiplyDoubleColumn(col 
5:double, col 5:double) -> 13:double
-                      Statistics: Num rows: 12288 Data size: 2641964 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 12288 Data size: 2907994 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: sum(_col0), sum(_col3), sum(_col1), 
count(_col1), min(_col2)
                         Group By Vectorization:

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_5.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_5.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_5.q.out
index 4cf4548..0fb430e 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_5.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_5.q.out
@@ -57,7 +57,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -67,7 +67,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprOrExpr(children: 
FilterExprAndExpr(children: SelectColumnIsNotNull(col 11:boolean), 
FilterStringColLikeStringScalar(col 6:string, pattern %b%)), 
FilterExprAndExpr(children: FilterDoubleColEqualDoubleColumn(col 13:double, col 
5:double)(children: CastLongToDouble(col 0:tinyint) -> 13:double), 
SelectColumnIsNotNull(col 9:timestamp), FilterStringColLikeStringScalar(col 
7:string, pattern a)))
                     predicate: (((UDFToDouble(ctinyint) = cdouble) and 
ctimestamp2 is not null and (cstring2 like 'a')) or (cboolean2 is not null and 
(cstring1 like '%b%'))) (type: boolean)
-                    Statistics: Num rows: 9216 Data size: 1981473 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 9216 Data size: 2180995 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: ctinyint (type: tinyint), csmallint (type: 
smallint), cint (type: int)
                       outputColumnNames: ctinyint, csmallint, cint
@@ -75,7 +75,7 @@ STAGE PLANS:
                           className: VectorSelectOperator
                           native: true
                           projectedOutputColumnNums: [0, 1, 2]
-                      Statistics: Num rows: 9216 Data size: 1981473 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 9216 Data size: 2180995 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: max(csmallint), count(), min(csmallint), 
sum(cint), max(ctinyint)
                         Group By Vectorization:

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_6.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_6.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_6.q.out
index ebf4849..bdb014c 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_6.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_6.q.out
@@ -57,7 +57,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -67,7 +67,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprAndExpr(children: 
FilterLongColNotEqualLongScalar(col 0:tinyint, val 0), 
FilterExprOrExpr(children: FilterExprAndExpr(children: 
FilterLongColLessEqualLongScalar(col 10:boolean, val 0), 
FilterLongColGreaterEqualLongColumn(col 11:boolean, col 10:boolean)), 
FilterExprAndExpr(children: SelectColumnIsNotNull(col 3:bigint), 
FilterExprOrExpr(children: FilterStringColLikeStringScalar(col 7:string, 
pattern %a), FilterDoubleColLessEqualDoubleScalar(col 4:float, val -257.0)))))
                     predicate: ((((cboolean1 <= 0) and (cboolean2 >= 
cboolean1)) or (cbigint is not null and ((cstring2 like '%a') or (cfloat <= 
-257)))) and (ctinyint <> 0Y)) (type: boolean)
-                    Statistics: Num rows: 11605 Data size: 2495116 Basic 
stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 11605 Data size: 2746359 Basic 
stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cboolean1 (type: boolean), cfloat (type: 
float), cstring1 (type: string), (988888 * UDFToInteger(csmallint)) (type: 
int), (- csmallint) (type: smallint), (- cfloat) (type: float), (-26.28D / 
UDFToDouble(cfloat)) (type: double), (cfloat * 359.0) (type: float), (cint % 
UDFToInteger(ctinyint)) (type: int), (- cdouble) (type: double), 
(UDFToInteger(ctinyint) - -75) (type: int), (762 * (cint % 
UDFToInteger(ctinyint))) (type: int)
                       outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6, _col7, _col8, _col9, _col10, _col11
@@ -76,13 +76,13 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [10, 4, 6, 13, 14, 15, 
16, 17, 18, 19, 20, 22]
                           selectExpressions: LongScalarMultiplyLongColumn(val 
988888, col 1:int)(children: col 1:smallint) -> 13:int, LongColUnaryMinus(col 
1:smallint) -> 14:smallint, DoubleColUnaryMinus(col 4:float) -> 15:float, 
DoubleScalarDivideDoubleColumn(val -26.28, col 4:double)(children: col 4:float) 
-> 16:double, DoubleColMultiplyDoubleScalar(col 4:float, val 359.0) -> 
17:float, LongColModuloLongColumn(col 2:int, col 0:int)(children: col 
0:tinyint) -> 18:int, DoubleColUnaryMinus(col 5:double) -> 19:double, 
LongColSubtractLongScalar(col 0:int, val -75)(children: col 0:tinyint) -> 
20:int, LongScalarMultiplyLongColumn(val 762, col 21:int)(children: 
LongColModuloLongColumn(col 2:int, col 0:int)(children: col 0:tinyint) -> 
21:int) -> 22:int
-                      Statistics: Num rows: 11605 Data size: 2495116 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 11605 Data size: 2746359 Basic 
stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
                         File Sink Vectorization:
                             className: VectorFileSinkOperator
                             native: false
-                        Statistics: Num rows: 11605 Data size: 2495116 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 11605 Data size: 2746359 Basic 
stats: COMPLETE Column stats: NONE
                         table:
                             input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/76148bb6/ql/src/test/results/clientpositive/spark/vectorization_9.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorization_9.q.out 
b/ql/src/test/results/clientpositive/spark/vectorization_9.q.out
index 8798ebe..56bbb89 100644
--- a/ql/src/test/results/clientpositive/spark/vectorization_9.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorization_9.q.out
@@ -57,7 +57,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: alltypesorc
-                  Statistics: Num rows: 12288 Data size: 2641964 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 12288 Data size: 2907994 Basic stats: 
COMPLETE Column stats: NONE
                   TableScan Vectorization:
                       native: true
                       vectorizationSchemaColumns: [0:ctinyint:tinyint, 
1:csmallint:smallint, 2:cint:int, 3:cbigint:bigint, 4:cfloat:float, 
5:cdouble:double, 6:cstring1:string, 7:cstring2:string, 
8:ctimestamp1:timestamp, 9:ctimestamp2:timestamp, 10:cboolean1:boolean, 
11:cboolean2:boolean, 
12:ROW__ID:struct<writeid:bigint,bucketid:int,rowid:bigint>]
@@ -67,7 +67,7 @@ STAGE PLANS:
                         native: true
                         predicateExpression: FilterExprAndExpr(children: 
FilterStringColLikeStringScalar(col 7:string, pattern %b%), 
FilterExprOrExpr(children: FilterDoubleColGreaterEqualDoubleScalar(col 
5:double, val -1.389), FilterStringGroupColLessStringScalar(col 6:string, val 
a)))
                     predicate: (((cdouble >= -1.389D) or (cstring1 < 'a')) and 
(cstring2 like '%b%')) (type: boolean)
-                    Statistics: Num rows: 4096 Data size: 880654 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 4096 Data size: 969331 Basic stats: 
COMPLETE Column stats: NONE
                     Select Operator
                       expressions: cstring1 (type: string), cdouble (type: 
double), ctimestamp1 (type: timestamp), (cdouble * cdouble) (type: double)
                       outputColumnNames: _col0, _col1, _col2, _col3
@@ -76,7 +76,7 @@ STAGE PLANS:
                           native: true
                           projectedOutputColumnNums: [6, 5, 8, 13]
                           selectExpressions: DoubleColMultiplyDoubleColumn(col 
5:double, col 5:double) -> 13:double
-                      Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: count(_col1), sum(_col3), sum(_col1), 
min(_col1)
                         Group By Vectorization:
@@ -90,7 +90,7 @@ STAGE PLANS:
                         keys: _col0 (type: string), _col1 (type: double), 
_col2 (type: timestamp)
                         mode: hash
                         outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5, _col6
-                        Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                         Reduce Output Operator
                           key expressions: _col0 (type: string), _col1 (type: 
double), _col2 (type: timestamp)
                           sort order: +++
@@ -101,7 +101,7 @@ STAGE PLANS:
                               native: true
                               nativeConditionsMet: 
hive.vectorized.execution.reducesink.new.enabled IS true, hive.execution.engine 
spark IN [tez, spark] IS true, No PTF TopN IS true, No DISTINCT columns IS 
true, BinarySortableSerDe for keys IS true, LazyBinarySerDe for values IS true
                               valueColumnNums: [3, 4, 5, 6]
-                          Statistics: Num rows: 4096 Data size: 880654 Basic 
stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 4096 Data size: 969331 Basic 
stats: COMPLETE Column stats: NONE
                           value expressions: _col3 (type: bigint), _col4 
(type: double), _col5 (type: double), _col6 (type: double)
             Execution mode: vectorized
             Map Vectorization:
@@ -148,7 +148,7 @@ STAGE PLANS:
                 keys: KEY._col0 (type: string), KEY._col1 (type: double), 
KEY._col2 (type: timestamp)
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6
-                Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                 Select Operator
                   expressions: _col0 (type: string), _col1 (type: double), 
_col2 (type: timestamp), (_col1 - 9763215.5639D) (type: double), (- (_col1 - 
9763215.5639D)) (type: double), _col3 (type: bigint), power(((_col4 - ((_col5 * 
_col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) 
END), 0.5) (type: double), (- power(((_col4 - ((_col5 * _col5) / _col3)) / CASE 
WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) END), 0.5)) (type: double), 
(power(((_col4 - ((_col5 * _col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN 
(null) ELSE ((_col3 - 1)) END), 0.5) * UDFToDouble(_col3)) (type: double), 
_col6 (type: double), (9763215.5639D / _col1) (type: double), (CAST( _col3 AS 
decimal(19,0)) / -1.389) (type: decimal(28,6)), power(((_col4 - ((_col5 * 
_col5) / _col3)) / CASE WHEN ((_col3 = 1L)) THEN (null) ELSE ((_col3 - 1)) 
END), 0.5) (type: double)
                   outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, 
_col6, _col7, _col8, _col9, _col10, _col11, _col12
@@ -157,13 +157,13 @@ STAGE PLANS:
                       native: true
                       projectedOutputColumnNums: [0, 1, 2, 7, 9, 3, 8, 14, 20, 
6, 10, 22, 17]
                       selectExpressions: DoubleColSubtractDoubleScalar(col 
1:double, val 9763215.5639) -> 7:double, DoubleColUnaryMinus(col 
8:double)(children: DoubleColSubtractDoubleScalar(col 1:double, val 
9763215.5639) -> 8:double) -> 9:double, FuncPowerDoubleToDouble(col 
10:double)(children: DoubleColDivideLongColumn(col 8:double, col 
13:bigint)(children: DoubleColSubtractDoubleColumn(col 4:double, col 
10:double)(children: DoubleColDivideLongColumn(col 8:double, col 
3:bigint)(children: DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) 
-> 8:double) -> 10:double) -> 8:double, IfExprNullCondExpr(col 11:boolean, 
null, col 12:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 
11:boolean, LongColSubtractLongScalar(col 3:bigint, val 1) -> 12:bigint) -> 
13:bigint) -> 10:double) -> 8:double, DoubleColUnaryMinus(col 
10:double)(children: FuncPowerDoubleToDouble(col 14:double)(children: 
DoubleColDivideLongColumn(col 10:double, col 16:bigint)(children: 
DoubleColSubtract
 DoubleColumn(col 4:double, col 14:double)(children: 
DoubleColDivideLongColumn(col 10:double, col 3:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) -> 10:double) -> 
14:double) -> 10:double, IfExprNullCondExpr(col 13:boolean, null, col 
15:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 13:boolean, 
LongColSubtractLongScalar(col 3:bigint, val 1) -> 15:bigint) -> 16:bigint) -> 
14:double) -> 10:double) -> 14:double, DoubleColMultiplyDoubleColumn(col 
10:double, col 17:double)(children: FuncPowerDoubleToDouble(col 
17:double)(children: DoubleColDivideLongColumn(col 10:double, col 
19:bigint)(children: DoubleColSubtractDoubleColumn(col 4:double, col 
17:double)(children: DoubleColDivideLongColumn(col 10:double, col 
3:bigint)(children: DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) 
-> 10:double) -> 17:double) -> 10:double, IfExprNullCondExpr(col 16:boolean, 
null, col 18:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 
16:boo
 lean, LongColSubtractLongScalar(col 3:bigint, val 1) -> 18:bigint) -> 
19:bigint) -> 17:double) -> 10:double, CastLongToDouble(col 3:bigint) -> 
17:double) -> 20:double, DoubleScalarDivideDoubleColumn(val 9763215.5639, col 
1:double) -> 10:double, DecimalColDivideDecimalScalar(col 21:decimal(19,0), val 
-1.389)(children: CastLongToDecimal(col 3:bigint) -> 21:decimal(19,0)) -> 
22:decimal(28,6), FuncPowerDoubleToDouble(col 23:double)(children: 
DoubleColDivideLongColumn(col 17:double, col 25:bigint)(children: 
DoubleColSubtractDoubleColumn(col 4:double, col 23:double)(children: 
DoubleColDivideLongColumn(col 17:double, col 3:bigint)(children: 
DoubleColMultiplyDoubleColumn(col 5:double, col 5:double) -> 17:double) -> 
23:double) -> 17:double, IfExprNullCondExpr(col 19:boolean, null, col 
24:bigint)(children: LongColEqualLongScalar(col 3:bigint, val 1) -> 19:boolean, 
LongColSubtractLongScalar(col 3:bigint, val 1) -> 24:bigint) -> 25:bigint) -> 
23:double) -> 17:double
-                  Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                   File Output Operator
                     compressed: false
                     File Sink Vectorization:
                         className: VectorFileSinkOperator
                         native: false
-                    Statistics: Num rows: 2048 Data size: 440327 Basic stats: 
COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2048 Data size: 484665 Basic stats: 
COMPLETE Column stats: NONE
                     table:
                         input format: 
org.apache.hadoop.mapred.SequenceFileInputFormat
                         output format: 
org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

Reply via email to