Modified: hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_opt_vectorization.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_opt_vectorization.q.out?rev=1628877&r1=1628876&r2=1628877&view=diff ============================================================================== --- hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_opt_vectorization.q.out (original) +++ hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_opt_vectorization.q.out Thu Oct 2 01:59:44 2014 @@ -342,11 +342,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Execution mode: vectorized Reduce Operator Tree: Extract @@ -399,11 +399,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Execution mode: vectorized Reduce Operator Tree: Extract @@ -691,11 +691,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Execution mode: vectorized Reduce Operator Tree: Extract @@ -748,11 +748,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Execution mode: vectorized Reduce Operator Tree: Extract @@ -2063,11 +2063,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 1048 Data size: 310873 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Execution mode: vectorized Reduce Operator Tree: Extract
Modified: hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization.q.out?rev=1628877&r1=1628876&r2=1628877&view=diff ============================================================================== --- hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization.q.out (original) +++ hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization.q.out Thu Oct 2 01:59:44 2014 @@ -275,11 +275,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Reduce Operator Tree: Extract Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE @@ -331,11 +331,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Reduce Operator Tree: Extract Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE @@ -598,11 +598,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string) sort order: ++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Reduce Operator Tree: Extract Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE @@ -654,11 +654,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Reduce Operator Tree: Extract Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE @@ -1962,11 +1962,11 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Reduce Output Operator - key expressions: _col4 (type: tinyint), -1 (type: int), _col3 (type: float) + key expressions: _col4 (type: tinyint), '_bucket_number' (type: string), _col3 (type: float) sort order: +++ Map-reduce partition columns: _col4 (type: tinyint) Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE - value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint) + value expressions: _col0 (type: smallint), _col1 (type: int), _col2 (type: bigint), _col3 (type: float), _col4 (type: tinyint), '_bucket_number' (type: string) Reduce Operator Tree: Extract Statistics: Num rows: 4442 Data size: 106611 Basic stats: COMPLETE Column stats: NONE Added: hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization2.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization2.q.out?rev=1628877&view=auto ============================================================================== --- hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization2.q.out (added) +++ hive/branches/branch-0.14/ql/src/test/results/clientpositive/dynpart_sort_optimization2.q.out Thu Oct 2 01:59:44 2014 @@ -0,0 +1,1782 @@ +PREHOOK: query: drop table ss +PREHOOK: type: DROPTABLE +POSTHOOK: query: drop table ss +POSTHOOK: type: DROPTABLE +PREHOOK: query: drop table ss_orc +PREHOOK: type: DROPTABLE +POSTHOOK: query: drop table ss_orc +POSTHOOK: type: DROPTABLE +PREHOOK: query: drop table ss_part +PREHOOK: type: DROPTABLE +POSTHOOK: query: drop table ss_part +POSTHOOK: type: DROPTABLE +PREHOOK: query: drop table ss_part_orc +PREHOOK: type: DROPTABLE +POSTHOOK: query: drop table ss_part_orc +POSTHOOK: type: DROPTABLE +PREHOOK: query: create table ss ( +ss_sold_date_sk int, +ss_net_paid_inc_tax float, +ss_net_profit float) +PREHOOK: type: CREATETABLE +PREHOOK: Output: database:default +PREHOOK: Output: default@ss +POSTHOOK: query: create table ss ( +ss_sold_date_sk int, +ss_net_paid_inc_tax float, +ss_net_profit float) +POSTHOOK: type: CREATETABLE +POSTHOOK: Output: database:default +POSTHOOK: Output: default@ss +PREHOOK: query: create table ss_part ( +ss_net_paid_inc_tax float, +ss_net_profit float) +partitioned by (ss_sold_date_sk int) +PREHOOK: type: CREATETABLE +PREHOOK: Output: database:default +PREHOOK: Output: default@ss_part +POSTHOOK: query: create table ss_part ( +ss_net_paid_inc_tax float, +ss_net_profit float) +partitioned by (ss_sold_date_sk int) +POSTHOOK: type: CREATETABLE +POSTHOOK: Output: database:default +POSTHOOK: Output: default@ss_part +PREHOOK: query: load data local inpath '../../data/files/dynpart_test.txt' overwrite into table ss +PREHOOK: type: LOAD +#### A masked pattern was here #### +PREHOOK: Output: default@ss +POSTHOOK: query: load data local inpath '../../data/files/dynpart_test.txt' overwrite into table ss +POSTHOOK: type: LOAD +#### A masked pattern was here #### +POSTHOOK: Output: default@ss +PREHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss + Statistics: Num rows: 46 Data size: 553 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + outputColumnNames: ss_sold_date_sk, ss_net_paid_inc_tax, ss_net_profit + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Group By Operator + keys: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: int), _col1 (type: float), _col2 (type: float) + sort order: +++ + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Operator Tree: + Group By Operator + keys: KEY._col0 (type: int), KEY._col1 (type: float), KEY._col2 (type: float) + mode: mergepartial + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col1 (type: float), _col2 (type: float), _col0 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss_part +POSTHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 151 + totalSize 162 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +2.1 -2026.3 2452617 +2.99 -11.32 2452617 +85.8 25.61 2452617 +552.96 -1363.84 2452617 +565.92 196.48 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +7412.83 2071.68 2452617 +10022.63 3952.8 2452617 +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 186 + totalSize 199 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +0.15 -241.22 2452638 +150.39 -162.12 2452638 +156.67 -4626.56 2452638 +181.03 -207.24 2452638 +267.01 -3266.36 2452638 +317.87 -3775.38 2452638 +1327.08 57.97 2452638 +1413.19 178.08 2452638 +1524.33 494.37 2452638 +1971.35 -488.25 2452638 +4133.98 -775.72 2452638 +4329.49 -4000.51 2452638 +10171.1 660.48 2452638 +PREHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss + Statistics: Num rows: 46 Data size: 553 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_net_paid_inc_tax (type: float), ss_net_profit (type: float), ss_sold_date_sk (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col2 (type: int) + sort order: + + Map-reduce partition columns: _col2 (type: int) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: float), _col1 (type: float), _col2 (type: int) + Reduce Operator Tree: + Select Operator + expressions: VALUE._col0 (type: float), VALUE._col1 (type: float), VALUE._col2 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss_part +POSTHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 151 + totalSize 162 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +10022.63 3952.8 2452617 +2.99 -11.32 2452617 +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +565.92 196.48 2452617 +85.8 25.61 2452617 +7412.83 2071.68 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +552.96 -1363.84 2452617 +2.1 -2026.3 2452617 +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 186 + totalSize 199 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +4329.49 -4000.51 2452638 +1413.19 178.08 2452638 +150.39 -162.12 2452638 +1524.33 494.37 2452638 +0.15 -241.22 2452638 +267.01 -3266.36 2452638 +181.03 -207.24 2452638 +1971.35 -488.25 2452638 +1327.08 57.97 2452638 +156.67 -4626.56 2452638 +317.87 -3775.38 2452638 +10171.1 660.48 2452638 +4133.98 -775.72 2452638 +PREHOOK: query: -- SORT DYNAMIC PARTITION DISABLED + +explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: -- SORT DYNAMIC PARTITION DISABLED + +explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss + Statistics: Num rows: 46 Data size: 553 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + outputColumnNames: ss_sold_date_sk, ss_net_paid_inc_tax, ss_net_profit + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Group By Operator + keys: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: int), _col1 (type: float), _col2 (type: float) + sort order: +++ + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Operator Tree: + Group By Operator + keys: KEY._col0 (type: int), KEY._col1 (type: float), KEY._col2 (type: float) + mode: mergepartial + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col1 (type: float), _col2 (type: float), _col0 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss_part +POSTHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 151 + totalSize 162 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +2.1 -2026.3 2452617 +2.99 -11.32 2452617 +85.8 25.61 2452617 +552.96 -1363.84 2452617 +565.92 196.48 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +7412.83 2071.68 2452617 +10022.63 3952.8 2452617 +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 186 + totalSize 199 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +0.15 -241.22 2452638 +150.39 -162.12 2452638 +156.67 -4626.56 2452638 +181.03 -207.24 2452638 +267.01 -3266.36 2452638 +317.87 -3775.38 2452638 +1327.08 57.97 2452638 +1413.19 178.08 2452638 +1524.33 494.37 2452638 +1971.35 -488.25 2452638 +4133.98 -775.72 2452638 +4329.49 -4000.51 2452638 +10171.1 660.48 2452638 +PREHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss + Statistics: Num rows: 46 Data size: 553 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_net_paid_inc_tax (type: float), ss_net_profit (type: float), ss_sold_date_sk (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + sort order: + Map-reduce partition columns: _col2 (type: int) + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: float), _col1 (type: float), _col2 (type: int) + Reduce Operator Tree: + Select Operator + expressions: VALUE._col0 (type: float), VALUE._col1 (type: float), VALUE._col2 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 5 Data size: 60 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.ss_part + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss_part +POSTHOOK: query: insert overwrite table ss_part partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 151 + totalSize 162 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +565.92 196.48 2452617 +85.8 25.61 2452617 +7412.83 2071.68 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +552.96 -1363.84 2452617 +2.1 -2026.3 2452617 +10022.63 3952.8 2452617 +2.99 -11.32 2452617 +PREHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part +POSTHOOK: query: desc formatted ss_part partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 186 + totalSize 199 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe +InputFormat: org.apache.hadoop.mapred.TextInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part +PREHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part +POSTHOOK: Input: default@ss_part@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +4329.49 -4000.51 2452638 +1413.19 178.08 2452638 +150.39 -162.12 2452638 +1524.33 494.37 2452638 +0.15 -241.22 2452638 +267.01 -3266.36 2452638 +181.03 -207.24 2452638 +1971.35 -488.25 2452638 +1327.08 57.97 2452638 +156.67 -4626.56 2452638 +317.87 -3775.38 2452638 +10171.1 660.48 2452638 +4133.98 -775.72 2452638 +PREHOOK: query: -- VECTORIZATION IS ENABLED + +create table ss_orc ( +ss_sold_date_sk int, +ss_net_paid_inc_tax float, +ss_net_profit float) stored as orc +PREHOOK: type: CREATETABLE +PREHOOK: Output: database:default +PREHOOK: Output: default@ss_orc +POSTHOOK: query: -- VECTORIZATION IS ENABLED + +create table ss_orc ( +ss_sold_date_sk int, +ss_net_paid_inc_tax float, +ss_net_profit float) stored as orc +POSTHOOK: type: CREATETABLE +POSTHOOK: Output: database:default +POSTHOOK: Output: default@ss_orc +PREHOOK: query: create table ss_part_orc ( +ss_net_paid_inc_tax float, +ss_net_profit float) +partitioned by (ss_sold_date_sk int) stored as orc +PREHOOK: type: CREATETABLE +PREHOOK: Output: database:default +PREHOOK: Output: default@ss_part_orc +POSTHOOK: query: create table ss_part_orc ( +ss_net_paid_inc_tax float, +ss_net_profit float) +partitioned by (ss_sold_date_sk int) stored as orc +POSTHOOK: type: CREATETABLE +POSTHOOK: Output: database:default +POSTHOOK: Output: default@ss_part_orc +PREHOOK: query: insert overwrite table ss_orc select * from ss +PREHOOK: type: QUERY +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss_orc +POSTHOOK: query: insert overwrite table ss_orc select * from ss +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss_orc +POSTHOOK: Lineage: ss_orc.ss_net_paid_inc_tax SIMPLE [(ss)ss.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_orc.ss_net_profit SIMPLE [(ss)ss.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_orc.ss_sold_date_sk SIMPLE [(ss)ss.FieldSchema(name:ss_sold_date_sk, type:int, comment:null), ] +PREHOOK: query: drop table ss +PREHOOK: type: DROPTABLE +PREHOOK: Input: default@ss +PREHOOK: Output: default@ss +POSTHOOK: query: drop table ss +POSTHOOK: type: DROPTABLE +POSTHOOK: Input: default@ss +POSTHOOK: Output: default@ss +PREHOOK: query: drop table ss_part +PREHOOK: type: DROPTABLE +PREHOOK: Input: default@ss_part +PREHOOK: Output: default@ss_part +POSTHOOK: query: drop table ss_part +POSTHOOK: type: DROPTABLE +POSTHOOK: Input: default@ss_part +POSTHOOK: Output: default@ss_part +PREHOOK: query: explain insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss_orc + Statistics: Num rows: 24 Data size: 288 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + outputColumnNames: ss_sold_date_sk, ss_net_paid_inc_tax, ss_net_profit + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Group By Operator + keys: ss_sold_date_sk (type: int), ss_net_paid_inc_tax (type: float), ss_net_profit (type: float) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: int), _col1 (type: float), _col2 (type: float) + sort order: +++ + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Execution mode: vectorized + Reduce Operator Tree: + Group By Operator + keys: KEY._col0 (type: int), KEY._col1 (type: float), KEY._col2 (type: float) + mode: mergepartial + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col1 (type: float), _col2 (type: float), _col0 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.ss_part_orc + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.ss_part_orc + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_orc +PREHOOK: Output: default@ss_part_orc +POSTHOOK: query: insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + group by ss_sold_date_sk, + ss_net_paid_inc_tax, + ss_net_profit + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_orc +POSTHOOK: Output: default@ss_part_orc@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part_orc@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part_orc +POSTHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part_orc +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part_orc +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 88 + totalSize 417 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.ql.io.orc.OrcSerde +InputFormat: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part_orc +PREHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part_orc +POSTHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +2.1 -2026.3 2452617 +2.99 -11.32 2452617 +85.8 25.61 2452617 +552.96 -1363.84 2452617 +565.92 196.48 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +7412.83 2071.68 2452617 +10022.63 3952.8 2452617 +PREHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part_orc +POSTHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part_orc +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part_orc +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 104 + totalSize 440 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.ql.io.orc.OrcSerde +InputFormat: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part_orc +PREHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part_orc +POSTHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +0.15 -241.22 2452638 +150.39 -162.12 2452638 +156.67 -4626.56 2452638 +181.03 -207.24 2452638 +267.01 -3266.36 2452638 +317.87 -3775.38 2452638 +1327.08 57.97 2452638 +1413.19 178.08 2452638 +1524.33 494.37 2452638 +1971.35 -488.25 2452638 +4133.98 -775.72 2452638 +4329.49 -4000.51 2452638 +10171.1 660.48 2452638 +PREHOOK: query: explain insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: ss_orc + Statistics: Num rows: 24 Data size: 288 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: ((ss_sold_date_sk >= 2452617) and (ss_sold_date_sk <= 2452638)) (type: boolean) + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: ss_net_paid_inc_tax (type: float), ss_net_profit (type: float), ss_sold_date_sk (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + sort order: + Map-reduce partition columns: _col2 (type: int) + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: float), _col1 (type: float), _col2 (type: int) + Execution mode: vectorized + Reduce Operator Tree: + Select Operator + expressions: VALUE._col0 (type: float), VALUE._col1 (type: float), VALUE._col2 (type: int) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.ss_part_orc + + Stage: Stage-0 + Move Operator + tables: + partition: + ss_sold_date_sk + replace: true + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.ss_part_orc + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_orc +PREHOOK: Output: default@ss_part_orc +POSTHOOK: query: insert overwrite table ss_part_orc partition (ss_sold_date_sk) +select ss_net_paid_inc_tax, + ss_net_profit, + ss_sold_date_sk + from ss_orc + where ss_sold_date_sk>=2452617 and ss_sold_date_sk<=2452638 + distribute by ss_sold_date_sk +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_orc +POSTHOOK: Output: default@ss_part_orc@ss_sold_date_sk=2452617 +POSTHOOK: Output: default@ss_part_orc@ss_sold_date_sk=2452638 +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452617).ss_net_paid_inc_tax SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452617).ss_net_profit SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452638).ss_net_paid_inc_tax SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_paid_inc_tax, type:float, comment:null), ] +POSTHOOK: Lineage: ss_part_orc PARTITION(ss_sold_date_sk=2452638).ss_net_profit SIMPLE [(ss_orc)ss_orc.FieldSchema(name:ss_net_profit, type:float, comment:null), ] +PREHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452617) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part_orc +POSTHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452617) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part_orc +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452617] +Database: default +Table: ss_part_orc +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 11 + rawDataSize 88 + totalSize 417 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.ql.io.orc.OrcSerde +InputFormat: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452617 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part_orc +PREHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452617 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part_orc +POSTHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452617 +#### A masked pattern was here #### +3423.95 -3164.07 2452617 +5362.01 -600.28 2452617 +565.92 196.48 2452617 +85.8 25.61 2452617 +7412.83 2071.68 2452617 +879.07 -2185.76 2452617 +1765.07 -4648.8 2452617 +552.96 -1363.84 2452617 +2.1 -2026.3 2452617 +10022.63 3952.8 2452617 +2.99 -11.32 2452617 +PREHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452638) +PREHOOK: type: DESCTABLE +PREHOOK: Input: default@ss_part_orc +POSTHOOK: query: desc formatted ss_part_orc partition(ss_sold_date_sk=2452638) +POSTHOOK: type: DESCTABLE +POSTHOOK: Input: default@ss_part_orc +# col_name data_type comment + +ss_net_paid_inc_tax float +ss_net_profit float + +# Partition Information +# col_name data_type comment + +ss_sold_date_sk int + +# Detailed Partition Information +Partition Value: [2452638] +Database: default +Table: ss_part_orc +#### A masked pattern was here #### +Protect Mode: None +#### A masked pattern was here #### +Partition Parameters: + COLUMN_STATS_ACCURATE true + numFiles 1 + numRows 13 + rawDataSize 104 + totalSize 440 +#### A masked pattern was here #### + +# Storage Information +SerDe Library: org.apache.hadoop.hive.ql.io.orc.OrcSerde +InputFormat: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat +OutputFormat: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat +Compressed: No +Num Buckets: -1 +Bucket Columns: [] +Sort Columns: [] +Storage Desc Params: + serialization.format 1 +PREHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452638 +PREHOOK: type: QUERY +PREHOOK: Input: default@ss_part_orc +PREHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +POSTHOOK: query: select * from ss_part_orc where ss_sold_date_sk=2452638 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@ss_part_orc +POSTHOOK: Input: default@ss_part_orc@ss_sold_date_sk=2452638 +#### A masked pattern was here #### +4329.49 -4000.51 2452638 +1413.19 178.08 2452638 +150.39 -162.12 2452638 +1524.33 494.37 2452638 +0.15 -241.22 2452638 +267.01 -3266.36 2452638 +181.03 -207.24 2452638 +1971.35 -488.25 2452638 +1327.08 57.97 2452638 +156.67 -4626.56 2452638 +317.87 -3775.38 2452638 +10171.1 660.48 2452638 +4133.98 -775.72 2452638 +PREHOOK: query: drop table ss_orc +PREHOOK: type: DROPTABLE +PREHOOK: Input: default@ss_orc +PREHOOK: Output: default@ss_orc +POSTHOOK: query: drop table ss_orc +POSTHOOK: type: DROPTABLE +POSTHOOK: Input: default@ss_orc +POSTHOOK: Output: default@ss_orc +PREHOOK: query: drop table ss_part_orc +PREHOOK: type: DROPTABLE +PREHOOK: Input: default@ss_part_orc +PREHOOK: Output: default@ss_part_orc +POSTHOOK: query: drop table ss_part_orc +POSTHOOK: type: DROPTABLE +POSTHOOK: Input: default@ss_part_orc +POSTHOOK: Output: default@ss_part_orc +PREHOOK: query: drop table if exists hive13_dp1 +PREHOOK: type: DROPTABLE +POSTHOOK: query: drop table if exists hive13_dp1 +POSTHOOK: type: DROPTABLE +PREHOOK: query: create table if not exists hive13_dp1 ( + k1 int, + k2 int +) +PARTITIONED BY(`day` string) +STORED AS ORC +PREHOOK: type: CREATETABLE +PREHOOK: Output: database:default +PREHOOK: Output: default@hive13_dp1 +POSTHOOK: query: create table if not exists hive13_dp1 ( + k1 int, + k2 int +) +PARTITIONED BY(`day` string) +STORED AS ORC +POSTHOOK: type: CREATETABLE +POSTHOOK: Output: database:default +POSTHOOK: Output: default@hive13_dp1 +PREHOOK: query: explain insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: key, value + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Group By Operator + aggregations: count(value) + keys: 'day' (type: string), key (type: string) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string), _col1 (type: string) + sort order: ++ + Map-reduce partition columns: _col0 (type: string), _col1 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col2 (type: bigint) + Reduce Operator Tree: + Group By Operator + aggregations: count(VALUE._col0) + keys: KEY._col0 (type: string), KEY._col1 (type: string) + mode: mergepartial + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: UDFToInteger(_col1) (type: int), UDFToInteger(_col2) (type: int), _col0 (type: string) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.hive13_dp1 + + Stage: Stage-0 + Move Operator + tables: + partition: + day + replace: true + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.hive13_dp1 + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +PREHOOK: type: QUERY +PREHOOK: Input: default@src +PREHOOK: Output: default@hive13_dp1 +POSTHOOK: query: insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +POSTHOOK: type: QUERY +POSTHOOK: Input: default@src +POSTHOOK: Output: default@hive13_dp1@day=day +POSTHOOK: Lineage: hive13_dp1 PARTITION(day=day).k1 EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ] +POSTHOOK: Lineage: hive13_dp1 PARTITION(day=day).k2 EXPRESSION [(src)src.FieldSchema(name:value, type:string, comment:default), ] +PREHOOK: query: select * from hive13_dp1 limit 5 +PREHOOK: type: QUERY +PREHOOK: Input: default@hive13_dp1 +PREHOOK: Input: default@hive13_dp1@day=day +#### A masked pattern was here #### +POSTHOOK: query: select * from hive13_dp1 limit 5 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@hive13_dp1 +POSTHOOK: Input: default@hive13_dp1@day=day +#### A masked pattern was here #### +0 3 day +10 1 day +100 2 day +103 2 day +104 2 day +PREHOOK: query: explain insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +PREHOOK: type: QUERY +POSTHOOK: query: explain insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +POSTHOOK: type: QUERY +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-0 + +STAGE PLANS: + Stage: Stage-1 + Map Reduce + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: key, value + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Group By Operator + aggregations: count(value) + keys: 'day' (type: string), key (type: string) + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string), _col1 (type: string) + sort order: ++ + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col2 (type: bigint) + Reduce Operator Tree: + Group By Operator + aggregations: count(VALUE._col0) + keys: KEY._col0 (type: string), KEY._col1 (type: string) + mode: mergepartial + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: UDFToInteger(_col1) (type: int), UDFToInteger(_col2) (type: int), _col0 (type: string) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.hive13_dp1 + + Stage: Stage-0 + Move Operator + tables: + partition: + day + replace: true + table: + input format: org.apache.hadoop.hive.ql.io.orc.OrcInputFormat + output format: org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + serde: org.apache.hadoop.hive.ql.io.orc.OrcSerde + name: default.hive13_dp1 + + Stage: Stage-2 + Stats-Aggr Operator + +PREHOOK: query: insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +PREHOOK: type: QUERY +PREHOOK: Input: default@src +PREHOOK: Output: default@hive13_dp1 +POSTHOOK: query: insert overwrite table `hive13_dp1` partition(`day`) +select + key k1, + count(value) k2, + "day" `day` +from src +group by "day", key +POSTHOOK: type: QUERY +POSTHOOK: Input: default@src +POSTHOOK: Output: default@hive13_dp1@day=day +POSTHOOK: Lineage: hive13_dp1 PARTITION(day=day).k1 EXPRESSION [(src)src.FieldSchema(name:key, type:string, comment:default), ] +POSTHOOK: Lineage: hive13_dp1 PARTITION(day=day).k2 EXPRESSION [(src)src.FieldSchema(name:value, type:string, comment:default), ] +PREHOOK: query: select * from hive13_dp1 limit 5 +PREHOOK: type: QUERY +PREHOOK: Input: default@hive13_dp1 +PREHOOK: Input: default@hive13_dp1@day=day +#### A masked pattern was here #### +POSTHOOK: query: select * from hive13_dp1 limit 5 +POSTHOOK: type: QUERY +POSTHOOK: Input: default@hive13_dp1 +POSTHOOK: Input: default@hive13_dp1@day=day +#### A masked pattern was here #### +0 3 day +10 1 day +100 2 day +103 2 day +104 2 day +PREHOOK: query: drop table hive13_dp1 +PREHOOK: type: DROPTABLE +PREHOOK: Input: default@hive13_dp1 +PREHOOK: Output: default@hive13_dp1 +POSTHOOK: query: drop table hive13_dp1 +POSTHOOK: type: DROPTABLE +POSTHOOK: Input: default@hive13_dp1 +POSTHOOK: Output: default@hive13_dp1 Modified: hive/branches/branch-0.14/ql/src/test/results/clientpositive/extrapolate_part_stats_partial.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/extrapolate_part_stats_partial.q.out?rev=1628877&r1=1628876&r2=1628877&view=diff ============================================================================== Files hive/branches/branch-0.14/ql/src/test/results/clientpositive/extrapolate_part_stats_partial.q.out (original) and hive/branches/branch-0.14/ql/src/test/results/clientpositive/extrapolate_part_stats_partial.q.out Thu Oct 2 01:59:44 2014 differ Modified: hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map.q.out?rev=1628877&r1=1628876&r2=1628877&view=diff ============================================================================== --- hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map.q.out (original) +++ hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map.q.out Thu Oct 2 01:59:44 2014 @@ -44,10 +44,10 @@ STAGE PLANS: Select Operator expressions: UDFToInteger(_col0) (type: int) outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat Modified: hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map_skew.q.out URL: http://svn.apache.org/viewvc/hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map_skew.q.out?rev=1628877&r1=1628876&r2=1628877&view=diff ============================================================================== --- hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map_skew.q.out (original) +++ hive/branches/branch-0.14/ql/src/test/results/clientpositive/groupby4_map_skew.q.out Thu Oct 2 01:59:44 2014 @@ -44,10 +44,10 @@ STAGE PLANS: Select Operator expressions: UDFToInteger(_col0) (type: int) outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
