http://git-wip-us.apache.org/repos/asf/hive/blob/0f7163fa/ql/src/test/results/clientpositive/perf/tez/query50.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query50.q.out
b/ql/src/test/results/clientpositive/perf/tez/query50.q.out
index efbae5c..cdbaad7 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query50.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query50.q.out
@@ -117,157 +117,157 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Map 12 <- Reducer 10 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 16
(BROADCAST_EDGE), Reducer 8 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE)
-Reducer 10 <- Reducer 2 (CUSTOM_SIMPLE_EDGE)
+Map 1 <- Reducer 10 (BROADCAST_EDGE), Reducer 11 (BROADCAST_EDGE), Reducer 14
(BROADCAST_EDGE), Reducer 16 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE)
+Reducer 10 <- Map 8 (CUSTOM_SIMPLE_EDGE)
+Reducer 11 <- Map 8 (CUSTOM_SIMPLE_EDGE)
Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE)
Reducer 16 <- Map 15 (CUSTOM_SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 11 (SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
Reducer 3 <- Map 12 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
Reducer 4 <- Map 13 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
Reducer 5 <- Map 15 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Reducer 5 (SIMPLE_EDGE)
Reducer 7 <- Reducer 6 (SIMPLE_EDGE)
-Reducer 8 <- Reducer 2 (CUSTOM_SIMPLE_EDGE)
-Reducer 9 <- Reducer 2 (CUSTOM_SIMPLE_EDGE)
+Reducer 9 <- Map 8 (CUSTOM_SIMPLE_EDGE)
Stage-0
Fetch Operator
limit:100
Stage-1
Reducer 7 vectorized
- File Output Operator [FS_156]
- Limit [LIM_155] (rows=100 width=88)
+ File Output Operator [FS_165]
+ Limit [LIM_164] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_154] (rows=383325119 width=88)
+ Select Operator [SEL_163] (rows=421657640 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"]
<-Reducer 6 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_153]
- Group By Operator [GBY_152] (rows=383325119 width=88)
+ SHUFFLE [RS_162]
+ Group By Operator [GBY_161] (rows=421657640 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)"],keys:KEY._col0,
KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7,
KEY._col8, KEY._col9
<-Reducer 5 [SIMPLE_EDGE]
SHUFFLE [RS_30]
PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5,
_col6, _col7, _col8, _col9
- Group By Operator [GBY_29] (rows=766650239 width=88)
+ Group By Operator [GBY_29] (rows=843315281 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)"],keys:_col0,
_col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9
- Top N Key Operator [TNK_56] (rows=766650239 width=88)
+ Top N Key Operator [TNK_56] (rows=843315281 width=88)
keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6,
_col7, _col8, _col9,sort order:++++++++++,top n:100
- Select Operator [SEL_27] (rows=766650239 width=88)
+ Select Operator [SEL_27] (rows=843315281 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"]
- Merge Join Operator [MERGEJOIN_120] (rows=766650239
width=88)
-
Conds:RS_24._col10=RS_143._col0(Inner),Output:["_col0","_col7","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"]
+ Merge Join Operator [MERGEJOIN_120] (rows=843315281
width=88)
+
Conds:RS_24._col3=RS_149._col0(Inner),Output:["_col0","_col5","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"]
<-Map 15 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_143]
+ SHUFFLE [RS_149]
PartitionCols:_col0
- Select Operator [SEL_142] (rows=1704 width=1910)
+ Select Operator [SEL_148] (rows=1704 width=1910)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
- Filter Operator [FIL_141] (rows=1704 width=1910)
+ Filter Operator [FIL_147] (rows=1704 width=1910)
predicate:s_store_sk is not null
TableScan [TS_12] (rows=1704 width=1910)
default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_company_id","s_street_number","s_street_name","s_street_type","s_suite_number","s_city","s_county","s_state","s_zip"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_24]
- PartitionCols:_col10
- Merge Join Operator [MERGEJOIN_119]
(rows=696954748 width=88)
-
Conds:RS_21._col7=RS_135._col0(Inner),Output:["_col0","_col7","_col10"]
+ PartitionCols:_col3
+ Merge Join Operator [MERGEJOIN_119]
(rows=766650239 width=88)
+
Conds:RS_21._col0=RS_141._col0(Inner),Output:["_col0","_col3","_col5"]
<-Map 13 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_135]
+ SHUFFLE [RS_141]
PartitionCols:_col0
- Select Operator [SEL_134] (rows=73049
width=1119)
+ Select Operator [SEL_140] (rows=73049
width=1119)
Output:["_col0"]
- Filter Operator [FIL_133] (rows=73049
width=1119)
+ Filter Operator [FIL_139] (rows=73049
width=1119)
predicate:d_date_sk is not null
TableScan [TS_9] (rows=73049 width=1119)
default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk"]
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_21]
- PartitionCols:_col7
- Merge Join Operator [MERGEJOIN_118]
(rows=633595212 width=88)
- Conds:RS_18._col1, _col2,
_col3=RS_151._col1, _col2, _col4(Inner),Output:["_col0","_col7","_col10"]
+ PartitionCols:_col0
+ Merge Join Operator [MERGEJOIN_118]
(rows=696954748 width=88)
+
Conds:RS_18._col5=RS_160._col0(Inner),Output:["_col0","_col3","_col5"]
+ <-Map 12 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_160]
+ PartitionCols:_col0
+ Select Operator [SEL_159] (rows=18262
width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_158] (rows=18262
width=1119)
+ predicate:((d_moy = 9) and (d_year =
2000) and d_date_sk is not null)
+ TableScan [TS_6] (rows=73049
width=1119)
+
default@date_dim,d2,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
<-Reducer 2 [SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_18]
- PartitionCols:_col1, _col2, _col3
- Merge Join Operator [MERGEJOIN_117]
(rows=63350266 width=77)
-
Conds:RS_123._col0=RS_126._col0(Inner),Output:["_col0","_col1","_col2","_col3"]
- <-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_123]
- PartitionCols:_col0
+ SHUFFLE [RS_18]
+ PartitionCols:_col5
+ Merge Join Operator [MERGEJOIN_117]
(rows=633595212 width=88)
+ Conds:RS_157._col1, _col2,
_col4=RS_123._col1, _col2, _col3(Inner),Output:["_col0","_col3","_col5"]
+ <-Map 8 [SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_123]
+ PartitionCols:_col1, _col2, _col3
Select Operator [SEL_122]
(rows=57591150 width=77)
Output:["_col0","_col1","_col2","_col3"]
Filter Operator [FIL_121]
(rows=57591150 width=77)
predicate:(sr_customer_sk is not
null and sr_item_sk is not null and sr_returned_date_sk is not null and
sr_ticket_number is not null)
- TableScan [TS_0] (rows=57591150
width=77)
+ TableScan [TS_3] (rows=57591150
width=77)
default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number"]
- <-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_126]
- PartitionCols:_col0
- Select Operator [SEL_125] (rows=18262
width=1119)
- Output:["_col0"]
- Filter Operator [FIL_124]
(rows=18262 width=1119)
- predicate:((d_moy = 9) and (d_year
= 2000) and d_date_sk is not null)
- TableScan [TS_3] (rows=73049
width=1119)
-
default@date_dim,d2,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
- <-Map 12 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_151]
- PartitionCols:_col1, _col2, _col4
- Select Operator [SEL_150] (rows=575995635
width=88)
-
Output:["_col0","_col1","_col2","_col3","_col4"]
- Filter Operator [FIL_149]
(rows=575995635 width=88)
- predicate:((ss_customer_sk BETWEEN
DynamicValue(RS_18_store_returns_sr_customer_sk_min) AND
DynamicValue(RS_18_store_returns_sr_customer_sk_max) and
in_bloom_filter(ss_customer_sk,
DynamicValue(RS_18_store_returns_sr_customer_sk_bloom_filter))) and (ss_item_sk
BETWEEN DynamicValue(RS_18_store_returns_sr_item_sk_min) AND
DynamicValue(RS_18_store_returns_sr_item_sk_max) and
in_bloom_filter(ss_item_sk,
DynamicValue(RS_18_store_returns_sr_item_sk_bloom_filter))) and
(ss_sold_date_sk BETWEEN DynamicValue(RS_22_d1_d_date_sk_min) AND
DynamicValue(RS_22_d1_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk,
DynamicValue(RS_22_d1_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN
DynamicValue(RS_25_store_s_store_sk_min) AND
DynamicValue(RS_25_store_s_store_sk_max) and in_bloom_filter(ss_store_sk,
DynamicValue(RS_25_store_s_store_sk_bloom_filter))) and (ss_ticket_number
BETWEEN DynamicValue(RS_18_store_returns_sr_ticket_number_min) AND
DynamicValue(RS_1
8_store_returns_sr_ticket_number_max) and in_bloom_filter(ss_ticket_number,
DynamicValue(RS_18_store_returns_sr_ticket_number_bloom_filter))) and
ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is
not null and ss_store_sk is not null and ss_ticket_number is not null)
- TableScan [TS_6] (rows=575995635
width=88)
-
default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number"]
- <-Reducer 10 [BROADCAST_EDGE]
vectorized
- BROADCAST [RS_132]
- Group By Operator [GBY_131]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=63350264)"]
- <-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_94]
- Group By Operator [GBY_93]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=63350264)"]
- Select Operator [SEL_92]
(rows=63350266 width=77)
- Output:["_col0"]
- Please refer to the
previous Merge Join Operator [MERGEJOIN_117]
- <-Reducer 14 [BROADCAST_EDGE]
vectorized
- BROADCAST [RS_140]
- Group By Operator [GBY_139]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=1000000)"]
- <-Map 13 [CUSTOM_SIMPLE_EDGE]
vectorized
- SHUFFLE [RS_138]
+ <-Map 1 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_157]
+ PartitionCols:_col1, _col2, _col4
+ Select Operator [SEL_156]
(rows=575995635 width=88)
+
Output:["_col0","_col1","_col2","_col3","_col4"]
+ Filter Operator [FIL_155]
(rows=575995635 width=88)
+ predicate:((ss_customer_sk BETWEEN
DynamicValue(RS_16_store_returns_sr_customer_sk_min) AND
DynamicValue(RS_16_store_returns_sr_customer_sk_max) and
in_bloom_filter(ss_customer_sk,
DynamicValue(RS_16_store_returns_sr_customer_sk_bloom_filter))) and (ss_item_sk
BETWEEN DynamicValue(RS_16_store_returns_sr_item_sk_min) AND
DynamicValue(RS_16_store_returns_sr_item_sk_max) and
in_bloom_filter(ss_item_sk,
DynamicValue(RS_16_store_returns_sr_item_sk_bloom_filter))) and
(ss_sold_date_sk BETWEEN DynamicValue(RS_22_d1_d_date_sk_min) AND
DynamicValue(RS_22_d1_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk,
DynamicValue(RS_22_d1_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN
DynamicValue(RS_25_store_s_store_sk_min) AND
DynamicValue(RS_25_store_s_store_sk_max) and in_bloom_filter(ss_store_sk,
DynamicValue(RS_25_store_s_store_sk_bloom_filter))) and (ss_ticket_number
BETWEEN DynamicValue(RS_16_store_returns_sr_ticket_number_min) AND DynamicValue(
RS_16_store_returns_sr_ticket_number_max) and
in_bloom_filter(ss_ticket_number,
DynamicValue(RS_16_store_returns_sr_ticket_number_bloom_filter))) and
ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is
not null and ss_store_sk is not null and ss_ticket_number is not null)
+ TableScan [TS_0] (rows=575995635
width=88)
+
default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number"]
+ <-Reducer 10 [BROADCAST_EDGE]
vectorized
+ BROADCAST [RS_136]
+ Group By Operator [GBY_135]
(rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=57591152)"]
+ <-Map 8 [CUSTOM_SIMPLE_EDGE]
vectorized
+ PARTITION_ONLY_SHUFFLE
[RS_131]
+ Group By Operator
[GBY_128] (rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=57591152)"]
+ Select Operator
[SEL_125] (rows=57591150 width=77)
+ Output:["_col0"]
+ Please refer to the
previous Select Operator [SEL_122]
+ <-Reducer 11 [BROADCAST_EDGE]
vectorized
+ BROADCAST [RS_138]
Group By Operator [GBY_137]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=1000000)"]
- Select Operator [SEL_136]
(rows=73049 width=1119)
- Output:["_col0"]
- Please refer to the
previous Select Operator [SEL_134]
- <-Reducer 16 [BROADCAST_EDGE]
vectorized
- BROADCAST [RS_148]
- Group By Operator [GBY_147]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=1000000)"]
- <-Map 15 [CUSTOM_SIMPLE_EDGE]
vectorized
- SHUFFLE [RS_146]
+
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=57591152)"]
+ <-Map 8 [CUSTOM_SIMPLE_EDGE]
vectorized
+ PARTITION_ONLY_SHUFFLE
[RS_132]
+ Group By Operator
[GBY_129] (rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=57591152)"]
+ Select Operator
[SEL_126] (rows=57591150 width=77)
+ Output:["_col0"]
+ Please refer to the
previous Select Operator [SEL_122]
+ <-Reducer 14 [BROADCAST_EDGE]
vectorized
+ BROADCAST [RS_146]
Group By Operator [GBY_145]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=1000000)"]
- Select Operator [SEL_144]
(rows=1704 width=1910)
- Output:["_col0"]
- Please refer to the
previous Select Operator [SEL_142]
- <-Reducer 8 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_128]
- Group By Operator [GBY_127]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=63350264)"]
- <-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_84]
- Group By Operator [GBY_83]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=63350264)"]
- Select Operator [SEL_82]
(rows=63350266 width=77)
- Output:["_col0"]
- Please refer to the
previous Merge Join Operator [MERGEJOIN_117]
- <-Reducer 9 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_130]
- Group By Operator [GBY_129]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=63350264)"]
- <-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_89]
- Group By Operator [GBY_88]
(rows=1 width=12)
-
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=63350264)"]
- Select Operator [SEL_87]
(rows=63350266 width=77)
- Output:["_col0"]
- Please refer to the
previous Merge Join Operator [MERGEJOIN_117]
+
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=1000000)"]
+ <-Map 13 [CUSTOM_SIMPLE_EDGE]
vectorized
+ SHUFFLE [RS_144]
+ Group By Operator
[GBY_143] (rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=1000000)"]
+ Select Operator
[SEL_142] (rows=73049 width=1119)
+ Output:["_col0"]
+ Please refer to the
previous Select Operator [SEL_140]
+ <-Reducer 16 [BROADCAST_EDGE]
vectorized
+ BROADCAST [RS_154]
+ Group By Operator [GBY_153]
(rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=1000000)"]
+ <-Map 15 [CUSTOM_SIMPLE_EDGE]
vectorized
+ SHUFFLE [RS_152]
+ Group By Operator
[GBY_151] (rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=1000000)"]
+ Select Operator
[SEL_150] (rows=1704 width=1910)
+ Output:["_col0"]
+ Please refer to the
previous Select Operator [SEL_148]
+ <-Reducer 9 [BROADCAST_EDGE]
vectorized
+ BROADCAST [RS_134]
+ Group By Operator [GBY_133]
(rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2,
expectedEntries=57591152)"]
+ <-Map 8 [CUSTOM_SIMPLE_EDGE]
vectorized
+ PARTITION_ONLY_SHUFFLE
[RS_130]
+ Group By Operator
[GBY_127] (rows=1 width=12)
+
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0,
expectedEntries=57591152)"]
+ Select Operator
[SEL_124] (rows=57591150 width=77)
+ Output:["_col0"]
+ Please refer to the
previous Select Operator [SEL_122]