http://git-wip-us.apache.org/repos/asf/hive/blob/ab9e954d/ql/src/test/results/clientpositive/perf/tez/query16.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query16.q.out b/ql/src/test/results/clientpositive/perf/tez/query16.q.out index 0b64c55..5652f3b 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query16.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query16.q.out @@ -80,22 +80,22 @@ Stage-0 limit:-1 Stage-1 Reducer 9 vectorized - File Output Operator [FS_174] - Limit [LIM_173] (rows=1 width=344) + File Output Operator [FS_176] + Limit [LIM_175] (rows=1 width=344) Number of rows:100 - Select Operator [SEL_172] (rows=1 width=344) + Select Operator [SEL_174] (rows=1 width=344) Output:["_col0","_col1","_col2"] <-Reducer 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_171] - Select Operator [SEL_170] (rows=1 width=344) + SHUFFLE [RS_173] + Select Operator [SEL_172] (rows=1 width=344) Output:["_col1","_col2","_col3"] - Group By Operator [GBY_169] (rows=1 width=344) + Group By Operator [GBY_171] (rows=1 width=344) Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] <-Reducer 7 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_168] - Group By Operator [GBY_167] (rows=1 width=344) + PARTITION_ONLY_SHUFFLE [RS_170] + Group By Operator [GBY_169] (rows=1 width=344) Output:["_col0","_col1","_col2"],aggregations:["count(_col0)","sum(_col1)","sum(_col2)"] - Group By Operator [GBY_166] (rows=231905279 width=135) + Group By Operator [GBY_168] (rows=231905279 width=135) Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0 <-Reducer 6 [SIMPLE_EDGE] SHUFFLE [RS_74] @@ -106,21 +106,21 @@ Stage-0 Output:["_col4","_col5","_col6"] Filter Operator [FIL_41] (rows=231905279 width=135) predicate:_col14 is null - Merge Join Operator [MERGEJOIN_128] (rows=463810558 width=135) - Conds:RS_38._col4=RS_165._col0(Left Outer),Output:["_col4","_col5","_col6","_col14"] + Merge Join Operator [MERGEJOIN_130] (rows=463810558 width=135) + Conds:RS_38._col4=RS_167._col0(Left Outer),Output:["_col4","_col5","_col6","_col14"] <-Reducer 18 [ONE_TO_ONE_EDGE] vectorized - FORWARD [RS_165] + FORWARD [RS_167] PartitionCols:_col0 - Select Operator [SEL_164] (rows=14399440 width=106) + Select Operator [SEL_166] (rows=14399440 width=106) Output:["_col0","_col1"] - Group By Operator [GBY_163] (rows=14399440 width=106) + Group By Operator [GBY_165] (rows=14399440 width=106) Output:["_col0"],keys:KEY._col0 <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_162] + SHUFFLE [RS_164] PartitionCols:_col0 - Group By Operator [GBY_161] (rows=28798881 width=106) + Group By Operator [GBY_163] (rows=28798881 width=106) Output:["_col0"],keys:cr_order_number - Filter Operator [FIL_160] (rows=28798881 width=106) + Filter Operator [FIL_162] (rows=28798881 width=106) predicate:cr_order_number is not null TableScan [TS_25] (rows=28798881 width=106) default@catalog_returns,cr1,Tbl:COMPLETE,Col:NONE,Output:["cr_order_number"] @@ -129,101 +129,101 @@ Stage-0 PartitionCols:_col4 Select Operator [SEL_37] (rows=421645953 width=135) Output:["_col4","_col5","_col6"] - Merge Join Operator [MERGEJOIN_127] (rows=421645953 width=135) - Conds:RS_34._col4=RS_159._col0(Left Semi),Output:["_col3","_col4","_col5","_col6","_col14"],residual filter predicates:{(_col3 <> _col14)} + Merge Join Operator [MERGEJOIN_129] (rows=421645953 width=135) + Conds:RS_34._col4=RS_161._col0(Left Semi),Output:["_col3","_col4","_col5","_col6","_col14"],residual filter predicates:{(_col3 <> _col14)} <-Map 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_159] + SHUFFLE [RS_161] PartitionCols:_col0 - Group By Operator [GBY_158] (rows=287989836 width=135) + Group By Operator [GBY_160] (rows=287989836 width=135) Output:["_col0","_col1"],keys:_col0, _col1 - Select Operator [SEL_157] (rows=287989836 width=135) + Select Operator [SEL_159] (rows=287989836 width=135) Output:["_col0","_col1"] - Filter Operator [FIL_156] (rows=287989836 width=135) + Filter Operator [FIL_158] (rows=287989836 width=135) predicate:(cs_order_number is not null and cs_warehouse_sk is not null) TableScan [TS_22] (rows=287989836 width=135) default@catalog_sales,cs2,Tbl:COMPLETE,Col:NONE,Output:["cs_warehouse_sk","cs_order_number"] <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_34] PartitionCols:_col4 - Merge Join Operator [MERGEJOIN_126] (rows=383314495 width=135) - Conds:RS_18._col2=RS_147._col0(Inner),Output:["_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_128] (rows=383314495 width=135) + Conds:RS_18._col2=RS_149._col0(Inner),Output:["_col3","_col4","_col5","_col6"] <-Map 14 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_147] + SHUFFLE [RS_149] PartitionCols:_col0 - Select Operator [SEL_146] (rows=30 width=2045) + Select Operator [SEL_148] (rows=30 width=2045) Output:["_col0"] - Filter Operator [FIL_145] (rows=30 width=2045) + Filter Operator [FIL_147] (rows=30 width=2045) predicate:((cc_county) IN ('Ziebach County', 'Levy County', 'Huron County', 'Franklin Parish', 'Daviess County') and cc_call_center_sk is not null) TableScan [TS_9] (rows=60 width=2045) default@call_center,call_center,Tbl:COMPLETE,Col:NONE,Output:["cc_call_center_sk","cc_county"] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_18] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_125] (rows=348467716 width=135) - Conds:RS_15._col1=RS_139._col0(Inner),Output:["_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_127] (rows=348467716 width=135) + Conds:RS_15._col1=RS_141._col0(Inner),Output:["_col2","_col3","_col4","_col5","_col6"] <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_139] + SHUFFLE [RS_141] PartitionCols:_col0 - Select Operator [SEL_138] (rows=20000000 width=1014) + Select Operator [SEL_140] (rows=20000000 width=1014) Output:["_col0"] - Filter Operator [FIL_137] (rows=20000000 width=1014) + Filter Operator [FIL_139] (rows=20000000 width=1014) predicate:((ca_state = 'NY') and ca_address_sk is not null) TableScan [TS_6] (rows=40000000 width=1014) default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_15] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_124] (rows=316788826 width=135) - Conds:RS_155._col0=RS_131._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_126] (rows=316788826 width=135) + Conds:RS_157._col0=RS_133._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6"] <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_131] + SHUFFLE [RS_133] PartitionCols:_col0 - Select Operator [SEL_130] (rows=8116 width=1119) + Select Operator [SEL_132] (rows=8116 width=1119) Output:["_col0"] - Filter Operator [FIL_129] (rows=8116 width=1119) + Filter Operator [FIL_131] (rows=8116 width=1119) predicate:(CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'2001-04-01 00:00:00' AND TIMESTAMP'2001-05-31 00:00:00' and d_date_sk is not null) TableScan [TS_3] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_155] + SHUFFLE [RS_157] PartitionCols:_col0 - Select Operator [SEL_154] (rows=287989836 width=135) + Select Operator [SEL_156] (rows=287989836 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Filter Operator [FIL_153] (rows=287989836 width=135) + Filter Operator [FIL_155] (rows=287989836 width=135) predicate:((cs_call_center_sk BETWEEN DynamicValue(RS_19_call_center_cc_call_center_sk_min) AND DynamicValue(RS_19_call_center_cc_call_center_sk_max) and in_bloom_filter(cs_call_center_sk, DynamicValue(RS_19_call_center_cc_call_center_sk_bloom_filter))) and (cs_ship_addr_sk BETWEEN DynamicValue(RS_16_customer_address_ca_address_sk_min) AND DynamicValue(RS_16_customer_address_ca_address_sk_max) and in_bloom_filter(cs_ship_addr_sk, DynamicValue(RS_16_customer_address_ca_address_sk_bloom_filter))) and (cs_ship_date_sk BETWEEN DynamicValue(RS_13_date_dim_d_date_sk_min) AND DynamicValue(RS_13_date_dim_d_date_sk_max) and in_bloom_filter(cs_ship_date_sk, DynamicValue(RS_13_date_dim_d_date_sk_bloom_filter))) and cs_call_center_sk is not null and cs_order_number is not null and cs_ship_addr_sk is not null and cs_ship_date_sk is not null) TableScan [TS_0] (rows=287989836 width=135) default@catalog_sales,cs1,Tbl:COMPLETE,Col:NONE,Output:["cs_ship_date_sk","cs_ship_addr_sk","cs_call_center_sk","cs_warehouse_sk","cs_order_number","cs_ext_ship_cost","cs_net_profit"] <-Reducer 11 [BROADCAST_EDGE] vectorized - BROADCAST [RS_136] - Group By Operator [GBY_135] (rows=1 width=12) + BROADCAST [RS_138] + Group By Operator [GBY_137] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 10 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_134] - Group By Operator [GBY_133] (rows=1 width=12) + SHUFFLE [RS_136] + Group By Operator [GBY_135] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_132] (rows=8116 width=1119) + Select Operator [SEL_134] (rows=8116 width=1119) Output:["_col0"] - Please refer to the previous Select Operator [SEL_130] + Please refer to the previous Select Operator [SEL_132] <-Reducer 13 [BROADCAST_EDGE] vectorized - BROADCAST [RS_144] - Group By Operator [GBY_143] (rows=1 width=12) + BROADCAST [RS_146] + Group By Operator [GBY_145] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=20000000)"] <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_142] - Group By Operator [GBY_141] (rows=1 width=12) + SHUFFLE [RS_144] + Group By Operator [GBY_143] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=20000000)"] - Select Operator [SEL_140] (rows=20000000 width=1014) + Select Operator [SEL_142] (rows=20000000 width=1014) Output:["_col0"] - Please refer to the previous Select Operator [SEL_138] + Please refer to the previous Select Operator [SEL_140] <-Reducer 15 [BROADCAST_EDGE] vectorized - BROADCAST [RS_152] - Group By Operator [GBY_151] (rows=1 width=12) + BROADCAST [RS_154] + Group By Operator [GBY_153] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_150] - Group By Operator [GBY_149] (rows=1 width=12) + SHUFFLE [RS_152] + Group By Operator [GBY_151] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_148] (rows=30 width=2045) + Select Operator [SEL_150] (rows=30 width=2045) Output:["_col0"] - Please refer to the previous Select Operator [SEL_146] + Please refer to the previous Select Operator [SEL_148]
http://git-wip-us.apache.org/repos/asf/hive/blob/ab9e954d/ql/src/test/results/clientpositive/perf/tez/query17.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query17.q.out b/ql/src/test/results/clientpositive/perf/tez/query17.q.out index 2e5e254..620d88a 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query17.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query17.q.out @@ -89,8 +89,8 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Reducer 17 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) -Map 18 <- Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE) +Map 1 <- Reducer 14 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) +Map 18 <- Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE) Reducer 10 <- Map 18 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) Reducer 11 <- Reducer 10 (SIMPLE_EDGE), Reducer 13 (SIMPLE_EDGE) Reducer 12 <- Map 8 (CUSTOM_SIMPLE_EDGE) @@ -112,16 +112,16 @@ Stage-0 limit:100 Stage-1 Reducer 7 vectorized - File Output Operator [FS_256] - Limit [LIM_255] (rows=100 width=88) + File Output Operator [FS_269] + Limit [LIM_268] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_254] (rows=421657640 width=88) + Select Operator [SEL_267] (rows=421657640 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] <-Reducer 6 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_253] - Select Operator [SEL_252] (rows=421657640 width=88) + SHUFFLE [RS_266] + Select Operator [SEL_265] (rows=421657640 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - Group By Operator [GBY_251] (rows=421657640 width=88) + Group By Operator [GBY_264] (rows=421657640 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","count(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","count(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)"],keys:KEY._col0, KEY._col1, KEY._col2 <-Reducer 5 [SIMPLE_EDGE] SHUFFLE [RS_50] @@ -130,172 +130,181 @@ Stage-0 Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["count(_col3)","sum(_col3)","sum(_col7)","sum(_col6)","count(_col4)","sum(_col4)","sum(_col9)","sum(_col8)","count(_col5)","sum(_col5)","sum(_col11)","sum(_col10)"],keys:_col0, _col1, _col2 Select Operator [SEL_47] (rows=843315281 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - Merge Join Operator [MERGEJOIN_202] (rows=843315281 width=88) - Conds:RS_44._col3=RS_230._col0(Inner),Output:["_col5","_col9","_col10","_col14","_col21","_col25"] + Merge Join Operator [MERGEJOIN_212] (rows=843315281 width=88) + Conds:RS_44._col3=RS_250._col0(Inner),Output:["_col5","_col9","_col10","_col14","_col21","_col25"] <-Map 20 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_230] + SHUFFLE [RS_250] PartitionCols:_col0 - Select Operator [SEL_229] (rows=1704 width=1910) + Select Operator [SEL_249] (rows=1704 width=1910) Output:["_col0","_col1"] - Filter Operator [FIL_228] (rows=1704 width=1910) + Filter Operator [FIL_248] (rows=1704 width=1910) predicate:s_store_sk is not null TableScan [TS_32] (rows=1704 width=1910) default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_44] PartitionCols:_col3 - Merge Join Operator [MERGEJOIN_201] (rows=766650239 width=88) + Merge Join Operator [MERGEJOIN_211] (rows=766650239 width=88) Conds:RS_41._col1, _col2, _col4=RS_42._col7, _col8, _col9(Inner),Output:["_col3","_col5","_col9","_col10","_col14","_col21"] <-Reducer 11 [SIMPLE_EDGE] SHUFFLE [RS_42] PartitionCols:_col7, _col8, _col9 - Merge Join Operator [MERGEJOIN_200] (rows=348467716 width=135) + Merge Join Operator [MERGEJOIN_210] (rows=348467716 width=135) Conds:RS_28._col2, _col1=RS_29._col1, _col2(Inner),Output:["_col3","_col7","_col8","_col9","_col10"] <-Reducer 13 [SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_29] PartitionCols:_col1, _col2 - Merge Join Operator [MERGEJOIN_199] (rows=63350266 width=77) - Conds:RS_243._col0=RS_213._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_209] (rows=63350266 width=77) + Conds:RS_241._col0=RS_223._col0(Inner),Output:["_col1","_col2","_col3","_col4"] <-Map 8 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_213] + PARTITION_ONLY_SHUFFLE [RS_223] PartitionCols:_col0 - Select Operator [SEL_208] (rows=36525 width=1119) + Select Operator [SEL_218] (rows=36525 width=1119) Output:["_col0"] - Filter Operator [FIL_205] (rows=36525 width=1119) + Filter Operator [FIL_215] (rows=36525 width=1119) predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) TableScan [TS_3] (rows=73049 width=1119) default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_quarter_name"] <-Map 19 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_243] + SHUFFLE [RS_241] PartitionCols:_col0 - Select Operator [SEL_242] (rows=57591150 width=77) + Select Operator [SEL_240] (rows=57591150 width=77) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_241] (rows=57591150 width=77) + Filter Operator [FIL_239] (rows=57591150 width=77) predicate:(sr_customer_sk is not null and sr_item_sk is not null and sr_returned_date_sk is not null and sr_ticket_number is not null) TableScan [TS_15] (rows=57591150 width=77) default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number","sr_return_quantity"] <-Reducer 10 [SIMPLE_EDGE] SHUFFLE [RS_28] PartitionCols:_col2, _col1 - Merge Join Operator [MERGEJOIN_198] (rows=316788826 width=135) - Conds:RS_250._col0=RS_211._col0(Inner),Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_208] (rows=316788826 width=135) + Conds:RS_263._col0=RS_221._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 8 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_211] + PARTITION_ONLY_SHUFFLE [RS_221] PartitionCols:_col0 - Select Operator [SEL_207] (rows=36525 width=1119) + Select Operator [SEL_217] (rows=36525 width=1119) Output:["_col0"] - Filter Operator [FIL_204] (rows=36525 width=1119) + Filter Operator [FIL_214] (rows=36525 width=1119) predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) Please refer to the previous TableScan [TS_3] <-Map 18 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_250] + SHUFFLE [RS_263] PartitionCols:_col0 - Select Operator [SEL_249] (rows=287989836 width=135) + Select Operator [SEL_262] (rows=287989836 width=135) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_248] (rows=287989836 width=135) - predicate:((cs_bill_customer_sk BETWEEN DynamicValue(RS_29_store_returns_sr_customer_sk_min) AND DynamicValue(RS_29_store_returns_sr_customer_sk_max) and in_bloom_filter(cs_bill_customer_sk, DynamicValue(RS_29_store_returns_sr_customer_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_29_store_returns_sr_item_sk_min) AND DynamicValue(RS_29_store_returns_sr_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_29_store_returns_sr_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_26_d3_d_date_sk_min) AND DynamicValue(RS_26_d3_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_26_d3_d_date_sk_bloom_filter))) and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null) + Filter Operator [FIL_261] (rows=287989836 width=135) + predicate:((cs_bill_customer_sk BETWEEN DynamicValue(RS_29_store_returns_sr_customer_sk_min) AND DynamicValue(RS_29_store_returns_sr_customer_sk_max) and in_bloom_filter(cs_bill_customer_sk, DynamicValue(RS_29_store_returns_sr_customer_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_29_store_returns_sr_item_sk_min) AND DynamicValue(RS_29_store_returns_sr_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_29_store_returns_sr_item_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_39_item_i_item_sk_min) AND DynamicValue(RS_39_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_39_item_i_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_26_d3_d_date_sk_min) AND DynamicValue(RS_26_d3_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_26_d3_d_date_sk_bloom_filter))) and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null) TableScan [TS_9] (rows=287989836 width=135) default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_quantity"] - <-Reducer 12 [BROADCAST_EDGE] vectorized - BROADCAST [RS_240] - Group By Operator [GBY_239] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_217] - Group By Operator [GBY_215] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_212] (rows=36525 width=1119) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_207] <-Reducer 14 [BROADCAST_EDGE] vectorized - BROADCAST [RS_245] - Group By Operator [GBY_244] (rows=1 width=12) + BROADCAST [RS_244] + Group By Operator [GBY_242] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=63350264)"] <-Reducer 13 [CUSTOM_SIMPLE_EDGE] - PARTITION_ONLY_SHUFFLE [RS_141] - Group By Operator [GBY_140] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_110] + Group By Operator [GBY_109] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=63350264)"] - Select Operator [SEL_139] (rows=63350266 width=77) + Select Operator [SEL_108] (rows=63350266 width=77) Output:["_col0"] - Please refer to the previous Merge Join Operator [MERGEJOIN_199] + Please refer to the previous Merge Join Operator [MERGEJOIN_209] <-Reducer 15 [BROADCAST_EDGE] vectorized BROADCAST [RS_247] - Group By Operator [GBY_246] (rows=1 width=12) + Group By Operator [GBY_245] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=63350264)"] <-Reducer 13 [CUSTOM_SIMPLE_EDGE] - PARTITION_ONLY_SHUFFLE [RS_146] - Group By Operator [GBY_145] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_125] + Group By Operator [GBY_124] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=63350264)"] - Select Operator [SEL_144] (rows=63350266 width=77) + Select Operator [SEL_123] (rows=63350266 width=77) + Output:["_col0"] + Please refer to the previous Merge Join Operator [MERGEJOIN_209] + <-Reducer 17 [BROADCAST_EDGE] vectorized + BROADCAST [RS_238] + Group By Operator [GBY_236] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_235] + Group By Operator [GBY_234] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_233] (rows=462000 width=1436) Output:["_col0"] - Please refer to the previous Merge Join Operator [MERGEJOIN_199] + Select Operator [SEL_231] (rows=462000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_230] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] + <-Reducer 12 [BROADCAST_EDGE] vectorized + BROADCAST [RS_260] + Group By Operator [GBY_259] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_227] + Group By Operator [GBY_225] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_222] (rows=36525 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_217] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_41] PartitionCols:_col1, _col2, _col4 - Merge Join Operator [MERGEJOIN_197] (rows=696954748 width=88) - Conds:RS_38._col1=RS_222._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col9","_col10"] + Merge Join Operator [MERGEJOIN_207] (rows=696954748 width=88) + Conds:RS_38._col1=RS_232._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col9","_col10"] <-Map 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_222] + SHUFFLE [RS_232] PartitionCols:_col0 - Select Operator [SEL_221] (rows=462000 width=1436) - Output:["_col0","_col1","_col2"] - Filter Operator [FIL_220] (rows=462000 width=1436) - predicate:i_item_sk is not null - TableScan [TS_6] (rows=462000 width=1436) - default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] + Please refer to the previous Select Operator [SEL_231] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_38] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_196] (rows=633595212 width=88) - Conds:RS_238._col0=RS_209._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_206] (rows=633595212 width=88) + Conds:RS_258._col0=RS_219._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5"] <-Map 8 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_209] + PARTITION_ONLY_SHUFFLE [RS_219] PartitionCols:_col0 - Select Operator [SEL_206] (rows=36524 width=1119) + Select Operator [SEL_216] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_203] (rows=36524 width=1119) + Filter Operator [FIL_213] (rows=36524 width=1119) predicate:((d_quarter_name = '2000Q1') and d_date_sk is not null) Please refer to the previous TableScan [TS_3] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_238] + SHUFFLE [RS_258] PartitionCols:_col0 - Select Operator [SEL_237] (rows=575995635 width=88) + Select Operator [SEL_257] (rows=575995635 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] - Filter Operator [FIL_236] (rows=575995635 width=88) - predicate:((ss_item_sk BETWEEN DynamicValue(RS_39_item_i_item_sk_min) AND DynamicValue(RS_39_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_39_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_36_d1_d_date_sk_min) AND DynamicValue(RS_36_d1_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_36_d1_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_45_store_s_store_sk_min) AND DynamicValue(RS_45_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_45_store_s_store_sk_bloom_filter))) and ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null and ss_ticket_number is not null) + Filter Operator [FIL_256] (rows=575995635 width=88) + predicate:((ss_customer_sk BETWEEN DynamicValue(RS_29_store_returns_sr_customer_sk_min) AND DynamicValue(RS_29_store_returns_sr_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_29_store_returns_sr_customer_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_29_store_returns_sr_item_sk_min) AND DynamicValue(RS_29_store_returns_sr_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_29_store_returns_sr_item_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_39_item_i_item_sk_min) AND DynamicValue(RS_39_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_39_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_36_d1_d_date_sk_min) AND DynamicValue(RS_36_d1_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_36_d1_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_45_store_s_store_sk_min) AND DynamicValue(RS_45_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_45_store_s_store_sk_bloom_filter))) and ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null and ss_ticket_number is not null) TableScan [TS_0] (rows=575995635 width=88) default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number","ss_quantity"] + <-Reducer 14 [BROADCAST_EDGE] vectorized + BROADCAST [RS_243] + Please refer to the previous Group By Operator [GBY_242] + <-Reducer 15 [BROADCAST_EDGE] vectorized + BROADCAST [RS_246] + Please refer to the previous Group By Operator [GBY_245] <-Reducer 17 [BROADCAST_EDGE] vectorized - BROADCAST [RS_227] - Group By Operator [GBY_226] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_225] - Group By Operator [GBY_224] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_223] (rows=462000 width=1436) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_221] + BROADCAST [RS_237] + Please refer to the previous Group By Operator [GBY_236] <-Reducer 21 [BROADCAST_EDGE] vectorized - BROADCAST [RS_235] - Group By Operator [GBY_234] (rows=1 width=12) + BROADCAST [RS_255] + Group By Operator [GBY_254] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 20 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_233] - Group By Operator [GBY_232] (rows=1 width=12) + SHUFFLE [RS_253] + Group By Operator [GBY_252] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_231] (rows=1704 width=1910) + Select Operator [SEL_251] (rows=1704 width=1910) Output:["_col0"] - Please refer to the previous Select Operator [SEL_229] + Please refer to the previous Select Operator [SEL_249] <-Reducer 9 [BROADCAST_EDGE] vectorized - BROADCAST [RS_219] - Group By Operator [GBY_218] (rows=1 width=12) + BROADCAST [RS_229] + Group By Operator [GBY_228] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_216] - Group By Operator [GBY_214] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_226] + Group By Operator [GBY_224] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_210] (rows=36524 width=1119) + Select Operator [SEL_220] (rows=36524 width=1119) Output:["_col0"] - Please refer to the previous Select Operator [SEL_206] + Please refer to the previous Select Operator [SEL_216] http://git-wip-us.apache.org/repos/asf/hive/blob/ab9e954d/ql/src/test/results/clientpositive/perf/tez/query18.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query18.q.out b/ql/src/test/results/clientpositive/perf/tez/query18.q.out index e858527..1b9b2fb 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query18.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query18.q.out @@ -86,16 +86,16 @@ Stage-0 limit:100 Stage-1 Reducer 6 vectorized - File Output Operator [FS_187] - Limit [LIM_186] (rows=100 width=135) + File Output Operator [FS_189] + Limit [LIM_188] (rows=100 width=135) Number of rows:100 - Select Operator [SEL_185] (rows=1054114882 width=135) + Select Operator [SEL_187] (rows=1054114882 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] <-Reducer 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_184] - Select Operator [SEL_183] (rows=1054114882 width=135) + SHUFFLE [RS_186] + Select Operator [SEL_185] (rows=1054114882 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - Group By Operator [GBY_182] (rows=1054114882 width=135) + Group By Operator [GBY_184] (rows=1054114882 width=135) Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["sum(VALUE._col0)","count(VALUE._col1)","sum(VALUE._col2)","count(VALUE._col3)","sum(VALUE._col4)","count(VALUE._col5)","sum(VALUE._col6)","count(VALUE._col7)","sum(VALUE._col8)","count(VALUE._col9)","sum(VALUE._col10)","count(VALUE._col11)","sum(VALUE._col12)","count(VALUE._col13)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_43] @@ -104,42 +104,42 @@ Stage-0 Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["sum(_col4)","count(_col4)","sum(_col5)","count(_col5)","sum(_col6)","count(_col6)","sum(_col7)","count(_col7)","sum(_col8)","count(_col8)","sum(_col9)","count(_col9)","sum(_col10)","count(_col10)"],keys:_col0, _col1, _col2, _col3, 0L Select Operator [SEL_40] (rows=421645953 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - Merge Join Operator [MERGEJOIN_143] (rows=421645953 width=135) + Merge Join Operator [MERGEJOIN_145] (rows=421645953 width=135) Conds:RS_37._col0=RS_38._col3(Inner),Output:["_col4","_col6","_col7","_col8","_col11","_col16","_col17","_col18","_col19","_col20","_col26"] <-Reducer 3 [SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_37] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_139] (rows=48400001 width=860) - Conds:RS_34._col1=RS_152._col0(Inner),Output:["_col0","_col4","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_141] (rows=48400001 width=860) + Conds:RS_34._col1=RS_154._col0(Inner),Output:["_col0","_col4","_col6","_col7","_col8"] <-Map 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_152] + SHUFFLE [RS_154] PartitionCols:_col0 - Select Operator [SEL_151] (rows=1861800 width=385) + Select Operator [SEL_153] (rows=1861800 width=385) Output:["_col0"] - Filter Operator [FIL_150] (rows=1861800 width=385) + Filter Operator [FIL_152] (rows=1861800 width=385) predicate:cd_demo_sk is not null TableScan [TS_6] (rows=1861800 width=385) default@customer_demographics,cd2,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_34] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_138] (rows=44000000 width=860) - Conds:RS_146._col2=RS_149._col0(Inner),Output:["_col0","_col1","_col4","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_140] (rows=44000000 width=860) + Conds:RS_148._col2=RS_151._col0(Inner),Output:["_col0","_col1","_col4","_col6","_col7","_col8"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_146] + SHUFFLE [RS_148] PartitionCols:_col2 - Select Operator [SEL_145] (rows=40000000 width=860) + Select Operator [SEL_147] (rows=40000000 width=860) Output:["_col0","_col1","_col2","_col4"] - Filter Operator [FIL_144] (rows=40000000 width=860) + Filter Operator [FIL_146] (rows=40000000 width=860) predicate:((c_birth_month) IN (9, 5, 12, 4, 1, 10) and c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null) TableScan [TS_0] (rows=80000000 width=860) default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk","c_birth_month","c_birth_year"] <-Map 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_149] + SHUFFLE [RS_151] PartitionCols:_col0 - Select Operator [SEL_148] (rows=20000000 width=1014) + Select Operator [SEL_150] (rows=20000000 width=1014) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_147] (rows=20000000 width=1014) + Filter Operator [FIL_149] (rows=20000000 width=1014) predicate:((ca_state) IN ('ND', 'WI', 'AL', 'NC', 'OK', 'MS', 'TN') and ca_address_sk is not null) TableScan [TS_3] (rows=40000000 width=1014) default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state","ca_country"] @@ -148,96 +148,96 @@ Stage-0 PartitionCols:_col3 Select Operator [SEL_30] (rows=383314495 width=135) Output:["_col1","_col3","_col6","_col7","_col8","_col9","_col10","_col16"] - Merge Join Operator [MERGEJOIN_142] (rows=383314495 width=135) - Conds:RS_27._col3=RS_171._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col8","_col14","_col16"] + Merge Join Operator [MERGEJOIN_144] (rows=383314495 width=135) + Conds:RS_27._col3=RS_173._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col8","_col14","_col16"] <-Map 18 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_171] + PARTITION_ONLY_SHUFFLE [RS_173] PartitionCols:_col0 - Select Operator [SEL_170] (rows=462000 width=1436) + Select Operator [SEL_172] (rows=462000 width=1436) Output:["_col0","_col1"] - Filter Operator [FIL_169] (rows=462000 width=1436) + Filter Operator [FIL_171] (rows=462000 width=1436) predicate:i_item_sk is not null TableScan [TS_18] (rows=462000 width=1436) default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] <-Reducer 12 [SIMPLE_EDGE] SHUFFLE [RS_27] PartitionCols:_col3 - Merge Join Operator [MERGEJOIN_141] (rows=348467716 width=135) - Conds:RS_24._col2=RS_163._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col14"] + Merge Join Operator [MERGEJOIN_143] (rows=348467716 width=135) + Conds:RS_24._col2=RS_165._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col14"] <-Map 16 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_163] + PARTITION_ONLY_SHUFFLE [RS_165] PartitionCols:_col0 - Select Operator [SEL_162] (rows=465450 width=385) + Select Operator [SEL_164] (rows=465450 width=385) Output:["_col0","_col3"] - Filter Operator [FIL_161] (rows=465450 width=385) + Filter Operator [FIL_163] (rows=465450 width=385) predicate:((cd_education_status = 'College') and (cd_gender = 'M') and cd_demo_sk is not null) TableScan [TS_15] (rows=1861800 width=385) default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_education_status","cd_dep_count"] <-Reducer 11 [SIMPLE_EDGE] SHUFFLE [RS_24] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_140] (rows=316788826 width=135) - Conds:RS_181._col0=RS_155._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_142] (rows=316788826 width=135) + Conds:RS_183._col0=RS_157._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] <-Map 14 [SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_155] + PARTITION_ONLY_SHUFFLE [RS_157] PartitionCols:_col0 - Select Operator [SEL_154] (rows=36524 width=1119) + Select Operator [SEL_156] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_153] (rows=36524 width=1119) + Filter Operator [FIL_155] (rows=36524 width=1119) predicate:((d_year = 2001) and d_date_sk is not null) TableScan [TS_12] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_181] + SHUFFLE [RS_183] PartitionCols:_col0 - Select Operator [SEL_180] (rows=287989836 width=135) + Select Operator [SEL_182] (rows=287989836 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Filter Operator [FIL_179] (rows=287989836 width=135) + Filter Operator [FIL_181] (rows=287989836 width=135) predicate:((cs_bill_cdemo_sk BETWEEN DynamicValue(RS_25_cd1_cd_demo_sk_min) AND DynamicValue(RS_25_cd1_cd_demo_sk_max) and in_bloom_filter(cs_bill_cdemo_sk, DynamicValue(RS_25_cd1_cd_demo_sk_bloom_filter))) and (cs_bill_customer_sk BETWEEN DynamicValue(RS_37_customer_c_customer_sk_min) AND DynamicValue(RS_37_customer_c_customer_sk_max) and in_bloom_filter(cs_bill_customer_sk, DynamicValue(RS_37_customer_c_customer_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_28_item_i_item_sk_min) AND DynamicValue(RS_28_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_28_item_i_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_22_date_dim_d_date_sk_min) AND DynamicValue(RS_22_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_22_date_dim_d_date_sk_bloom_filter))) and cs_bill_cdemo_sk is not null and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null) TableScan [TS_9] (rows=287989836 width=135) default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_bill_cdemo_sk","cs_item_sk","cs_quantity","cs_list_price","cs_sales_price","cs_coupon_amt","cs_net_profit"] <-Reducer 15 [BROADCAST_EDGE] vectorized - BROADCAST [RS_160] - Group By Operator [GBY_159] (rows=1 width=12) + BROADCAST [RS_162] + Group By Operator [GBY_161] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_158] - Group By Operator [GBY_157] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_160] + Group By Operator [GBY_159] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_156] (rows=36524 width=1119) + Select Operator [SEL_158] (rows=36524 width=1119) Output:["_col0"] - Please refer to the previous Select Operator [SEL_154] + Please refer to the previous Select Operator [SEL_156] <-Reducer 17 [BROADCAST_EDGE] vectorized - BROADCAST [RS_168] - Group By Operator [GBY_167] (rows=1 width=12) + BROADCAST [RS_170] + Group By Operator [GBY_169] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_166] - Group By Operator [GBY_165] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_168] + Group By Operator [GBY_167] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_164] (rows=465450 width=385) + Select Operator [SEL_166] (rows=465450 width=385) Output:["_col0"] - Please refer to the previous Select Operator [SEL_162] + Please refer to the previous Select Operator [SEL_164] <-Reducer 19 [BROADCAST_EDGE] vectorized - BROADCAST [RS_176] - Group By Operator [GBY_175] (rows=1 width=12) + BROADCAST [RS_178] + Group By Operator [GBY_177] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] <-Map 18 [CUSTOM_SIMPLE_EDGE] vectorized - PARTITION_ONLY_SHUFFLE [RS_174] - Group By Operator [GBY_173] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_176] + Group By Operator [GBY_175] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_172] (rows=462000 width=1436) + Select Operator [SEL_174] (rows=462000 width=1436) Output:["_col0"] - Please refer to the previous Select Operator [SEL_170] + Please refer to the previous Select Operator [SEL_172] <-Reducer 7 [BROADCAST_EDGE] vectorized - BROADCAST [RS_178] - Group By Operator [GBY_177] (rows=1 width=12) + BROADCAST [RS_180] + Group By Operator [GBY_179] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=48400000)"] <-Reducer 3 [CUSTOM_SIMPLE_EDGE] - PARTITION_ONLY_SHUFFLE [RS_120] - Group By Operator [GBY_119] (rows=1 width=12) + PARTITION_ONLY_SHUFFLE [RS_126] + Group By Operator [GBY_125] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=48400000)"] - Select Operator [SEL_118] (rows=48400001 width=860) + Select Operator [SEL_124] (rows=48400001 width=860) Output:["_col0"] - Please refer to the previous Merge Join Operator [MERGEJOIN_139] + Please refer to the previous Merge Join Operator [MERGEJOIN_141]