http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query27.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query27.q.out b/ql/src/test/results/clientpositive/perf/tez/query27.q.out index 0839118..df1e15f 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query27.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query27.q.out @@ -45,28 +45,33 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage +Map 1 <- Reducer 11 (BROADCAST_EDGE), Reducer 13 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) +Reducer 11 <- Map 10 (CUSTOM_SIMPLE_EDGE) +Reducer 13 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 15 <- Map 14 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) -Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) -Reducer 4 <- Map 10 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 11 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) +Reducer 3 <- Map 10 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 4 <- Map 12 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) +Reducer 5 <- Map 14 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) +Reducer 9 <- Map 8 (CUSTOM_SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 7 vectorized - File Output Operator [FS_80] - Limit [LIM_79] (rows=100 width=88) + File Output Operator [FS_140] + Limit [LIM_139] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_78] (rows=1264972921 width=88) + Select Operator [SEL_138] (rows=1264972921 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] <-Reducer 6 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_77] - Select Operator [SEL_76] (rows=1264972921 width=88) + SHUFFLE [RS_137] + Select Operator [SEL_136] (rows=1264972921 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Group By Operator [GBY_75] (rows=1264972921 width=88) + Group By Operator [GBY_135] (rows=1264972921 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"],aggregations:["sum(VALUE._col0)","count(VALUE._col1)","sum(VALUE._col2)","count(VALUE._col3)","sum(VALUE._col4)","count(VALUE._col5)","sum(VALUE._col6)","count(VALUE._col7)"],keys:KEY._col0, KEY._col1, KEY._col2 <-Reducer 5 [SIMPLE_EDGE] SHUFFLE [RS_30] @@ -75,66 +80,110 @@ Stage-0 Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"],aggregations:["sum(_col2)","count(_col2)","sum(_col3)","count(_col3)","sum(_col4)","count(_col4)","sum(_col5)","count(_col5)"],keys:_col0, _col1, 0L Select Operator [SEL_27] (rows=843315281 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] - Merge Join Operator [MERGEJOIN_59] (rows=843315281 width=88) - Conds:RS_24._col1=RS_74._col0(Inner),Output:["_col4","_col5","_col6","_col7","_col15","_col17"] - <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_74] + Merge Join Operator [MERGEJOIN_99] (rows=843315281 width=88) + Conds:RS_24._col1=RS_126._col0(Inner),Output:["_col4","_col5","_col6","_col7","_col15","_col17"] + <-Map 14 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_126] PartitionCols:_col0 - Select Operator [SEL_73] (rows=462000 width=1436) + Select Operator [SEL_125] (rows=462000 width=1436) Output:["_col0","_col1"] - Filter Operator [FIL_72] (rows=462000 width=1436) + Filter Operator [FIL_124] (rows=462000 width=1436) predicate:i_item_sk is not null TableScan [TS_12] (rows=462000 width=1436) default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_24] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_58] (rows=766650239 width=88) - Conds:RS_21._col3=RS_71._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col15"] - <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_71] + Merge Join Operator [MERGEJOIN_98] (rows=766650239 width=88) + Conds:RS_21._col3=RS_118._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col15"] + <-Map 12 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_118] PartitionCols:_col0 - Select Operator [SEL_70] (rows=852 width=1910) + Select Operator [SEL_117] (rows=852 width=1910) Output:["_col0","_col1"] - Filter Operator [FIL_69] (rows=852 width=1910) + Filter Operator [FIL_116] (rows=852 width=1910) predicate:((s_state) IN ('SD', 'FL', 'MI', 'LA', 'MO', 'SC') and s_store_sk is not null) TableScan [TS_9] (rows=1704 width=1910) default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_21] PartitionCols:_col3 - Merge Join Operator [MERGEJOIN_57] (rows=696954748 width=88) - Conds:RS_18._col0=RS_68._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7"] - <-Map 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_68] + Merge Join Operator [MERGEJOIN_97] (rows=696954748 width=88) + Conds:RS_18._col0=RS_110._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7"] + <-Map 10 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_110] PartitionCols:_col0 - Select Operator [SEL_67] (rows=36524 width=1119) + Select Operator [SEL_109] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_66] (rows=36524 width=1119) + Filter Operator [FIL_108] (rows=36524 width=1119) predicate:((d_year = 2001) and d_date_sk is not null) TableScan [TS_6] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_18] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_56] (rows=633595212 width=88) - Conds:RS_62._col2=RS_65._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] - <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_62] - PartitionCols:_col2 - Select Operator [SEL_61] (rows=575995635 width=88) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Filter Operator [FIL_60] (rows=575995635 width=88) - predicate:(ss_cdemo_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null) - TableScan [TS_0] (rows=575995635 width=88) - default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_cdemo_sk","ss_store_sk","ss_quantity","ss_list_price","ss_sales_price","ss_coupon_amt"] + Merge Join Operator [MERGEJOIN_96] (rows=633595212 width=88) + Conds:RS_134._col2=RS_102._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] <-Map 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_65] + PARTITION_ONLY_SHUFFLE [RS_102] PartitionCols:_col0 - Select Operator [SEL_64] (rows=232725 width=385) + Select Operator [SEL_101] (rows=232725 width=385) Output:["_col0"] - Filter Operator [FIL_63] (rows=232725 width=385) + Filter Operator [FIL_100] (rows=232725 width=385) predicate:((cd_education_status = '2 yr Degree') and (cd_gender = 'M') and (cd_marital_status = 'U') and cd_demo_sk is not null) TableScan [TS_3] (rows=1861800 width=385) default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status"] + <-Map 1 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_134] + PartitionCols:_col2 + Select Operator [SEL_133] (rows=575995635 width=88) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_132] (rows=575995635 width=88) + predicate:((ss_cdemo_sk BETWEEN DynamicValue(RS_16_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_16_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_16_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_25_item_i_item_sk_min) AND DynamicValue(RS_25_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_25_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_19_date_dim_d_date_sk_min) AND DynamicValue(RS_19_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_19_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_22_store_s_store_sk_min) AND DynamicValue(RS_22_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_22_store_s_store_sk_bloom_filter))) and ss_cdemo_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is no t null) + TableScan [TS_0] (rows=575995635 width=88) + default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_cdemo_sk","ss_store_sk","ss_quantity","ss_list_price","ss_sales_price","ss_coupon_amt"] + <-Reducer 11 [BROADCAST_EDGE] vectorized + BROADCAST [RS_115] + Group By Operator [GBY_114] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 10 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_113] + Group By Operator [GBY_112] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_111] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_109] + <-Reducer 13 [BROADCAST_EDGE] vectorized + BROADCAST [RS_123] + Group By Operator [GBY_122] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_121] + Group By Operator [GBY_120] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_119] (rows=852 width=1910) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_117] + <-Reducer 15 [BROADCAST_EDGE] vectorized + BROADCAST [RS_131] + Group By Operator [GBY_130] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_129] + Group By Operator [GBY_128] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_127] (rows=462000 width=1436) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_125] + <-Reducer 9 [BROADCAST_EDGE] vectorized + BROADCAST [RS_107] + Group By Operator [GBY_106] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_105] + Group By Operator [GBY_104] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_103] (rows=232725 width=385) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_101]
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query29.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query29.q.out b/ql/src/test/results/clientpositive/perf/tez/query29.q.out index a0e7621..46ff49d 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query29.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query29.q.out @@ -93,138 +93,224 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Reducer 10 <- Map 15 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE) -Reducer 11 <- Map 16 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE) -Reducer 13 <- Map 12 (SIMPLE_EDGE), Map 14 (SIMPLE_EDGE) +Map 1 <- Reducer 7 (BROADCAST_EDGE) +Map 8 <- Reducer 14 (BROADCAST_EDGE), Reducer 16 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 18 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Reducer 23 (BROADCAST_EDGE) +Reducer 10 <- Reducer 15 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE) +Reducer 11 <- Map 20 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE) +Reducer 12 <- Map 22 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE) +Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE) +Reducer 15 <- Map 13 (SIMPLE_EDGE), Map 19 (SIMPLE_EDGE) +Reducer 16 <- Reducer 15 (CUSTOM_SIMPLE_EDGE) +Reducer 17 <- Reducer 15 (CUSTOM_SIMPLE_EDGE) +Reducer 18 <- Reducer 15 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (SIMPLE_EDGE) -Reducer 3 <- Reducer 11 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 21 <- Map 20 (CUSTOM_SIMPLE_EDGE) +Reducer 23 <- Map 22 (CUSTOM_SIMPLE_EDGE) +Reducer 3 <- Reducer 12 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) -Reducer 8 <- Map 12 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) -Reducer 9 <- Reducer 13 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) +Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) +Reducer 9 <- Map 13 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 5 vectorized - File Output Operator [FS_128] - Limit [LIM_127] (rows=100 width=88) + File Output Operator [FS_257] + Limit [LIM_256] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_126] (rows=463823414 width=88) + Select Operator [SEL_255] (rows=463823414 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] <-Reducer 4 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_125] - Group By Operator [GBY_124] (rows=463823414 width=88) + SHUFFLE [RS_254] + Group By Operator [GBY_253] (rows=463823414 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_49] PartitionCols:_col0, _col1, _col2, _col3 Group By Operator [GBY_48] (rows=927646829 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col14)","sum(_col22)","sum(_col3)"],keys:_col7, _col8, _col27, _col28 - Merge Join Operator [MERGEJOIN_99] (rows=927646829 width=88) + Merge Join Operator [MERGEJOIN_202] (rows=927646829 width=88) Conds:RS_44._col1, _col2=RS_45._col14, _col13(Inner),Output:["_col3","_col7","_col8","_col14","_col22","_col27","_col28"] - <-Reducer 11 [SIMPLE_EDGE] + <-Reducer 12 [SIMPLE_EDGE] SHUFFLE [RS_45] PartitionCols:_col14, _col13 Select Operator [SEL_40] (rows=843315281 width=88) Output:["_col1","_col2","_col8","_col13","_col14","_col16","_col21","_col22"] - Merge Join Operator [MERGEJOIN_98] (rows=843315281 width=88) - Conds:RS_37._col3=RS_123._col0(Inner),Output:["_col5","_col10","_col11","_col13","_col18","_col19","_col21","_col22"] - <-Map 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_123] + Merge Join Operator [MERGEJOIN_201] (rows=843315281 width=88) + Conds:RS_37._col3=RS_244._col0(Inner),Output:["_col5","_col10","_col11","_col13","_col18","_col19","_col21","_col22"] + <-Map 22 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_244] PartitionCols:_col0 - Select Operator [SEL_122] (rows=1704 width=1910) + Select Operator [SEL_243] (rows=1704 width=1910) Output:["_col0","_col1","_col2"] - Filter Operator [FIL_121] (rows=1704 width=1910) + Filter Operator [FIL_242] (rows=1704 width=1910) predicate:s_store_sk is not null TableScan [TS_25] (rows=1704 width=1910) default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id","s_store_name"] - <-Reducer 10 [SIMPLE_EDGE] + <-Reducer 11 [SIMPLE_EDGE] SHUFFLE [RS_37] PartitionCols:_col3 - Merge Join Operator [MERGEJOIN_97] (rows=766650239 width=88) - Conds:RS_34._col1=RS_120._col0(Inner),Output:["_col3","_col5","_col10","_col11","_col13","_col18","_col19"] - <-Map 15 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_120] + Merge Join Operator [MERGEJOIN_200] (rows=766650239 width=88) + Conds:RS_34._col1=RS_236._col0(Inner),Output:["_col3","_col5","_col10","_col11","_col13","_col18","_col19"] + <-Map 20 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_236] PartitionCols:_col0 - Select Operator [SEL_119] (rows=462000 width=1436) + Select Operator [SEL_235] (rows=462000 width=1436) Output:["_col0","_col1","_col2"] - Filter Operator [FIL_118] (rows=462000 width=1436) + Filter Operator [FIL_234] (rows=462000 width=1436) predicate:i_item_sk is not null TableScan [TS_22] (rows=462000 width=1436) default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] - <-Reducer 9 [SIMPLE_EDGE] + <-Reducer 10 [SIMPLE_EDGE] SHUFFLE [RS_34] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_96] (rows=696954748 width=88) + Merge Join Operator [MERGEJOIN_199] (rows=696954748 width=88) Conds:RS_31._col1, _col2, _col4=RS_32._col1, _col2, _col3(Inner),Output:["_col1","_col3","_col5","_col10","_col11","_col13"] - <-Reducer 13 [SIMPLE_EDGE] - SHUFFLE [RS_32] + <-Reducer 15 [SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_32] PartitionCols:_col1, _col2, _col3 - Merge Join Operator [MERGEJOIN_95] (rows=63350266 width=77) - Conds:RS_117._col0=RS_114._col0(Inner),Output:["_col1","_col2","_col3","_col4"] - <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_114] + Merge Join Operator [MERGEJOIN_198] (rows=63350266 width=77) + Conds:RS_227._col0=RS_220._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + <-Map 13 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_220] PartitionCols:_col0 - Select Operator [SEL_112] (rows=4058 width=1119) + Select Operator [SEL_217] (rows=4058 width=1119) Output:["_col0"] - Filter Operator [FIL_110] (rows=4058 width=1119) + Filter Operator [FIL_215] (rows=4058 width=1119) predicate:((d_year = 1999) and d_date_sk is not null and d_moy BETWEEN 4 AND 7) TableScan [TS_9] (rows=73049 width=1119) default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] - <-Map 14 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_117] + <-Map 19 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_227] PartitionCols:_col0 - Select Operator [SEL_116] (rows=57591150 width=77) + Select Operator [SEL_226] (rows=57591150 width=77) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_115] (rows=57591150 width=77) + Filter Operator [FIL_225] (rows=57591150 width=77) predicate:(sr_customer_sk is not null and sr_item_sk is not null and sr_returned_date_sk is not null and sr_ticket_number is not null) TableScan [TS_12] (rows=57591150 width=77) default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number","sr_return_quantity"] - <-Reducer 8 [SIMPLE_EDGE] + <-Reducer 9 [SIMPLE_EDGE] SHUFFLE [RS_31] PartitionCols:_col1, _col2, _col4 - Merge Join Operator [MERGEJOIN_94] (rows=633595212 width=88) - Conds:RS_108._col0=RS_113._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5"] - <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_113] + Merge Join Operator [MERGEJOIN_197] (rows=633595212 width=88) + Conds:RS_252._col0=RS_218._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5"] + <-Map 13 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_218] PartitionCols:_col0 - Select Operator [SEL_111] (rows=18262 width=1119) + Select Operator [SEL_216] (rows=18262 width=1119) Output:["_col0"] - Filter Operator [FIL_109] (rows=18262 width=1119) + Filter Operator [FIL_214] (rows=18262 width=1119) predicate:((d_moy = 4) and (d_year = 1999) and d_date_sk is not null) Please refer to the previous TableScan [TS_9] - <-Map 7 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_108] + <-Map 8 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_252] PartitionCols:_col0 - Select Operator [SEL_107] (rows=575995635 width=88) + Select Operator [SEL_251] (rows=575995635 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] - Filter Operator [FIL_106] (rows=575995635 width=88) - predicate:(ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null and ss_ticket_number is not null) + Filter Operator [FIL_250] (rows=575995635 width=88) + predicate:((ss_customer_sk BETWEEN DynamicValue(RS_32_store_returns_sr_customer_sk_min) AND DynamicValue(RS_32_store_returns_sr_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_32_store_returns_sr_customer_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_32_store_returns_sr_item_sk_min) AND DynamicValue(RS_32_store_returns_sr_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_32_store_returns_sr_item_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_35_item_i_item_sk_min) AND DynamicValue(RS_35_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_35_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_29_d1_d_date_sk_min) AND DynamicValue(RS_29_d1_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_29_d1_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_38_store_s_store_sk_min) AND DynamicValue(RS_38_store_s_store_sk_ma x) and in_bloom_filter(ss_store_sk, DynamicValue(RS_38_store_s_store_sk_bloom_filter))) and (ss_ticket_number BETWEEN DynamicValue(RS_32_store_returns_sr_ticket_number_min) AND DynamicValue(RS_32_store_returns_sr_ticket_number_max) and in_bloom_filter(ss_ticket_number, DynamicValue(RS_32_store_returns_sr_ticket_number_bloom_filter))) and ss_customer_sk is not null and ss_item_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null and ss_ticket_number is not null) TableScan [TS_6] (rows=575995635 width=88) default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number","ss_quantity"] + <-Reducer 14 [BROADCAST_EDGE] vectorized + BROADCAST [RS_224] + Group By Operator [GBY_223] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_222] + Group By Operator [GBY_221] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_219] (rows=18262 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_216] + <-Reducer 16 [BROADCAST_EDGE] vectorized + BROADCAST [RS_229] + Group By Operator [GBY_228] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=63350264)"] + <-Reducer 15 [CUSTOM_SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_120] + Group By Operator [GBY_119] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=63350264)"] + Select Operator [SEL_118] (rows=63350266 width=77) + Output:["_col0"] + Please refer to the previous Merge Join Operator [MERGEJOIN_198] + <-Reducer 17 [BROADCAST_EDGE] vectorized + BROADCAST [RS_231] + Group By Operator [GBY_230] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=63350264)"] + <-Reducer 15 [CUSTOM_SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_125] + Group By Operator [GBY_124] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=63350264)"] + Select Operator [SEL_123] (rows=63350266 width=77) + Output:["_col0"] + Please refer to the previous Merge Join Operator [MERGEJOIN_198] + <-Reducer 18 [BROADCAST_EDGE] vectorized + BROADCAST [RS_233] + Group By Operator [GBY_232] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=63350264)"] + <-Reducer 15 [CUSTOM_SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_130] + Group By Operator [GBY_129] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=63350264)"] + Select Operator [SEL_128] (rows=63350266 width=77) + Output:["_col0"] + Please refer to the previous Merge Join Operator [MERGEJOIN_198] + <-Reducer 21 [BROADCAST_EDGE] vectorized + BROADCAST [RS_241] + Group By Operator [GBY_240] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 20 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_239] + Group By Operator [GBY_238] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_237] (rows=462000 width=1436) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_235] + <-Reducer 23 [BROADCAST_EDGE] vectorized + BROADCAST [RS_249] + Group By Operator [GBY_248] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 22 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_247] + Group By Operator [GBY_246] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_245] (rows=1704 width=1910) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_243] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_44] PartitionCols:_col1, _col2 - Merge Join Operator [MERGEJOIN_93] (rows=316788826 width=135) - Conds:RS_102._col0=RS_105._col0(Inner),Output:["_col1","_col2","_col3"] - <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_102] - PartitionCols:_col0 - Select Operator [SEL_101] (rows=287989836 width=135) - Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_100] (rows=287989836 width=135) - predicate:(cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null) - TableScan [TS_0] (rows=287989836 width=135) - default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_quantity"] + Merge Join Operator [MERGEJOIN_196] (rows=316788826 width=135) + Conds:RS_213._col0=RS_205._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 6 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_105] + PARTITION_ONLY_SHUFFLE [RS_205] PartitionCols:_col0 - Select Operator [SEL_104] (rows=36525 width=1119) + Select Operator [SEL_204] (rows=36525 width=1119) Output:["_col0"] - Filter Operator [FIL_103] (rows=36525 width=1119) + Filter Operator [FIL_203] (rows=36525 width=1119) predicate:((d_year) IN (1999, 2000, 2001) and d_date_sk is not null) TableScan [TS_3] (rows=73049 width=1119) default@date_dim,d3,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Map 1 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_213] + PartitionCols:_col0 + Select Operator [SEL_212] (rows=287989836 width=135) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_211] (rows=287989836 width=135) + predicate:((cs_sold_date_sk BETWEEN DynamicValue(RS_42_d3_d_date_sk_min) AND DynamicValue(RS_42_d3_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_42_d3_d_date_sk_bloom_filter))) and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=287989836 width=135) + default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_quantity"] + <-Reducer 7 [BROADCAST_EDGE] vectorized + BROADCAST [RS_210] + Group By Operator [GBY_209] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 6 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_208] + Group By Operator [GBY_207] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_206] (rows=36525 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_204] http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query3.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query3.q.out b/ql/src/test/results/clientpositive/perf/tez/query3.q.out index c655c1b..801b4f9 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query3.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query3.q.out @@ -41,62 +41,87 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage +Map 1 <- Reducer 7 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (SIMPLE_EDGE) -Reducer 3 <- Map 7 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) +Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) +Reducer 9 <- Map 8 (CUSTOM_SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 5 vectorized - File Output Operator [FS_47] - Limit [LIM_46] (rows=100 width=88) + File Output Operator [FS_77] + Limit [LIM_76] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_45] (rows=348477374 width=88) + Select Operator [SEL_75] (rows=348477374 width=88) Output:["_col0","_col1","_col2","_col3"] <-Reducer 4 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_44] - Group By Operator [GBY_43] (rows=348477374 width=88) + SHUFFLE [RS_74] + Group By Operator [GBY_73] (rows=348477374 width=88) Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_17] PartitionCols:_col0, _col1, _col2 Group By Operator [GBY_16] (rows=696954748 width=88) Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col2)"],keys:_col8, _col4, _col5 - Merge Join Operator [MERGEJOIN_33] (rows=696954748 width=88) - Conds:RS_12._col0=RS_42._col0(Inner),Output:["_col2","_col4","_col5","_col8"] - <-Map 7 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_42] + Merge Join Operator [MERGEJOIN_53] (rows=696954748 width=88) + Conds:RS_12._col0=RS_64._col0(Inner),Output:["_col2","_col4","_col5","_col8"] + <-Map 8 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_64] PartitionCols:_col0 - Select Operator [SEL_41] (rows=36524 width=1119) + Select Operator [SEL_63] (rows=36524 width=1119) Output:["_col0","_col1"] - Filter Operator [FIL_40] (rows=36524 width=1119) + Filter Operator [FIL_62] (rows=36524 width=1119) predicate:((d_moy = 12) and d_date_sk is not null) TableScan [TS_6] (rows=73049 width=1119) default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_12] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_32] (rows=633595212 width=88) - Conds:RS_36._col1=RS_39._col0(Inner),Output:["_col0","_col2","_col4","_col5"] - <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_36] - PartitionCols:_col1 - Select Operator [SEL_35] (rows=575995635 width=88) - Output:["_col0","_col1","_col2"] - Filter Operator [FIL_34] (rows=575995635 width=88) - predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) - TableScan [TS_0] (rows=575995635 width=88) - default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] + Merge Join Operator [MERGEJOIN_52] (rows=633595212 width=88) + Conds:RS_72._col1=RS_56._col0(Inner),Output:["_col0","_col2","_col4","_col5"] <-Map 6 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_39] + PARTITION_ONLY_SHUFFLE [RS_56] PartitionCols:_col0 - Select Operator [SEL_38] (rows=231000 width=1436) + Select Operator [SEL_55] (rows=231000 width=1436) Output:["_col0","_col1","_col2"] - Filter Operator [FIL_37] (rows=231000 width=1436) + Filter Operator [FIL_54] (rows=231000 width=1436) predicate:((i_manufact_id = 436) and i_item_sk is not null) TableScan [TS_3] (rows=462000 width=1436) default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manufact_id"] + <-Map 1 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_72] + PartitionCols:_col1 + Select Operator [SEL_71] (rows=575995635 width=88) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_70] (rows=575995635 width=88) + predicate:((ss_item_sk BETWEEN DynamicValue(RS_10_item_i_item_sk_min) AND DynamicValue(RS_10_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_10_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_13_dt_d_date_sk_min) AND DynamicValue(RS_13_dt_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_13_dt_d_date_sk_bloom_filter))) and ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=575995635 width=88) + default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] + <-Reducer 7 [BROADCAST_EDGE] vectorized + BROADCAST [RS_61] + Group By Operator [GBY_60] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 6 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_59] + Group By Operator [GBY_58] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_57] (rows=231000 width=1436) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_55] + <-Reducer 9 [BROADCAST_EDGE] vectorized + BROADCAST [RS_69] + Group By Operator [GBY_68] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_67] + Group By Operator [GBY_66] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_65] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_63] http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query30.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query30.q.out b/ql/src/test/results/clientpositive/perf/tez/query30.q.out index 4d0e2d4..802a6e7 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query30.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query30.q.out @@ -77,37 +77,37 @@ Stage-0 limit:100 Stage-1 Reducer 4 vectorized - File Output Operator [FS_140] - Limit [LIM_139] (rows=100 width=860) + File Output Operator [FS_210] + Limit [LIM_209] (rows=100 width=860) Number of rows:100 - Select Operator [SEL_138] (rows=96800003 width=860) + Select Operator [SEL_208] (rows=96800003 width=860) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12"] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_63] Select Operator [SEL_62] (rows=96800003 width=860) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12"] - Merge Join Operator [MERGEJOIN_107] (rows=96800003 width=860) + Merge Join Operator [MERGEJOIN_177] (rows=96800003 width=860) Conds:RS_59._col0=RS_60._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col18"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_59] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_101] (rows=88000001 width=860) - Conds:RS_110._col2=RS_117._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + Merge Join Operator [MERGEJOIN_171] (rows=88000001 width=860) + Conds:RS_180._col2=RS_187._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] <-Map 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_117] + SHUFFLE [RS_187] PartitionCols:_col0 - Select Operator [SEL_114] (rows=20000000 width=1014) + Select Operator [SEL_184] (rows=20000000 width=1014) Output:["_col0"] - Filter Operator [FIL_111] (rows=20000000 width=1014) + Filter Operator [FIL_181] (rows=20000000 width=1014) predicate:((ca_state = 'IL') and ca_address_sk is not null) TableScan [TS_3] (rows=40000000 width=1014) default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_110] + SHUFFLE [RS_180] PartitionCols:_col2 - Select Operator [SEL_109] (rows=80000000 width=860) + Select Operator [SEL_179] (rows=80000000 width=860) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - Filter Operator [FIL_108] (rows=80000000 width=860) + Filter Operator [FIL_178] (rows=80000000 width=860) predicate:(c_current_addr_sk is not null and c_customer_sk is not null) TableScan [TS_0] (rows=80000000 width=860) default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id","c_current_addr_sk","c_salutation","c_first_name","c_last_name","c_preferred_cust_flag","c_birth_day","c_birth_month","c_birth_year","c_birth_country","c_login","c_email_address","c_last_review_date"] @@ -118,94 +118,94 @@ Stage-0 Output:["_col0","_col2"] Filter Operator [FIL_54] (rows=8066666 width=1014) predicate:(_col2 > _col3) - Merge Join Operator [MERGEJOIN_106] (rows=24200000 width=1014) - Conds:RS_132._col1=RS_137._col1(Inner),Output:["_col0","_col2","_col3"] + Merge Join Operator [MERGEJOIN_176] (rows=24200000 width=1014) + Conds:RS_202._col1=RS_207._col1(Inner),Output:["_col0","_col2","_col3"] <-Reducer 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_137] + SHUFFLE [RS_207] PartitionCols:_col1 - Select Operator [SEL_136] (rows=11000000 width=1014) + Select Operator [SEL_206] (rows=11000000 width=1014) Output:["_col0","_col1"] - Group By Operator [GBY_135] (rows=11000000 width=1014) + Group By Operator [GBY_205] (rows=11000000 width=1014) Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)","count(_col2)"],keys:_col0 - Select Operator [SEL_134] (rows=22000000 width=1014) + Select Operator [SEL_204] (rows=22000000 width=1014) Output:["_col0","_col2"] - Group By Operator [GBY_133] (rows=22000000 width=1014) + Group By Operator [GBY_203] (rows=22000000 width=1014) Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 9 [SIMPLE_EDGE] SHUFFLE [RS_43] PartitionCols:_col0 Group By Operator [GBY_42] (rows=44000000 width=1014) Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col7, _col1 - Merge Join Operator [MERGEJOIN_105] (rows=44000000 width=1014) - Conds:RS_38._col2=RS_119._col0(Inner),Output:["_col1","_col3","_col7"] + Merge Join Operator [MERGEJOIN_175] (rows=44000000 width=1014) + Conds:RS_38._col2=RS_189._col0(Inner),Output:["_col1","_col3","_col7"] <-Map 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_119] + SHUFFLE [RS_189] PartitionCols:_col0 - Select Operator [SEL_116] (rows=40000000 width=1014) + Select Operator [SEL_186] (rows=40000000 width=1014) Output:["_col0","_col1"] - Filter Operator [FIL_113] (rows=40000000 width=1014) + Filter Operator [FIL_183] (rows=40000000 width=1014) predicate:(ca_address_sk is not null and ca_state is not null) Please refer to the previous TableScan [TS_3] <-Reducer 13 [SIMPLE_EDGE] SHUFFLE [RS_38] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_104] (rows=15838314 width=92) - Conds:RS_125._col0=RS_129._col0(Inner),Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_174] (rows=15838314 width=92) + Conds:RS_195._col0=RS_199._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_125] + SHUFFLE [RS_195] PartitionCols:_col0 - Select Operator [SEL_123] (rows=14398467 width=92) + Select Operator [SEL_193] (rows=14398467 width=92) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_121] (rows=14398467 width=92) + Filter Operator [FIL_191] (rows=14398467 width=92) predicate:(wr_returned_date_sk is not null and wr_returning_addr_sk is not null) TableScan [TS_6] (rows=14398467 width=92) default@web_returns,web_returns,Tbl:COMPLETE,Col:NONE,Output:["wr_returned_date_sk","wr_returning_customer_sk","wr_returning_addr_sk","wr_return_amt"] <-Map 14 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_129] + SHUFFLE [RS_199] PartitionCols:_col0 - Select Operator [SEL_127] (rows=36524 width=1119) + Select Operator [SEL_197] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_126] (rows=36524 width=1119) + Filter Operator [FIL_196] (rows=36524 width=1119) predicate:((d_year = 2002) and d_date_sk is not null) TableScan [TS_9] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] <-Reducer 7 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_132] + SHUFFLE [RS_202] PartitionCols:_col1 - Select Operator [SEL_131] (rows=22000000 width=1014) + Select Operator [SEL_201] (rows=22000000 width=1014) Output:["_col0","_col1","_col2"] - Group By Operator [GBY_130] (rows=22000000 width=1014) + Group By Operator [GBY_200] (rows=22000000 width=1014) Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 6 [SIMPLE_EDGE] SHUFFLE [RS_23] PartitionCols:_col0, _col1 Group By Operator [GBY_22] (rows=44000000 width=1014) Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col7, _col1 - Merge Join Operator [MERGEJOIN_103] (rows=44000000 width=1014) - Conds:RS_18._col2=RS_118._col0(Inner),Output:["_col1","_col3","_col7"] + Merge Join Operator [MERGEJOIN_173] (rows=44000000 width=1014) + Conds:RS_18._col2=RS_188._col0(Inner),Output:["_col1","_col3","_col7"] <-Map 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_118] + SHUFFLE [RS_188] PartitionCols:_col0 - Select Operator [SEL_115] (rows=40000000 width=1014) + Select Operator [SEL_185] (rows=40000000 width=1014) Output:["_col0","_col1"] - Filter Operator [FIL_112] (rows=40000000 width=1014) + Filter Operator [FIL_182] (rows=40000000 width=1014) predicate:(ca_address_sk is not null and ca_state is not null) Please refer to the previous TableScan [TS_3] <-Reducer 12 [SIMPLE_EDGE] SHUFFLE [RS_18] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_102] (rows=15838314 width=92) - Conds:RS_124._col0=RS_128._col0(Inner),Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_172] (rows=15838314 width=92) + Conds:RS_194._col0=RS_198._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_124] + SHUFFLE [RS_194] PartitionCols:_col0 - Select Operator [SEL_122] (rows=14398467 width=92) + Select Operator [SEL_192] (rows=14398467 width=92) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_120] (rows=14398467 width=92) + Filter Operator [FIL_190] (rows=14398467 width=92) predicate:(wr_returned_date_sk is not null and wr_returning_addr_sk is not null and wr_returning_customer_sk is not null) Please refer to the previous TableScan [TS_6] <-Map 14 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_128] + SHUFFLE [RS_198] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_127] + Please refer to the previous Select Operator [SEL_197]
