http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query95.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/spark/query95.q.out b/ql/src/test/results/clientpositive/perf/spark/query95.q.out index b0df142..abb95f9 100644 --- a/ql/src/test/results/clientpositive/perf/spark/query95.q.out +++ b/ql/src/test/results/clientpositive/perf/spark/query95.q.out @@ -75,6 +75,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: web_site + filterExpr: ((web_company_name = 'pri') and web_site_sk is not null) (type: boolean) Statistics: Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((web_company_name = 'pri') and web_site_sk is not null) (type: boolean) @@ -99,6 +100,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: date_dim + filterExpr: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1999-05-01 00:00:00.0' AND TIMESTAMP'1999-06-30 00:00:00.0' and d_date_sk is not null) (type: boolean) Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1999-05-01 00:00:00.0' AND TIMESTAMP'1999-06-30 00:00:00.0' and d_date_sk is not null) (type: boolean) @@ -134,6 +136,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ws1 + filterExpr: (ws_order_number is not null and ws_ship_date_sk is not null and ws_ship_addr_sk is not null and ws_web_site_sk is not null) (type: boolean) Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (ws_order_number is not null and ws_ship_addr_sk is not null and ws_ship_date_sk is not null and ws_web_site_sk is not null) (type: boolean) @@ -165,6 +168,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ws1 + filterExpr: ws_order_number is not null (type: boolean) Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ws_order_number is not null (type: boolean) @@ -184,6 +188,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ws2 + filterExpr: ws_order_number is not null (type: boolean) Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ws_order_number is not null (type: boolean) @@ -203,6 +208,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ws1 + filterExpr: ws_order_number is not null (type: boolean) Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ws_order_number is not null (type: boolean) @@ -222,6 +228,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ws2 + filterExpr: ws_order_number is not null (type: boolean) Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ws_order_number is not null (type: boolean) @@ -241,6 +248,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: web_returns + filterExpr: wr_order_number is not null (type: boolean) Statistics: Num rows: 14398467 Data size: 1325194184 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: wr_order_number is not null (type: boolean) @@ -259,6 +267,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer_address + filterExpr: ((ca_state = 'TX') and ca_address_sk is not null) (type: boolean) Statistics: Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((ca_state = 'TX') and ca_address_sk is not null) (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query96.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/spark/query96.q.out b/ql/src/test/results/clientpositive/perf/spark/query96.q.out index 68af7a4..ba41c76 100644 --- a/ql/src/test/results/clientpositive/perf/spark/query96.q.out +++ b/ql/src/test/results/clientpositive/perf/spark/query96.q.out @@ -42,6 +42,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: time_dim + filterExpr: ((t_hour = 8) and (t_minute >= 30) and t_time_sk is not null) (type: boolean) Statistics: Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((t_hour = 8) and (t_minute >= 30) and t_time_sk is not null) (type: boolean) @@ -61,6 +62,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: household_demographics + filterExpr: ((hd_dep_count = 5) and hd_demo_sk is not null) (type: boolean) Statistics: Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((hd_dep_count = 5) and hd_demo_sk is not null) (type: boolean) @@ -80,6 +82,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store + filterExpr: ((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) Statistics: Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) @@ -107,6 +110,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales + filterExpr: (ss_hdemo_sk is not null and ss_sold_time_sk is not null and ss_store_sk is not null) (type: boolean) Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (ss_hdemo_sk is not null and ss_sold_time_sk is not null and ss_store_sk is not null) (type: boolean) http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query97.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/spark/query97.q.out b/ql/src/test/results/clientpositive/perf/spark/query97.q.out index 1908e48..c4f4804 100644 --- a/ql/src/test/results/clientpositive/perf/spark/query97.q.out +++ b/ql/src/test/results/clientpositive/perf/spark/query97.q.out @@ -61,6 +61,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: date_dim + filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean) Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean) @@ -85,6 +86,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: date_dim + filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean) Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean) @@ -114,6 +116,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales + filterExpr: ss_sold_date_sk is not null (type: boolean) Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ss_sold_date_sk is not null (type: boolean) @@ -149,6 +152,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: catalog_sales + filterExpr: cs_sold_date_sk is not null (type: boolean) Statistics: Num rows: 287989836 Data size: 38999608952 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: cs_sold_date_sk is not null (type: boolean) http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query98.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/spark/query98.q.out b/ql/src/test/results/clientpositive/perf/spark/query98.q.out index c69032b..d3f6670 100644 --- a/ql/src/test/results/clientpositive/perf/spark/query98.q.out +++ b/ql/src/test/results/clientpositive/perf/spark/query98.q.out @@ -74,6 +74,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: date_dim + filterExpr: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'2001-01-12 00:00:00.0' AND TIMESTAMP'2001-02-11 00:00:00.0' and d_date_sk is not null) (type: boolean) Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'2001-01-12 00:00:00.0' AND TIMESTAMP'2001-02-11 00:00:00.0' and d_date_sk is not null) (type: boolean) @@ -103,6 +104,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales + filterExpr: (ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) @@ -134,6 +136,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item + filterExpr: ((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean) Statistics: Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: ((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean) http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query99.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/spark/query99.q.out b/ql/src/test/results/clientpositive/perf/spark/query99.q.out index 1e584ae..f541da8 100644 --- a/ql/src/test/results/clientpositive/perf/spark/query99.q.out +++ b/ql/src/test/results/clientpositive/perf/spark/query99.q.out @@ -80,6 +80,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: date_dim + filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean) Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean) @@ -99,6 +100,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: call_center + filterExpr: cc_call_center_sk is not null (type: boolean) Statistics: Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: cc_call_center_sk is not null (type: boolean) @@ -118,6 +120,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: warehouse + filterExpr: w_warehouse_sk is not null (type: boolean) Statistics: Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: w_warehouse_sk is not null (type: boolean) @@ -137,6 +140,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ship_mode + filterExpr: sm_ship_mode_sk is not null (type: boolean) Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE Filter Operator predicate: sm_ship_mode_sk is not null (type: boolean) @@ -164,6 +168,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: catalog_sales + filterExpr: (cs_warehouse_sk is not null and cs_ship_mode_sk is not null and cs_call_center_sk is not null and cs_ship_date_sk is not null) (type: boolean) Statistics: Num rows: 287989836 Data size: 38999608952 Basic stats: COMPLETE Column stats: NONE Filter Operator predicate: (cs_call_center_sk is not null and cs_ship_date_sk is not null and cs_ship_mode_sk is not null and cs_warehouse_sk is not null) (type: boolean) http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query1.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query1.q.out b/ql/src/test/results/clientpositive/perf/tez/query1.q.out index ea6e0da..579940c 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query1.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query1.q.out @@ -63,10 +63,10 @@ Stage-0 limit:100 Stage-1 Reducer 7 vectorized - File Output Operator [FS_108] - Limit [LIM_107] (rows=100 width=860) + File Output Operator [FS_159] + Limit [LIM_158] (rows=100 width=860) Number of rows:100 - Select Operator [SEL_106] (rows=32266667 width=860) + Select Operator [SEL_157] (rows=32266667 width=860) Output:["_col0"] <-Reducer 6 [SIMPLE_EDGE] SHUFFLE [RS_50] @@ -74,96 +74,96 @@ Stage-0 Output:["_col0"] Filter Operator [FIL_48] (rows=32266667 width=860) predicate:(_col2 > _col7) - Merge Join Operator [MERGEJOIN_81] (rows=96800003 width=860) - Conds:RS_45._col1=RS_105._col1(Inner),Output:["_col2","_col6","_col7"] + Merge Join Operator [MERGEJOIN_132] (rows=96800003 width=860) + Conds:RS_45._col1=RS_156._col1(Inner),Output:["_col2","_col6","_col7"] <-Reducer 5 [SIMPLE_EDGE] SHUFFLE [RS_45] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_79] (rows=88000001 width=860) - Conds:RS_42._col0=RS_100._col0(Inner),Output:["_col1","_col2","_col6"] + Merge Join Operator [MERGEJOIN_130] (rows=88000001 width=860) + Conds:RS_42._col0=RS_151._col0(Inner),Output:["_col1","_col2","_col6"] <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_100] + SHUFFLE [RS_151] PartitionCols:_col0 - Select Operator [SEL_99] (rows=80000000 width=860) + Select Operator [SEL_150] (rows=80000000 width=860) Output:["_col0","_col1"] - Filter Operator [FIL_98] (rows=80000000 width=860) + Filter Operator [FIL_149] (rows=80000000 width=860) predicate:c_customer_sk is not null TableScan [TS_17] (rows=80000000 width=860) default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id"] <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_42] PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_78] (rows=34842647 width=77) - Conds:RS_94._col1=RS_97._col0(Inner),Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_129] (rows=34842647 width=77) + Conds:RS_145._col1=RS_148._col0(Inner),Output:["_col0","_col1","_col2"] <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_97] + SHUFFLE [RS_148] PartitionCols:_col0 - Select Operator [SEL_96] (rows=852 width=1910) + Select Operator [SEL_147] (rows=852 width=1910) Output:["_col0"] - Filter Operator [FIL_95] (rows=852 width=1910) + Filter Operator [FIL_146] (rows=852 width=1910) predicate:((s_state = 'NM') and s_store_sk is not null) TableScan [TS_14] (rows=1704 width=1910) default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] <-Reducer 3 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_94] + SHUFFLE [RS_145] PartitionCols:_col1 - Select Operator [SEL_93] (rows=31675133 width=77) + Select Operator [SEL_144] (rows=31675133 width=77) Output:["_col0","_col1","_col2"] - Group By Operator [GBY_92] (rows=31675133 width=77) + Group By Operator [GBY_143] (rows=31675133 width=77) Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_11] PartitionCols:_col0, _col1 Group By Operator [GBY_10] (rows=63350266 width=77) Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col2, _col1 - Merge Join Operator [MERGEJOIN_77] (rows=63350266 width=77) - Conds:RS_86._col0=RS_90._col0(Inner),Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_128] (rows=63350266 width=77) + Conds:RS_137._col0=RS_141._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_86] + SHUFFLE [RS_137] PartitionCols:_col0 - Select Operator [SEL_84] (rows=57591150 width=77) + Select Operator [SEL_135] (rows=57591150 width=77) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_82] (rows=57591150 width=77) + Filter Operator [FIL_133] (rows=57591150 width=77) predicate:(sr_customer_sk is not null and sr_returned_date_sk is not null and sr_store_sk is not null) TableScan [TS_0] (rows=57591150 width=77) default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_customer_sk","sr_store_sk","sr_fee"] <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_90] + SHUFFLE [RS_141] PartitionCols:_col0 - Select Operator [SEL_89] (rows=36524 width=1119) + Select Operator [SEL_140] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_88] (rows=36524 width=1119) + Filter Operator [FIL_139] (rows=36524 width=1119) predicate:((d_year = 2000) and d_date_sk is not null) TableScan [TS_3] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] <-Reducer 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_105] + SHUFFLE [RS_156] PartitionCols:_col1 - Select Operator [SEL_104] (rows=15837566 width=77) + Select Operator [SEL_155] (rows=15837566 width=77) Output:["_col0","_col1"] - Group By Operator [GBY_103] (rows=15837566 width=77) + Group By Operator [GBY_154] (rows=15837566 width=77) Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)","count(_col2)"],keys:_col1 - Select Operator [SEL_102] (rows=31675133 width=77) + Select Operator [SEL_153] (rows=31675133 width=77) Output:["_col1","_col2"] - Group By Operator [GBY_101] (rows=31675133 width=77) + Group By Operator [GBY_152] (rows=31675133 width=77) Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 8 [SIMPLE_EDGE] SHUFFLE [RS_31] PartitionCols:_col0 Group By Operator [GBY_30] (rows=63350266 width=77) Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col2, _col1 - Merge Join Operator [MERGEJOIN_80] (rows=63350266 width=77) - Conds:RS_87._col0=RS_91._col0(Inner),Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_131] (rows=63350266 width=77) + Conds:RS_138._col0=RS_142._col0(Inner),Output:["_col1","_col2","_col3"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_87] + SHUFFLE [RS_138] PartitionCols:_col0 - Select Operator [SEL_85] (rows=57591150 width=77) + Select Operator [SEL_136] (rows=57591150 width=77) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_83] (rows=57591150 width=77) + Filter Operator [FIL_134] (rows=57591150 width=77) predicate:(sr_returned_date_sk is not null and sr_store_sk is not null) Please refer to the previous TableScan [TS_0] <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_91] + SHUFFLE [RS_142] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_89] + Please refer to the previous Select Operator [SEL_140] http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query10.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query10.q.out b/ql/src/test/results/clientpositive/perf/tez/query10.q.out index a88b7e1..1b6adee 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query10.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query10.q.out @@ -117,32 +117,39 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Reducer 10 <- Map 11 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE) -Reducer 12 <- Map 11 (SIMPLE_EDGE), Map 16 (SIMPLE_EDGE) -Reducer 13 <- Reducer 12 (SIMPLE_EDGE) -Reducer 14 <- Map 11 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) +Map 10 <- Reducer 13 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) +Map 20 <- Reducer 16 (BROADCAST_EDGE) +Map 21 <- Reducer 19 (BROADCAST_EDGE) +Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE) +Reducer 13 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 14 <- Map 12 (SIMPLE_EDGE), Map 20 (SIMPLE_EDGE) Reducer 15 <- Reducer 14 (SIMPLE_EDGE) -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) -Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) -Reducer 4 <- Reducer 10 (SIMPLE_EDGE), Reducer 13 (ONE_TO_ONE_EDGE), Reducer 15 (ONE_TO_ONE_EDGE), Reducer 3 (SIMPLE_EDGE) +Reducer 16 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 17 <- Map 12 (SIMPLE_EDGE), Map 21 (SIMPLE_EDGE) +Reducer 18 <- Reducer 17 (SIMPLE_EDGE) +Reducer 19 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) +Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 4 <- Reducer 11 (SIMPLE_EDGE), Reducer 15 (ONE_TO_ONE_EDGE), Reducer 18 (ONE_TO_ONE_EDGE), Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) +Reducer 7 <- Reducer 3 (CUSTOM_SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 6 vectorized - File Output Operator [FS_143] - Limit [LIM_142] (rows=100 width=88) + File Output Operator [FS_224] + Limit [LIM_223] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_141] (rows=1045432122 width=88) + Select Operator [SEL_222] (rows=1045432122 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] <-Reducer 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_140] - Select Operator [SEL_139] (rows=1045432122 width=88) + SHUFFLE [RS_221] + Select Operator [SEL_220] (rows=1045432122 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col8","_col10","_col12"] - Group By Operator [GBY_138] (rows=1045432122 width=88) + Group By Operator [GBY_219] (rows=1045432122 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7 <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_63] @@ -153,124 +160,168 @@ Stage-0 Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] Filter Operator [FIL_60] (rows=2090864244 width=88) predicate:(_col15 is not null or _col17 is not null) - Merge Join Operator [MERGEJOIN_108] (rows=2090864244 width=88) - Conds:RS_55._col0=RS_56._col0(Left Semi),RS_55._col0=RS_131._col0(Left Outer),RS_55._col0=RS_137._col0(Left Outer),Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col15","_col17"] - <-Reducer 10 [SIMPLE_EDGE] + Merge Join Operator [MERGEJOIN_172] (rows=2090864244 width=88) + Conds:RS_55._col0=RS_56._col0(Left Semi),RS_55._col0=RS_210._col0(Left Outer),RS_55._col0=RS_218._col0(Left Outer),Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col15","_col17"] + <-Reducer 3 [SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_55] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_168] (rows=96800003 width=860) + Conds:RS_50._col1=RS_181._col0(Inner),Output:["_col0","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + <-Map 9 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_181] + PartitionCols:_col0 + Select Operator [SEL_180] (rows=1861800 width=385) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Filter Operator [FIL_179] (rows=1861800 width=385) + predicate:cd_demo_sk is not null + TableScan [TS_6] (rows=1861800 width=385) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status","cd_purchase_estimate","cd_credit_rating","cd_dep_count","cd_dep_employed_count","cd_dep_college_count"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_50] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_167] (rows=88000001 width=860) + Conds:RS_175._col2=RS_178._col0(Inner),Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_175] + PartitionCols:_col2 + Select Operator [SEL_174] (rows=80000000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_173] (rows=80000000 width=860) + predicate:(c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null) + TableScan [TS_0] (rows=80000000 width=860) + default@customer,c,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk"] + <-Map 8 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_178] + PartitionCols:_col0 + Select Operator [SEL_177] (rows=20000000 width=1014) + Output:["_col0"] + Filter Operator [FIL_176] (rows=20000000 width=1014) + predicate:((ca_county) IN ('Walker County', 'Richland County', 'Gaines County', 'Douglas County', 'Dona Ana County') and ca_address_sk is not null) + TableScan [TS_3] (rows=40000000 width=1014) + default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 11 [SIMPLE_EDGE] SHUFFLE [RS_56] PartitionCols:_col0 Group By Operator [GBY_54] (rows=633595212 width=88) Output:["_col0"],keys:_col0 Select Operator [SEL_18] (rows=633595212 width=88) Output:["_col0"] - Merge Join Operator [MERGEJOIN_105] (rows=633595212 width=88) - Conds:RS_120._col0=RS_123._col0(Inner),Output:["_col1"] - <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_123] + Merge Join Operator [MERGEJOIN_169] (rows=633595212 width=88) + Conds:RS_202._col0=RS_184._col0(Inner),Output:["_col1"] + <-Map 12 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_184] PartitionCols:_col0 - Select Operator [SEL_122] (rows=4058 width=1119) + Select Operator [SEL_183] (rows=4058 width=1119) Output:["_col0"] - Filter Operator [FIL_121] (rows=4058 width=1119) + Filter Operator [FIL_182] (rows=4058 width=1119) predicate:((d_year = 2002) and d_date_sk is not null and d_moy BETWEEN 4 AND 7) TableScan [TS_12] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] - <-Map 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_120] + <-Map 10 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_202] PartitionCols:_col0 - Select Operator [SEL_119] (rows=575995635 width=88) + Select Operator [SEL_201] (rows=575995635 width=88) Output:["_col0","_col1"] - Filter Operator [FIL_118] (rows=575995635 width=88) - predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null) + Filter Operator [FIL_200] (rows=575995635 width=88) + predicate:((ss_customer_sk BETWEEN DynamicValue(RS_55_c_c_customer_sk_min) AND DynamicValue(RS_55_c_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_55_c_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_16_date_dim_d_date_sk_min) AND DynamicValue(RS_16_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_16_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null) TableScan [TS_9] (rows=575995635 width=88) default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk"] - <-Reducer 13 [ONE_TO_ONE_EDGE] vectorized - FORWARD [RS_131] + <-Reducer 13 [BROADCAST_EDGE] vectorized + BROADCAST [RS_197] + Group By Operator [GBY_196] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_193] + Group By Operator [GBY_190] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_185] (rows=4058 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_183] + <-Reducer 7 [BROADCAST_EDGE] vectorized + BROADCAST [RS_199] + Group By Operator [GBY_198] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=96800000)"] + <-Reducer 3 [CUSTOM_SIMPLE_EDGE] + PARTITION_ONLY_SHUFFLE [RS_135] + Group By Operator [GBY_134] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=96800000)"] + Select Operator [SEL_133] (rows=96800003 width=860) + Output:["_col0"] + Please refer to the previous Merge Join Operator [MERGEJOIN_168] + <-Reducer 15 [ONE_TO_ONE_EDGE] vectorized + FORWARD [RS_210] PartitionCols:_col0 - Select Operator [SEL_130] (rows=79201469 width=135) + Select Operator [SEL_209] (rows=79201469 width=135) Output:["_col0","_col1"] - Group By Operator [GBY_129] (rows=79201469 width=135) + Group By Operator [GBY_208] (rows=79201469 width=135) Output:["_col0"],keys:KEY._col0 - <-Reducer 12 [SIMPLE_EDGE] + <-Reducer 14 [SIMPLE_EDGE] SHUFFLE [RS_30] PartitionCols:_col0 Group By Operator [GBY_29] (rows=158402938 width=135) Output:["_col0"],keys:_col1 - Merge Join Operator [MERGEJOIN_106] (rows=158402938 width=135) - Conds:RS_128._col0=RS_124._col0(Inner),Output:["_col1"] - <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_124] + Merge Join Operator [MERGEJOIN_170] (rows=158402938 width=135) + Conds:RS_207._col0=RS_186._col0(Inner),Output:["_col1"] + <-Map 12 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_186] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_122] - <-Map 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_128] + Please refer to the previous Select Operator [SEL_183] + <-Map 20 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_207] PartitionCols:_col0 - Select Operator [SEL_127] (rows=144002668 width=135) + Select Operator [SEL_206] (rows=144002668 width=135) Output:["_col0","_col1"] - Filter Operator [FIL_126] (rows=144002668 width=135) - predicate:(ws_bill_customer_sk is not null and ws_sold_date_sk is not null) + Filter Operator [FIL_205] (rows=144002668 width=135) + predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_26_date_dim_d_date_sk_min) AND DynamicValue(RS_26_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_26_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null) TableScan [TS_19] (rows=144002668 width=135) default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk"] - <-Reducer 15 [ONE_TO_ONE_EDGE] vectorized - FORWARD [RS_137] + <-Reducer 16 [BROADCAST_EDGE] vectorized + BROADCAST [RS_204] + Group By Operator [GBY_203] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_194] + Group By Operator [GBY_191] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_187] (rows=4058 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_183] + <-Reducer 18 [ONE_TO_ONE_EDGE] vectorized + FORWARD [RS_218] PartitionCols:_col0 - Select Operator [SEL_136] (rows=158394413 width=135) + Select Operator [SEL_217] (rows=158394413 width=135) Output:["_col0","_col1"] - Group By Operator [GBY_135] (rows=158394413 width=135) + Group By Operator [GBY_216] (rows=158394413 width=135) Output:["_col0"],keys:KEY._col0 - <-Reducer 14 [SIMPLE_EDGE] + <-Reducer 17 [SIMPLE_EDGE] SHUFFLE [RS_44] PartitionCols:_col0 Group By Operator [GBY_43] (rows=316788826 width=135) Output:["_col0"],keys:_col1 - Merge Join Operator [MERGEJOIN_107] (rows=316788826 width=135) - Conds:RS_134._col0=RS_125._col0(Inner),Output:["_col1"] - <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_125] + Merge Join Operator [MERGEJOIN_171] (rows=316788826 width=135) + Conds:RS_215._col0=RS_188._col0(Inner),Output:["_col1"] + <-Map 12 [SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_188] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_122] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_134] + Please refer to the previous Select Operator [SEL_183] + <-Map 21 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_215] PartitionCols:_col0 - Select Operator [SEL_133] (rows=287989836 width=135) + Select Operator [SEL_214] (rows=287989836 width=135) Output:["_col0","_col1"] - Filter Operator [FIL_132] (rows=287989836 width=135) - predicate:(cs_ship_customer_sk is not null and cs_sold_date_sk is not null) + Filter Operator [FIL_213] (rows=287989836 width=135) + predicate:((cs_sold_date_sk BETWEEN DynamicValue(RS_40_date_dim_d_date_sk_min) AND DynamicValue(RS_40_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_40_date_dim_d_date_sk_bloom_filter))) and cs_ship_customer_sk is not null and cs_sold_date_sk is not null) TableScan [TS_33] (rows=287989836 width=135) default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_ship_customer_sk"] - <-Reducer 3 [SIMPLE_EDGE] - SHUFFLE [RS_55] - PartitionCols:_col0 - Merge Join Operator [MERGEJOIN_104] (rows=96800003 width=860) - Conds:RS_50._col1=RS_117._col0(Inner),Output:["_col0","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - <-Map 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_117] - PartitionCols:_col0 - Select Operator [SEL_116] (rows=1861800 width=385) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Filter Operator [FIL_115] (rows=1861800 width=385) - predicate:cd_demo_sk is not null - TableScan [TS_6] (rows=1861800 width=385) - default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status","cd_purchase_estimate","cd_credit_rating","cd_dep_count","cd_dep_employed_count","cd_dep_college_count"] - <-Reducer 2 [SIMPLE_EDGE] - SHUFFLE [RS_50] - PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_103] (rows=88000001 width=860) - Conds:RS_111._col2=RS_114._col0(Inner),Output:["_col0","_col1"] - <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_111] - PartitionCols:_col2 - Select Operator [SEL_110] (rows=80000000 width=860) - Output:["_col0","_col1","_col2"] - Filter Operator [FIL_109] (rows=80000000 width=860) - predicate:(c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null) - TableScan [TS_0] (rows=80000000 width=860) - default@customer,c,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk"] - <-Map 7 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_114] - PartitionCols:_col0 - Select Operator [SEL_113] (rows=20000000 width=1014) - Output:["_col0"] - Filter Operator [FIL_112] (rows=20000000 width=1014) - predicate:((ca_county) IN ('Walker County', 'Richland County', 'Gaines County', 'Douglas County', 'Dona Ana County') and ca_address_sk is not null) - TableScan [TS_3] (rows=40000000 width=1014) - default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 19 [BROADCAST_EDGE] vectorized + BROADCAST [RS_212] + Group By Operator [GBY_211] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_195] + Group By Operator [GBY_192] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_189] (rows=4058 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_183] http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query11.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query11.q.out b/ql/src/test/results/clientpositive/perf/tez/query11.q.out index 2599621..bf454a0 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query11.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query11.q.out @@ -149,30 +149,40 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) -Reducer 12 <- Map 18 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE) -Reducer 13 <- Reducer 12 (SIMPLE_EDGE) -Reducer 14 <- Map 10 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) -Reducer 15 <- Map 18 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE) -Reducer 16 <- Reducer 15 (SIMPLE_EDGE) -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) -Reducer 3 <- Map 18 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Map 1 <- Reducer 17 (BROADCAST_EDGE) +Map 11 <- Reducer 16 (BROADCAST_EDGE), Reducer 24 (BROADCAST_EDGE) +Map 26 <- Reducer 22 (BROADCAST_EDGE) +Map 7 <- Reducer 18 (BROADCAST_EDGE), Reducer 25 (BROADCAST_EDGE) +Reducer 10 <- Reducer 9 (SIMPLE_EDGE) +Reducer 12 <- Map 11 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE) +Reducer 13 <- Map 23 (SIMPLE_EDGE), Reducer 12 (SIMPLE_EDGE) +Reducer 14 <- Reducer 13 (SIMPLE_EDGE) +Reducer 16 <- Map 15 (CUSTOM_SIMPLE_EDGE) +Reducer 17 <- Map 15 (CUSTOM_SIMPLE_EDGE) +Reducer 18 <- Map 15 (CUSTOM_SIMPLE_EDGE) +Reducer 19 <- Map 15 (SIMPLE_EDGE), Map 26 (SIMPLE_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE) +Reducer 20 <- Map 23 (SIMPLE_EDGE), Reducer 19 (SIMPLE_EDGE) +Reducer 21 <- Reducer 20 (SIMPLE_EDGE) +Reducer 22 <- Map 15 (CUSTOM_SIMPLE_EDGE) +Reducer 24 <- Map 23 (CUSTOM_SIMPLE_EDGE) +Reducer 25 <- Map 23 (CUSTOM_SIMPLE_EDGE) +Reducer 3 <- Map 23 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Reducer 13 (SIMPLE_EDGE), Reducer 16 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE) +Reducer 5 <- Reducer 10 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE), Reducer 21 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) -Reducer 7 <- Map 1 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE) -Reducer 8 <- Map 18 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) -Reducer 9 <- Reducer 8 (SIMPLE_EDGE) +Reducer 8 <- Map 15 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) +Reducer 9 <- Map 23 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 6 vectorized - File Output Operator [FS_218] - Limit [LIM_217] (rows=100 width=88) + File Output Operator [FS_360] + Limit [LIM_359] (rows=100 width=88) Number of rows:100 - Select Operator [SEL_216] (rows=383325119 width=88) + Select Operator [SEL_358] (rows=383325119 width=88) Output:["_col0"] <-Reducer 5 [SIMPLE_EDGE] SHUFFLE [RS_93] @@ -180,103 +190,209 @@ Stage-0 Output:["_col0"] Filter Operator [FIL_91] (rows=383325119 width=88) predicate:((_col1 / _col8) > (_col6 / _col3)) - Merge Join Operator [MERGEJOIN_175] (rows=1149975359 width=88) - Conds:RS_198._col0=RS_215._col0(Inner),RS_215._col0=RS_210._col0(Inner),RS_215._col0=RS_203._col0(Inner),Output:["_col1","_col3","_col5","_col6","_col8"] - <-Reducer 13 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_210] + Merge Join Operator [MERGEJOIN_283] (rows=1149975359 width=88) + Conds:RS_325._col0=RS_337._col0(Inner),RS_337._col0=RS_347._col0(Inner),RS_337._col0=RS_357._col0(Inner),Output:["_col1","_col3","_col5","_col6","_col8"] + <-Reducer 10 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_337] PartitionCols:_col0 - Select Operator [SEL_209] (rows=348477374 width=88) + Select Operator [SEL_336] (rows=116159124 width=88) + Output:["_col0","_col1"] + Filter Operator [FIL_335] (rows=116159124 width=88) + predicate:(_col7 > 0) + Select Operator [SEL_334] (rows=348477374 width=88) + Output:["_col0","_col7"] + Group By Operator [GBY_333] (rows=348477374 width=88) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 + Group By Operator [GBY_38] (rows=696954748 width=88) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6 + Select Operator [SEL_36] (rows=696954748 width=88) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Merge Join Operator [MERGEJOIN_278] (rows=696954748 width=88) + Conds:RS_33._col1=RS_316._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + <-Map 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_316] + PartitionCols:_col0 + Select Operator [SEL_312] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_311] (rows=80000000 width=860) + predicate:(c_customer_id is not null and c_customer_sk is not null) + TableScan [TS_49] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id","c_first_name","c_last_name","c_preferred_cust_flag","c_birth_country","c_login","c_email_address"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_277] (rows=633595212 width=88) + Conds:RS_332._col0=RS_294._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 15 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_294] + PartitionCols:_col0 + Select Operator [SEL_288] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_285] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_46] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Map 7 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_332] + PartitionCols:_col0 + Select Operator [SEL_331] (rows=575995635 width=88) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_330] (rows=575995635 width=88) + predicate:((ss_customer_sk BETWEEN DynamicValue(RS_34_customer_c_customer_sk_min) AND DynamicValue(RS_34_customer_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_34_customer_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_31_date_dim_d_date_sk_min) AND DynamicValue(RS_31_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_31_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_21] (rows=575995635 width=88) + default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_discount_amt","ss_ext_list_price"] + <-Reducer 18 [BROADCAST_EDGE] vectorized + BROADCAST [RS_327] + Group By Operator [GBY_326] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_304] + Group By Operator [GBY_300] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_295] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_288] + <-Reducer 25 [BROADCAST_EDGE] vectorized + BROADCAST [RS_329] + Group By Operator [GBY_328] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=80000000)"] + <-Map 23 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_322] + Group By Operator [GBY_320] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=80000000)"] + Select Operator [SEL_317] (rows=80000000 width=860) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_312] + <-Reducer 14 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_347] + PartitionCols:_col0 + Select Operator [SEL_346] (rows=348477374 width=88) Output:["_col0","_col1","_col2"] - Group By Operator [GBY_208] (rows=348477374 width=88) + Group By Operator [GBY_345] (rows=348477374 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 - <-Reducer 12 [SIMPLE_EDGE] + <-Reducer 13 [SIMPLE_EDGE] SHUFFLE [RS_61] PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 Group By Operator [GBY_60] (rows=696954748 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6 Select Operator [SEL_58] (rows=696954748 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Merge Join Operator [MERGEJOIN_172] (rows=696954748 width=88) - Conds:RS_55._col1=RS_192._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - <-Map 18 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_192] + Merge Join Operator [MERGEJOIN_280] (rows=696954748 width=88) + Conds:RS_55._col1=RS_313._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + <-Map 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_313] PartitionCols:_col0 - Select Operator [SEL_191] (rows=80000000 width=860) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Filter Operator [FIL_190] (rows=80000000 width=860) - predicate:(c_customer_id is not null and c_customer_sk is not null) - TableScan [TS_49] (rows=80000000 width=860) - default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id","c_first_name","c_last_name","c_preferred_cust_flag","c_birth_country","c_login","c_email_address"] - <-Reducer 11 [SIMPLE_EDGE] + Please refer to the previous Select Operator [SEL_312] + <-Reducer 12 [SIMPLE_EDGE] SHUFFLE [RS_55] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_171] (rows=633595212 width=88) - Conds:RS_206._col0=RS_186._col0(Inner),Output:["_col1","_col2","_col3"] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_186] + Merge Join Operator [MERGEJOIN_279] (rows=633595212 width=88) + Conds:RS_344._col0=RS_290._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 15 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_290] PartitionCols:_col0 - Select Operator [SEL_183] (rows=36524 width=1119) + Select Operator [SEL_287] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_180] (rows=36524 width=1119) + Filter Operator [FIL_284] (rows=36524 width=1119) predicate:((d_year = 2002) and d_date_sk is not null) - TableScan [TS_46] (rows=73049 width=1119) - default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] - <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_206] + Please refer to the previous TableScan [TS_46] + <-Map 11 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_344] PartitionCols:_col0 - Select Operator [SEL_205] (rows=575995635 width=88) + Select Operator [SEL_343] (rows=575995635 width=88) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_204] (rows=575995635 width=88) - predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null) + Filter Operator [FIL_342] (rows=575995635 width=88) + predicate:((ss_customer_sk BETWEEN DynamicValue(RS_56_customer_c_customer_sk_min) AND DynamicValue(RS_56_customer_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_56_customer_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_53_date_dim_d_date_sk_min) AND DynamicValue(RS_53_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_53_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null) TableScan [TS_43] (rows=575995635 width=88) default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_discount_amt","ss_ext_list_price"] - <-Reducer 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_215] + <-Reducer 16 [BROADCAST_EDGE] vectorized + BROADCAST [RS_339] + Group By Operator [GBY_338] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_302] + Group By Operator [GBY_298] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_291] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_287] + <-Reducer 24 [BROADCAST_EDGE] vectorized + BROADCAST [RS_341] + Group By Operator [GBY_340] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=80000000)"] + <-Map 23 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_321] + Group By Operator [GBY_319] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=80000000)"] + Select Operator [SEL_314] (rows=80000000 width=860) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_312] + <-Reducer 21 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_357] PartitionCols:_col0 - Select Operator [SEL_214] (rows=116159124 width=88) + Select Operator [SEL_356] (rows=29040539 width=135) Output:["_col0","_col1"] - Filter Operator [FIL_213] (rows=116159124 width=88) + Filter Operator [FIL_355] (rows=29040539 width=135) predicate:(_col7 > 0) - Select Operator [SEL_212] (rows=348477374 width=88) + Select Operator [SEL_354] (rows=87121617 width=135) Output:["_col0","_col7"] - Group By Operator [GBY_211] (rows=348477374 width=88) + Group By Operator [GBY_353] (rows=87121617 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 - <-Reducer 15 [SIMPLE_EDGE] - SHUFFLE [RS_39] + <-Reducer 20 [SIMPLE_EDGE] + SHUFFLE [RS_82] PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 - Group By Operator [GBY_38] (rows=696954748 width=88) + Group By Operator [GBY_81] (rows=174243235 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6 - Select Operator [SEL_36] (rows=696954748 width=88) + Select Operator [SEL_79] (rows=174243235 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Merge Join Operator [MERGEJOIN_170] (rows=696954748 width=88) - Conds:RS_33._col1=RS_194._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - <-Map 18 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_194] + Merge Join Operator [MERGEJOIN_282] (rows=174243235 width=135) + Conds:RS_76._col1=RS_318._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + <-Map 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_318] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_191] - <-Reducer 14 [SIMPLE_EDGE] - SHUFFLE [RS_33] + Please refer to the previous Select Operator [SEL_312] + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_76] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_169] (rows=633595212 width=88) - Conds:RS_207._col0=RS_188._col0(Inner),Output:["_col1","_col2","_col3"] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_188] + Merge Join Operator [MERGEJOIN_281] (rows=158402938 width=135) + Conds:RS_352._col0=RS_296._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 15 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_296] PartitionCols:_col0 - Select Operator [SEL_184] (rows=36524 width=1119) + Select Operator [SEL_289] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_181] (rows=36524 width=1119) + Filter Operator [FIL_286] (rows=36524 width=1119) predicate:((d_year = 2001) and d_date_sk is not null) Please refer to the previous TableScan [TS_46] - <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_207] + <-Map 26 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_352] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_205] + Select Operator [SEL_351] (rows=144002668 width=135) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_350] (rows=144002668 width=135) + predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_74_date_dim_d_date_sk_min) AND DynamicValue(RS_74_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_74_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_64] (rows=144002668 width=135) + default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk","ws_ext_discount_amt","ws_ext_list_price"] + <-Reducer 22 [BROADCAST_EDGE] vectorized + BROADCAST [RS_349] + Group By Operator [GBY_348] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_305] + Group By Operator [GBY_301] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_297] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_289] <-Reducer 4 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_198] + SHUFFLE [RS_325] PartitionCols:_col0 - Select Operator [SEL_197] (rows=87121617 width=135) + Select Operator [SEL_324] (rows=87121617 width=135) Output:["_col0","_col1"] - Group By Operator [GBY_196] (rows=87121617 width=135) + Group By Operator [GBY_323] (rows=87121617 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_18] @@ -285,69 +401,39 @@ Stage-0 Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6 Select Operator [SEL_15] (rows=174243235 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Merge Join Operator [MERGEJOIN_168] (rows=174243235 width=135) - Conds:RS_12._col1=RS_193._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - <-Map 18 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_193] + Merge Join Operator [MERGEJOIN_276] (rows=174243235 width=135) + Conds:RS_12._col1=RS_315._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] + <-Map 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_315] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_191] + Please refer to the previous Select Operator [SEL_312] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_12] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_167] (rows=158402938 width=135) - Conds:RS_178._col0=RS_187._col0(Inner),Output:["_col1","_col2","_col3"] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_187] + Merge Join Operator [MERGEJOIN_275] (rows=158402938 width=135) + Conds:RS_310._col0=RS_292._col0(Inner),Output:["_col1","_col2","_col3"] + <-Map 15 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_292] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_183] + Please refer to the previous Select Operator [SEL_287] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_178] + SHUFFLE [RS_310] PartitionCols:_col0 - Select Operator [SEL_177] (rows=144002668 width=135) + Select Operator [SEL_309] (rows=144002668 width=135) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_176] (rows=144002668 width=135) - predicate:(ws_bill_customer_sk is not null and ws_sold_date_sk is not null) + Filter Operator [FIL_308] (rows=144002668 width=135) + predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_10_date_dim_d_date_sk_min) AND DynamicValue(RS_10_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_10_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null) TableScan [TS_0] (rows=144002668 width=135) default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk","ws_ext_discount_amt","ws_ext_list_price"] - <-Reducer 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_203] - PartitionCols:_col0 - Select Operator [SEL_202] (rows=29040539 width=135) - Output:["_col0","_col1"] - Filter Operator [FIL_201] (rows=29040539 width=135) - predicate:(_col7 > 0) - Select Operator [SEL_200] (rows=87121617 width=135) - Output:["_col0","_col7"] - Group By Operator [GBY_199] (rows=87121617 width=135) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 - <-Reducer 8 [SIMPLE_EDGE] - SHUFFLE [RS_82] - PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 - Group By Operator [GBY_81] (rows=174243235 width=135) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6 - Select Operator [SEL_79] (rows=174243235 width=135) - Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Merge Join Operator [MERGEJOIN_174] (rows=174243235 width=135) - Conds:RS_76._col1=RS_195._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"] - <-Map 18 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_195] - PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_191] - <-Reducer 7 [SIMPLE_EDGE] - SHUFFLE [RS_76] - PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_173] (rows=158402938 width=135) - Conds:RS_179._col0=RS_189._col0(Inner),Output:["_col1","_col2","_col3"] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_189] - PartitionCols:_col0 - Select Operator [SEL_185] (rows=36524 width=1119) - Output:["_col0"] - Filter Operator [FIL_182] (rows=36524 width=1119) - predicate:((d_year = 2001) and d_date_sk is not null) - Please refer to the previous TableScan [TS_46] - <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_179] - PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_177] + <-Reducer 17 [BROADCAST_EDGE] vectorized + BROADCAST [RS_307] + Group By Operator [GBY_306] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_303] + Group By Operator [GBY_299] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_293] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_287]
