http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query48.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query48.q.out b/ql/src/test/results/clientpositive/perf/tez/query48.q.out index 56eb93f..1cf8d5c 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query48.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query48.q.out @@ -131,19 +131,24 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) -Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) -Reducer 4 <- Map 9 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 10 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) +Map 8 <- Reducer 10 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) +Reducer 10 <- Map 9 (CUSTOM_SIMPLE_EDGE) +Reducer 12 <- Map 11 (CUSTOM_SIMPLE_EDGE) +Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) +Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 4 <- Map 11 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) +Reducer 5 <- Map 13 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (CUSTOM_SIMPLE_EDGE) +Reducer 7 <- Map 1 (CUSTOM_SIMPLE_EDGE) Stage-0 Fetch Operator limit:-1 Stage-1 Reducer 6 vectorized - File Output Operator [FS_73] - Group By Operator [GBY_72] (rows=1 width=8) + File Output Operator [FS_133] + Group By Operator [GBY_132] (rows=1 width=8) Output:["_col0"],aggregations:["sum(VALUE._col0)"] <-Reducer 5 [CUSTOM_SIMPLE_EDGE] PARTITION_ONLY_SHUFFLE [RS_30] @@ -153,66 +158,110 @@ Stage-0 Output:["_col5"] Filter Operator [FIL_27] (rows=15616947 width=88) predicate:(((_col14) IN ('KY', 'GA', 'NM') and _col7 BETWEEN 0 AND 2000) or ((_col14) IN ('MT', 'OR', 'IN') and _col7 BETWEEN 150 AND 3000) or ((_col14) IN ('WI', 'MO', 'WV') and _col7 BETWEEN 50 AND 25000)) - Merge Join Operator [MERGEJOIN_56] (rows=93701693 width=88) - Conds:RS_24._col3=RS_71._col0(Inner),Output:["_col5","_col7","_col14"] - <-Map 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_71] + Merge Join Operator [MERGEJOIN_96] (rows=93701693 width=88) + Conds:RS_24._col3=RS_123._col0(Inner),Output:["_col5","_col7","_col14"] + <-Map 13 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_123] PartitionCols:_col0 - Select Operator [SEL_70] (rows=10000000 width=1014) + Select Operator [SEL_122] (rows=10000000 width=1014) Output:["_col0","_col1"] - Filter Operator [FIL_69] (rows=10000000 width=1014) + Filter Operator [FIL_121] (rows=10000000 width=1014) predicate:((ca_country = 'United States') and (ca_state) IN ('KY', 'GA', 'NM', 'MT', 'OR', 'IN', 'WI', 'MO', 'WV') and ca_address_sk is not null) TableScan [TS_12] (rows=40000000 width=1014) default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"] <-Reducer 4 [SIMPLE_EDGE] SHUFFLE [RS_24] PartitionCols:_col3 - Merge Join Operator [MERGEJOIN_55] (rows=85183356 width=88) - Conds:RS_21._col2=RS_68._col0(Inner),Output:["_col3","_col5","_col7"] - <-Map 9 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_68] + Merge Join Operator [MERGEJOIN_95] (rows=85183356 width=88) + Conds:RS_21._col2=RS_115._col0(Inner),Output:["_col3","_col5","_col7"] + <-Map 11 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_115] PartitionCols:_col0 - Select Operator [SEL_67] (rows=465450 width=385) + Select Operator [SEL_114] (rows=465450 width=385) Output:["_col0"] - Filter Operator [FIL_66] (rows=465450 width=385) + Filter Operator [FIL_113] (rows=465450 width=385) predicate:((cd_education_status = '4 yr Degree') and (cd_marital_status = 'M') and cd_demo_sk is not null) TableScan [TS_9] (rows=1861800 width=385) default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_21] PartitionCols:_col2 - Merge Join Operator [MERGEJOIN_54] (rows=77439413 width=88) - Conds:RS_18._col1=RS_65._col0(Inner),Output:["_col2","_col3","_col5","_col7"] - <-Map 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_65] + Merge Join Operator [MERGEJOIN_94] (rows=77439413 width=88) + Conds:RS_18._col1=RS_107._col0(Inner),Output:["_col2","_col3","_col5","_col7"] + <-Map 9 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_107] PartitionCols:_col0 - Select Operator [SEL_64] (rows=36524 width=1119) + Select Operator [SEL_106] (rows=36524 width=1119) Output:["_col0"] - Filter Operator [FIL_63] (rows=36524 width=1119) + Filter Operator [FIL_105] (rows=36524 width=1119) predicate:((d_year = 1998) and d_date_sk is not null) TableScan [TS_6] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_18] PartitionCols:_col1 - Merge Join Operator [MERGEJOIN_53] (rows=70399465 width=88) - Conds:RS_59._col0=RS_62._col3(Inner),Output:["_col1","_col2","_col3","_col5","_col7"] + Merge Join Operator [MERGEJOIN_93] (rows=70399465 width=88) + Conds:RS_99._col0=RS_131._col3(Inner),Output:["_col1","_col2","_col3","_col5","_col7"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_59] + PARTITION_ONLY_SHUFFLE [RS_99] PartitionCols:_col0 - Select Operator [SEL_58] (rows=1704 width=1910) + Select Operator [SEL_98] (rows=1704 width=1910) Output:["_col0"] - Filter Operator [FIL_57] (rows=1704 width=1910) + Filter Operator [FIL_97] (rows=1704 width=1910) predicate:s_store_sk is not null TableScan [TS_0] (rows=1704 width=1910) default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"] - <-Map 7 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_62] + <-Map 8 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_131] PartitionCols:_col3 - Select Operator [SEL_61] (rows=63999513 width=88) + Select Operator [SEL_130] (rows=63999513 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col6"] - Filter Operator [FIL_60] (rows=63999513 width=88) - predicate:((ss_net_profit BETWEEN 0 AND 2000 or ss_net_profit BETWEEN 150 AND 3000 or ss_net_profit BETWEEN 50 AND 25000) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 150 AND 200) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null) + Filter Operator [FIL_129] (rows=63999513 width=88) + predicate:((ss_addr_sk BETWEEN DynamicValue(RS_25_customer_address_ca_address_sk_min) AND DynamicValue(RS_25_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_25_customer_address_ca_address_sk_bloom_filter))) and (ss_cdemo_sk BETWEEN DynamicValue(RS_22_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_22_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_22_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_net_profit BETWEEN 0 AND 2000 or ss_net_profit BETWEEN 150 AND 3000 or ss_net_profit BETWEEN 50 AND 25000) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 150 AND 200) and (ss_sold_date_sk BETWEEN DynamicValue(RS_19_date_dim_d_date_sk_min) AND DynamicValue(RS_19_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_19_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN Dynami cValue(RS_15_store_s_store_sk_min) AND DynamicValue(RS_15_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_15_store_s_store_sk_bloom_filter))) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null) TableScan [TS_3] (rows=575995635 width=88) default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_net_profit"] + <-Reducer 10 [BROADCAST_EDGE] vectorized + BROADCAST [RS_112] + Group By Operator [GBY_111] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 9 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_110] + Group By Operator [GBY_109] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_108] (rows=36524 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_106] + <-Reducer 12 [BROADCAST_EDGE] vectorized + BROADCAST [RS_120] + Group By Operator [GBY_119] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 11 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_118] + Group By Operator [GBY_117] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_116] (rows=465450 width=385) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_114] + <-Reducer 14 [BROADCAST_EDGE] vectorized + BROADCAST [RS_128] + Group By Operator [GBY_127] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=10000000)"] + <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized + SHUFFLE [RS_126] + Group By Operator [GBY_125] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=10000000)"] + Select Operator [SEL_124] (rows=10000000 width=1014) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_122] + <-Reducer 7 [BROADCAST_EDGE] vectorized + BROADCAST [RS_104] + Group By Operator [GBY_103] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 1 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_102] + Group By Operator [GBY_101] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_100] (rows=1704 width=1910) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_98]
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query49.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/query49.q.out b/ql/src/test/results/clientpositive/perf/tez/query49.q.out index 47f37a2..434ed16 100644 --- a/ql/src/test/results/clientpositive/perf/tez/query49.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/query49.q.out @@ -253,20 +253,26 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage +Map 1 <- Reducer 13 (BROADCAST_EDGE) +Map 27 <- Reducer 19 (BROADCAST_EDGE) +Map 29 <- Reducer 25 (BROADCAST_EDGE) Reducer 10 <- Union 9 (SIMPLE_EDGE) Reducer 11 <- Reducer 10 (SIMPLE_EDGE) -Reducer 13 <- Map 12 (SIMPLE_EDGE), Map 24 (SIMPLE_EDGE) -Reducer 14 <- Map 25 (SIMPLE_EDGE), Reducer 13 (SIMPLE_EDGE) -Reducer 15 <- Reducer 14 (SIMPLE_EDGE) +Reducer 13 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 14 <- Map 12 (SIMPLE_EDGE), Map 27 (SIMPLE_EDGE) +Reducer 15 <- Map 28 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE) Reducer 16 <- Reducer 15 (SIMPLE_EDGE) -Reducer 17 <- Reducer 16 (SIMPLE_EDGE), Union 7 (CONTAINS) -Reducer 18 <- Map 12 (SIMPLE_EDGE), Map 26 (SIMPLE_EDGE) -Reducer 19 <- Map 27 (SIMPLE_EDGE), Reducer 18 (SIMPLE_EDGE) +Reducer 17 <- Reducer 16 (SIMPLE_EDGE) +Reducer 18 <- Reducer 17 (SIMPLE_EDGE), Union 7 (CONTAINS) +Reducer 19 <- Map 12 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE) -Reducer 20 <- Reducer 19 (SIMPLE_EDGE) -Reducer 21 <- Reducer 20 (SIMPLE_EDGE) -Reducer 22 <- Reducer 21 (SIMPLE_EDGE), Union 9 (CONTAINS) -Reducer 3 <- Map 23 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 20 <- Map 12 (SIMPLE_EDGE), Map 29 (SIMPLE_EDGE) +Reducer 21 <- Map 30 (SIMPLE_EDGE), Reducer 20 (SIMPLE_EDGE) +Reducer 22 <- Reducer 21 (SIMPLE_EDGE) +Reducer 23 <- Reducer 22 (SIMPLE_EDGE) +Reducer 24 <- Reducer 23 (SIMPLE_EDGE), Union 9 (CONTAINS) +Reducer 25 <- Map 12 (CUSTOM_SIMPLE_EDGE) +Reducer 3 <- Map 26 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE), Union 7 (CONTAINS) @@ -277,185 +283,207 @@ Stage-0 limit:100 Stage-1 Reducer 11 vectorized - File Output Operator [FS_205] - Limit [LIM_204] (rows=100 width=101) + File Output Operator [FS_306] + Limit [LIM_305] (rows=100 width=101) Number of rows:100 - Select Operator [SEL_203] (rows=5915494 width=101) + Select Operator [SEL_304] (rows=5915494 width=101) Output:["_col0","_col1","_col2","_col3","_col4"] <-Reducer 10 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_202] - Select Operator [SEL_201] (rows=5915494 width=101) + SHUFFLE [RS_303] + Select Operator [SEL_302] (rows=5915494 width=101) Output:["_col0","_col1","_col2","_col3","_col4"] - Group By Operator [GBY_200] (rows=5915494 width=101) + Group By Operator [GBY_301] (rows=5915494 width=101) Output:["_col0","_col1","_col2","_col3","_col4"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 <-Union 9 [SIMPLE_EDGE] - <-Reducer 22 [CONTAINS] vectorized - Reduce Output Operator [RS_241] + <-Reducer 24 [CONTAINS] vectorized + Reduce Output Operator [RS_346] PartitionCols:_col0, _col1, _col2, _col3, _col4 - Group By Operator [GBY_240] (rows=11830988 width=101) + Group By Operator [GBY_345] (rows=11830988 width=101) Output:["_col0","_col1","_col2","_col3","_col4"],keys:_col0, _col3, _col4, _col1, _col2 - Select Operator [SEL_239] (rows=8604378 width=88) + Select Operator [SEL_344] (rows=8604378 width=88) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_238] (rows=8604378 width=88) + Filter Operator [FIL_343] (rows=8604378 width=88) predicate:((_col0 <= 10) or (rank_window_1 <= 10)) - PTF Operator [PTF_237] (rows=12906568 width=88) + PTF Operator [PTF_342] (rows=12906568 width=88) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col4 AS decimal(15,4)) / CAST( _col5 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_236] (rows=12906568 width=88) + Select Operator [SEL_341] (rows=12906568 width=88) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] - <-Reducer 21 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_235] + <-Reducer 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_340] PartitionCols:0 - Select Operator [SEL_234] (rows=12906568 width=88) + Select Operator [SEL_339] (rows=12906568 width=88) Output:["rank_window_0","_col0","_col1","_col2","_col3","_col4"] - PTF Operator [PTF_233] (rows=12906568 width=88) + PTF Operator [PTF_338] (rows=12906568 width=88) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col1 AS decimal(15,4)) / CAST( _col2 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_232] (rows=12906568 width=88) + Select Operator [SEL_337] (rows=12906568 width=88) Output:["_col0","_col1","_col2","_col3","_col4"] - <-Reducer 20 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_231] + <-Reducer 22 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_336] PartitionCols:0 - Group By Operator [GBY_230] (rows=12906568 width=88) + Group By Operator [GBY_335] (rows=12906568 width=88) Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"],keys:KEY._col0 - <-Reducer 19 [SIMPLE_EDGE] + <-Reducer 21 [SIMPLE_EDGE] SHUFFLE [RS_89] PartitionCols:_col0 Group By Operator [GBY_88] (rows=25813137 width=88) Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0 Select Operator [SEL_86] (rows=25813137 width=88) Output:["_col0","_col1","_col2","_col3","_col4"] - Merge Join Operator [MERGEJOIN_146] (rows=25813137 width=88) - Conds:RS_83._col1, _col2=RS_229._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] - <-Map 27 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_229] + Merge Join Operator [MERGEJOIN_236] (rows=25813137 width=88) + Conds:RS_83._col1, _col2=RS_334._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] + <-Map 30 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_334] PartitionCols:_col0, _col1 - Select Operator [SEL_228] (rows=19197050 width=77) + Select Operator [SEL_333] (rows=19197050 width=77) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_227] (rows=19197050 width=77) + Filter Operator [FIL_332] (rows=19197050 width=77) predicate:((sr_return_amt > 10000) and sr_item_sk is not null and sr_ticket_number is not null) TableScan [TS_77] (rows=57591150 width=77) default@store_returns,sr,Tbl:COMPLETE,Col:NONE,Output:["sr_item_sk","sr_ticket_number","sr_return_quantity","sr_return_amt"] - <-Reducer 18 [SIMPLE_EDGE] + <-Reducer 20 [SIMPLE_EDGE] SHUFFLE [RS_83] PartitionCols:_col1, _col2 - Merge Join Operator [MERGEJOIN_145] (rows=23466488 width=88) - Conds:RS_226._col0=RS_180._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_235] (rows=23466488 width=88) + Conds:RS_331._col0=RS_269._col0(Inner),Output:["_col1","_col2","_col3","_col4"] <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_180] + PARTITION_ONLY_SHUFFLE [RS_269] PartitionCols:_col0 - Select Operator [SEL_177] (rows=18262 width=1119) + Select Operator [SEL_264] (rows=18262 width=1119) Output:["_col0"] - Filter Operator [FIL_176] (rows=18262 width=1119) + Filter Operator [FIL_263] (rows=18262 width=1119) predicate:((d_moy = 12) and (d_year = 2000) and d_date_sk is not null) TableScan [TS_3] (rows=73049 width=1119) default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] - <-Map 26 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_226] + <-Map 29 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_331] PartitionCols:_col0 - Select Operator [SEL_225] (rows=21333171 width=88) + Select Operator [SEL_330] (rows=21333171 width=88) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_224] (rows=21333171 width=88) - predicate:((ss_net_paid > 0) and (ss_net_profit > 1) and (ss_quantity > 0) and ss_item_sk is not null and ss_sold_date_sk is not null and ss_ticket_number is not null) + Filter Operator [FIL_329] (rows=21333171 width=88) + predicate:((ss_net_paid > 0) and (ss_net_profit > 1) and (ss_quantity > 0) and (ss_sold_date_sk BETWEEN DynamicValue(RS_81_date_dim_d_date_sk_min) AND DynamicValue(RS_81_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_81_date_dim_d_date_sk_bloom_filter))) and ss_item_sk is not null and ss_sold_date_sk is not null and ss_ticket_number is not null) TableScan [TS_71] (rows=575995635 width=88) default@store_sales,sts,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ticket_number","ss_quantity","ss_net_paid","ss_net_profit"] + <-Reducer 25 [BROADCAST_EDGE] vectorized + BROADCAST [RS_328] + Group By Operator [GBY_327] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_276] + Group By Operator [GBY_273] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_270] (rows=18262 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_264] <-Reducer 8 [CONTAINS] vectorized - Reduce Output Operator [RS_199] + Reduce Output Operator [RS_300] PartitionCols:_col0, _col1, _col2, _col3, _col4 - Group By Operator [GBY_198] (rows=11830988 width=101) + Group By Operator [GBY_299] (rows=11830988 width=101) Output:["_col0","_col1","_col2","_col3","_col4"],keys:_col0, _col3, _col4, _col1, _col2 - Select Operator [SEL_197] (rows=3226610 width=135) + Select Operator [SEL_298] (rows=3226610 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Group By Operator [GBY_196] (rows=3226610 width=135) + Group By Operator [GBY_297] (rows=3226610 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 <-Union 7 [SIMPLE_EDGE] - <-Reducer 17 [CONTAINS] vectorized - Reduce Output Operator [RS_223] + <-Reducer 18 [CONTAINS] vectorized + Reduce Output Operator [RS_326] PartitionCols:_col0, _col1, _col2, _col3, _col4 - Group By Operator [GBY_222] (rows=6453220 width=135) + Group By Operator [GBY_325] (rows=6453220 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],keys:_col0, _col3, _col4, _col1, _col2 - Select Operator [SEL_221] (rows=4302070 width=135) + Select Operator [SEL_324] (rows=4302070 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_220] (rows=4302070 width=135) + Filter Operator [FIL_323] (rows=4302070 width=135) predicate:((_col0 <= 10) or (rank_window_1 <= 10)) - PTF Operator [PTF_219] (rows=6453105 width=135) + PTF Operator [PTF_322] (rows=6453105 width=135) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col4 AS decimal(15,4)) / CAST( _col5 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_218] (rows=6453105 width=135) + Select Operator [SEL_321] (rows=6453105 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] - <-Reducer 16 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_217] + <-Reducer 17 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_320] PartitionCols:0 - Select Operator [SEL_216] (rows=6453105 width=135) + Select Operator [SEL_319] (rows=6453105 width=135) Output:["rank_window_0","_col0","_col1","_col2","_col3","_col4"] - PTF Operator [PTF_215] (rows=6453105 width=135) + PTF Operator [PTF_318] (rows=6453105 width=135) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col1 AS decimal(15,4)) / CAST( _col2 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_214] (rows=6453105 width=135) + Select Operator [SEL_317] (rows=6453105 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - <-Reducer 15 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_213] + <-Reducer 16 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_316] PartitionCols:0 - Group By Operator [GBY_212] (rows=6453105 width=135) + Group By Operator [GBY_315] (rows=6453105 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"],keys:KEY._col0 - <-Reducer 14 [SIMPLE_EDGE] + <-Reducer 15 [SIMPLE_EDGE] SHUFFLE [RS_50] PartitionCols:_col0 Group By Operator [GBY_49] (rows=12906211 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0 Select Operator [SEL_47] (rows=12906211 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Merge Join Operator [MERGEJOIN_144] (rows=12906211 width=135) - Conds:RS_44._col1, _col2=RS_211._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] - <-Map 25 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_211] + Merge Join Operator [MERGEJOIN_234] (rows=12906211 width=135) + Conds:RS_44._col1, _col2=RS_314._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] + <-Map 28 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_314] PartitionCols:_col0, _col1 - Select Operator [SEL_210] (rows=9599627 width=106) + Select Operator [SEL_313] (rows=9599627 width=106) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_209] (rows=9599627 width=106) + Filter Operator [FIL_312] (rows=9599627 width=106) predicate:((cr_return_amount > 10000) and cr_item_sk is not null and cr_order_number is not null) TableScan [TS_38] (rows=28798881 width=106) default@catalog_returns,cr,Tbl:COMPLETE,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_return_quantity","cr_return_amount"] - <-Reducer 13 [SIMPLE_EDGE] + <-Reducer 14 [SIMPLE_EDGE] SHUFFLE [RS_44] PartitionCols:_col1, _col2 - Merge Join Operator [MERGEJOIN_143] (rows=11732919 width=135) - Conds:RS_208._col0=RS_179._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_233] (rows=11732919 width=135) + Conds:RS_311._col0=RS_267._col0(Inner),Output:["_col1","_col2","_col3","_col4"] <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_179] + PARTITION_ONLY_SHUFFLE [RS_267] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_177] - <-Map 24 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_208] + Please refer to the previous Select Operator [SEL_264] + <-Map 27 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_311] PartitionCols:_col0 - Select Operator [SEL_207] (rows=10666290 width=135) + Select Operator [SEL_310] (rows=10666290 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_206] (rows=10666290 width=135) - predicate:((cs_net_paid > 0) and (cs_net_profit > 1) and (cs_quantity > 0) and cs_item_sk is not null and cs_order_number is not null and cs_sold_date_sk is not null) + Filter Operator [FIL_309] (rows=10666290 width=135) + predicate:((cs_net_paid > 0) and (cs_net_profit > 1) and (cs_quantity > 0) and (cs_sold_date_sk BETWEEN DynamicValue(RS_42_date_dim_d_date_sk_min) AND DynamicValue(RS_42_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_42_date_dim_d_date_sk_bloom_filter))) and cs_item_sk is not null and cs_order_number is not null and cs_sold_date_sk is not null) TableScan [TS_32] (rows=287989836 width=135) default@catalog_sales,cs,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_order_number","cs_quantity","cs_net_paid","cs_net_profit"] + <-Reducer 19 [BROADCAST_EDGE] vectorized + BROADCAST [RS_308] + Group By Operator [GBY_307] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_275] + Group By Operator [GBY_272] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_268] (rows=18262 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_264] <-Reducer 6 [CONTAINS] vectorized - Reduce Output Operator [RS_195] + Reduce Output Operator [RS_296] PartitionCols:_col0, _col1, _col2, _col3, _col4 - Group By Operator [GBY_194] (rows=6453220 width=135) + Group By Operator [GBY_295] (rows=6453220 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],keys:_col0, _col3, _col4, _col1, _col2 - Select Operator [SEL_193] (rows=2151150 width=135) + Select Operator [SEL_294] (rows=2151150 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_192] (rows=2151150 width=135) + Filter Operator [FIL_293] (rows=2151150 width=135) predicate:((_col0 <= 10) or (rank_window_1 <= 10)) - PTF Operator [PTF_191] (rows=3226726 width=135) + PTF Operator [PTF_292] (rows=3226726 width=135) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col4 AS decimal(15,4)) / CAST( _col5 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_190] (rows=3226726 width=135) + Select Operator [SEL_291] (rows=3226726 width=135) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] <-Reducer 5 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_189] + SHUFFLE [RS_290] PartitionCols:0 - Select Operator [SEL_188] (rows=3226726 width=135) + Select Operator [SEL_289] (rows=3226726 width=135) Output:["rank_window_0","_col0","_col1","_col2","_col3","_col4"] - PTF Operator [PTF_187] (rows=3226726 width=135) + PTF Operator [PTF_288] (rows=3226726 width=135) Function definitions:[{},{"name:":"windowingtablefunction","order by:":"(CAST( _col1 AS decimal(15,4)) / CAST( _col2 AS decimal(15,4))) ASC NULLS FIRST","partition by:":"0"}] - Select Operator [SEL_186] (rows=3226726 width=135) + Select Operator [SEL_287] (rows=3226726 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] <-Reducer 4 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_185] + SHUFFLE [RS_286] PartitionCols:0 - Group By Operator [GBY_184] (rows=3226726 width=135) + Group By Operator [GBY_285] (rows=3226726 width=135) Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"],keys:KEY._col0 <-Reducer 3 [SIMPLE_EDGE] SHUFFLE [RS_18] @@ -464,33 +492,44 @@ Stage-0 Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0 Select Operator [SEL_15] (rows=6453452 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Merge Join Operator [MERGEJOIN_142] (rows=6453452 width=135) - Conds:RS_12._col1, _col2=RS_183._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] - <-Map 23 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_183] + Merge Join Operator [MERGEJOIN_232] (rows=6453452 width=135) + Conds:RS_12._col1, _col2=RS_284._col0, _col1(Inner),Output:["_col1","_col3","_col4","_col11","_col12"] + <-Map 26 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_284] PartitionCols:_col0, _col1 - Select Operator [SEL_182] (rows=4799489 width=92) + Select Operator [SEL_283] (rows=4799489 width=92) Output:["_col0","_col1","_col2","_col3"] - Filter Operator [FIL_181] (rows=4799489 width=92) + Filter Operator [FIL_282] (rows=4799489 width=92) predicate:((wr_return_amt > 10000) and wr_item_sk is not null and wr_order_number is not null) TableScan [TS_6] (rows=14398467 width=92) default@web_returns,wr,Tbl:COMPLETE,Col:NONE,Output:["wr_item_sk","wr_order_number","wr_return_quantity","wr_return_amt"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_12] PartitionCols:_col1, _col2 - Merge Join Operator [MERGEJOIN_141] (rows=5866775 width=135) - Conds:RS_175._col0=RS_178._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_231] (rows=5866775 width=135) + Conds:RS_281._col0=RS_265._col0(Inner),Output:["_col1","_col2","_col3","_col4"] <-Map 12 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_178] + PARTITION_ONLY_SHUFFLE [RS_265] PartitionCols:_col0 - Please refer to the previous Select Operator [SEL_177] + Please refer to the previous Select Operator [SEL_264] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_175] + SHUFFLE [RS_281] PartitionCols:_col0 - Select Operator [SEL_174] (rows=5333432 width=135) + Select Operator [SEL_280] (rows=5333432 width=135) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_173] (rows=5333432 width=135) - predicate:((ws_net_paid > 0) and (ws_net_profit > 1) and (ws_quantity > 0) and ws_item_sk is not null and ws_order_number is not null and ws_sold_date_sk is not null) + Filter Operator [FIL_279] (rows=5333432 width=135) + predicate:((ws_net_paid > 0) and (ws_net_profit > 1) and (ws_quantity > 0) and (ws_sold_date_sk BETWEEN DynamicValue(RS_10_date_dim_d_date_sk_min) AND DynamicValue(RS_10_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_10_date_dim_d_date_sk_bloom_filter))) and ws_item_sk is not null and ws_order_number is not null and ws_sold_date_sk is not null) TableScan [TS_0] (rows=144002668 width=135) default@web_sales,ws,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_order_number","ws_quantity","ws_net_paid","ws_net_profit"] + <-Reducer 13 [BROADCAST_EDGE] vectorized + BROADCAST [RS_278] + Group By Operator [GBY_277] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] + <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized + PARTITION_ONLY_SHUFFLE [RS_274] + Group By Operator [GBY_271] (rows=1 width=12) + Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] + Select Operator [SEL_266] (rows=18262 width=1119) + Output:["_col0"] + Please refer to the previous Select Operator [SEL_264]
