http://git-wip-us.apache.org/repos/asf/hive/blob/be9735e1/ql/src/test/results/clientpositive/llap/constprog_dpp.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/llap/constprog_dpp.q.out b/ql/src/test/results/clientpositive/llap/constprog_dpp.q.out index a1addb7..ab0b36c 100644 --- a/ql/src/test/results/clientpositive/llap/constprog_dpp.q.out +++ b/ql/src/test/results/clientpositive/llap/constprog_dpp.q.out @@ -47,70 +47,41 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 5 <- Union 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 llap - File Output Operator [FS_17] - compressed:false - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_21] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] llap - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_1] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] llap - Reduce Output Operator [RS_14] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Limit [LIM_11] - Number of rows:1 - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Select Operator [SEL_10] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - |<-Union 4 [SIMPLE_EDGE] - |<-Map 3 [CONTAINS] llap - | Reduce Output Operator [RS_9] - | sort order: - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - | value expressions:_col0 (type: int) - | Limit [LIM_8] - | Number of rows:1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - | Select Operator [SEL_3] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_2] - | alias:tb2 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 6 [CONTAINS] llap - Reduce Output Operator [RS_9] - sort order: - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - value expressions:_col0 (type: int) - Limit [LIM_8] - Number of rows:1 - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - TableScan [TS_4] - alias:tb2 - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 llap + File Output Operator [FS_17] + Merge Join Operator [MERGEJOIN_21] (rows=1 width=0) + Conds:RS_13._col0=RS_14._col0(Left Outer),Output:["_col0"] + <-Map 1 [SIMPLE_EDGE] llap + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_1] (rows=1 width=0) + Output:["_col0"] + TableScan [TS_0] (rows=1 width=0) + default@tb1,a,Tbl:PARTIAL,Col:NONE,Output:["id"] + <-Reducer 5 [SIMPLE_EDGE] llap + SHUFFLE [RS_14] + PartitionCols:_col0 + Limit [LIM_11] (rows=1 width=0) + Number of rows:1 + Select Operator [SEL_10] (rows=1 width=0) + Output:["_col0"] + <-Union 4 [SIMPLE_EDGE] + <-Map 3 [CONTAINS] llap + Reduce Output Operator [RS_9] + Limit [LIM_8] (rows=1 width=0) + Number of rows:1 + Select Operator [SEL_3] (rows=1 width=0) + Output:["_col0"] + TableScan [TS_2] (rows=1 width=0) + Output:["id"] + <-Map 6 [CONTAINS] llap + Reduce Output Operator [RS_9] + Limit [LIM_8] (rows=1 width=0) + Number of rows:1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0"] + TableScan [TS_4] (rows=1 width=0)
http://git-wip-us.apache.org/repos/asf/hive/blob/be9735e1/ql/src/test/results/clientpositive/perf/query12.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/query12.q.out b/ql/src/test/results/clientpositive/perf/query12.q.out index 648d64d..ce3654a 100644 --- a/ql/src/test/results/clientpositive/perf/query12.q.out +++ b/ql/src/test/results/clientpositive/perf/query12.q.out @@ -12,118 +12,63 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_26] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_25] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_24] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col1 (type: string), _col2 (type: string), _col4 (type: string), _col0 (type: string), _col6 (type: decimal(38,23)) - sort order:+++++ - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_20] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_19] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col3 (type: string) - Map-reduce partition columns:_col3 (type: string) - sort order:+ - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Group By Operator [GBY_17] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: decimal(7,2)) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: decimal(7,2)) - sort order:+++++ - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)) - Group By Operator [GBY_15] - aggregations:["sum(_col23)"] - keys:_col38 (type: string), _col41 (type: string), _col49 (type: string), _col47 (type: string), _col42 (type: decimal(7,2)) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_14] - outputColumnNames:["_col38","_col41","_col49","_col47","_col42","_col23"] - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_32] - predicate:((_col3 = _col37) and (_col0 = _col62)) (type: boolean) - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_37] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"d_date_sk (type: int)"} - | outputColumnNames:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49","_col62"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:d_date_sk (type: int) - | Map-reduce partition columns:d_date_sk (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_35] - | predicate:(d_date_sk is not null and d_date BETWEEN '2001-01-12' AND '2001-02-11') (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_2] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col23 (type: decimal(7,2)), _col37 (type: int), _col38 (type: string), _col41 (type: string), _col42 (type: decimal(7,2)), _col47 (type: string), _col49 (type: string) - Merge Join Operator [MERGEJOIN_36] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"ws_item_sk (type: int)","1":"i_item_sk (type: int)"} - | outputColumnNames:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:ws_item_sk (type: int) - | Map-reduce partition columns:ws_item_sk (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:ws_sold_date_sk (type: int), ws_ext_sales_price (type: decimal(7,2)) - | Filter Operator [FIL_33] - | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - key expressions:i_item_sk (type: int) - Map-reduce partition columns:i_item_sk (type: int) - sort order:+ - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - value expressions:i_item_id (type: string), i_item_desc (type: string), i_current_price (type: decimal(7,2)), i_class (type: string), i_category (type: string) - Filter Operator [FIL_34] - predicate:(i_item_sk is not null and (i_category) IN ('Jewelry', 'Sports', 'Books')) (type: boolean) - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_1] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_26] + Limit [LIM_25] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_24] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Select Operator [SEL_21] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_20] (rows=34938 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] + Select Operator [SEL_19] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col3 + Group By Operator [GBY_17] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_15] (rows=69877 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col23)"],keys:_col38, _col41, _col49, _col47, _col42 + Select Operator [SEL_14] (rows=69877 width=1436) + Output:["_col38","_col41","_col49","_col47","_col42","_col23"] + Filter Operator [FIL_32] (rows=69877 width=1436) + predicate:((_col3 = _col37) and (_col0 = _col62)) + Merge Join Operator [MERGEJOIN_37] (rows=279510 width=1436) + Conds:RS_9._col0=RS_11.d_date_sk(Inner),Output:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49","_col62"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:d_date_sk + Filter Operator [FIL_35] (rows=36524 width=1119) + predicate:(d_date_sk is not null and d_date BETWEEN '2001-01-12' AND '2001-02-11') + TableScan [TS_2] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_36] (rows=254100 width=1436) + Conds:RS_4.ws_item_sk=RS_6.i_item_sk(Inner),Output:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:ws_item_sk + Filter Operator [FIL_33] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_ext_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:i_item_sk + Filter Operator [FIL_34] (rows=231000 width=1436) + predicate:(i_item_sk is not null and (i_category) IN ('Jewelry', 'Sports', 'Books')) + TableScan [TS_1] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_class","i_category"] http://git-wip-us.apache.org/repos/asf/hive/blob/be9735e1/ql/src/test/results/clientpositive/perf/query13.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/query13.q.out b/ql/src/test/results/clientpositive/perf/query13.q.out index b8dc4cc..cc40e79 100644 --- a/ql/src/test/results/clientpositive/perf/query13.q.out +++ b/ql/src/test/results/clientpositive/perf/query13.q.out @@ -117,184 +117,99 @@ Reducer 6 <- Map 12 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_42] - compressed:false - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_40] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","sum(VALUE._col3)"] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - sort order: - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: struct<count:bigint,sum:double,input:int>), _col1 (type: struct<count:bigint,sum:decimal(17,2),input:decimal(7,2)>), _col2 (type: struct<count:bigint,sum:decimal(17,2),input:decimal(7,2)>), _col3 (type: decimal(17,2)) - Group By Operator [GBY_38] - aggregations:["avg(_col5)","avg(_col7)","avg(_col8)","sum(_col8)"] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_73] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col7","_col8"] - | Statistics:Num rows: 18150000 Data size: 18420070657 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_35] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_33] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_68] - | predicate:((d_year = 2001) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_31] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Select Operator [SEL_30] - outputColumnNames:["_col0","_col5","_col7","_col8"] - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_29] - predicate:(((_col17) IN ('KY', 'GA', 'NM') and _col9 BETWEEN 100 AND 200) or ((_col17) IN ('MT', 'OR', 'IN') and _col9 BETWEEN 150 AND 300) or ((_col17) IN ('WI', 'MO', 'WV') and _col9 BETWEEN 50 AND 250)) (type: boolean) - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col5","_col7","_col8","_col9","_col17"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_67] - | predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col5 (type: int), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - Select Operator [SEL_22] - outputColumnNames:["_col0","_col3","_col5","_col7","_col8","_col9"] - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_21] - predicate:(((_col12 = 'M') and (_col13 = '4 yr Degree') and _col6 BETWEEN 100.0 AND 150.0 and (_col15 = 3)) or ((_col12 = 'D') and (_col13 = 'Primary') and _col6 BETWEEN 50.0 AND 100.0 and (_col15 = 1)) or ((_col12 = 'U') and (_col13 = 'Advanced Degree') and _col6 BETWEEN 150.0 AND 200.0 and (_col15 = 1))) (type: boolean) - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_71] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13","_col15"] - | Statistics:Num rows: 23958 Data size: 8676981 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_66] - | predicate:(((hd_dep_count = 3) or (hd_dep_count = 1)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col12 (type: string), _col13 (type: string) - Merge Join Operator [MERGEJOIN_70] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13"] - | Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_65] - | predicate:((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_69] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col4 (type: int) - | Map-reduce partition columns:_col4 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_63] - | predicate:(((((((ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0) and (ss_net_profit BETWEEN 100 AND 200 or ss_net_profit BETWEEN 150 AND 300 or ss_net_profit BETWEEN 50 AND 250)) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_64] - predicate:s_store_sk is not null (type: boolean) - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:store - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_42] + Group By Operator [GBY_40] (rows=1 width=344) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","sum(VALUE._col3)"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + Group By Operator [GBY_38] (rows=1 width=112) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(_col5)","avg(_col7)","avg(_col8)","sum(_col8)"] + Merge Join Operator [MERGEJOIN_73] (rows=18150000 width=1014) + Conds:RS_34._col0=RS_35._col0(Inner),Output:["_col5","_col7","_col8"] + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col0 + Select Operator [SEL_33] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_68] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_31] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=16500000 width=1014) + Output:["_col0","_col5","_col7","_col8"] + Filter Operator [FIL_29] (rows=16500000 width=1014) + predicate:(((_col17) IN ('KY', 'GA', 'NM') and _col9 BETWEEN 100 AND 200) or ((_col17) IN ('MT', 'OR', 'IN') and _col9 BETWEEN 150 AND 300) or ((_col17) IN ('WI', 'MO', 'WV') and _col9 BETWEEN 50 AND 250)) + Merge Join Operator [MERGEJOIN_72] (rows=22000000 width=1014) + Conds:RS_26._col3=RS_27._col0(Inner),Output:["_col0","_col5","_col7","_col8","_col9","_col17"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_25] (rows=20000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_67] (rows=20000000 width=1014) + predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) + TableScan [TS_23] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col3 + Select Operator [SEL_22] (rows=4491 width=362) + Output:["_col0","_col3","_col5","_col7","_col8","_col9"] + Filter Operator [FIL_21] (rows=4491 width=362) + predicate:(((_col12 = 'M') and (_col13 = '4 yr Degree') and _col6 BETWEEN 100.0 AND 150.0 and (_col15 = 3)) or ((_col12 = 'D') and (_col13 = 'Primary') and _col6 BETWEEN 50.0 AND 100.0 and (_col15 = 1)) or ((_col12 = 'U') and (_col13 = 'Advanced Degree') and _col6 BETWEEN 150.0 AND 200.0 and (_col15 = 1))) + Merge Join Operator [MERGEJOIN_71] (rows=23958 width=362) + Conds:RS_18._col2=RS_19._col0(Inner),Output:["_col0","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13","_col15"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_66] (rows=7200 width=107) + predicate:(((hd_dep_count = 3) or (hd_dep_count = 1)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_70] (rows=21780 width=362) + Conds:RS_15._col1=RS_16._col0(Inner),Output:["_col0","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=19800 width=362) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_65] (rows=19800 width=362) + predicate:((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) + TableScan [TS_6] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_69] (rows=1874 width=1911) + Conds:RS_12._col4=RS_13._col0(Inner),Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Filter Operator [FIL_63] (rows=1 width=0) + predicate:(((((((ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0) and (ss_net_profit BETWEEN 100 AND 200 or ss_net_profit BETWEEN 150 AND 300 or ss_net_profit BETWEEN 50 AND 250)) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_ext_sales_price","ss_ext_wholesale_cost","ss_net_profit"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1704 width=1910) + Output:["_col0"] + Filter Operator [FIL_64] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_3] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"] http://git-wip-us.apache.org/repos/asf/hive/blob/be9735e1/ql/src/test/results/clientpositive/perf/query15.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/query15.q.out b/ql/src/test/results/clientpositive/perf/query15.q.out index c237828..e8c06ad 100644 --- a/ql/src/test/results/clientpositive/perf/query15.q.out +++ b/ql/src/test/results/clientpositive/perf/query15.q.out @@ -12,142 +12,76 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_30] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_26] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_24] - aggregations:["sum(_col2)"] - keys:_col7 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_23] - outputColumnNames:["_col7","_col2"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_47] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col7"] - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_44] - | predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col7 (type: string) - Select Operator [SEL_16] - outputColumnNames:["_col0","_col2","_col7"] - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_15] - predicate:((substr(_col7, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792') or (_col6) IN ('CA', 'WA', 'GA') or (_col2 > 500)) (type: boolean) - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_46] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col6","_col7"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_45] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_41] - | predicate:(cs_bill_customer_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_42] - predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_31] + Limit [LIM_30] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_29] (rows=53240002 width=860) + Output:["_col0","_col1"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_28] + Group By Operator [GBY_26] (rows=53240002 width=860) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Group By Operator [GBY_24] (rows=106480005 width=860) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col7 + Select Operator [SEL_23] (rows=106480005 width=860) + Output:["_col7","_col2"] + Merge Join Operator [MERGEJOIN_47] (rows=106480005 width=860) + Conds:RS_20._col0=RS_21._col0(Inner),Output:["_col2","_col7"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_44] (rows=18262 width=1119) + predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) + TableScan [TS_17] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=96800003 width=860) + Output:["_col0","_col2","_col7"] + Filter Operator [FIL_15] (rows=96800003 width=860) + predicate:((substr(_col7, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792') or (_col6) IN ('CA', 'WA', 'GA') or (_col2 > 500)) + Merge Join Operator [MERGEJOIN_46] (rows=96800003 width=860) + Conds:RS_12._col4=RS_13._col0(Inner),Output:["_col0","_col2","_col6","_col7"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_43] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_6] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_zip"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_45] (rows=88000001 width=860) + Conds:RS_9._col1=RS_10._col0(Inner),Output:["_col0","_col2","_col4"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_41] (rows=1 width=0) + predicate:(cs_bill_customer_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=80000000 width=860) + Output:["_col0","_col1"] + Filter Operator [FIL_42] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_3] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"]