HIVE-10628: Incorrect result when vectorized native mapjoin is enabled using 
null safe operators <=> (Matt McCline reviewed by Jason Dere)


Project: http://git-wip-us.apache.org/repos/asf/hive/repo
Commit: http://git-wip-us.apache.org/repos/asf/hive/commit/4a2a2bcd
Tree: http://git-wip-us.apache.org/repos/asf/hive/tree/4a2a2bcd
Diff: http://git-wip-us.apache.org/repos/asf/hive/diff/4a2a2bcd

Branch: refs/heads/master
Commit: 4a2a2bcd0202e2b4d3ee5eb2548d288b9c5b6881
Parents: 312711b
Author: Prasanth Jayachandran <j.prasant...@gmail.com>
Authored: Tue May 19 17:12:09 2015 -0700
Committer: Prasanth Jayachandran <j.prasant...@gmail.com>
Committed: Tue May 19 17:12:09 2015 -0700

----------------------------------------------------------------------
 .../test/resources/testconfiguration.properties |    1 +
 .../hive/ql/optimizer/physical/Vectorizer.java  |   12 +-
 .../clientpositive/vector_nullsafe_join.q       |   72 ++
 .../tez/vector_nullsafe_join.q.out              | 1210 ++++++++++++++++++
 .../clientpositive/vector_nullsafe_join.q.out   | 1208 +++++++++++++++++
 5 files changed, 2502 insertions(+), 1 deletion(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/hive/blob/4a2a2bcd/itests/src/test/resources/testconfiguration.properties
----------------------------------------------------------------------
diff --git a/itests/src/test/resources/testconfiguration.properties 
b/itests/src/test/resources/testconfiguration.properties
index c79c36c..a485408 100644
--- a/itests/src/test/resources/testconfiguration.properties
+++ b/itests/src/test/resources/testconfiguration.properties
@@ -233,6 +233,7 @@ minitez.query.files.shared=alter_merge_2_orc.q,\
   vector_mr_diff_schema_alias.q,\
   vector_multi_insert.q,\
   vector_non_string_partition.q,\
+  vector_nullsafe_join.q,\
   vector_orderby_5.q,\
   vector_outer_join0.q,\
   vector_outer_join1.q,\

http://git-wip-us.apache.org/repos/asf/hive/blob/4a2a2bcd/ql/src/java/org/apache/hadoop/hive/ql/optimizer/physical/Vectorizer.java
----------------------------------------------------------------------
diff --git 
a/ql/src/java/org/apache/hadoop/hive/ql/optimizer/physical/Vectorizer.java 
b/ql/src/java/org/apache/hadoop/hive/ql/optimizer/physical/Vectorizer.java
index 705b185..b429c56 100644
--- a/ql/src/java/org/apache/hadoop/hive/ql/optimizer/physical/Vectorizer.java
+++ b/ql/src/java/org/apache/hadoop/hive/ql/optimizer/physical/Vectorizer.java
@@ -1552,6 +1552,16 @@ public class Vectorizer implements PhysicalPlanResolver {
     return vectorOp;
   }
 
+  private boolean onExpressionHasNullSafes(MapJoinDesc desc) {
+    boolean[] nullSafes = desc.getNullSafes();
+    for (boolean nullSafe : nullSafes) {
+      if (nullSafe) {
+        return true;
+      }
+    }
+    return false;
+  }
+
   private boolean canSpecializeMapJoin(Operator<? extends OperatorDesc> op, 
MapJoinDesc desc,
       boolean isTez) {
 
@@ -1562,7 +1572,7 @@ public class Vectorizer implements PhysicalPlanResolver {
             HiveConf.ConfVars.HIVE_VECTORIZATION_MAPJOIN_NATIVE_ENABLED)) {
 
       // Currently, only under Tez and non-N-way joins.
-      if (isTez && desc.getConds().length == 1) {
+      if (isTez && desc.getConds().length == 1 && 
!onExpressionHasNullSafes(desc)) {
 
         // Ok, all basic restrictions satisfied so far...
         specialize = true;

http://git-wip-us.apache.org/repos/asf/hive/blob/4a2a2bcd/ql/src/test/queries/clientpositive/vector_nullsafe_join.q
----------------------------------------------------------------------
diff --git a/ql/src/test/queries/clientpositive/vector_nullsafe_join.q 
b/ql/src/test/queries/clientpositive/vector_nullsafe_join.q
new file mode 100644
index 0000000..316b2a6
--- /dev/null
+++ b/ql/src/test/queries/clientpositive/vector_nullsafe_join.q
@@ -0,0 +1,72 @@
+SET hive.vectorized.execution.enabled=true;
+SET hive.auto.convert.join=true;
+
+-- SORT_QUERY_RESULTS
+--
+-- We currently do not support null safes (i.e the <=> operator) in native 
vector map join.
+-- The explain output will show vectorized execution for both.  We verify the 
query
+-- results are the same (HIVE-10628 shows native will produce the wrong results
+-- otherwise).
+--
+-- This query for "HIVE-3315 join predicate transitive" triggers HIVE-10640-
+-- explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.key is NULL;
+-- select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is 
NULL;
+--
+CREATE TABLE myinput1_txt(key int, value int);
+LOAD DATA LOCAL INPATH '../../data/files/in8.txt' INTO TABLE myinput1_txt;
+CREATE TABLE myinput1 STORED AS ORC AS SELECT * FROM myinput1_txt;
+
+SET hive.vectorized.execution.mapjoin.native.enabled=false;
+
+-- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value join 
myinput1 c on a.key=c.key;
+select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on 
a.key=c.key;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value join 
myinput1 c on a.key<=>c.key;
+select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on 
a.key<=>c.key;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key 
join myinput1 c on a.key<=>c.key AND a.value=c.value;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value;
+
+-- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value;
+SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON a.key<=>b.value;
+SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON a.key<=>b.value;
+
+-- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value;
+SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value;
+
+SET hive.vectorized.execution.mapjoin.native.enabled=true;
+
+-- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value join 
myinput1 c on a.key=c.key;
+select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on 
a.key=c.key;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value join 
myinput1 c on a.key<=>c.key;
+select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on 
a.key<=>c.key;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key 
join myinput1 c on a.key<=>c.key AND a.value=c.value;
+
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value;
+select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value;
+
+-- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value;
+SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON a.key<=>b.value;
+SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON a.key<=>b.value;
+
+-- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value;
+SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value;
+

http://git-wip-us.apache.org/repos/asf/hive/blob/4a2a2bcd/ql/src/test/results/clientpositive/tez/vector_nullsafe_join.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/tez/vector_nullsafe_join.q.out 
b/ql/src/test/results/clientpositive/tez/vector_nullsafe_join.q.out
new file mode 100644
index 0000000..db170a9
--- /dev/null
+++ b/ql/src/test/results/clientpositive/tez/vector_nullsafe_join.q.out
@@ -0,0 +1,1210 @@
+PREHOOK: query: -- SORT_QUERY_RESULTS
+--
+-- We currently do not support null safes (i.e the <=> operator) in native 
vector map join.
+-- The explain output will show vectorized execution for both.  We verify the 
query
+-- results are the same (HIVE-10628 shows native will produce the wrong results
+-- otherwise).
+--
+-- This query for "HIVE-3315 join predicate transitive" triggers HIVE-10640-
+-- explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.key is NULL;
+-- select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is 
NULL;
+--
+CREATE TABLE myinput1_txt(key int, value int)
+PREHOOK: type: CREATETABLE
+PREHOOK: Output: database:default
+PREHOOK: Output: default@myinput1_txt
+POSTHOOK: query: -- SORT_QUERY_RESULTS
+--
+-- We currently do not support null safes (i.e the <=> operator) in native 
vector map join.
+-- The explain output will show vectorized execution for both.  We verify the 
query
+-- results are the same (HIVE-10628 shows native will produce the wrong results
+-- otherwise).
+--
+-- This query for "HIVE-3315 join predicate transitive" triggers HIVE-10640-
+-- explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND 
a.key is NULL;
+-- select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is 
NULL;
+--
+CREATE TABLE myinput1_txt(key int, value int)
+POSTHOOK: type: CREATETABLE
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@myinput1_txt
+PREHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in8.txt' INTO TABLE 
myinput1_txt
+PREHOOK: type: LOAD
+#### A masked pattern was here ####
+PREHOOK: Output: default@myinput1_txt
+POSTHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in8.txt' INTO TABLE 
myinput1_txt
+POSTHOOK: type: LOAD
+#### A masked pattern was here ####
+POSTHOOK: Output: default@myinput1_txt
+PREHOOK: query: CREATE TABLE myinput1 STORED AS ORC AS SELECT * FROM 
myinput1_txt
+PREHOOK: type: CREATETABLE_AS_SELECT
+PREHOOK: Input: default@myinput1_txt
+PREHOOK: Output: database:default
+PREHOOK: Output: default@myinput1
+POSTHOOK: query: CREATE TABLE myinput1 STORED AS ORC AS SELECT * FROM 
myinput1_txt
+POSTHOOK: type: CREATETABLE_AS_SELECT
+POSTHOOK: Input: default@myinput1_txt
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@myinput1
+PREHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+POSTHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                    keys:
+                      0 key (type: int)
+                      1 value (type: int)
+                    nullSafes: [true]
+                    outputColumnNames: _col0, _col1, _col5, _col6
+                    input vertices:
+                      1 Map 2
+                    Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Map Join Operator
+                      condition map:
+                           Inner Join 0 to 1
+                           Inner Join 0 to 2
+                      keys:
+                        0 key (type: int)
+                        1 value (type: int)
+                        2 key (type: int)
+                      outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                      input vertices:
+                        1 Map 2
+                        2 Map 3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      HybridGraceHashJoin: true
+                      Select Operator
+                        expressions: _col0 (type: int), _col1 (type: int), 
_col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                        outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        File Output Operator
+                          compressed: false
+                          Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                          table:
+                              input format: 
org.apache.hadoop.mapred.TextInputFormat
+                              output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                              serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int)
+                      sort order: +
+                      Map-reduce partition columns: value (type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                      value expressions: key (type: int)
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int)
+                      sort order: +
+                      Map-reduce partition columns: key (type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                      value expressions: value (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                         Inner Join 0 to 2
+                    keys:
+                      0 key (type: int)
+                      1 value (type: int)
+                      2 key (type: int)
+                    nullSafes: [true]
+                    outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                    input vertices:
+                      1 Map 2
+                      2 Map 3
+                    Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                      Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int)
+                    sort order: +
+                    Map-reduce partition columns: key (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: value (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+NULL   10      10      NULL    NULL    35
+NULL   10      10      NULL    NULL    NULL
+NULL   10      48      NULL    NULL    10
+NULL   10      48      NULL    NULL    35
+NULL   10      48      NULL    NULL    NULL
+NULL   10      NULL    NULL    NULL    10
+NULL   10      NULL    NULL    NULL    35
+NULL   10      NULL    NULL    NULL    NULL
+NULL   35      10      NULL    NULL    10
+NULL   35      10      NULL    NULL    35
+NULL   35      10      NULL    NULL    NULL
+NULL   35      48      NULL    NULL    10
+NULL   35      48      NULL    NULL    35
+NULL   35      48      NULL    NULL    NULL
+NULL   35      NULL    NULL    NULL    10
+NULL   35      NULL    NULL    NULL    35
+NULL   35      NULL    NULL    NULL    NULL
+NULL   NULL    10      NULL    NULL    10
+NULL   NULL    10      NULL    NULL    35
+NULL   NULL    10      NULL    NULL    NULL
+NULL   NULL    48      NULL    NULL    10
+NULL   NULL    48      NULL    NULL    35
+NULL   NULL    48      NULL    NULL    NULL
+NULL   NULL    NULL    NULL    NULL    10
+NULL   NULL    NULL    NULL    NULL    35
+NULL   NULL    NULL    NULL    NULL    NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND 
a.value=c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND 
a.value=c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Map Join Operator
+                      condition map:
+                           Inner Join 0 to 1
+                           Inner Join 0 to 2
+                      keys:
+                        0 key (type: int), value (type: int)
+                        1 value (type: int), key (type: int)
+                        2 key (type: int), value (type: int)
+                      nullSafes: [true, false]
+                      outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                      input vertices:
+                        1 Map 2
+                        2 Map 3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      HybridGraceHashJoin: true
+                      Select Operator
+                        expressions: _col0 (type: int), _col1 (type: int), 
_col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                        outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        File Output Operator
+                          compressed: false
+                          Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                          table:
+                              input format: 
org.apache.hadoop.mapred.TextInputFormat
+                              output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                              serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int), key (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: value (type: int), key 
(type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int), value (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: key (type: int), value 
(type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND 
a.value<=>c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND 
a.value<=>c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                         Inner Join 0 to 2
+                    keys:
+                      0 key (type: int), value (type: int)
+                      1 value (type: int), key (type: int)
+                      2 key (type: int), value (type: int)
+                    nullSafes: [true, true]
+                    outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                    input vertices:
+                      1 Map 2
+                      2 Map 3
+                    Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                      Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int), key (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: value (type: int), key 
(type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int), value (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: key (type: int), value 
(type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+NULL   NULL    NULL    NULL    NULL    NULL
+PREHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+48     NULL    NULL    NULL
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    35
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+48     NULL    NULL    NULL
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    35
+NULL   NULL    NULL    NULL
+PREHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+POSTHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                    keys:
+                      0 key (type: int)
+                      1 value (type: int)
+                    nullSafes: [true]
+                    outputColumnNames: _col0, _col1, _col5, _col6
+                    input vertices:
+                      1 Map 2
+                    Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Map Join Operator
+                      condition map:
+                           Inner Join 0 to 1
+                           Inner Join 0 to 2
+                      keys:
+                        0 key (type: int)
+                        1 value (type: int)
+                        2 key (type: int)
+                      outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                      input vertices:
+                        1 Map 2
+                        2 Map 3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      HybridGraceHashJoin: true
+                      Select Operator
+                        expressions: _col0 (type: int), _col1 (type: int), 
_col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                        outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        File Output Operator
+                          compressed: false
+                          Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                          table:
+                              input format: 
org.apache.hadoop.mapred.TextInputFormat
+                              output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                              serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int)
+                      sort order: +
+                      Map-reduce partition columns: value (type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                      value expressions: key (type: int)
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int)
+                      sort order: +
+                      Map-reduce partition columns: key (type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                      value expressions: value (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                         Inner Join 0 to 2
+                    keys:
+                      0 key (type: int)
+                      1 value (type: int)
+                      2 key (type: int)
+                    nullSafes: [true]
+                    outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                    input vertices:
+                      1 Map 2
+                      2 Map 3
+                    Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                      Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int)
+                    sort order: +
+                    Map-reduce partition columns: key (type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+                    value expressions: value (type: int)
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+NULL   10      10      NULL    NULL    35
+NULL   10      10      NULL    NULL    NULL
+NULL   10      48      NULL    NULL    10
+NULL   10      48      NULL    NULL    35
+NULL   10      48      NULL    NULL    NULL
+NULL   10      NULL    NULL    NULL    10
+NULL   10      NULL    NULL    NULL    35
+NULL   10      NULL    NULL    NULL    NULL
+NULL   35      10      NULL    NULL    10
+NULL   35      10      NULL    NULL    35
+NULL   35      10      NULL    NULL    NULL
+NULL   35      48      NULL    NULL    10
+NULL   35      48      NULL    NULL    35
+NULL   35      48      NULL    NULL    NULL
+NULL   35      NULL    NULL    NULL    10
+NULL   35      NULL    NULL    NULL    35
+NULL   35      NULL    NULL    NULL    NULL
+NULL   NULL    10      NULL    NULL    10
+NULL   NULL    10      NULL    NULL    35
+NULL   NULL    10      NULL    NULL    NULL
+NULL   NULL    48      NULL    NULL    10
+NULL   NULL    48      NULL    NULL    35
+NULL   NULL    48      NULL    NULL    NULL
+NULL   NULL    NULL    NULL    NULL    10
+NULL   NULL    NULL    NULL    NULL    35
+NULL   NULL    NULL    NULL    NULL    NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND 
a.value=c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND 
a.value=c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Map Join Operator
+                      condition map:
+                           Inner Join 0 to 1
+                           Inner Join 0 to 2
+                      keys:
+                        0 key (type: int), value (type: int)
+                        1 value (type: int), key (type: int)
+                        2 key (type: int), value (type: int)
+                      nullSafes: [true, false]
+                      outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                      input vertices:
+                        1 Map 2
+                        2 Map 3
+                      Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                      HybridGraceHashJoin: true
+                      Select Operator
+                        expressions: _col0 (type: int), _col1 (type: int), 
_col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                        outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                        Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                        File Output Operator
+                          compressed: false
+                          Statistics: Num rows: 6 Data size: 26 Basic stats: 
COMPLETE Column stats: NONE
+                          table:
+                              input format: 
org.apache.hadoop.mapred.TextInputFormat
+                              output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                              serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int), key (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: value (type: int), key 
(type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int), value (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: key (type: int), value 
(type: int)
+                      Statistics: Num rows: 3 Data size: 12 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND 
a.value<=>c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on 
a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND 
a.value<=>c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Map Join Operator
+                    condition map:
+                         Inner Join 0 to 1
+                         Inner Join 0 to 2
+                    keys:
+                      0 key (type: int), value (type: int)
+                      1 value (type: int), key (type: int)
+                      2 key (type: int), value (type: int)
+                    nullSafes: [true, true]
+                    outputColumnNames: _col0, _col1, _col5, _col6, _col10, 
_col11
+                    input vertices:
+                      1 Map 2
+                      2 Map 3
+                    Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                    HybridGraceHashJoin: true
+                    Select Operator
+                      expressions: _col0 (type: int), _col1 (type: int), _col5 
(type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                      outputColumnNames: _col0, _col1, _col2, _col3, _col4, 
_col5
+                      Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                      File Output Operator
+                        compressed: false
+                        Statistics: Num rows: 13 Data size: 52 Basic stats: 
COMPLETE Column stats: NONE
+                        table:
+                            input format: 
org.apache.hadoop.mapred.TextInputFormat
+                            output format: 
org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                            serde: 
org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            Execution mode: vectorized
+        Map 2 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int), key (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: value (type: int), key 
(type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE 
Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int), value (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: key (type: int), value 
(type: int)
+                    Statistics: Num rows: 6 Data size: 24 Basic stats: 
COMPLETE Column stats: NONE
+            Execution mode: vectorized
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value 
AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10      10      NULL
+100    100     100     100     100     100
+NULL   10      10      NULL    NULL    10
+NULL   NULL    NULL    NULL    NULL    NULL
+PREHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+48     NULL    NULL    NULL
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    35
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+48     NULL    NULL    NULL
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    35
+NULL   NULL    NULL    NULL
+PREHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON 
a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON 
a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10     NULL    NULL    10
+100    100     100     100
+NULL   10      10      NULL
+NULL   10      48      NULL
+NULL   10      NULL    NULL
+NULL   35      10      NULL
+NULL   35      48      NULL
+NULL   35      NULL    NULL
+NULL   NULL    10      NULL
+NULL   NULL    48      NULL
+NULL   NULL    NULL    NULL

Reply via email to