You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by gu...@apache.org on 2014/11/08 01:00:19 UTC

svn commit: r1637489 - in /hive/trunk: itests/src/test/resources/ ql/src/java/org/apache/hadoop/hive/ql/exec/ ql/src/java/org/apache/hadoop/hive/ql/optimizer/ ql/src/test/results/clientpositive/tez/

Author: gunther
Date: Sat Nov  8 00:00:19 2014
New Revision: 1637489

URL: http://svn.apache.org/r1637489
Log:
HIVE-8781: Nullsafe joins are busted on Tez (Gunther Hagleitner, reviewed by Prasanth J)

Added:
    hive/trunk/ql/src/test/results/clientpositive/tez/join_nullsafe.q.out
Modified:
    hive/trunk/itests/src/test/resources/testconfiguration.properties
    hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/exec/CommonMergeJoinOperator.java
    hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/optimizer/ConvertJoinMapJoin.java
    hive/trunk/ql/src/test/results/clientpositive/tez/tez_union_group_by.q.out

Modified: hive/trunk/itests/src/test/resources/testconfiguration.properties
URL: http://svn.apache.org/viewvc/hive/trunk/itests/src/test/resources/testconfiguration.properties?rev=1637489&r1=1637488&r2=1637489&view=diff
==============================================================================
--- hive/trunk/itests/src/test/resources/testconfiguration.properties (original)
+++ hive/trunk/itests/src/test/resources/testconfiguration.properties Sat Nov  8 00:00:19 2014
@@ -108,6 +108,7 @@ minitez.query.files.shared=alter_merge_2
   insert_update_delete.q,\
   join0.q,\
   join1.q,\
+  join_nullsafe.q,\
   leftsemijoin.q,\
   limit_pushdown.q,\
   load_dyn_part1.q,\

Modified: hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/exec/CommonMergeJoinOperator.java
URL: http://svn.apache.org/viewvc/hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/exec/CommonMergeJoinOperator.java?rev=1637489&r1=1637488&r2=1637489&view=diff
==============================================================================
--- hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/exec/CommonMergeJoinOperator.java (original)
+++ hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/exec/CommonMergeJoinOperator.java Sat Nov  8 00:00:19 2014
@@ -438,8 +438,11 @@ public class CommonMergeJoinOperator ext
       WritableComparable key_1 = (WritableComparable) k1.get(i);
       WritableComparable key_2 = (WritableComparable) k2.get(i);
       if (key_1 == null && key_2 == null) {
-        return nullsafes != null && nullsafes[i] ? 0 : -1; // just return k1 is
-                                                           // smaller than k2
+        if (nullsafes != null && nullsafes[i]) {
+          continue;
+        } else {
+          return -1;
+        }
       } else if (key_1 == null) {
         return -1;
       } else if (key_2 == null) {

Modified: hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/optimizer/ConvertJoinMapJoin.java
URL: http://svn.apache.org/viewvc/hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/optimizer/ConvertJoinMapJoin.java?rev=1637489&r1=1637488&r2=1637489&view=diff
==============================================================================
--- hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/optimizer/ConvertJoinMapJoin.java (original)
+++ hive/trunk/ql/src/java/org/apache/hadoop/hive/ql/optimizer/ConvertJoinMapJoin.java Sat Nov  8 00:00:19 2014
@@ -240,6 +240,9 @@ public class ConvertJoinMapJoin implemen
           new MapJoinDesc(null, null, joinDesc.getExprs(), null, null,
               joinDesc.getOutputColumnNames(), mapJoinConversionPos, joinDesc.getConds(),
               joinDesc.getFilters(), joinDesc.getNoOuterJoin(), null);
+      mapJoinDesc.setNullSafes(joinDesc.getNullSafes());
+      mapJoinDesc.setFilterMap(joinDesc.getFilterMap());
+      mapJoinDesc.resetOrder();
     }
 
     @SuppressWarnings("unchecked")

Added: hive/trunk/ql/src/test/results/clientpositive/tez/join_nullsafe.q.out
URL: http://svn.apache.org/viewvc/hive/trunk/ql/src/test/results/clientpositive/tez/join_nullsafe.q.out?rev=1637489&view=auto
==============================================================================
--- hive/trunk/ql/src/test/results/clientpositive/tez/join_nullsafe.q.out (added)
+++ hive/trunk/ql/src/test/results/clientpositive/tez/join_nullsafe.q.out Sat Nov  8 00:00:19 2014
@@ -0,0 +1,1641 @@
+PREHOOK: query: -- SORT_QUERY_RESULTS
+
+CREATE TABLE myinput1(key int, value int)
+PREHOOK: type: CREATETABLE
+PREHOOK: Output: database:default
+PREHOOK: Output: default@myinput1
+POSTHOOK: query: -- SORT_QUERY_RESULTS
+
+CREATE TABLE myinput1(key int, value int)
+POSTHOOK: type: CREATETABLE
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@myinput1
+PREHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in8.txt' INTO TABLE myinput1
+PREHOOK: type: LOAD
+#### A masked pattern was here ####
+PREHOOK: Output: default@myinput1
+POSTHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in8.txt' INTO TABLE myinput1
+POSTHOOK: type: LOAD
+#### A masked pattern was here ####
+POSTHOOK: Output: default@myinput1
+PREHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+POSTHOOK: query: -- merging
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int)
+                    sort order: +
+                    Map-reduce partition columns: key (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                    value expressions: value (type: int)
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                condition expressions:
+                  0 {KEY.reducesinkkey0} {VALUE._col0}
+                  1 {VALUE._col0} {KEY.reducesinkkey0}
+                nullSafes: [true]
+                outputColumnNames: _col0, _col1, _col5, _col6
+                Statistics: Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: _col0 (type: int), _col1 (type: int), _col5 (type: int), _col6 (type: int)
+                  outputColumnNames: _col0, _col1, _col2, _col3
+                  Statistics: Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int)
+                      sort order: +
+                      Map-reduce partition columns: value (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                      value expressions: key (type: int)
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int)
+                      sort order: +
+                      Map-reduce partition columns: key (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                      value expressions: value (type: int)
+        Map 4 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int)
+                      sort order: +
+                      Map-reduce partition columns: key (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                      value expressions: value (type: int)
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                     Inner Join 0 to 2
+                condition expressions:
+                  0 {KEY.reducesinkkey0} {VALUE._col0}
+                  1 {VALUE._col0} {KEY.reducesinkkey0}
+                  2 {KEY.reducesinkkey0} {VALUE._col0}
+                outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
+                Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: _col0 (type: int), _col1 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
+                  Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key=c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key=c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10	10	NULL
+100	100	100	100	100	100
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int)
+                    sort order: +
+                    Map-reduce partition columns: value (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                    value expressions: key (type: int)
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int)
+                    sort order: +
+                    Map-reduce partition columns: key (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                    value expressions: value (type: int)
+        Map 4 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int)
+                    sort order: +
+                    Map-reduce partition columns: key (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                    value expressions: value (type: int)
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                     Inner Join 0 to 2
+                condition expressions:
+                  0 {KEY.reducesinkkey0} {VALUE._col0}
+                  1 {VALUE._col0} {KEY.reducesinkkey0}
+                  2 {KEY.reducesinkkey0} {VALUE._col0}
+                nullSafes: [true]
+                outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
+                Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: _col0 (type: int), _col1 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
+                  Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key<=>c.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key<=>c.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10	10	NULL
+100	100	100	100	100	100
+NULL	10	10	NULL	NULL	10
+NULL	10	10	NULL	NULL	35
+NULL	10	10	NULL	NULL	NULL
+NULL	10	48	NULL	NULL	10
+NULL	10	48	NULL	NULL	35
+NULL	10	48	NULL	NULL	NULL
+NULL	10	NULL	NULL	NULL	10
+NULL	10	NULL	NULL	NULL	35
+NULL	10	NULL	NULL	NULL	NULL
+NULL	35	10	NULL	NULL	10
+NULL	35	10	NULL	NULL	35
+NULL	35	10	NULL	NULL	NULL
+NULL	35	48	NULL	NULL	10
+NULL	35	48	NULL	NULL	35
+NULL	35	48	NULL	NULL	NULL
+NULL	35	NULL	NULL	NULL	10
+NULL	35	NULL	NULL	NULL	35
+NULL	35	NULL	NULL	NULL	NULL
+NULL	NULL	10	NULL	NULL	10
+NULL	NULL	10	NULL	NULL	35
+NULL	NULL	10	NULL	NULL	NULL
+NULL	NULL	48	NULL	NULL	10
+NULL	NULL	48	NULL	NULL	35
+NULL	NULL	48	NULL	NULL	NULL
+NULL	NULL	NULL	NULL	NULL	10
+NULL	NULL	NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL	NULL	NULL
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: key is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: value (type: int), key (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: value (type: int), key (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int), value (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: key (type: int), value (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+        Map 4 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: value is not null (type: boolean)
+                    Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: key (type: int), value (type: int)
+                      sort order: ++
+                      Map-reduce partition columns: key (type: int), value (type: int)
+                      Statistics: Num rows: 2 Data size: 17 Basic stats: COMPLETE Column stats: NONE
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                     Inner Join 0 to 2
+                condition expressions:
+                  0 {KEY.reducesinkkey0} {KEY.reducesinkkey1}
+                  1 {KEY.reducesinkkey1} {KEY.reducesinkkey0}
+                  2 {KEY.reducesinkkey0} {KEY.reducesinkkey1}
+                nullSafes: [true, false]
+                outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
+                Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: _col0 (type: int), _col1 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
+                  Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 4 Data size: 37 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+100	100	100	100	100	100
+NULL	10	10	NULL	NULL	10
+PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+PREHOOK: type: QUERY
+POSTHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: value (type: int), key (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: value (type: int), key (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: c
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int), value (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: key (type: int), value (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+        Map 4 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Reduce Output Operator
+                    key expressions: key (type: int), value (type: int)
+                    sort order: ++
+                    Map-reduce partition columns: key (type: int), value (type: int)
+                    Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                     Inner Join 0 to 2
+                condition expressions:
+                  0 {KEY.reducesinkkey0} {KEY.reducesinkkey1}
+                  1 {KEY.reducesinkkey1} {KEY.reducesinkkey0}
+                  2 {KEY.reducesinkkey0} {KEY.reducesinkkey1}
+                nullSafes: [true, true]
+                outputColumnNames: _col0, _col1, _col5, _col6, _col10, _col11
+                Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: _col0 (type: int), _col1 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5
+                  Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10	10	NULL
+100	100	100	100	100	100
+NULL	10	10	NULL	NULL	10
+NULL	NULL	NULL	NULL	NULL	NULL
+PREHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- outer joins
+SELECT * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+48	NULL	NULL	NULL
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT * FROM myinput1 a FULL OUTER JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+48	NULL	NULL	NULL
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: -- map joins
+SELECT /*+ MAPJOIN(a) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+10	NULL	NULL	10
+100	100	100	100
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: CREATE TABLE smb_input(key int, value int)
+PREHOOK: type: CREATETABLE
+PREHOOK: Output: database:default
+PREHOOK: Output: default@smb_input
+POSTHOOK: query: CREATE TABLE smb_input(key int, value int)
+POSTHOOK: type: CREATETABLE
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@smb_input
+PREHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in4.txt' into table smb_input
+PREHOOK: type: LOAD
+#### A masked pattern was here ####
+PREHOOK: Output: default@smb_input
+POSTHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in4.txt' into table smb_input
+POSTHOOK: type: LOAD
+#### A masked pattern was here ####
+POSTHOOK: Output: default@smb_input
+PREHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in5.txt' into table smb_input
+PREHOOK: type: LOAD
+#### A masked pattern was here ####
+PREHOOK: Output: default@smb_input
+POSTHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/in5.txt' into table smb_input
+POSTHOOK: type: LOAD
+#### A masked pattern was here ####
+POSTHOOK: Output: default@smb_input
+PREHOOK: query: -- smbs
+CREATE TABLE smb_input1(key int, value int) CLUSTERED BY (key) SORTED BY (key) INTO 2 BUCKETS
+PREHOOK: type: CREATETABLE
+PREHOOK: Output: database:default
+PREHOOK: Output: default@smb_input1
+POSTHOOK: query: -- smbs
+CREATE TABLE smb_input1(key int, value int) CLUSTERED BY (key) SORTED BY (key) INTO 2 BUCKETS
+POSTHOOK: type: CREATETABLE
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@smb_input1
+PREHOOK: query: CREATE TABLE smb_input2(key int, value int) CLUSTERED BY (value) SORTED BY (value) INTO 2 BUCKETS
+PREHOOK: type: CREATETABLE
+PREHOOK: Output: database:default
+PREHOOK: Output: default@smb_input2
+POSTHOOK: query: CREATE TABLE smb_input2(key int, value int) CLUSTERED BY (value) SORTED BY (value) INTO 2 BUCKETS
+POSTHOOK: type: CREATETABLE
+POSTHOOK: Output: database:default
+POSTHOOK: Output: default@smb_input2
+PREHOOK: query: from smb_input
+insert overwrite table smb_input1 select *
+insert overwrite table smb_input2 select *
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input
+PREHOOK: Output: default@smb_input1
+PREHOOK: Output: default@smb_input2
+POSTHOOK: query: from smb_input
+insert overwrite table smb_input1 select *
+insert overwrite table smb_input2 select *
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input
+POSTHOOK: Output: default@smb_input1
+POSTHOOK: Output: default@smb_input2
+POSTHOOK: Lineage: smb_input1.key SIMPLE [(smb_input)smb_input.FieldSchema(name:key, type:int, comment:null), ]
+POSTHOOK: Lineage: smb_input1.value SIMPLE [(smb_input)smb_input.FieldSchema(name:value, type:int, comment:null), ]
+POSTHOOK: Lineage: smb_input2.key SIMPLE [(smb_input)smb_input.FieldSchema(name:key, type:int, comment:null), ]
+POSTHOOK: Lineage: smb_input2.value SIMPLE [(smb_input)smb_input.FieldSchema(name:value, type:int, comment:null), ]
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	1000
+10	100	10	1000
+10	1000	10	100
+10	1000	10	100
+10	1000	10	1000
+100	100	100	100
+12	100	12	100
+12	100	12	NULL
+12	NULL	12	100
+12	NULL	12	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	NULL	10050
+NULL	10050	NULL	35
+NULL	10050	NULL	NULL
+NULL	35	NULL	10050
+NULL	35	NULL	35
+NULL	35	NULL	NULL
+NULL	NULL	NULL	10050
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key AND a.value <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key AND a.value <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	1000	10	1000
+100	100	100	100
+12	100	12	100
+12	NULL	12	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	NULL	10050
+NULL	35	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a RIGHT OUTER JOIN smb_input1 b ON a.key <=> b.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a RIGHT OUTER JOIN smb_input1 b ON a.key <=> b.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	1000
+10	100	10	1000
+10	1000	10	100
+10	1000	10	100
+10	1000	10	1000
+100	100	100	100
+12	100	12	100
+12	100	12	NULL
+12	NULL	12	100
+12	NULL	12	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	NULL	10050
+NULL	10050	NULL	35
+NULL	10050	NULL	NULL
+NULL	35	NULL	10050
+NULL	35	NULL	35
+NULL	35	NULL	NULL
+NULL	NULL	NULL	10050
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	1000
+10	100	10	1000
+10	1000	10	100
+10	1000	10	100
+10	1000	10	1000
+100	100	100	100
+12	100	12	100
+12	100	12	NULL
+12	NULL	12	100
+12	NULL	12	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	NULL	10050
+NULL	10050	NULL	35
+NULL	10050	NULL	NULL
+NULL	35	NULL	10050
+NULL	35	NULL	35
+NULL	35	NULL	NULL
+NULL	NULL	NULL	10050
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a LEFT OUTER JOIN smb_input1 b ON a.key <=> b.key
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a LEFT OUTER JOIN smb_input1 b ON a.key <=> b.key
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	1000
+10	100	10	1000
+10	1000	10	100
+10	1000	10	100
+10	1000	10	1000
+100	100	100	100
+12	100	12	100
+12	100	12	NULL
+12	NULL	12	100
+12	NULL	12	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	NULL	10050
+NULL	10050	NULL	35
+NULL	10050	NULL	NULL
+NULL	35	NULL	10050
+NULL	35	NULL	35
+NULL	35	NULL	NULL
+NULL	NULL	NULL	10050
+NULL	NULL	NULL	35
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input2 b ON a.key <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input2 b ON a.key <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+35	10035	NULL	35
+NULL	10050	12	NULL
+NULL	10050	NULL	NULL
+NULL	35	12	NULL
+NULL	35	NULL	NULL
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a JOIN smb_input2 b ON a.key <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a JOIN smb_input2 b ON a.key <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+35	10035	NULL	35
+NULL	10050	12	NULL
+NULL	10050	NULL	NULL
+NULL	35	12	NULL
+NULL	35	NULL	NULL
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a LEFT OUTER JOIN smb_input2 b ON a.key <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input1 a LEFT OUTER JOIN smb_input2 b ON a.key <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+10	100	NULL	NULL
+10	100	NULL	NULL
+10	1000	NULL	NULL
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+12	100	NULL	NULL
+12	NULL	NULL	NULL
+15	10015	NULL	NULL
+20	10020	NULL	NULL
+25	10025	NULL	NULL
+30	10030	NULL	NULL
+35	10035	NULL	35
+40	10040	NULL	NULL
+40	10040	NULL	NULL
+5	10005	NULL	NULL
+50	10050	NULL	NULL
+50	10050	NULL	NULL
+50	10050	NULL	NULL
+60	10040	NULL	NULL
+60	10040	NULL	NULL
+70	10040	NULL	NULL
+70	10040	NULL	NULL
+80	10040	NULL	NULL
+80	10040	NULL	NULL
+NULL	10050	12	NULL
+NULL	10050	NULL	NULL
+NULL	35	12	NULL
+NULL	35	NULL	NULL
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a RIGHT OUTER JOIN smb_input2 b ON a.key <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input1
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input1 a RIGHT OUTER JOIN smb_input2 b ON a.key <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input1
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+35	10035	NULL	35
+NULL	10050	12	NULL
+NULL	10050	NULL	NULL
+NULL	35	12	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	1000
+NULL	NULL	12	NULL
+NULL	NULL	15	10015
+NULL	NULL	20	10020
+NULL	NULL	25	10025
+NULL	NULL	30	10030
+NULL	NULL	35	10035
+NULL	NULL	40	10040
+NULL	NULL	40	10040
+NULL	NULL	5	10005
+NULL	NULL	50	10050
+NULL	NULL	50	10050
+NULL	NULL	50	10050
+NULL	NULL	60	10040
+NULL	NULL	60	10040
+NULL	NULL	70	10040
+NULL	NULL	70	10040
+NULL	NULL	80	10040
+NULL	NULL	80	10040
+NULL	NULL	NULL	10050
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input2 a JOIN smb_input2 b ON a.value <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input2 a JOIN smb_input2 b ON a.value <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	100	100
+10	100	100	100
+10	100	12	100
+10	100	12	100
+10	1000	10	1000
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+12	100	10	100
+12	100	10	100
+12	100	100	100
+12	100	12	100
+12	NULL	12	NULL
+12	NULL	NULL	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	NULL	10050
+NULL	35	NULL	35
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input2 a RIGHT OUTER JOIN smb_input2 b ON a.value <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(a) */ * FROM smb_input2 a RIGHT OUTER JOIN smb_input2 b ON a.value <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	100	100
+10	100	100	100
+10	100	12	100
+10	100	12	100
+10	1000	10	1000
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+12	100	10	100
+12	100	10	100
+12	100	100	100
+12	100	12	100
+12	NULL	12	NULL
+12	NULL	NULL	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	NULL	10050
+NULL	35	NULL	35
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input2 a JOIN smb_input2 b ON a.value <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input2 a JOIN smb_input2 b ON a.value <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	100	100
+10	100	100	100
+10	100	12	100
+10	100	12	100
+10	1000	10	1000
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+12	100	10	100
+12	100	10	100
+12	100	100	100
+12	100	12	100
+12	NULL	12	NULL
+12	NULL	NULL	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	NULL	10050
+NULL	35	NULL	35
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input2 a LEFT OUTER JOIN smb_input2 b ON a.value <=> b.value
+PREHOOK: type: QUERY
+PREHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+POSTHOOK: query: SELECT /*+ MAPJOIN(b) */ * FROM smb_input2 a LEFT OUTER JOIN smb_input2 b ON a.value <=> b.value
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@smb_input2
+#### A masked pattern was here ####
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	10	100
+10	100	100	100
+10	100	100	100
+10	100	12	100
+10	100	12	100
+10	1000	10	1000
+100	100	10	100
+100	100	10	100
+100	100	100	100
+100	100	12	100
+12	100	10	100
+12	100	10	100
+12	100	100	100
+12	100	12	100
+12	NULL	12	NULL
+12	NULL	NULL	NULL
+15	10015	15	10015
+20	10020	20	10020
+25	10025	25	10025
+30	10030	30	10030
+35	10035	35	10035
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	40	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	60	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	70	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+40	10040	80	10040
+5	10005	5	10005
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	50	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+50	10050	NULL	10050
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	40	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	60	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	70	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+60	10040	80	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	40	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	60	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	70	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+70	10040	80	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	40	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	60	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	70	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+80	10040	80	10040
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	50	10050
+NULL	10050	NULL	10050
+NULL	35	NULL	35
+NULL	NULL	12	NULL
+NULL	NULL	NULL	NULL
+PREHOOK: query: --HIVE-3315 join predicate transitive
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is NULL
+PREHOOK: type: QUERY
+POSTHOOK: query: --HIVE-3315 join predicate transitive
+explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is NULL
+POSTHOOK: type: QUERY
+STAGE DEPENDENCIES:
+  Stage-1 is a root stage
+  Stage-0 depends on stages: Stage-1
+
+STAGE PLANS:
+  Stage: Stage-1
+    Tez
+      Edges:
+        Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE)
+#### A masked pattern was here ####
+      Vertices:
+        Map 1 
+            Map Operator Tree:
+                TableScan
+                  alias: b
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: value is null (type: boolean)
+                    Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: null (type: void)
+                      sort order: +
+                      Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                      value expressions: key (type: int)
+        Map 3 
+            Map Operator Tree:
+                TableScan
+                  alias: a
+                  Statistics: Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE
+                  Filter Operator
+                    predicate: key is null (type: boolean)
+                    Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                    Reduce Output Operator
+                      key expressions: null (type: void)
+                      sort order: +
+                      Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                      value expressions: value (type: int)
+        Reducer 2 
+            Reduce Operator Tree:
+              Merge Join Operator
+                condition map:
+                     Inner Join 0 to 1
+                condition expressions:
+                  0 {VALUE._col0}
+                  1 {VALUE._col0}
+                nullSafes: [true]
+                outputColumnNames: _col1, _col5
+                Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                Select Operator
+                  expressions: null (type: void), _col1 (type: int), _col5 (type: int), null (type: void)
+                  outputColumnNames: _col0, _col1, _col2, _col3
+                  Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+
+  Stage: Stage-0
+    Fetch Operator
+      limit: -1
+      Processor Tree:
+        ListSink
+
+PREHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is NULL
+PREHOOK: type: QUERY
+PREHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+POSTHOOK: query: select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.key is NULL
+POSTHOOK: type: QUERY
+POSTHOOK: Input: default@myinput1
+#### A masked pattern was here ####
+NULL	10	10	NULL
+NULL	10	48	NULL
+NULL	10	NULL	NULL
+NULL	35	10	NULL
+NULL	35	48	NULL
+NULL	35	NULL	NULL
+NULL	NULL	10	NULL
+NULL	NULL	48	NULL
+NULL	NULL	NULL	NULL

Modified: hive/trunk/ql/src/test/results/clientpositive/tez/tez_union_group_by.q.out
URL: http://svn.apache.org/viewvc/hive/trunk/ql/src/test/results/clientpositive/tez/tez_union_group_by.q.out?rev=1637489&r1=1637488&r2=1637489&view=diff
==============================================================================
--- hive/trunk/ql/src/test/results/clientpositive/tez/tez_union_group_by.q.out (original)
+++ hive/trunk/ql/src/test/results/clientpositive/tez/tez_union_group_by.q.out Sat Nov  8 00:00:19 2014
@@ -180,6 +180,7 @@ STAGE PLANS:
                 condition expressions:
                   0 {VALUE._col0}
                   1 
+                nullSafes: [false, true]
                 outputColumnNames: _col0
                 Statistics: Num rows: 0 Data size: 0 Basic stats: NONE Column stats: NONE
                 Select Operator