You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by kg...@apache.org on 2017/12/20 10:40:15 UTC

[14/37] hive git commit: HIVE-18149: Stats: rownum estimation from datasize underestimates in most cases (Zoltan Haindrich, reviewed by Ashutosh Chauhan)

http://git-wip-us.apache.org/repos/asf/hive/blob/e26b9325/ql/src/test/results/clientpositive/spark/smb_mapjoin_2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/smb_mapjoin_2.q.out b/ql/src/test/results/clientpositive/spark/smb_mapjoin_2.q.out
index ed7c5bf..da419fe 100644
--- a/ql/src/test/results/clientpositive/spark/smb_mapjoin_2.q.out
+++ b/ql/src/test/results/clientpositive/spark/smb_mapjoin_2.q.out
@@ -65,10 +65,10 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                     Sorted Merge Bucket Map Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -76,14 +76,14 @@ STAGE PLANS:
                         0 key (type: int)
                         1 key (type: int)
                       outputColumnNames: _col0, _col1, _col5, _col6
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       Select Operator
                         expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         File Output Operator
                           compressed: false
-                          Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                           table:
                               input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                               output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -126,7 +126,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Left Outer Join 0 to 1
@@ -134,14 +134,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -187,7 +187,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Right Outer Join 0 to 1
@@ -195,14 +195,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -249,7 +249,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Outer Join 0 to 1
@@ -257,14 +257,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -314,10 +314,10 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                     Sorted Merge Bucket Map Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -325,14 +325,14 @@ STAGE PLANS:
                         0 key (type: int)
                         1 key (type: int)
                       outputColumnNames: _col0, _col1, _col5, _col6
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       Select Operator
                         expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         File Output Operator
                           compressed: false
-                          Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                           table:
                               input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                               output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -375,7 +375,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Left Outer Join 0 to 1
@@ -383,14 +383,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -436,7 +436,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Right Outer Join 0 to 1
@@ -444,14 +444,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -498,7 +498,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Outer Join 0 to 1
@@ -506,14 +506,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 228 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2288 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/e26b9325/ql/src/test/results/clientpositive/spark/smb_mapjoin_25.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/smb_mapjoin_25.q.out b/ql/src/test/results/clientpositive/spark/smb_mapjoin_25.q.out
index 8237bed..e9e837f 100644
--- a/ql/src/test/results/clientpositive/spark/smb_mapjoin_25.q.out
+++ b/ql/src/test/results/clientpositive/spark/smb_mapjoin_25.q.out
@@ -72,54 +72,54 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (key = 5) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         sort order: 
-                        Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
         Map 4 
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (5 = key) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         sort order: 
-                        Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
         Map 5 
             Map Operator Tree:
                 TableScan
                   alias: c
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (key = 5) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         sort order: 
-                        Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
         Map 7 
             Map Operator Tree:
                 TableScan
                   alias: d
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (5 = key) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         sort order: 
-                        Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
         Reducer 2 
             Reduce Operator Tree:
               Join Operator
@@ -128,10 +128,10 @@ STAGE PLANS:
                 keys:
                   0 
                   1 
-                Statistics: Num rows: 1 Data size: 415 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 1 Data size: 4141 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   sort order: 
-                  Statistics: Num rows: 1 Data size: 415 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 4141 Basic stats: COMPLETE Column stats: NONE
         Reducer 3 
             Reduce Operator Tree:
               Join Operator
@@ -140,14 +140,14 @@ STAGE PLANS:
                 keys:
                   0 
                   1 
-                Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                 Select Operator
                   expressions: 5 (type: int), 5 (type: int)
                   outputColumnNames: _col0, _col1
-                  Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                   File Output Operator
                     compressed: false
-                    Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                     table:
                         input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                         output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -160,10 +160,10 @@ STAGE PLANS:
                 keys:
                   0 
                   1 
-                Statistics: Num rows: 1 Data size: 429 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 1 Data size: 4281 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   sort order: 
-                  Statistics: Num rows: 1 Data size: 429 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 4281 Basic stats: COMPLETE Column stats: NONE
 
   Stage: Stage-0
     Fetch Operator
@@ -195,12 +195,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (5 = key) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                       Spark HashTable Sink Operator
                         keys:
                           0 
@@ -216,12 +216,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (key = 5) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 208 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2080 Basic stats: COMPLETE Column stats: NONE
                       Map Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -230,7 +230,7 @@ STAGE PLANS:
                           1 
                         input vertices:
                           1 Map 2
-                        Statistics: Num rows: 1 Data size: 415 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 4141 Basic stats: COMPLETE Column stats: NONE
                         Spark HashTable Sink Operator
                           keys:
                             0 
@@ -241,12 +241,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: c
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (key = 5) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                       Spark HashTable Sink Operator
                         keys:
                           0 
@@ -262,12 +262,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: d
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: (5 = key) (type: boolean)
-                    Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
-                      Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                       Map Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -276,7 +276,7 @@ STAGE PLANS:
                           1 
                         input vertices:
                           0 Map 3
-                        Statistics: Num rows: 1 Data size: 429 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 4281 Basic stats: COMPLETE Column stats: NONE
                         Map Join Operator
                           condition map:
                                Inner Join 0 to 1
@@ -285,14 +285,14 @@ STAGE PLANS:
                             1 
                           input vertices:
                             0 Map 1
-                          Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                           Select Operator
                             expressions: 5 (type: int), 5 (type: int)
                             outputColumnNames: _col0, _col1
-                            Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                            Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                             File Output Operator
                               compressed: false
-                              Statistics: Num rows: 1 Data size: 845 Basic stats: COMPLETE Column stats: NONE
+                              Statistics: Num rows: 1 Data size: 8423 Basic stats: COMPLETE Column stats: NONE
                               table:
                                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/e26b9325/ql/src/test/results/clientpositive/spark/smb_mapjoin_3.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/smb_mapjoin_3.q.out b/ql/src/test/results/clientpositive/spark/smb_mapjoin_3.q.out
index c63ff7f..9362085 100644
--- a/ql/src/test/results/clientpositive/spark/smb_mapjoin_3.q.out
+++ b/ql/src/test/results/clientpositive/spark/smb_mapjoin_3.q.out
@@ -65,10 +65,10 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                     Sorted Merge Bucket Map Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -76,14 +76,14 @@ STAGE PLANS:
                         0 key (type: int)
                         1 key (type: int)
                       outputColumnNames: _col0, _col1, _col5, _col6
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       Select Operator
                         expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         File Output Operator
                           compressed: false
-                          Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                           table:
                               input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                               output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -126,7 +126,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Left Outer Join 0 to 1
@@ -134,14 +134,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -186,7 +186,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Right Outer Join 0 to 1
@@ -194,14 +194,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -248,7 +248,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 222 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2220 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Outer Join 0 to 1
@@ -256,14 +256,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -312,10 +312,10 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Filter Operator
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                     Sorted Merge Bucket Map Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -323,14 +323,14 @@ STAGE PLANS:
                         0 key (type: int)
                         1 key (type: int)
                       outputColumnNames: _col0, _col1, _col5, _col6
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       Select Operator
                         expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                         outputColumnNames: _col0, _col1, _col2, _col3
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         File Output Operator
                           compressed: false
-                          Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                          Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                           table:
                               input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                               output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -373,7 +373,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Left Outer Join 0 to 1
@@ -381,14 +381,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -433,7 +433,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Right Outer Join 0 to 1
@@ -441,14 +441,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -495,7 +495,7 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 2060 Basic stats: COMPLETE Column stats: NONE
                   Sorted Merge Bucket Map Join Operator
                     condition map:
                          Outer Join 0 to 1
@@ -503,14 +503,14 @@ STAGE PLANS:
                       0 key (type: int)
                       1 key (type: int)
                     outputColumnNames: _col0, _col1, _col5, _col6
-                    Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: _col0 (type: int), _col1 (type: string), _col5 (type: int), _col6 (type: string)
                       outputColumnNames: _col0, _col1, _col2, _col3
-                      Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                       File Output Operator
                         compressed: false
-                        Statistics: Num rows: 1 Data size: 226 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 1 Data size: 2266 Basic stats: COMPLETE Column stats: NONE
                         table:
                             input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                             output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat