You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by kg...@apache.org on 2018/01/05 10:49:02 UTC

[13/18] hive git commit: HIVE-18108: in case basic stats are missing; rowcount estimation depends on the selected columns size (Zoltan Haindrich, reviewed by Ashutosh Chauhan)

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out b/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
index 524af1c..d055be2 100644
--- a/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
+++ b/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
@@ -82,22 +82,22 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: employee_part
-            Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: employeeid (type: int), employeename (type: string), country (type: string)
               outputColumnNames: employeeid, employeename, country
-              Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(employeename, 'hll'), compute_stats(employeeid, 'hll')
                 keys: 4000.0 (type: double), country (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2, _col3
-                Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+                Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   key expressions: 4000.0 (type: double), _col1 (type: string)
                   sort order: ++
                   Map-reduce partition columns: 4000.0 (type: double), _col1 (type: string)
-                  Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
                   value expressions: _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -105,14 +105,14 @@ STAGE PLANS:
           keys: 4000.0 (type: double), KEY._col1 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2, _col3
-          Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+          Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 4000.0 (type: double), _col1 (type: string)
             outputColumnNames: _col0, _col1, _col2, _col3
-            Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 1 Data size: 64 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 640 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -213,22 +213,22 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: employee_part
-            Statistics: Num rows: 42 Data size: 169 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 3 Data size: 1690 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: employeeid (type: int), country (type: string)
               outputColumnNames: employeeid, country
-              Statistics: Num rows: 42 Data size: 169 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 3 Data size: 1690 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(employeeid, 'hll')
                 keys: 2000.0 (type: double), country (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2
-                Statistics: Num rows: 42 Data size: 169 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 3 Data size: 1690 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   key expressions: 2000.0 (type: double), _col1 (type: string)
                   sort order: ++
                   Map-reduce partition columns: 2000.0 (type: double), _col1 (type: string)
-                  Statistics: Num rows: 42 Data size: 169 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 3 Data size: 1690 Basic stats: COMPLETE Column stats: NONE
                   value expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -236,14 +236,14 @@ STAGE PLANS:
           keys: 2000.0 (type: double), KEY._col1 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2
-          Statistics: Num rows: 21 Data size: 84 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 563 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 2000.0 (type: double), _col1 (type: string)
             outputColumnNames: _col0, _col1, _col2
-            Statistics: Num rows: 21 Data size: 84 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 563 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 21 Data size: 84 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 563 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/combine2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/combine2.q.out b/ql/src/test/results/clientpositive/combine2.q.out
index 6c94c87..d4194c8 100644
--- a/ql/src/test/results/clientpositive/combine2.q.out
+++ b/ql/src/test/results/clientpositive/combine2.q.out
@@ -161,22 +161,22 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: srcpart
-            Statistics: Num rows: 2000 Data size: 212480 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: ds (type: string)
               outputColumnNames: ds
-              Statistics: Num rows: 2000 Data size: 212480 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: count()
                 keys: ds (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1
-                Statistics: Num rows: 2000 Data size: 212480 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   key expressions: _col0 (type: string)
                   sort order: +
                   Map-reduce partition columns: _col0 (type: string)
-                  Statistics: Num rows: 2000 Data size: 212480 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE
                   value expressions: _col1 (type: bigint)
       Reduce Operator Tree:
         Group By Operator
@@ -184,10 +184,10 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 1000 Data size: 106240 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE
           File Output Operator
             compressed: false
-            Statistics: Num rows: 1000 Data size: 106240 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE
             table:
                 input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                 output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/groupby_sort_11.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/groupby_sort_11.q.out b/ql/src/test/results/clientpositive/groupby_sort_11.q.out
index e1a16e4..23c89f9 100644
--- a/ql/src/test/results/clientpositive/groupby_sort_11.q.out
+++ b/ql/src/test/results/clientpositive/groupby_sort_11.q.out
@@ -387,19 +387,19 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: t1
-            Statistics: Num rows: 10 Data size: 700 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 10 Data size: 70 Basic stats: COMPLETE Column stats: NONE
             Select Operator
-              Statistics: Num rows: 10 Data size: 700 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 10 Data size: 70 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: count(DISTINCT 1)
                 keys: 1 (type: int)
                 mode: hash
                 outputColumnNames: _col0, _col1
-                Statistics: Num rows: 10 Data size: 700 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 10 Data size: 70 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   key expressions: _col0 (type: int)
                   sort order: +
-                  Statistics: Num rows: 10 Data size: 700 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 10 Data size: 70 Basic stats: COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Group By Operator
           aggregations: count(DISTINCT KEY._col0:0._col0)

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/groupby_sort_6.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/groupby_sort_6.q.out b/ql/src/test/results/clientpositive/groupby_sort_6.q.out
index 871c7b3..97e667a 100644
--- a/ql/src/test/results/clientpositive/groupby_sort_6.q.out
+++ b/ql/src/test/results/clientpositive/groupby_sort_6.q.out
@@ -531,24 +531,24 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: t1
-            Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
             GatherStats: false
             Select Operator
               expressions: key (type: string)
               outputColumnNames: key
-              Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
               Group By Operator
                 aggregations: count()
                 keys: key (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1
-                Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+                Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
                 Reduce Output Operator
                   key expressions: _col0 (type: string)
                   null sort order: a
                   sort order: +
                   Map-reduce partition columns: _col0 (type: string)
-                  Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
                   tag: -1
                   value expressions: _col1 (type: bigint)
                   auto parallelism: false
@@ -610,17 +610,17 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+          Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
           Select Operator
             expressions: UDFToInteger(_col0) (type: int), UDFToInteger(_col1) (type: int)
             outputColumnNames: _col0, _col1
-            Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
             File Output Operator
               compressed: false
               GlobalTableId: 1
 #### A masked pattern was here ####
               NumFilesPerFileSink: 1
-              Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
 #### A masked pattern was here ####
               table:
                   input format: org.apache.hadoop.mapred.TextInputFormat
@@ -650,7 +650,7 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: int), _col1 (type: int)
               outputColumnNames: key, cnt
-              Statistics: Num rows: 1 Data size: 30 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 300 Basic stats: PARTIAL Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(key, 'hll'), compute_stats(cnt, 'hll')
                 mode: hash

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/infer_bucket_sort_dyn_part.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/infer_bucket_sort_dyn_part.q.out b/ql/src/test/results/clientpositive/infer_bucket_sort_dyn_part.q.out
index 32e4513..03e629d 100644
--- a/ql/src/test/results/clientpositive/infer_bucket_sort_dyn_part.q.out
+++ b/ql/src/test/results/clientpositive/infer_bucket_sort_dyn_part.q.out
@@ -427,22 +427,22 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: srcpart
-            Statistics: Num rows: 116 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 198 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: key (type: string)
               outputColumnNames: key
-              Statistics: Num rows: 116 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 198 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: count()
                 keys: key (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1
-                Statistics: Num rows: 116 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 198 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
                 Reduce Output Operator
                   key expressions: _col0 (type: string)
                   sort order: +
                   Map-reduce partition columns: _col0 (type: string)
-                  Statistics: Num rows: 116 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 198 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
                   value expressions: _col1 (type: bigint)
       Reduce Operator Tree:
         Group By Operator
@@ -450,14 +450,14 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col0 (type: string), UDFToString(_col1) (type: string), if(((UDFToDouble(_col0) % 100.0) = 0.0), '11', '12') (type: string)
             outputColumnNames: _col0, _col1, _col2
-            Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.hive.ql.io.RCFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.RCFileOutputFormat
@@ -466,13 +466,13 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: string), _col1 (type: string), '2008-04-08' (type: string), _col2 (type: string)
               outputColumnNames: key, value, ds, hr
-              Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(key, 'hll'), compute_stats(value, 'hll')
                 keys: ds (type: string), hr (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2, _col3
-                Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   table:
@@ -538,7 +538,7 @@ STAGE PLANS:
               key expressions: _col0 (type: string), _col1 (type: string)
               sort order: ++
               Map-reduce partition columns: _col0 (type: string), _col1 (type: string)
-              Statistics: Num rows: 58 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               value expressions: _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -546,14 +546,14 @@ STAGE PLANS:
           keys: KEY._col0 (type: string), KEY._col1 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2, _col3
-          Statistics: Num rows: 29 Data size: 2906 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 49 Data size: 28766 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: string), _col1 (type: string)
             outputColumnNames: _col0, _col1, _col2, _col3
-            Statistics: Num rows: 29 Data size: 2906 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 49 Data size: 28766 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 29 Data size: 2906 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 49 Data size: 28766 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/infer_bucket_sort_num_buckets.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/infer_bucket_sort_num_buckets.q.out b/ql/src/test/results/clientpositive/infer_bucket_sort_num_buckets.q.out
index cf332e2..7487c98 100644
--- a/ql/src/test/results/clientpositive/infer_bucket_sort_num_buckets.q.out
+++ b/ql/src/test/results/clientpositive/infer_bucket_sort_num_buckets.q.out
@@ -34,24 +34,24 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: srcpart
-            Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: if(((key % 3) < 2), 0, 1) (type: int), value (type: string), UDFToInteger((key % 2)) (type: int)
               outputColumnNames: _col0, _col1, _col2
-              Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
               Reduce Output Operator
                 sort order: 
                 Map-reduce partition columns: _col0 (type: int)
-                Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
                 value expressions: _col0 (type: int), _col1 (type: string), _col2 (type: int)
       Reduce Operator Tree:
         Select Operator
           expressions: VALUE._col0 (type: int), VALUE._col1 (type: string), VALUE._col2 (type: int)
           outputColumnNames: _col0, _col1, _col2
-          Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
           File Output Operator
             compressed: false
-            Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
             table:
                 input format: org.apache.hadoop.mapred.TextInputFormat
                 output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -60,13 +60,13 @@ STAGE PLANS:
           Select Operator
             expressions: _col0 (type: int), _col1 (type: string), UDFToString(_col2) (type: string)
             outputColumnNames: key, value, hr
-            Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
             Group By Operator
               aggregations: compute_stats(key, 'hll'), compute_stats(value, 'hll')
               keys: '2008-04-08' (type: string), hr (type: string)
               mode: hash
               outputColumnNames: _col0, _col1, _col2, _col3
-              Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
               File Output Operator
                 compressed: false
                 table:
@@ -103,7 +103,7 @@ STAGE PLANS:
               key expressions: '2008-04-08' (type: string), _col1 (type: string)
               sort order: ++
               Map-reduce partition columns: '2008-04-08' (type: string), _col1 (type: string)
-              Statistics: Num rows: 58 Data size: 11624 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 234 Data size: 116240 Basic stats: COMPLETE Column stats: NONE
               value expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -111,14 +111,14 @@ STAGE PLANS:
           keys: '2008-04-08' (type: string), KEY._col1 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2, _col3
-          Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 117 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), '2008-04-08' (type: string), _col1 (type: string)
             outputColumnNames: _col0, _col1, _col2, _col3
-            Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 117 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 117 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/insert1_overwrite_partitions.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/insert1_overwrite_partitions.q.out b/ql/src/test/results/clientpositive/insert1_overwrite_partitions.q.out
index b17bc11..5c85380 100644
--- a/ql/src/test/results/clientpositive/insert1_overwrite_partitions.q.out
+++ b/ql/src/test/results/clientpositive/insert1_overwrite_partitions.q.out
@@ -50,26 +50,26 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: sourcetable
-            Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: one (type: string), two (type: string)
               outputColumnNames: _col0, _col1
-              Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               Reduce Output Operator
                 key expressions: _col0 (type: string), _col1 (type: string)
                 sort order: --
-                Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Select Operator
           expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string)
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
           Limit
             Number of rows: 5
-            Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.TextInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -78,13 +78,13 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: string), _col1 (type: string), '2011-11-11' (type: string), '11' (type: string)
               outputColumnNames: one, two, ds, hr
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(one, 'hll'), compute_stats(two, 'hll')
                 keys: ds (type: string), hr (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2, _col3
-                Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   table:
@@ -121,7 +121,7 @@ STAGE PLANS:
               key expressions: _col0 (type: string), _col1 (type: string)
               sort order: ++
               Map-reduce partition columns: _col0 (type: string), _col1 (type: string)
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
               value expressions: _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -129,14 +129,14 @@ STAGE PLANS:
           keys: KEY._col0 (type: string), KEY._col1 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2, _col3
-          Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 2 Data size: 1174 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: string), _col1 (type: string)
             outputColumnNames: _col0, _col1, _col2, _col3
-            Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 2 Data size: 1174 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 2 Data size: 1174 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -233,26 +233,26 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: sourcetable
-            Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: one (type: string), two (type: string)
               outputColumnNames: _col0, _col1
-              Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
               Reduce Output Operator
                 key expressions: _col0 (type: string), _col1 (type: string)
                 sort order: --
-                Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Select Operator
           expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string)
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 29 Data size: 5812 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 99 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
           Limit
             Number of rows: 5
-            Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.TextInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -261,7 +261,7 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: string), _col1 (type: string)
               outputColumnNames: one, two
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2935 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(one, 'hll'), compute_stats(two, 'hll')
                 mode: hash

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/insert2_overwrite_partitions.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/insert2_overwrite_partitions.q.out b/ql/src/test/results/clientpositive/insert2_overwrite_partitions.q.out
index 77913f0..14b4c10 100644
--- a/ql/src/test/results/clientpositive/insert2_overwrite_partitions.q.out
+++ b/ql/src/test/results/clientpositive/insert2_overwrite_partitions.q.out
@@ -61,26 +61,26 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: sourcetable
-            Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: one (type: string), two (type: string)
               outputColumnNames: _col0, _col1
-              Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
               Reduce Output Operator
                 key expressions: _col0 (type: string), _col1 (type: string)
                 sort order: --
-                Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Select Operator
           expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string)
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
           Limit
             Number of rows: 5
-            Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.TextInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -89,13 +89,13 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: string), _col1 (type: string), '2011-11-11' (type: string)
               outputColumnNames: one, two, ds
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(one, 'hll'), compute_stats(two, 'hll')
                 keys: ds (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2
-                Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   table:
@@ -131,7 +131,7 @@ STAGE PLANS:
               key expressions: _col0 (type: string)
               sort order: +
               Map-reduce partition columns: _col0 (type: string)
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               value expressions: _col1 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -139,14 +139,14 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2
-          Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col1 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: string)
             outputColumnNames: _col0, _col1, _col2
-            Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -199,26 +199,26 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: sourcetable
-            Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: one (type: string), two (type: string)
               outputColumnNames: _col0, _col1
-              Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
               Reduce Output Operator
                 key expressions: _col0 (type: string), _col1 (type: string)
                 sort order: --
-                Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
       Reduce Operator Tree:
         Select Operator
           expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: string)
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 30 Data size: 6028 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 124 Data size: 60280 Basic stats: COMPLETE Column stats: NONE
           Limit
             Number of rows: 5
-            Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.TextInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -227,13 +227,13 @@ STAGE PLANS:
             Select Operator
               expressions: _col0 (type: string), _col1 (type: string), '2011-11-11' (type: string)
               outputColumnNames: one, two, ds
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: compute_stats(one, 'hll'), compute_stats(two, 'hll')
                 keys: ds (type: string)
                 mode: hash
                 outputColumnNames: _col0, _col1, _col2
-                Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
                 File Output Operator
                   compressed: false
                   table:
@@ -269,7 +269,7 @@ STAGE PLANS:
               key expressions: _col0 (type: string)
               sort order: +
               Map-reduce partition columns: _col0 (type: string)
-              Statistics: Num rows: 5 Data size: 1000 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 5 Data size: 2430 Basic stats: COMPLETE Column stats: NONE
               value expressions: _col1 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
       Reduce Operator Tree:
         Group By Operator
@@ -277,14 +277,14 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2
-          Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
           Select Operator
             expressions: _col1 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: string)
             outputColumnNames: _col0, _col1, _col2
-            Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
             File Output Operator
               compressed: false
-              Statistics: Num rows: 2 Data size: 400 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 2 Data size: 972 Basic stats: COMPLETE Column stats: NONE
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat
                   output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/insert_into2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/insert_into2.q.out b/ql/src/test/results/clientpositive/insert_into2.q.out
index 13ad212..efffd53 100644
--- a/ql/src/test/results/clientpositive/insert_into2.q.out
+++ b/ql/src/test/results/clientpositive/insert_into2.q.out
@@ -571,9 +571,9 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: insert_into2
-            Statistics: Num rows: 50 Data size: 5300 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 50 Data size: 530 Basic stats: COMPLETE Column stats: NONE
             Select Operator
-              Statistics: Num rows: 50 Data size: 5300 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 50 Data size: 530 Basic stats: COMPLETE Column stats: NONE
               Group By Operator
                 aggregations: count()
                 mode: hash

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/list_bucket_query_oneskew_1.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_1.q.out b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_1.q.out
index 1076df5..bb75940 100644
--- a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_1.q.out
+++ b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_1.q.out
@@ -185,16 +185,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 2 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x = 484) (type: boolean)
-            Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
             Select Operator
               expressions: 484 (type: int)
               outputColumnNames: _col0
-              Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
               ListSink
 
 PREHOOK: query: SELECT x FROM fact_daily WHERE ds='1' and x=484
@@ -266,16 +266,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 2 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x = 495) (type: boolean)
-            Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
             Select Operator
               expressions: 495 (type: int)
               outputColumnNames: _col0
-              Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
               ListSink
 
 PREHOOK: query: SELECT x FROM fact_daily WHERE ds='1' and x=495
@@ -347,16 +347,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 2 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x = 1) (type: boolean)
-            Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
             Select Operator
               expressions: 1 (type: int)
               outputColumnNames: _col0
-              Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 80 Basic stats: PARTIAL Column stats: NONE
               ListSink
 
 PREHOOK: query: SELECT x FROM fact_daily WHERE ds='1' and x=1

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/list_bucket_query_oneskew_2.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_2.q.out b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_2.q.out
index 3e595fc..54c9b38 100644
--- a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_2.q.out
+++ b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_2.q.out
@@ -188,16 +188,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x = 484) (type: boolean)
-            Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
             Select Operator
               expressions: 484 (type: int)
               outputColumnNames: _col0
-              Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
               ListSink
 
 PREHOOK: query: select x from (select * from fact_daily where ds = '1') subq where x = 484
@@ -269,16 +269,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+          Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x = 484) (type: boolean)
-            Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
             Select Operator
               expressions: 484 (type: int), y (type: string)
               outputColumnNames: _col0, _col1
-              Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
               ListSink
 
 PREHOOK: query: select x1, y1 from(select x as x1, y as y1 from fact_daily where ds ='1') subq where x1 = 484
@@ -306,28 +306,28 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: fact_daily
-            Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
             GatherStats: false
             Filter Operator
               isSamplingPred: false
               predicate: (x = 484) (type: boolean)
-              Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+              Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
               Select Operator
                 expressions: y (type: string)
                 outputColumnNames: y
-                Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+                Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                 Group By Operator
                   aggregations: count()
                   keys: y (type: string)
                   mode: hash
                   outputColumnNames: _col0, _col1
-                  Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                   Reduce Output Operator
                     key expressions: _col0 (type: string)
                     null sort order: a
                     sort order: +
                     Map-reduce partition columns: _col0 (type: string)
-                    Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                     tag: -1
                     value expressions: _col1 (type: bigint)
                     auto parallelism: false
@@ -388,13 +388,13 @@ STAGE PLANS:
           keys: KEY._col0 (type: string)
           mode: mergepartial
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+          Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
           File Output Operator
             compressed: false
             GlobalTableId: 0
 #### A masked pattern was here ####
             NumFilesPerFileSink: 1
-            Statistics: Num rows: 1 Data size: 24 Basic stats: PARTIAL Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
 #### A masked pattern was here ####
             table:
                 input format: org.apache.hadoop.mapred.SequenceFileInputFormat
@@ -443,26 +443,26 @@ STAGE PLANS:
       Map Operator Tree:
           TableScan
             alias: fact_daily
-            Statistics: Num rows: 6 Data size: 24 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
             GatherStats: false
             Filter Operator
               isSamplingPred: false
               predicate: (x = 484) (type: boolean)
-              Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
               Select Operator
-                Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                 Group By Operator
                   aggregations: count()
                   keys: 484 (type: int)
                   mode: hash
                   outputColumnNames: _col0, _col1
-                  Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                   Reduce Output Operator
                     key expressions: _col0 (type: int)
                     null sort order: a
                     sort order: +
                     Map-reduce partition columns: _col0 (type: int)
-                    Statistics: Num rows: 3 Data size: 12 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
                     tag: -1
                     value expressions: _col1 (type: bigint)
                     auto parallelism: false
@@ -523,17 +523,17 @@ STAGE PLANS:
           keys: KEY._col0 (type: int)
           mode: mergepartial
           outputColumnNames: _col0, _col1
-          Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
           Select Operator
             expressions: 484 (type: int), _col1 (type: bigint)
             outputColumnNames: _col0, _col1
-            Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
             File Output Operator
               compressed: false
               GlobalTableId: 0
 #### A masked pattern was here ####
               NumFilesPerFileSink: 1
-              Statistics: Num rows: 1 Data size: 4 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 1 Data size: 240 Basic stats: PARTIAL Column stats: NONE
 #### A masked pattern was here ####
               table:
                   input format: org.apache.hadoop.mapred.SequenceFileInputFormat

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/list_bucket_query_oneskew_3.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_3.q.out b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_3.q.out
index 9d30759..cc8d3ce 100644
--- a/ql/src/test/results/clientpositive/list_bucket_query_oneskew_3.q.out
+++ b/ql/src/test/results/clientpositive/list_bucket_query_oneskew_3.q.out
@@ -208,16 +208,16 @@ STAGE PLANS:
       Processor Tree:
         TableScan
           alias: fact_daily
-          Statistics: Num rows: 29 Data size: 117 Basic stats: COMPLETE Column stats: NONE
+          Statistics: Num rows: 2 Data size: 1170 Basic stats: COMPLETE Column stats: NONE
           GatherStats: false
           Filter Operator
             isSamplingPred: false
             predicate: (x <> 86) (type: boolean)
-            Statistics: Num rows: 29 Data size: 117 Basic stats: COMPLETE Column stats: NONE
+            Statistics: Num rows: 2 Data size: 1170 Basic stats: COMPLETE Column stats: NONE
             Select Operator
               expressions: x (type: int)
               outputColumnNames: _col0
-              Statistics: Num rows: 29 Data size: 117 Basic stats: COMPLETE Column stats: NONE
+              Statistics: Num rows: 2 Data size: 1170 Basic stats: COMPLETE Column stats: NONE
               ListSink
 
 PREHOOK: query: SELECT x FROM fact_daily WHERE ds='1' and not (x = 86)

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_1.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_1.q.out b/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_1.q.out
index 8fc43e4..3c3e913 100644
--- a/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_1.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_1.q.out
@@ -119,16 +119,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -185,16 +185,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                       Merge Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -202,7 +202,7 @@ STAGE PLANS:
                           0 _col0 (type: string)
                           1 _col0 (type: string)
                         Position of Big Table: 1
-                        Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                         Group By Operator
                           aggregations: count()
                           mode: hash
@@ -393,16 +393,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -459,16 +459,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                       Merge Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -476,7 +476,7 @@ STAGE PLANS:
                           0 _col0 (type: string)
                           1 _col0 (type: string)
                         Position of Big Table: 0
-                        Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                         Group By Operator
                           aggregations: count()
                           mode: hash
@@ -667,16 +667,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -733,16 +733,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                       Merge Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -750,7 +750,7 @@ STAGE PLANS:
                           0 _col0 (type: string)
                           1 _col0 (type: string)
                         Position of Big Table: 0
-                        Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                         Group By Operator
                           aggregations: count()
                           mode: hash

http://git-wip-us.apache.org/repos/asf/hive/blob/d0fa7d55/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_11.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_11.q.out b/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_11.q.out
index 3eb8fde..d6ecf9c 100644
--- a/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_11.q.out
+++ b/ql/src/test/results/clientpositive/llap/auto_sortmerge_join_11.q.out
@@ -118,22 +118,22 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         key expressions: _col0 (type: string)
                         null sort order: a
                         sort order: +
                         Map-reduce partition columns: _col0 (type: string)
-                        Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                         tag: 0
                         auto parallelism: true
             Execution mode: llap
@@ -196,22 +196,22 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                       Reduce Output Operator
                         key expressions: _col0 (type: string)
                         null sort order: a
                         sort order: +
                         Map-reduce partition columns: _col0 (type: string)
-                        Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                         tag: 1
                         auto parallelism: true
             Execution mode: llap
@@ -331,7 +331,7 @@ STAGE PLANS:
                   0 _col0 (type: string)
                   1 _col0 (type: string)
                 Position of Big Table: 1
-                Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                 Group By Operator
                   aggregations: count()
                   mode: hash
@@ -419,16 +419,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -485,16 +485,16 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Select Operator
                       expressions: key (type: string)
                       outputColumnNames: _col0
-                      Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                       Merge Join Operator
                         condition map:
                              Inner Join 0 to 1
@@ -502,7 +502,7 @@ STAGE PLANS:
                           0 _col0 (type: string)
                           1 _col0 (type: string)
                         Position of Big Table: 1
-                        Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                        Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                         Group By Operator
                           aggregations: count()
                           mode: hash
@@ -693,12 +693,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -755,12 +755,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Merge Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -768,7 +768,7 @@ STAGE PLANS:
                         0 key (type: string)
                         1 key (type: string)
                       Position of Big Table: 1
-                      Statistics: Num rows: 122 Data size: 33926 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 250 Data size: 165502 Basic stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: count()
                         mode: hash
@@ -959,12 +959,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: a
-                  Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 1 Data size: 298 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 2 Data size: 1508 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -1021,12 +1021,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: c
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
             Path -> Alias:
 #### A masked pattern was here ####
             Path -> Partition:
@@ -1132,12 +1132,12 @@ STAGE PLANS:
             Map Operator Tree:
                 TableScan
                   alias: b
-                  Statistics: Num rows: 116 Data size: 32232 Basic stats: COMPLETE Column stats: NONE
+                  Statistics: Num rows: 240 Data size: 158376 Basic stats: COMPLETE Column stats: NONE
                   GatherStats: false
                   Filter Operator
                     isSamplingPred: false
                     predicate: key is not null (type: boolean)
-                    Statistics: Num rows: 111 Data size: 30842 Basic stats: COMPLETE Column stats: NONE
+                    Statistics: Num rows: 228 Data size: 150457 Basic stats: COMPLETE Column stats: NONE
                     Merge Join Operator
                       condition map:
                            Inner Join 0 to 1
@@ -1147,7 +1147,7 @@ STAGE PLANS:
                         1 key (type: string)
                         2 key (type: string)
                       Position of Big Table: 1
-                      Statistics: Num rows: 244 Data size: 67852 Basic stats: COMPLETE Column stats: NONE
+                      Statistics: Num rows: 501 Data size: 331005 Basic stats: COMPLETE Column stats: NONE
                       Group By Operator
                         aggregations: count()
                         mode: hash