You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by kg...@apache.org on 2019/01/23 16:39:09 UTC
[37/51] [partial] hive git commit: HIVE-17084: Turn on
hive.stats.fetch.column.stats configuration flag (Zoltan Haindrich reviewed
by Ashutosh Chauhan)
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/cbo_rp_join1.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/cbo_rp_join1.q.out b/ql/src/test/results/clientpositive/cbo_rp_join1.q.out
index 93eacf7..78d5e74 100644
--- a/ql/src/test/results/clientpositive/cbo_rp_join1.q.out
+++ b/ql/src/test/results/clientpositive/cbo_rp_join1.q.out
@@ -34,25 +34,25 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: a
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean)
TableScan
alias: b
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean)
Reduce Operator Tree:
Join Operator
@@ -65,11 +65,11 @@ STAGE PLANS:
0
1
outputColumnNames: _col0, _col1, _col3, _col4
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: hash(_col0,_col1,_col3,_col4) (type: int)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: sum(_col0)
mode: hash
@@ -141,25 +141,25 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: a
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean), (value = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean), _col3 (type: boolean)
TableScan
alias: b
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean)
Reduce Operator Tree:
Join Operator
@@ -172,11 +172,11 @@ STAGE PLANS:
0
1
outputColumnNames: _col0, _col1, _col4, _col5
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: hash(_col0,_col1,_col4,_col5) (type: int)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: sum(_col0)
mode: hash
@@ -248,25 +248,25 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: a
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean)
TableScan
alias: b
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key = 40) (type: boolean)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean)
Reduce Operator Tree:
Join Operator
@@ -279,11 +279,11 @@ STAGE PLANS:
0
1
outputColumnNames: _col0, _col1, _col3, _col4
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: hash(_col0,_col1,_col3,_col4) (type: int)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: sum(_col0)
mode: hash
@@ -355,25 +355,25 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: a
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key > 40) (type: boolean), (value > 50) (type: boolean), (key = value) (type: boolean)
outputColumnNames: _col0, _col1, _col2, _col3, _col4
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean), _col3 (type: boolean), _col4 (type: boolean)
TableScan
alias: b
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: int), value (type: int), (key > 40) (type: boolean), (value > 50) (type: boolean), (key = value) (type: boolean)
outputColumnNames: _col0, _col1, _col2, _col3, _col4
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 220 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: boolean), _col3 (type: boolean), _col4 (type: boolean)
Reduce Operator Tree:
Join Operator
@@ -386,11 +386,11 @@ STAGE PLANS:
0
1
outputColumnNames: _col0, _col1, _col5, _col6
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: hash(_col0,_col1,_col5,_col6) (type: int)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 441 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 17 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: sum(_col0)
mode: hash
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/cbo_rp_outer_join_ppr.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/cbo_rp_outer_join_ppr.q.out b/ql/src/test/results/clientpositive/cbo_rp_outer_join_ppr.q.out
index 8fd669b..684155f 100644
--- a/ql/src/test/results/clientpositive/cbo_rp_outer_join_ppr.q.out
+++ b/ql/src/test/results/clientpositive/cbo_rp_outer_join_ppr.q.out
@@ -37,44 +37,44 @@ STAGE PLANS:
TableScan
alias: a
filterExpr: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE
GatherStats: false
Filter Operator
isSamplingPred: false
predicate: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string)
outputColumnNames: key, value
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: key (type: string)
null sort order: a
sort order: +
Map-reduce partition columns: key (type: string)
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
tag: 0
value expressions: value (type: string)
auto parallelism: false
TableScan
alias: b
filterExpr: ((UDFToDouble(key) > 15.0D) and (UDFToDouble(key) < 20.0D)) (type: boolean)
- Statistics: Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1000 Data size: 178000 Basic stats: COMPLETE Column stats: COMPLETE
GatherStats: false
Filter Operator
isSamplingPred: false
predicate: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 19758 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string)
outputColumnNames: key, value
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 30192 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: key (type: string)
null sort order: a
sort order: +
Map-reduce partition columns: key (type: string)
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 30192 Basic stats: COMPLETE Column stats: COMPLETE
tag: 1
value expressions: value (type: string)
auto parallelism: false
@@ -240,17 +240,17 @@ STAGE PLANS:
0 key (type: string)
1 key (type: string)
outputColumnNames: key, value, key0, value0
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string), key0 (type: string), value0 (type: string)
outputColumnNames: key, value, key0, value0
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
GlobalTableId: 0
#### A masked pattern was here ####
NumFilesPerFileSink: 1
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
#### A masked pattern was here ####
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
@@ -351,44 +351,44 @@ STAGE PLANS:
TableScan
alias: a
filterExpr: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE
GatherStats: false
Filter Operator
isSamplingPred: false
predicate: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string)
outputColumnNames: key, value
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: key (type: string)
null sort order: a
sort order: +
Map-reduce partition columns: key (type: string)
- Statistics: Num rows: 55 Data size: 584 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 9790 Basic stats: COMPLETE Column stats: COMPLETE
tag: 0
value expressions: value (type: string)
auto parallelism: false
TableScan
alias: b
filterExpr: ((UDFToDouble(key) > 15.0D) and (UDFToDouble(key) < 20.0D)) (type: boolean)
- Statistics: Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1000 Data size: 178000 Basic stats: COMPLETE Column stats: COMPLETE
GatherStats: false
Filter Operator
isSamplingPred: false
predicate: ((UDFToDouble(key) < 20.0D) and (UDFToDouble(key) > 15.0D)) (type: boolean)
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 19758 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string)
outputColumnNames: key, value
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 30192 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: key (type: string)
null sort order: a
sort order: +
Map-reduce partition columns: key (type: string)
- Statistics: Num rows: 111 Data size: 1179 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 111 Data size: 30192 Basic stats: COMPLETE Column stats: COMPLETE
tag: 1
value expressions: value (type: string)
auto parallelism: false
@@ -554,17 +554,17 @@ STAGE PLANS:
0 key (type: string)
1 key (type: string)
outputColumnNames: key, value, key0, value0
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), value (type: string), key0 (type: string), value0 (type: string)
outputColumnNames: key, value, key0, value0
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
GlobalTableId: 0
#### A masked pattern was here ####
NumFilesPerFileSink: 1
- Statistics: Num rows: 122 Data size: 1296 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 55 Data size: 19580 Basic stats: COMPLETE Column stats: COMPLETE
#### A masked pattern was here ####
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/cbo_rp_udaf_percentile_approx_23.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/cbo_rp_udaf_percentile_approx_23.q.out b/ql/src/test/results/clientpositive/cbo_rp_udaf_percentile_approx_23.q.out
index 1a998f6..15c3b37 100644
--- a/ql/src/test/results/clientpositive/cbo_rp_udaf_percentile_approx_23.q.out
+++ b/ql/src/test/results/clientpositive/cbo_rp_udaf_percentile_approx_23.q.out
@@ -514,29 +514,29 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: bucket_n1
- Statistics: Num rows: 1 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: CASE WHEN ((key < 100.0D)) THEN (NaND) ELSE (key) END (type: double)
outputColumnNames: $f0
- Statistics: Num rows: 1 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: percentile_approx($f0, 0.5)
mode: hash
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: array<double>)
Reduce Operator Tree:
Group By Operator
aggregations: percentile_approx(VALUE._col0)
mode: mergepartial
outputColumnNames: $f0
- Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -577,29 +577,29 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: bucket_n1
- Statistics: Num rows: 1 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: key (type: double)
outputColumnNames: $f0
- Statistics: Num rows: 1 Data size: 58120 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: percentile_approx($f0, 0.5)
mode: hash
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: array<double>)
Reduce Operator Tree:
Group By Operator
aggregations: percentile_approx(VALUE._col0)
mode: mergepartial
outputColumnNames: $f0
- Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 168 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/cbo_union_view.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/cbo_union_view.q.out b/ql/src/test/results/clientpositive/cbo_union_view.q.out
index a1c582e..71fb4e6 100644
--- a/ql/src/test/results/clientpositive/cbo_union_view.q.out
+++ b/ql/src/test/results/clientpositive/cbo_union_view.q.out
@@ -79,23 +79,23 @@ STAGE PLANS:
filterExpr: (key = 86) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: (key = 86) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string), ds (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 368 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1104 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -105,23 +105,23 @@ STAGE PLANS:
filterExpr: (key = 86) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: (key = 86) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string), ds (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 368 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1104 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -131,23 +131,23 @@ STAGE PLANS:
filterExpr: (key = 86) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: (key = 86) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string), ds (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 368 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1104 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1116 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -186,23 +186,23 @@ STAGE PLANS:
filterExpr: ((key = 86) and (ds = '1')) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: ((ds = '1') and (key = 86)) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 184 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 552 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), '1' (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -212,23 +212,23 @@ STAGE PLANS:
filterExpr: ((key = 86) and (ds = '1')) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: ((ds = '1') and (key = 86)) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 184 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 552 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), '1' (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -238,23 +238,23 @@ STAGE PLANS:
filterExpr: ((key = 86) and (ds = '1')) (type: boolean)
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Filter Operator
predicate: ((ds = '1') and (key = 86)) (type: boolean)
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 372 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: value (type: string)
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 184 Basic stats: COMPLETE Column stats: PARTIAL
Union
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 552 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: 86 (type: int), _col0 (type: string), '1' (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 3 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 819 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/column_pruner_multiple_children.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/column_pruner_multiple_children.q.out b/ql/src/test/results/clientpositive/column_pruner_multiple_children.q.out
index 77cf52c..598bf82 100644
--- a/ql/src/test/results/clientpositive/column_pruner_multiple_children.q.out
+++ b/ql/src/test/results/clientpositive/column_pruner_multiple_children.q.out
@@ -40,16 +40,16 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: s_n129
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: key (type: string), substr(value, 5) (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
key expressions: _col0 (type: string)
sort order: +
Map-reduce partition columns: _col0 (type: string)
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col1 (type: string)
Execution mode: vectorized
Reduce Operator Tree:
@@ -58,14 +58,14 @@ STAGE PLANS:
keys: KEY._col0 (type: string)
mode: complete
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: UDFToInteger(_col0) (type: int), CAST( _col1 AS STRING) (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 188 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 188 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.TextInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
@@ -74,7 +74,7 @@ STAGE PLANS:
Select Operator
expressions: _col0 (type: int), _col1 (type: string)
outputColumnNames: key, value
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 188 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
table:
@@ -106,7 +106,7 @@ STAGE PLANS:
TableScan
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 9 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 188 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: key (type: int), value (type: string)
Execution mode: vectorized
Reduce Operator Tree:
@@ -114,10 +114,10 @@ STAGE PLANS:
aggregations: compute_stats(VALUE._col0, 'hll'), compute_stats(VALUE._col2, 'hll')
mode: complete
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/column_pruning_partitioned_view.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/column_pruning_partitioned_view.q.out b/ql/src/test/results/clientpositive/column_pruning_partitioned_view.q.out
index cfa9cdc..066614f 100644
--- a/ql/src/test/results/clientpositive/column_pruning_partitioned_view.q.out
+++ b/ql/src/test/results/clientpositive/column_pruning_partitioned_view.q.out
@@ -39,10 +39,10 @@ STAGE PLANS:
alias: lv_table
properties:
insideView TRUE
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 368 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: c1 (type: string), c2 (type: string)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 368 Basic stats: COMPLETE Column stats: PARTIAL
ListSink
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/columnarserde_create_shortcut.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/columnarserde_create_shortcut.q.out b/ql/src/test/results/clientpositive/columnarserde_create_shortcut.q.out
index 96c9395..6419a5f 100644
--- a/ql/src/test/results/clientpositive/columnarserde_create_shortcut.q.out
+++ b/ql/src/test/results/clientpositive/columnarserde_create_shortcut.q.out
@@ -29,25 +29,25 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: src_thrift
- Statistics: Num rows: 11 Data size: 30700 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 11 Data size: 34628 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: lint (type: array<int>), lstring (type: array<string>), mstringstring (type: map<string,string>), aint (type: int), astring (type: string)
outputColumnNames: _col0, _col1, _col2, _col3, _col4
- Statistics: Num rows: 11 Data size: 30700 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 11 Data size: 34628 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
Map-reduce partition columns: 1 (type: int)
- Statistics: Num rows: 11 Data size: 30700 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 11 Data size: 34628 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: array<int>), _col1 (type: array<string>), _col2 (type: map<string,string>), _col3 (type: int), _col4 (type: string)
Execution mode: vectorized
Reduce Operator Tree:
Select Operator
expressions: VALUE._col0 (type: array<int>), VALUE._col1 (type: array<string>), VALUE._col2 (type: map<string,string>), VALUE._col3 (type: int), VALUE._col4 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3, _col4
- Statistics: Num rows: 11 Data size: 30700 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 11 Data size: 34628 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 11 Data size: 30700 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 11 Data size: 34628 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.hive.ql.io.RCFileInputFormat
output format: org.apache.hadoop.hive.ql.io.RCFileOutputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/columnstats_partlvl.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/columnstats_partlvl.q.out b/ql/src/test/results/clientpositive/columnstats_partlvl.q.out
index 18346e4..431f24e 100644
--- a/ql/src/test/results/clientpositive/columnstats_partlvl.q.out
+++ b/ql/src/test/results/clientpositive/columnstats_partlvl.q.out
@@ -57,22 +57,22 @@ STAGE PLANS:
TableScan
alias: employee_part
filterExpr: (employeesalary = 2000.0D) (type: boolean)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: employeeid (type: int)
outputColumnNames: employeeid
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: 2000.0D (type: double)
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Reduce Output Operator
key expressions: 2000.0D (type: double)
sort order: +
Map-reduce partition columns: 2000.0D (type: double)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -80,14 +80,14 @@ STAGE PLANS:
keys: 2000.0D (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 2000.0D (type: double)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -128,25 +128,25 @@ STAGE PLANS:
TableScan
alias: employee_part
filterExpr: (employeesalary = 2000.0D) (type: boolean)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Statistics Aggregation Key Prefix: default.employee_part/
GatherStats: true
Select Operator
expressions: employeeid (type: int)
outputColumnNames: employeeid
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: 2000.0D (type: double)
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Reduce Output Operator
key expressions: 2000.0D (type: double)
null sort order: a
sort order: +
Map-reduce partition columns: 2000.0D (type: double)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
tag: -1
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
auto parallelism: false
@@ -211,17 +211,17 @@ STAGE PLANS:
keys: 2000.0D (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 2000.0D (type: double)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
File Output Operator
compressed: false
GlobalTableId: 0
#### A masked pattern was here ####
NumFilesPerFileSink: 1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
#### A masked pattern was here ####
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
@@ -328,22 +328,22 @@ STAGE PLANS:
TableScan
alias: employee_part
filterExpr: (employeesalary = 4000.0D) (type: boolean)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: employeeid (type: int)
outputColumnNames: employeeid
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: 4000.0D (type: double)
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Reduce Output Operator
key expressions: 4000.0D (type: double)
sort order: +
Map-reduce partition columns: 4000.0D (type: double)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -351,14 +351,14 @@ STAGE PLANS:
keys: 4000.0D (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 4000.0D (type: double)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -399,25 +399,25 @@ STAGE PLANS:
TableScan
alias: employee_part
filterExpr: (employeesalary = 4000.0D) (type: boolean)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Statistics Aggregation Key Prefix: default.employee_part/
GatherStats: true
Select Operator
expressions: employeeid (type: int)
outputColumnNames: employeeid
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: 4000.0D (type: double)
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
Reduce Output Operator
key expressions: 4000.0D (type: double)
null sort order: a
sort order: +
Map-reduce partition columns: 4000.0D (type: double)
- Statistics: Num rows: 3 Data size: 1050 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1062 Basic stats: PARTIAL Column stats: NONE
tag: -1
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
auto parallelism: false
@@ -482,17 +482,17 @@ STAGE PLANS:
keys: 4000.0D (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 4000.0D (type: double)
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
File Output Operator
compressed: false
GlobalTableId: 0
#### A masked pattern was here ####
NumFilesPerFileSink: 1
- Statistics: Num rows: 1 Data size: 350 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 354 Basic stats: PARTIAL Column stats: NONE
#### A masked pattern was here ####
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
@@ -561,22 +561,22 @@ STAGE PLANS:
TableScan
alias: employee_part
filterExpr: (employeesalary = 2000.0D) (type: boolean)
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 13 Data size: 52 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeename (type: string)
outputColumnNames: employeeid, employeename
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 13 Data size: 52 Basic stats: COMPLETE Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll'), compute_stats(employeename, 'hll')
keys: 2000.0D (type: double)
mode: hash
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 872 Basic stats: COMPLETE Column stats: PARTIAL
Reduce Output Operator
key expressions: 2000.0D (type: double)
sort order: +
Map-reduce partition columns: 2000.0D (type: double)
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 872 Basic stats: COMPLETE Column stats: PARTIAL
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -584,14 +584,14 @@ STAGE PLANS:
keys: 2000.0D (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 6 Data size: 42 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 888 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 2000.0D (type: double)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 6 Data size: 42 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 888 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 6 Data size: 42 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 888 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -685,22 +685,22 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: employee_part
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 26 Data size: 2596 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeename (type: string), employeesalary (type: double)
outputColumnNames: employeeid, employeename, employeesalary
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 26 Data size: 2596 Basic stats: COMPLETE Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll'), compute_stats(employeename, 'hll')
keys: employeesalary (type: double)
mode: hash
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 2 Data size: 1744 Basic stats: COMPLETE Column stats: PARTIAL
Reduce Output Operator
key expressions: _col0 (type: double)
sort order: +
Map-reduce partition columns: _col0 (type: double)
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 2 Data size: 1744 Basic stats: COMPLETE Column stats: PARTIAL
value expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -708,14 +708,14 @@ STAGE PLANS:
keys: KEY._col0 (type: double)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 2 Data size: 1776 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: _col1 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: double)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 2 Data size: 1776 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 13 Data size: 92 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 2 Data size: 1776 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -813,29 +813,29 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: employee_part
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 26 Data size: 2388 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeename (type: string)
outputColumnNames: employeeid, employeename
- Statistics: Num rows: 26 Data size: 184 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 26 Data size: 2388 Basic stats: COMPLETE Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll'), compute_stats(employeename, 'hll')
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 864 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 864 Basic stats: COMPLETE Column stats: PARTIAL
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 864 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 864 Basic stats: COMPLETE Column stats: PARTIAL
value expressions: _col0 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col1 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
aggregations: compute_stats(VALUE._col0), compute_stats(VALUE._col1)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 1 Data size: 880 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -885,7 +885,7 @@ num_trues
num_falses
bitVector HL
comment from deserializer
-COLUMN_STATS_ACCURATE {\"COLUMN_STATS\":{\"employeeid\":\"true\",\"employeename\":\"true\"}}
+COLUMN_STATS_ACCURATE {\"COLUMN_STATS\":{\"employeename\":\"true\"}}
PREHOOK: query: create database if not exists dummydb
PREHOOK: type: CREATEDATABASE
PREHOOK: Output: database:dummydb
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out b/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
index 3b04987..4cc76be 100644
--- a/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
+++ b/ql/src/test/results/clientpositive/columnstats_partlvl_dp.q.out
@@ -93,22 +93,22 @@ STAGE PLANS:
TableScan
alias: employee_part_n0
filterExpr: (employeesalary = 4000.0D) (type: boolean)
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1012 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeename (type: string), country (type: string)
outputColumnNames: employeeid, employeename, country
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1012 Basic stats: PARTIAL Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeename, 'hll'), compute_stats(employeeid, 'hll')
keys: 4000.0D (type: double), country (type: string)
mode: hash
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1236 Basic stats: PARTIAL Column stats: PARTIAL
Reduce Output Operator
key expressions: 4000.0D (type: double), _col1 (type: string)
sort order: ++
Map-reduce partition columns: 4000.0D (type: double), _col1 (type: string)
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1236 Basic stats: PARTIAL Column stats: PARTIAL
value expressions: _col2 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -116,14 +116,14 @@ STAGE PLANS:
keys: 4000.0D (type: double), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1252 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: _col2 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 4000.0D (type: double), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1252 Basic stats: PARTIAL Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 640 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1252 Basic stats: PARTIAL Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -239,22 +239,22 @@ STAGE PLANS:
TableScan
alias: employee_part_n0
filterExpr: (employeesalary = 2000.0D) (type: boolean)
- Statistics: Num rows: 3 Data size: 1690 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 2254 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), country (type: string)
outputColumnNames: employeeid, country
- Statistics: Num rows: 3 Data size: 1690 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 2254 Basic stats: PARTIAL Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: 2000.0D (type: double), country (type: string)
mode: hash
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 3 Data size: 1690 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1836 Basic stats: PARTIAL Column stats: PARTIAL
Reduce Output Operator
key expressions: 2000.0D (type: double), _col1 (type: string)
sort order: ++
Map-reduce partition columns: 2000.0D (type: double), _col1 (type: string)
- Statistics: Num rows: 3 Data size: 1690 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 3 Data size: 1836 Basic stats: PARTIAL Column stats: PARTIAL
value expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -262,14 +262,14 @@ STAGE PLANS:
keys: 2000.0D (type: double), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 563 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 628 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), 2000.0D (type: double), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 1 Data size: 563 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 628 Basic stats: PARTIAL Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 563 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 628 Basic stats: PARTIAL Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -383,22 +383,22 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: employee_part_n0
- Statistics: Num rows: 31 Data size: 2536 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 31 Data size: 6072 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeesalary (type: double), country (type: string)
outputColumnNames: employeeid, employeesalary, country
- Statistics: Num rows: 31 Data size: 2536 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 31 Data size: 6072 Basic stats: PARTIAL Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll')
keys: employeesalary (type: double), country (type: string)
mode: hash
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 31 Data size: 2536 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 31 Data size: 19216 Basic stats: PARTIAL Column stats: PARTIAL
Reduce Output Operator
key expressions: _col0 (type: double), _col1 (type: string)
sort order: ++
Map-reduce partition columns: _col0 (type: double), _col1 (type: string)
- Statistics: Num rows: 31 Data size: 2536 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 31 Data size: 19216 Basic stats: PARTIAL Column stats: PARTIAL
value expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -406,14 +406,14 @@ STAGE PLANS:
keys: KEY._col0 (type: double), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 15 Data size: 1227 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 15 Data size: 9536 Basic stats: PARTIAL Column stats: PARTIAL
Select Operator
expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: double), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2
- Statistics: Num rows: 15 Data size: 1227 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 15 Data size: 9536 Basic stats: PARTIAL Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 15 Data size: 1227 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 15 Data size: 9536 Basic stats: PARTIAL Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -525,22 +525,22 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: employee_part_n0
- Statistics: Num rows: 54 Data size: 412 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 54 Data size: 15386 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: employeeid (type: int), employeename (type: string), employeesalary (type: double), country (type: string)
outputColumnNames: employeeid, employeename, employeesalary, country
- Statistics: Num rows: 54 Data size: 412 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 54 Data size: 15386 Basic stats: COMPLETE Column stats: PARTIAL
Group By Operator
aggregations: compute_stats(employeeid, 'hll'), compute_stats(employeename, 'hll')
keys: employeesalary (type: double), country (type: string)
mode: hash
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 54 Data size: 412 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 8 Data size: 8448 Basic stats: COMPLETE Column stats: PARTIAL
Reduce Output Operator
key expressions: _col0 (type: double), _col1 (type: string)
sort order: ++
Map-reduce partition columns: _col0 (type: double), _col1 (type: string)
- Statistics: Num rows: 54 Data size: 412 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 8 Data size: 8448 Basic stats: COMPLETE Column stats: PARTIAL
value expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
@@ -548,14 +548,14 @@ STAGE PLANS:
keys: KEY._col0 (type: double), KEY._col1 (type: string)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 27 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 8 Data size: 8576 Basic stats: COMPLETE Column stats: PARTIAL
Select Operator
expressions: _col2 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col3 (type: struct<columntype:string,maxlength:bigint,avglength:double,countnulls:bigint,numdistinctvalues:bigint,ndvbitvector:binary>), _col0 (type: double), _col1 (type: string)
outputColumnNames: _col0, _col1, _col2, _col3
- Statistics: Num rows: 27 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 8 Data size: 8576 Basic stats: COMPLETE Column stats: PARTIAL
File Output Operator
compressed: false
- Statistics: Num rows: 27 Data size: 206 Basic stats: COMPLETE Column stats: NONE
+ Statistics: Num rows: 8 Data size: 8576 Basic stats: COMPLETE Column stats: PARTIAL
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
http://git-wip-us.apache.org/repos/asf/hive/blob/268a6e5a/ql/src/test/results/clientpositive/columnstats_quoting.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/columnstats_quoting.q.out b/ql/src/test/results/clientpositive/columnstats_quoting.q.out
index 9bf560b..9d2ff32 100644
--- a/ql/src/test/results/clientpositive/columnstats_quoting.q.out
+++ b/ql/src/test/results/clientpositive/columnstats_quoting.q.out
@@ -30,29 +30,29 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: user_web_events
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 192 Basic stats: COMPLETE Column stats: NONE
Select Operator
expressions: user id (type: bigint), user name (type: string)
outputColumnNames: user id, user name
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 192 Basic stats: COMPLETE Column stats: NONE
Group By Operator
aggregations: compute_stats(user id, 'hll'), compute_stats(user name, 'hll')
mode: hash
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 864 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1056 Basic stats: COMPLETE Column stats: NONE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 864 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1056 Basic stats: COMPLETE Column stats: NONE
value expressions: _col0 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>), _col1 (type: struct<columntype:string,maxlength:bigint,sumlength:bigint,count:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
aggregations: compute_stats(VALUE._col0), compute_stats(VALUE._col1)
mode: mergepartial
outputColumnNames: _col0, _col1
- Statistics: Num rows: 1 Data size: 880 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1072 Basic stats: COMPLETE Column stats: NONE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 880 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 1072 Basic stats: COMPLETE Column stats: NONE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
@@ -96,29 +96,29 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: user_web_events
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: user id (type: bigint)
outputColumnNames: user id
- Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: compute_stats(user id, 'hll')
mode: hash
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 424 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 424 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
sort order:
- Statistics: Num rows: 1 Data size: 424 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 424 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col0 (type: struct<columntype:string,min:bigint,max:bigint,countnulls:bigint,bitvector:binary>)
Reduce Operator Tree:
Group By Operator
aggregations: compute_stats(VALUE._col0)
mode: mergepartial
outputColumnNames: _col0
- Statistics: Num rows: 1 Data size: 440 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 440 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
- Statistics: Num rows: 1 Data size: 440 Basic stats: PARTIAL Column stats: NONE
+ Statistics: Num rows: 1 Data size: 440 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat