You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by ha...@apache.org on 2016/05/06 20:56:02 UTC
[10/15] hive git commit: HIVE-13542 : Missing stats for tables in
TPCDS performance regression suite (Hari Subramaniyan via Ashutosh Chauhan)
http://git-wip-us.apache.org/repos/asf/hive/blob/db8a6db9/ql/src/test/results/clientpositive/perf/query50.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/query50.q.out b/ql/src/test/results/clientpositive/perf/query50.q.out
index e6ba451..781d3ec 100644
--- a/ql/src/test/results/clientpositive/perf/query50.q.out
+++ b/ql/src/test/results/clientpositive/perf/query50.q.out
@@ -130,37 +130,37 @@ Stage-0
Stage-1
Reducer 7
File Output Operator [FS_36]
- Limit [LIM_35] (rows=100 width=1119)
+ Limit [LIM_35] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_34] (rows=44194 width=1119)
+ Select Operator [SEL_34] (rows=421657640 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"]
<-Reducer 6 [SIMPLE_EDGE]
SHUFFLE [RS_33]
- Group By Operator [GBY_31] (rows=44194 width=1119)
+ Group By Operator [GBY_31] (rows=421657640 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7, KEY._col8, KEY._col9
<-Reducer 5 [SIMPLE_EDGE]
SHUFFLE [RS_30]
PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9
- Group By Operator [GBY_29] (rows=88388 width=1119)
+ Group By Operator [GBY_29] (rows=843315281 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9
- Select Operator [SEL_27] (rows=88388 width=1119)
+ Select Operator [SEL_27] (rows=843315281 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"]
- Merge Join Operator [MERGEJOIN_59] (rows=88388 width=1119)
- Conds:RS_24._col5=RS_25._col0(Inner),Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"]
+ Merge Join Operator [MERGEJOIN_59] (rows=843315281 width=88)
+ Conds:RS_24._col3=RS_25._col0(Inner),Output:["_col0","_col5","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23"]
<-Map 11 [SIMPLE_EDGE]
SHUFFLE [RS_25]
PartitionCols:_col0
- Select Operator [SEL_14] (rows=18262 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_55] (rows=18262 width=1119)
- predicate:((d_year = 2000) and (d_moy = 9) and d_date_sk is not null)
- TableScan [TS_12] (rows=73049 width=1119)
- default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
+ Select Operator [SEL_14] (rows=1704 width=1910)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
+ Filter Operator [FIL_55] (rows=1704 width=1910)
+ predicate:s_store_sk is not null
+ TableScan [TS_12] (rows=1704 width=1910)
+ default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_company_id","s_street_number","s_street_name","s_street_type","s_suite_number","s_city","s_county","s_state","s_zip"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_24]
- PartitionCols:_col5
- Merge Join Operator [MERGEJOIN_58] (rows=80353 width=1119)
- Conds:RS_21._col0=RS_22._col0(Inner),Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"]
+ PartitionCols:_col3
+ Merge Join Operator [MERGEJOIN_58] (rows=766650239 width=88)
+ Conds:RS_21._col0=RS_22._col0(Inner),Output:["_col0","_col3","_col5"]
<-Map 10 [SIMPLE_EDGE]
SHUFFLE [RS_22]
PartitionCols:_col0
@@ -173,38 +173,38 @@ Stage-0
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_21]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_57] (rows=1874 width=1911)
- Conds:RS_18._col3=RS_19._col0(Inner),Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"]
+ Merge Join Operator [MERGEJOIN_57] (rows=696954748 width=88)
+ Conds:RS_18._col5=RS_19._col0(Inner),Output:["_col0","_col3","_col5"]
<-Map 9 [SIMPLE_EDGE]
SHUFFLE [RS_19]
PartitionCols:_col0
- Select Operator [SEL_8] (rows=1704 width=1910)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
- Filter Operator [FIL_53] (rows=1704 width=1910)
- predicate:s_store_sk is not null
- TableScan [TS_6] (rows=1704 width=1910)
- default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_company_id","s_street_number","s_street_name","s_street_type","s_suite_number","s_city","s_county","s_state","s_zip"]
+ Select Operator [SEL_8] (rows=18262 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_53] (rows=18262 width=1119)
+ predicate:((d_year = 2000) and (d_moy = 9) and d_date_sk is not null)
+ TableScan [TS_6] (rows=73049 width=1119)
+ default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_18]
- PartitionCols:_col3
- Merge Join Operator [MERGEJOIN_56] (rows=1 width=0)
+ PartitionCols:_col5
+ Merge Join Operator [MERGEJOIN_56] (rows=633595212 width=88)
Conds:RS_15._col4, _col1, _col2=RS_16._col3, _col1, _col2(Inner),Output:["_col0","_col3","_col5"]
<-Map 1 [SIMPLE_EDGE]
SHUFFLE [RS_15]
PartitionCols:_col4, _col1, _col2
- Select Operator [SEL_2] (rows=1 width=0)
+ Select Operator [SEL_2] (rows=575995635 width=88)
Output:["_col0","_col1","_col2","_col3","_col4"]
- Filter Operator [FIL_51] (rows=1 width=0)
+ Filter Operator [FIL_51] (rows=575995635 width=88)
predicate:(ss_item_sk is not null and ss_customer_sk is not null and ss_ticket_number is not null and ss_store_sk is not null and ss_sold_date_sk is not null)
- TableScan [TS_0] (rows=1 width=0)
- default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number"]
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number"]
<-Map 8 [SIMPLE_EDGE]
SHUFFLE [RS_16]
PartitionCols:_col3, _col1, _col2
- Select Operator [SEL_5] (rows=1 width=0)
+ Select Operator [SEL_5] (rows=57591150 width=77)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_52] (rows=1 width=0)
+ Filter Operator [FIL_52] (rows=57591150 width=77)
predicate:(sr_item_sk is not null and sr_customer_sk is not null and sr_ticket_number is not null and sr_returned_date_sk is not null)
- TableScan [TS_3] (rows=1 width=0)
- default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number"]
+ TableScan [TS_3] (rows=57591150 width=77)
+ default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number"]
http://git-wip-us.apache.org/repos/asf/hive/blob/db8a6db9/ql/src/test/results/clientpositive/perf/query51.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/query51.q.out b/ql/src/test/results/clientpositive/perf/query51.q.out
index 08546c5..6d40b04 100644
--- a/ql/src/test/results/clientpositive/perf/query51.q.out
+++ b/ql/src/test/results/clientpositive/perf/query51.q.out
@@ -101,42 +101,42 @@ Stage-0
Stage-1
Reducer 6
File Output Operator [FS_53]
- Limit [LIM_52] (rows=100 width=1119)
+ Limit [LIM_52] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_51] (rows=7365 width=1119)
+ Select Operator [SEL_51] (rows=116159124 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
<-Reducer 5 [SIMPLE_EDGE]
SHUFFLE [RS_50]
- Select Operator [SEL_46] (rows=7365 width=1119)
+ Select Operator [SEL_46] (rows=116159124 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
- Filter Operator [FIL_58] (rows=7365 width=1119)
+ Filter Operator [FIL_58] (rows=116159124 width=88)
predicate:(max_window_0 > max_window_1)
- PTF Operator [PTF_45] (rows=22096 width=1119)
- Function definitions:[{},{"name:":"windowingtablefunction","order by:":"CASE WHEN (_col1 is not null) THEN (_col1) ELSE (_col4) END ASC NULLS FIRST","partition by:":"CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END"}]
- Select Operator [SEL_44] (rows=22096 width=1119)
+ PTF Operator [PTF_45] (rows=348477374 width=88)
+ Function definitions:[{},{"name:":"windowingtablefunction","order by:":"CASE WHEN (_col4 is not null) THEN (_col4) ELSE (_col1) END ASC NULLS FIRST","partition by:":"CASE WHEN (_col3 is not null) THEN (_col3) ELSE (_col0) END"}]
+ Select Operator [SEL_44] (rows=348477374 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_43]
- PartitionCols:CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END
- Merge Join Operator [MERGEJOIN_67] (rows=22096 width=1119)
+ PartitionCols:CASE WHEN (_col3 is not null) THEN (_col3) ELSE (_col0) END
+ Merge Join Operator [MERGEJOIN_67] (rows=348477374 width=88)
Conds:RS_40._col0, _col1=RS_41._col0, _col1(Outer),Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
<-Reducer 10 [SIMPLE_EDGE]
SHUFFLE [RS_41]
PartitionCols:_col0, _col1
- Select Operator [SEL_37] (rows=20088 width=1119)
+ Select Operator [SEL_37] (rows=79201469 width=135)
Output:["_col0","_col1","_col2"]
- PTF Operator [PTF_36] (rows=20088 width=1119)
+ PTF Operator [PTF_36] (rows=79201469 width=135)
Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1 ASC NULLS FIRST","partition by:":"_col0"}]
- Group By Operator [GBY_32] (rows=20088 width=1119)
+ Group By Operator [GBY_32] (rows=79201469 width=135)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1
<-Reducer 9 [SIMPLE_EDGE]
SHUFFLE [RS_31]
PartitionCols:_col0
- Group By Operator [GBY_30] (rows=40176 width=1119)
+ Group By Operator [GBY_30] (rows=158402938 width=135)
Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)"],keys:_col1, _col4
- Select Operator [SEL_29] (rows=40176 width=1119)
+ Select Operator [SEL_29] (rows=158402938 width=135)
Output:["_col1","_col4","_col2"]
- Merge Join Operator [MERGEJOIN_66] (rows=40176 width=1119)
+ Merge Join Operator [MERGEJOIN_66] (rows=158402938 width=135)
Conds:RS_26._col0=RS_27._col0(Inner),Output:["_col1","_col2","_col4"]
<-Map 11 [SIMPLE_EDGE]
SHUFFLE [RS_27]
@@ -150,39 +150,39 @@ Stage-0
<-Map 8 [SIMPLE_EDGE]
SHUFFLE [RS_26]
PartitionCols:_col0
- Select Operator [SEL_22] (rows=1 width=0)
+ Select Operator [SEL_22] (rows=144002668 width=135)
Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_61] (rows=1 width=0)
- predicate:(ss_item_sk is not null and ss_sold_date_sk is not null)
- TableScan [TS_20] (rows=1 width=0)
- default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_sales_price"]
+ Filter Operator [FIL_61] (rows=144002668 width=135)
+ predicate:(ws_item_sk is not null and ws_sold_date_sk is not null)
+ TableScan [TS_20] (rows=144002668 width=135)
+ default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_sales_price"]
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_40]
PartitionCols:_col0, _col1
- Select Operator [SEL_17] (rows=20088 width=1119)
+ Select Operator [SEL_17] (rows=316797606 width=88)
Output:["_col0","_col1","_col2"]
- PTF Operator [PTF_16] (rows=20088 width=1119)
+ PTF Operator [PTF_16] (rows=316797606 width=88)
Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1 ASC NULLS FIRST","partition by:":"_col0"}]
- Group By Operator [GBY_12] (rows=20088 width=1119)
+ Group By Operator [GBY_12] (rows=316797606 width=88)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_11]
PartitionCols:_col0
- Group By Operator [GBY_10] (rows=40176 width=1119)
+ Group By Operator [GBY_10] (rows=633595212 width=88)
Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)"],keys:_col1, _col4
- Select Operator [SEL_9] (rows=40176 width=1119)
+ Select Operator [SEL_9] (rows=633595212 width=88)
Output:["_col1","_col4","_col2"]
- Merge Join Operator [MERGEJOIN_65] (rows=40176 width=1119)
+ Merge Join Operator [MERGEJOIN_65] (rows=633595212 width=88)
Conds:RS_6._col0=RS_7._col0(Inner),Output:["_col1","_col2","_col4"]
<-Map 1 [SIMPLE_EDGE]
SHUFFLE [RS_6]
PartitionCols:_col0
- Select Operator [SEL_2] (rows=1 width=0)
+ Select Operator [SEL_2] (rows=575995635 width=88)
Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_59] (rows=1 width=0)
- predicate:(ws_item_sk is not null and ws_sold_date_sk is not null)
- TableScan [TS_0] (rows=1 width=0)
- default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_sales_price"]
+ Filter Operator [FIL_59] (rows=575995635 width=88)
+ predicate:(ss_item_sk is not null and ss_sold_date_sk is not null)
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_sales_price"]
<-Map 7 [SIMPLE_EDGE]
SHUFFLE [RS_7]
PartitionCols:_col0
http://git-wip-us.apache.org/repos/asf/hive/blob/db8a6db9/ql/src/test/results/clientpositive/perf/query52.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/query52.q.out b/ql/src/test/results/clientpositive/perf/query52.q.out
index 7bf7317..21f3a39 100644
--- a/ql/src/test/results/clientpositive/perf/query52.q.out
+++ b/ql/src/test/results/clientpositive/perf/query52.q.out
@@ -16,25 +16,25 @@ Stage-0
Stage-1
Reducer 5
File Output Operator [FS_24]
- Limit [LIM_23] (rows=100 width=1436)
+ Limit [LIM_23] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_22] (rows=127050 width=1436)
+ Select Operator [SEL_22] (rows=348477374 width=88)
Output:["_col0","_col1","_col2","_col3"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_21]
- Select Operator [SEL_20] (rows=127050 width=1436)
+ Select Operator [SEL_20] (rows=348477374 width=88)
Output:["_col1","_col2","_col3"]
- Group By Operator [GBY_19] (rows=127050 width=1436)
+ Group By Operator [GBY_19] (rows=348477374 width=88)
Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:1998, KEY._col1, KEY._col2
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_18]
PartitionCols:1998, _col1, _col2
- Group By Operator [GBY_17] (rows=254100 width=1436)
+ Group By Operator [GBY_17] (rows=696954748 width=88)
Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:1998, _col1, _col2
- Select Operator [SEL_15] (rows=254100 width=1436)
+ Select Operator [SEL_15] (rows=696954748 width=88)
Output:["_col1","_col2","_col3"]
- Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436)
- Conds:RS_12._col4=RS_13._col0(Inner),Output:["_col5","_col7","_col8"]
+ Merge Join Operator [MERGEJOIN_34] (rows=696954748 width=88)
+ Conds:RS_12._col1=RS_13._col0(Inner),Output:["_col2","_col7","_col8"]
<-Map 7 [SIMPLE_EDGE]
SHUFFLE [RS_13]
PartitionCols:_col0
@@ -46,25 +46,25 @@ Stage-0
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manager_id"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_12]
- PartitionCols:_col4
- Merge Join Operator [MERGEJOIN_33] (rows=20088 width=1119)
- Conds:RS_9._col0=RS_10._col0(Inner),Output:["_col4","_col5"]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_33] (rows=633595212 width=88)
+ Conds:RS_9._col0=RS_10._col0(Inner),Output:["_col1","_col2"]
<-Map 1 [SIMPLE_EDGE]
SHUFFLE [RS_9]
PartitionCols:_col0
- Select Operator [SEL_2] (rows=18262 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_30] (rows=18262 width=1119)
- predicate:((d_moy = 12) and (d_year = 1998) and d_date_sk is not null)
- TableScan [TS_0] (rows=73049 width=1119)
- default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
+ Select Operator [SEL_2] (rows=575995635 width=88)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_30] (rows=575995635 width=88)
+ predicate:(ss_sold_date_sk is not null and ss_item_sk is not null)
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"]
<-Map 6 [SIMPLE_EDGE]
SHUFFLE [RS_10]
PartitionCols:_col0
- Select Operator [SEL_5] (rows=1 width=0)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_31] (rows=1 width=0)
- predicate:(ss_sold_date_sk is not null and ss_item_sk is not null)
- TableScan [TS_3] (rows=1 width=0)
- default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"]
+ Select Operator [SEL_5] (rows=18262 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_31] (rows=18262 width=1119)
+ predicate:((d_moy = 12) and (d_year = 1998) and d_date_sk is not null)
+ TableScan [TS_3] (rows=73049 width=1119)
+ default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
http://git-wip-us.apache.org/repos/asf/hive/blob/db8a6db9/ql/src/test/results/clientpositive/perf/query54.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/query54.q.out b/ql/src/test/results/clientpositive/perf/query54.q.out
index 3edf749..76657a0 100644
--- a/ql/src/test/results/clientpositive/perf/query54.q.out
+++ b/ql/src/test/results/clientpositive/perf/query54.q.out
@@ -5,169 +5,171 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Map 1 <- Union 2 (CONTAINS)
-Map 14 <- Union 2 (CONTAINS)
-Reducer 10 <- Map 21 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE)
-Reducer 11 <- Reducer 10 (SIMPLE_EDGE)
-Reducer 12 <- Reducer 11 (SIMPLE_EDGE)
-Reducer 13 <- Reducer 12 (SIMPLE_EDGE)
-Reducer 3 <- Map 15 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE)
-Reducer 4 <- Map 16 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
-Reducer 5 <- Map 17 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE)
+Map 12 <- Union 13 (CONTAINS)
+Map 18 <- Union 13 (CONTAINS)
+Reducer 10 <- Reducer 17 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE)
+Reducer 14 <- Map 19 (SIMPLE_EDGE), Union 13 (SIMPLE_EDGE)
+Reducer 15 <- Map 20 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE)
+Reducer 16 <- Map 21 (SIMPLE_EDGE), Reducer 15 (SIMPLE_EDGE)
+Reducer 17 <- Reducer 16 (SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE)
+Reducer 3 <- Reducer 10 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
+Reducer 4 <- Reducer 3 (SIMPLE_EDGE)
+Reducer 5 <- Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Reducer 5 (SIMPLE_EDGE)
-Reducer 7 <- Map 18 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE)
-Reducer 8 <- Map 19 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE)
-Reducer 9 <- Map 20 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE)
+Reducer 9 <- Map 11 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
Stage-0
Fetch Operator
limit:100
Stage-1
- Reducer 13
- File Output Operator [FS_68]
- Limit [LIM_67] (rows=100 width=860)
+ Reducer 6
+ File Output Operator [FS_69]
+ Limit [LIM_68] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_66] (rows=16105101 width=860)
+ Select Operator [SEL_67] (rows=174238687 width=88)
Output:["_col0","_col1","_col2"]
- <-Reducer 12 [SIMPLE_EDGE]
- SHUFFLE [RS_65]
- Select Operator [SEL_64] (rows=16105101 width=860)
+ <-Reducer 5 [SIMPLE_EDGE]
+ SHUFFLE [RS_66]
+ Select Operator [SEL_65] (rows=174238687 width=88)
Output:["_col0","_col1","_col2"]
- Group By Operator [GBY_63] (rows=16105101 width=860)
+ Group By Operator [GBY_64] (rows=174238687 width=88)
Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0
- <-Reducer 11 [SIMPLE_EDGE]
- SHUFFLE [RS_62]
+ <-Reducer 4 [SIMPLE_EDGE]
+ SHUFFLE [RS_63]
PartitionCols:_col0
- Group By Operator [GBY_61] (rows=32210202 width=860)
+ Group By Operator [GBY_62] (rows=348477374 width=88)
Output:["_col0","_col1"],aggregations:["count()"],keys:_col0
- Select Operator [SEL_59] (rows=32210202 width=860)
+ Select Operator [SEL_60] (rows=348477374 width=88)
Output:["_col0"]
- Group By Operator [GBY_58] (rows=32210202 width=860)
+ Group By Operator [GBY_59] (rows=348477374 width=88)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
- <-Reducer 10 [SIMPLE_EDGE]
- SHUFFLE [RS_57]
+ <-Reducer 3 [SIMPLE_EDGE]
+ SHUFFLE [RS_58]
PartitionCols:_col0
- Group By Operator [GBY_56] (rows=64420404 width=860)
- Output:["_col0","_col1"],aggregations:["sum(_col4)"],keys:_col0
- Merge Join Operator [MERGEJOIN_126] (rows=64420404 width=860)
- Conds:RS_52._col2=RS_53._col0(Inner),Output:["_col0","_col4"]
- <-Map 21 [SIMPLE_EDGE]
- SHUFFLE [RS_53]
- PartitionCols:_col0
- Select Operator [SEL_42] (rows=36524 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_119] (rows=36524 width=1119)
- predicate:(d_month_seq BETWEEN 1203 AND 1205 and d_date_sk is not null)
- TableScan [TS_40] (rows=73049 width=1119)
- default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"]
- <-Reducer 9 [SIMPLE_EDGE]
- SHUFFLE [RS_52]
- PartitionCols:_col2
- Merge Join Operator [MERGEJOIN_125] (rows=58564003 width=860)
- Conds:RS_49._col6, _col7=RS_50._col0, _col1(Inner),Output:["_col0","_col2","_col4"]
- <-Map 20 [SIMPLE_EDGE]
- SHUFFLE [RS_50]
- PartitionCols:_col0, _col1
- Select Operator [SEL_39] (rows=1704 width=1910)
- Output:["_col0","_col1"]
- Filter Operator [FIL_118] (rows=1704 width=1910)
- predicate:(s_county is not null and s_state is not null)
- TableScan [TS_37] (rows=1704 width=1910)
- default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_county","s_state"]
- <-Reducer 8 [SIMPLE_EDGE]
- SHUFFLE [RS_49]
- PartitionCols:_col6, _col7
- Merge Join Operator [MERGEJOIN_124] (rows=53240002 width=860)
- Conds:RS_46._col1=RS_47._col0(Inner),Output:["_col0","_col2","_col4","_col6","_col7"]
- <-Map 19 [SIMPLE_EDGE]
- SHUFFLE [RS_47]
- PartitionCols:_col0
- Select Operator [SEL_36] (rows=40000000 width=1014)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_117] (rows=40000000 width=1014)
- predicate:(ca_address_sk is not null and ca_county is not null and ca_state is not null)
- TableScan [TS_34] (rows=40000000 width=1014)
- default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state"]
- <-Reducer 7 [SIMPLE_EDGE]
- SHUFFLE [RS_46]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_123] (rows=48400001 width=860)
- Conds:RS_43._col0=RS_44._col1(Inner),Output:["_col0","_col1","_col2","_col4"]
- <-Map 18 [SIMPLE_EDGE]
- SHUFFLE [RS_44]
- PartitionCols:_col1
- Select Operator [SEL_33] (rows=1 width=0)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_116] (rows=1 width=0)
- predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null)
- TableScan [TS_31] (rows=1 width=0)
- default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_sales_price"]
- <-Reducer 6 [SIMPLE_EDGE]
- SHUFFLE [RS_43]
- PartitionCols:_col0
- Group By Operator [GBY_29] (rows=44000000 width=860)
- Output:["_col0","_col1"],keys:KEY._col0, KEY._col1
- <-Reducer 5 [SIMPLE_EDGE]
- SHUFFLE [RS_28]
- PartitionCols:_col0, _col1
- Group By Operator [GBY_27] (rows=88000001 width=860)
- Output:["_col0","_col1"],keys:_col9, _col10
- Merge Join Operator [MERGEJOIN_122] (rows=88000001 width=860)
- Conds:RS_23._col1=RS_24._col0(Inner),Output:["_col9","_col10"]
- <-Map 17 [SIMPLE_EDGE]
- SHUFFLE [RS_24]
- PartitionCols:_col0
- Select Operator [SEL_16] (rows=80000000 width=860)
- Output:["_col0","_col1"]
- Filter Operator [FIL_115] (rows=80000000 width=860)
- predicate:(c_customer_sk is not null and c_current_addr_sk is not null)
- TableScan [TS_14] (rows=80000000 width=860)
- default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"]
- <-Reducer 4 [SIMPLE_EDGE]
- SHUFFLE [RS_23]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_121] (rows=139755 width=1436)
- Conds:RS_20._col0=RS_21._col0(Inner),Output:["_col1"]
- <-Map 16 [SIMPLE_EDGE]
- SHUFFLE [RS_21]
+ Group By Operator [GBY_57] (rows=696954748 width=88)
+ Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col10
+ Select Operator [SEL_56] (rows=696954748 width=88)
+ Output:["_col10","_col2"]
+ Merge Join Operator [MERGEJOIN_117] (rows=696954748 width=88)
+ Conds:RS_53._col1=RS_54._col5(Inner),Output:["_col2","_col10"]
+ <-Reducer 10 [SIMPLE_EDGE]
+ SHUFFLE [RS_54]
+ PartitionCols:_col5
+ Merge Join Operator [MERGEJOIN_116] (rows=316240138 width=135)
+ Conds:RS_46._col0=RS_47._col1(Inner),Output:["_col5"]
+ <-Reducer 17 [SIMPLE_EDGE]
+ SHUFFLE [RS_47]
+ PartitionCols:_col1
+ Group By Operator [GBY_41] (rows=287491029 width=135)
+ Output:["_col0","_col1"],keys:KEY._col0, KEY._col1
+ <-Reducer 16 [SIMPLE_EDGE]
+ SHUFFLE [RS_40]
+ PartitionCols:_col0, _col1
+ Group By Operator [GBY_39] (rows=574982058 width=135)
+ Output:["_col0","_col1"],keys:_col9, _col10
+ Merge Join Operator [MERGEJOIN_115] (rows=574982058 width=135)
+ Conds:RS_35._col1=RS_36._col0(Inner),Output:["_col9","_col10"]
+ <-Map 21 [SIMPLE_EDGE]
+ SHUFFLE [RS_36]
+ PartitionCols:_col0
+ Select Operator [SEL_28] (rows=80000000 width=860)
+ Output:["_col0","_col1"]
+ Filter Operator [FIL_110] (rows=80000000 width=860)
+ predicate:(c_customer_sk is not null and c_current_addr_sk is not null)
+ TableScan [TS_26] (rows=80000000 width=860)
+ default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"]
+ <-Reducer 15 [SIMPLE_EDGE]
+ SHUFFLE [RS_35]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_114] (rows=522710951 width=135)
+ Conds:RS_32._col2=RS_33._col0(Inner),Output:["_col1"]
+ <-Map 20 [SIMPLE_EDGE]
+ SHUFFLE [RS_33]
+ PartitionCols:_col0
+ Select Operator [SEL_25] (rows=115500 width=1436)
+ Output:["_col0"]
+ Filter Operator [FIL_109] (rows=115500 width=1436)
+ predicate:((i_category = 'Jewelry') and (i_class = 'football') and i_item_sk is not null)
+ TableScan [TS_23] (rows=462000 width=1436)
+ default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_class","i_category"]
+ <-Reducer 14 [SIMPLE_EDGE]
+ SHUFFLE [RS_32]
+ PartitionCols:_col2
+ Merge Join Operator [MERGEJOIN_113] (rows=475191764 width=135)
+ Conds:Union 13._col0=RS_30._col0(Inner),Output:["_col1","_col2"]
+ <-Map 19 [SIMPLE_EDGE]
+ SHUFFLE [RS_30]
+ PartitionCols:_col0
+ Select Operator [SEL_22] (rows=18262 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_108] (rows=18262 width=1119)
+ predicate:((d_moy = 3) and (d_year = 2000) and d_date_sk is not null)
+ TableScan [TS_20] (rows=73049 width=1119)
+ default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
+ <-Union 13 [SIMPLE_EDGE]
+ <-Map 12 [CONTAINS]
+ Reduce Output Operator [RS_29]
PartitionCols:_col0
- Select Operator [SEL_13] (rows=18262 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_114] (rows=18262 width=1119)
- predicate:((d_moy = 3) and (d_year = 2000) and d_date_sk is not null)
- TableScan [TS_11] (rows=73049 width=1119)
- default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
- <-Reducer 3 [SIMPLE_EDGE]
- SHUFFLE [RS_20]
+ Select Operator [SEL_14] (rows=287989836 width=135)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_106] (rows=287989836 width=135)
+ predicate:(cs_item_sk is not null and cs_sold_date_sk is not null and cs_bill_customer_sk is not null)
+ TableScan [TS_12] (rows=287989836 width=135)
+ Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk"]
+ <-Map 18 [CONTAINS]
+ Reduce Output Operator [RS_29]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_120] (rows=127050 width=1436)
- Conds:Union 2._col2=RS_18._col0(Inner),Output:["_col0","_col1"]
- <-Map 15 [SIMPLE_EDGE]
- SHUFFLE [RS_18]
- PartitionCols:_col0
- Select Operator [SEL_10] (rows=115500 width=1436)
- Output:["_col0"]
- Filter Operator [FIL_113] (rows=115500 width=1436)
- predicate:((i_category = 'Jewelry') and (i_class = 'football') and i_item_sk is not null)
- TableScan [TS_8] (rows=462000 width=1436)
- default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_class","i_category"]
- <-Union 2 [SIMPLE_EDGE]
- <-Map 1 [CONTAINS]
- Reduce Output Operator [RS_17]
- PartitionCols:_col2
- Select Operator [SEL_2] (rows=1 width=0)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_111] (rows=1 width=0)
- predicate:(cs_item_sk is not null and cs_sold_date_sk is not null and cs_bill_customer_sk is not null)
- TableScan [TS_0] (rows=1 width=0)
- Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk"]
- <-Map 14 [CONTAINS]
- Reduce Output Operator [RS_17]
- PartitionCols:_col2
- Select Operator [SEL_5] (rows=1 width=0)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_112] (rows=1 width=0)
- predicate:(ws_item_sk is not null and ws_sold_date_sk is not null and ws_bill_customer_sk is not null)
- TableScan [TS_3] (rows=1 width=0)
- Output:["ws_sold_date_sk","ws_item_sk","ws_bill_customer_sk"]
+ Select Operator [SEL_17] (rows=144002668 width=135)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_107] (rows=144002668 width=135)
+ predicate:(ws_item_sk is not null and ws_sold_date_sk is not null and ws_bill_customer_sk is not null)
+ TableScan [TS_15] (rows=144002668 width=135)
+ Output:["ws_sold_date_sk","ws_item_sk","ws_bill_customer_sk"]
+ <-Reducer 9 [SIMPLE_EDGE]
+ SHUFFLE [RS_46]
+ PartitionCols:_col0
+ Merge Join Operator [MERGEJOIN_112] (rows=44000000 width=1014)
+ Conds:RS_43._col1, _col2=RS_44._col0, _col1(Inner),Output:["_col0"]
+ <-Map 11 [SIMPLE_EDGE]
+ SHUFFLE [RS_44]
+ PartitionCols:_col0, _col1
+ Select Operator [SEL_11] (rows=1704 width=1910)
+ Output:["_col0","_col1"]
+ Filter Operator [FIL_105] (rows=1704 width=1910)
+ predicate:(s_county is not null and s_state is not null)
+ TableScan [TS_9] (rows=1704 width=1910)
+ default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_county","s_state"]
+ <-Map 8 [SIMPLE_EDGE]
+ SHUFFLE [RS_43]
+ PartitionCols:_col1, _col2
+ Select Operator [SEL_8] (rows=40000000 width=1014)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_104] (rows=40000000 width=1014)
+ predicate:(ca_address_sk is not null and ca_county is not null and ca_state is not null)
+ TableScan [TS_6] (rows=40000000 width=1014)
+ default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state"]
+ <-Reducer 2 [SIMPLE_EDGE]
+ SHUFFLE [RS_53]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_111] (rows=633595212 width=88)
+ Conds:RS_50._col0=RS_51._col0(Inner),Output:["_col1","_col2"]
+ <-Map 1 [SIMPLE_EDGE]
+ SHUFFLE [RS_50]
+ PartitionCols:_col0
+ Select Operator [SEL_2] (rows=575995635 width=88)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_102] (rows=575995635 width=88)
+ predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null)
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_sales_price"]
+ <-Map 7 [SIMPLE_EDGE]
+ SHUFFLE [RS_51]
+ PartitionCols:_col0
+ Select Operator [SEL_5] (rows=36524 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_103] (rows=36524 width=1119)
+ predicate:(d_month_seq BETWEEN 1203 AND 1205 and d_date_sk is not null)
+ TableScan [TS_3] (rows=73049 width=1119)
+ default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"]
http://git-wip-us.apache.org/repos/asf/hive/blob/db8a6db9/ql/src/test/results/clientpositive/perf/query55.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/query55.q.out b/ql/src/test/results/clientpositive/perf/query55.q.out
index a9044c1..fb3743d 100644
--- a/ql/src/test/results/clientpositive/perf/query55.q.out
+++ b/ql/src/test/results/clientpositive/perf/query55.q.out
@@ -16,23 +16,23 @@ Stage-0
Stage-1
Reducer 5
File Output Operator [FS_24]
- Limit [LIM_23] (rows=100 width=1436)
+ Limit [LIM_23] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_22] (rows=127050 width=1436)
+ Select Operator [SEL_22] (rows=348477374 width=88)
Output:["_col0","_col1","_col2"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_21]
- Group By Operator [GBY_18] (rows=127050 width=1436)
+ Group By Operator [GBY_18] (rows=348477374 width=88)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_17]
PartitionCols:_col0, _col1
- Group By Operator [GBY_16] (rows=254100 width=1436)
- Output:["_col0","_col1","_col2"],aggregations:["sum(_col5)"],keys:_col7, _col8
- Select Operator [SEL_15] (rows=254100 width=1436)
- Output:["_col7","_col8","_col5"]
- Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436)
- Conds:RS_12._col4=RS_13._col0(Inner),Output:["_col5","_col7","_col8"]
+ Group By Operator [GBY_16] (rows=696954748 width=88)
+ Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)"],keys:_col7, _col8
+ Select Operator [SEL_15] (rows=696954748 width=88)
+ Output:["_col7","_col8","_col2"]
+ Merge Join Operator [MERGEJOIN_34] (rows=696954748 width=88)
+ Conds:RS_12._col1=RS_13._col0(Inner),Output:["_col2","_col7","_col8"]
<-Map 7 [SIMPLE_EDGE]
SHUFFLE [RS_13]
PartitionCols:_col0
@@ -44,25 +44,25 @@ Stage-0
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manager_id"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_12]
- PartitionCols:_col4
- Merge Join Operator [MERGEJOIN_33] (rows=20088 width=1119)
- Conds:RS_9._col0=RS_10._col0(Inner),Output:["_col4","_col5"]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_33] (rows=633595212 width=88)
+ Conds:RS_9._col0=RS_10._col0(Inner),Output:["_col1","_col2"]
<-Map 1 [SIMPLE_EDGE]
SHUFFLE [RS_9]
PartitionCols:_col0
- Select Operator [SEL_2] (rows=18262 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_30] (rows=18262 width=1119)
- predicate:((d_moy = 12) and (d_year = 2001) and d_date_sk is not null)
- TableScan [TS_0] (rows=73049 width=1119)
- default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
+ Select Operator [SEL_2] (rows=575995635 width=88)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_30] (rows=575995635 width=88)
+ predicate:(ss_sold_date_sk is not null and ss_item_sk is not null)
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"]
<-Map 6 [SIMPLE_EDGE]
SHUFFLE [RS_10]
PartitionCols:_col0
- Select Operator [SEL_5] (rows=1 width=0)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_31] (rows=1 width=0)
- predicate:(ss_sold_date_sk is not null and ss_item_sk is not null)
- TableScan [TS_3] (rows=1 width=0)
- default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"]
+ Select Operator [SEL_5] (rows=18262 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_31] (rows=18262 width=1119)
+ predicate:((d_moy = 12) and (d_year = 2001) and d_date_sk is not null)
+ TableScan [TS_3] (rows=73049 width=1119)
+ default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]