You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by ha...@apache.org on 2018/06/25 16:04:22 UTC
[19/51] [partial] hive git commit: HIVE-12342 : Set default value of
hive.optimize.index.filter to true (Igor Kryvenko via Ashutosh Chauhan)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query95.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/spark/query95.q.out b/ql/src/test/results/clientpositive/perf/spark/query95.q.out
index b0df142..abb95f9 100644
--- a/ql/src/test/results/clientpositive/perf/spark/query95.q.out
+++ b/ql/src/test/results/clientpositive/perf/spark/query95.q.out
@@ -75,6 +75,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: web_site
+ filterExpr: ((web_company_name = 'pri') and web_site_sk is not null) (type: boolean)
Statistics: Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((web_company_name = 'pri') and web_site_sk is not null) (type: boolean)
@@ -99,6 +100,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: date_dim
+ filterExpr: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1999-05-01 00:00:00.0' AND TIMESTAMP'1999-06-30 00:00:00.0' and d_date_sk is not null) (type: boolean)
Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1999-05-01 00:00:00.0' AND TIMESTAMP'1999-06-30 00:00:00.0' and d_date_sk is not null) (type: boolean)
@@ -134,6 +136,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ws1
+ filterExpr: (ws_order_number is not null and ws_ship_date_sk is not null and ws_ship_addr_sk is not null and ws_web_site_sk is not null) (type: boolean)
Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (ws_order_number is not null and ws_ship_addr_sk is not null and ws_ship_date_sk is not null and ws_web_site_sk is not null) (type: boolean)
@@ -165,6 +168,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ws1
+ filterExpr: ws_order_number is not null (type: boolean)
Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ws_order_number is not null (type: boolean)
@@ -184,6 +188,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ws2
+ filterExpr: ws_order_number is not null (type: boolean)
Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ws_order_number is not null (type: boolean)
@@ -203,6 +208,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ws1
+ filterExpr: ws_order_number is not null (type: boolean)
Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ws_order_number is not null (type: boolean)
@@ -222,6 +228,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ws2
+ filterExpr: ws_order_number is not null (type: boolean)
Statistics: Num rows: 144002668 Data size: 19580198212 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ws_order_number is not null (type: boolean)
@@ -241,6 +248,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: web_returns
+ filterExpr: wr_order_number is not null (type: boolean)
Statistics: Num rows: 14398467 Data size: 1325194184 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: wr_order_number is not null (type: boolean)
@@ -259,6 +267,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: customer_address
+ filterExpr: ((ca_state = 'TX') and ca_address_sk is not null) (type: boolean)
Statistics: Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((ca_state = 'TX') and ca_address_sk is not null) (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query96.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/spark/query96.q.out b/ql/src/test/results/clientpositive/perf/spark/query96.q.out
index 68af7a4..ba41c76 100644
--- a/ql/src/test/results/clientpositive/perf/spark/query96.q.out
+++ b/ql/src/test/results/clientpositive/perf/spark/query96.q.out
@@ -42,6 +42,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: time_dim
+ filterExpr: ((t_hour = 8) and (t_minute >= 30) and t_time_sk is not null) (type: boolean)
Statistics: Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((t_hour = 8) and (t_minute >= 30) and t_time_sk is not null) (type: boolean)
@@ -61,6 +62,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: household_demographics
+ filterExpr: ((hd_dep_count = 5) and hd_demo_sk is not null) (type: boolean)
Statistics: Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((hd_dep_count = 5) and hd_demo_sk is not null) (type: boolean)
@@ -80,6 +82,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: store
+ filterExpr: ((s_store_name = 'ese') and s_store_sk is not null) (type: boolean)
Statistics: Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((s_store_name = 'ese') and s_store_sk is not null) (type: boolean)
@@ -107,6 +110,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: store_sales
+ filterExpr: (ss_hdemo_sk is not null and ss_sold_time_sk is not null and ss_store_sk is not null) (type: boolean)
Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (ss_hdemo_sk is not null and ss_sold_time_sk is not null and ss_store_sk is not null) (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query97.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/spark/query97.q.out b/ql/src/test/results/clientpositive/perf/spark/query97.q.out
index 1908e48..c4f4804 100644
--- a/ql/src/test/results/clientpositive/perf/spark/query97.q.out
+++ b/ql/src/test/results/clientpositive/perf/spark/query97.q.out
@@ -61,6 +61,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: date_dim
+ filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean)
Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean)
@@ -85,6 +86,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: date_dim
+ filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean)
Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean)
@@ -114,6 +116,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: store_sales
+ filterExpr: ss_sold_date_sk is not null (type: boolean)
Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ss_sold_date_sk is not null (type: boolean)
@@ -149,6 +152,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: catalog_sales
+ filterExpr: cs_sold_date_sk is not null (type: boolean)
Statistics: Num rows: 287989836 Data size: 38999608952 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: cs_sold_date_sk is not null (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query98.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/spark/query98.q.out b/ql/src/test/results/clientpositive/perf/spark/query98.q.out
index c69032b..d3f6670 100644
--- a/ql/src/test/results/clientpositive/perf/spark/query98.q.out
+++ b/ql/src/test/results/clientpositive/perf/spark/query98.q.out
@@ -74,6 +74,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: date_dim
+ filterExpr: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'2001-01-12 00:00:00.0' AND TIMESTAMP'2001-02-11 00:00:00.0' and d_date_sk is not null) (type: boolean)
Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'2001-01-12 00:00:00.0' AND TIMESTAMP'2001-02-11 00:00:00.0' and d_date_sk is not null) (type: boolean)
@@ -103,6 +104,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: store_sales
+ filterExpr: (ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean)
Statistics: Num rows: 575995635 Data size: 50814502088 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean)
@@ -134,6 +136,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: item
+ filterExpr: ((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean)
Statistics: Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: ((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/spark/query99.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/spark/query99.q.out b/ql/src/test/results/clientpositive/perf/spark/query99.q.out
index 1e584ae..f541da8 100644
--- a/ql/src/test/results/clientpositive/perf/spark/query99.q.out
+++ b/ql/src/test/results/clientpositive/perf/spark/query99.q.out
@@ -80,6 +80,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: date_dim
+ filterExpr: (d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean)
Statistics: Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (d_date_sk is not null and d_month_seq BETWEEN 1212 AND 1223) (type: boolean)
@@ -99,6 +100,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: call_center
+ filterExpr: cc_call_center_sk is not null (type: boolean)
Statistics: Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: cc_call_center_sk is not null (type: boolean)
@@ -118,6 +120,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: warehouse
+ filterExpr: w_warehouse_sk is not null (type: boolean)
Statistics: Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: w_warehouse_sk is not null (type: boolean)
@@ -137,6 +140,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: ship_mode
+ filterExpr: sm_ship_mode_sk is not null (type: boolean)
Statistics: Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE
Filter Operator
predicate: sm_ship_mode_sk is not null (type: boolean)
@@ -164,6 +168,7 @@ STAGE PLANS:
Map Operator Tree:
TableScan
alias: catalog_sales
+ filterExpr: (cs_warehouse_sk is not null and cs_ship_mode_sk is not null and cs_call_center_sk is not null and cs_ship_date_sk is not null) (type: boolean)
Statistics: Num rows: 287989836 Data size: 38999608952 Basic stats: COMPLETE Column stats: NONE
Filter Operator
predicate: (cs_call_center_sk is not null and cs_ship_date_sk is not null and cs_ship_mode_sk is not null and cs_warehouse_sk is not null) (type: boolean)
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query1.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query1.q.out b/ql/src/test/results/clientpositive/perf/tez/query1.q.out
index ea6e0da..579940c 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query1.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query1.q.out
@@ -63,10 +63,10 @@ Stage-0
limit:100
Stage-1
Reducer 7 vectorized
- File Output Operator [FS_108]
- Limit [LIM_107] (rows=100 width=860)
+ File Output Operator [FS_159]
+ Limit [LIM_158] (rows=100 width=860)
Number of rows:100
- Select Operator [SEL_106] (rows=32266667 width=860)
+ Select Operator [SEL_157] (rows=32266667 width=860)
Output:["_col0"]
<-Reducer 6 [SIMPLE_EDGE]
SHUFFLE [RS_50]
@@ -74,96 +74,96 @@ Stage-0
Output:["_col0"]
Filter Operator [FIL_48] (rows=32266667 width=860)
predicate:(_col2 > _col7)
- Merge Join Operator [MERGEJOIN_81] (rows=96800003 width=860)
- Conds:RS_45._col1=RS_105._col1(Inner),Output:["_col2","_col6","_col7"]
+ Merge Join Operator [MERGEJOIN_132] (rows=96800003 width=860)
+ Conds:RS_45._col1=RS_156._col1(Inner),Output:["_col2","_col6","_col7"]
<-Reducer 5 [SIMPLE_EDGE]
SHUFFLE [RS_45]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_79] (rows=88000001 width=860)
- Conds:RS_42._col0=RS_100._col0(Inner),Output:["_col1","_col2","_col6"]
+ Merge Join Operator [MERGEJOIN_130] (rows=88000001 width=860)
+ Conds:RS_42._col0=RS_151._col0(Inner),Output:["_col1","_col2","_col6"]
<-Map 12 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_100]
+ SHUFFLE [RS_151]
PartitionCols:_col0
- Select Operator [SEL_99] (rows=80000000 width=860)
+ Select Operator [SEL_150] (rows=80000000 width=860)
Output:["_col0","_col1"]
- Filter Operator [FIL_98] (rows=80000000 width=860)
+ Filter Operator [FIL_149] (rows=80000000 width=860)
predicate:c_customer_sk is not null
TableScan [TS_17] (rows=80000000 width=860)
default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id"]
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_42]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_78] (rows=34842647 width=77)
- Conds:RS_94._col1=RS_97._col0(Inner),Output:["_col0","_col1","_col2"]
+ Merge Join Operator [MERGEJOIN_129] (rows=34842647 width=77)
+ Conds:RS_145._col1=RS_148._col0(Inner),Output:["_col0","_col1","_col2"]
<-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_97]
+ SHUFFLE [RS_148]
PartitionCols:_col0
- Select Operator [SEL_96] (rows=852 width=1910)
+ Select Operator [SEL_147] (rows=852 width=1910)
Output:["_col0"]
- Filter Operator [FIL_95] (rows=852 width=1910)
+ Filter Operator [FIL_146] (rows=852 width=1910)
predicate:((s_state = 'NM') and s_store_sk is not null)
TableScan [TS_14] (rows=1704 width=1910)
default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"]
<-Reducer 3 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_94]
+ SHUFFLE [RS_145]
PartitionCols:_col1
- Select Operator [SEL_93] (rows=31675133 width=77)
+ Select Operator [SEL_144] (rows=31675133 width=77)
Output:["_col0","_col1","_col2"]
- Group By Operator [GBY_92] (rows=31675133 width=77)
+ Group By Operator [GBY_143] (rows=31675133 width=77)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_11]
PartitionCols:_col0, _col1
Group By Operator [GBY_10] (rows=63350266 width=77)
Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col2, _col1
- Merge Join Operator [MERGEJOIN_77] (rows=63350266 width=77)
- Conds:RS_86._col0=RS_90._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_128] (rows=63350266 width=77)
+ Conds:RS_137._col0=RS_141._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_86]
+ SHUFFLE [RS_137]
PartitionCols:_col0
- Select Operator [SEL_84] (rows=57591150 width=77)
+ Select Operator [SEL_135] (rows=57591150 width=77)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_82] (rows=57591150 width=77)
+ Filter Operator [FIL_133] (rows=57591150 width=77)
predicate:(sr_customer_sk is not null and sr_returned_date_sk is not null and sr_store_sk is not null)
TableScan [TS_0] (rows=57591150 width=77)
default@store_returns,store_returns,Tbl:COMPLETE,Col:NONE,Output:["sr_returned_date_sk","sr_customer_sk","sr_store_sk","sr_fee"]
<-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_90]
+ SHUFFLE [RS_141]
PartitionCols:_col0
- Select Operator [SEL_89] (rows=36524 width=1119)
+ Select Operator [SEL_140] (rows=36524 width=1119)
Output:["_col0"]
- Filter Operator [FIL_88] (rows=36524 width=1119)
+ Filter Operator [FIL_139] (rows=36524 width=1119)
predicate:((d_year = 2000) and d_date_sk is not null)
TableScan [TS_3] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
<-Reducer 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_105]
+ SHUFFLE [RS_156]
PartitionCols:_col1
- Select Operator [SEL_104] (rows=15837566 width=77)
+ Select Operator [SEL_155] (rows=15837566 width=77)
Output:["_col0","_col1"]
- Group By Operator [GBY_103] (rows=15837566 width=77)
+ Group By Operator [GBY_154] (rows=15837566 width=77)
Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)","count(_col2)"],keys:_col1
- Select Operator [SEL_102] (rows=31675133 width=77)
+ Select Operator [SEL_153] (rows=31675133 width=77)
Output:["_col1","_col2"]
- Group By Operator [GBY_101] (rows=31675133 width=77)
+ Group By Operator [GBY_152] (rows=31675133 width=77)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1
<-Reducer 8 [SIMPLE_EDGE]
SHUFFLE [RS_31]
PartitionCols:_col0
Group By Operator [GBY_30] (rows=63350266 width=77)
Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col2, _col1
- Merge Join Operator [MERGEJOIN_80] (rows=63350266 width=77)
- Conds:RS_87._col0=RS_91._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_131] (rows=63350266 width=77)
+ Conds:RS_138._col0=RS_142._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_87]
+ SHUFFLE [RS_138]
PartitionCols:_col0
- Select Operator [SEL_85] (rows=57591150 width=77)
+ Select Operator [SEL_136] (rows=57591150 width=77)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_83] (rows=57591150 width=77)
+ Filter Operator [FIL_134] (rows=57591150 width=77)
predicate:(sr_returned_date_sk is not null and sr_store_sk is not null)
Please refer to the previous TableScan [TS_0]
<-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_91]
+ SHUFFLE [RS_142]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_89]
+ Please refer to the previous Select Operator [SEL_140]
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query10.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query10.q.out b/ql/src/test/results/clientpositive/perf/tez/query10.q.out
index a88b7e1..1b6adee 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query10.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query10.q.out
@@ -117,32 +117,39 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Reducer 10 <- Map 11 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE)
-Reducer 12 <- Map 11 (SIMPLE_EDGE), Map 16 (SIMPLE_EDGE)
-Reducer 13 <- Reducer 12 (SIMPLE_EDGE)
-Reducer 14 <- Map 11 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE)
+Map 10 <- Reducer 13 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE)
+Map 20 <- Reducer 16 (BROADCAST_EDGE)
+Map 21 <- Reducer 19 (BROADCAST_EDGE)
+Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 12 (SIMPLE_EDGE)
+Reducer 13 <- Map 12 (CUSTOM_SIMPLE_EDGE)
+Reducer 14 <- Map 12 (SIMPLE_EDGE), Map 20 (SIMPLE_EDGE)
Reducer 15 <- Reducer 14 (SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE)
-Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
-Reducer 4 <- Reducer 10 (SIMPLE_EDGE), Reducer 13 (ONE_TO_ONE_EDGE), Reducer 15 (ONE_TO_ONE_EDGE), Reducer 3 (SIMPLE_EDGE)
+Reducer 16 <- Map 12 (CUSTOM_SIMPLE_EDGE)
+Reducer 17 <- Map 12 (SIMPLE_EDGE), Map 21 (SIMPLE_EDGE)
+Reducer 18 <- Reducer 17 (SIMPLE_EDGE)
+Reducer 19 <- Map 12 (CUSTOM_SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
+Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
+Reducer 4 <- Reducer 11 (SIMPLE_EDGE), Reducer 15 (ONE_TO_ONE_EDGE), Reducer 18 (ONE_TO_ONE_EDGE), Reducer 3 (SIMPLE_EDGE)
Reducer 5 <- Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Reducer 5 (SIMPLE_EDGE)
+Reducer 7 <- Reducer 3 (CUSTOM_SIMPLE_EDGE)
Stage-0
Fetch Operator
limit:100
Stage-1
Reducer 6 vectorized
- File Output Operator [FS_143]
- Limit [LIM_142] (rows=100 width=88)
+ File Output Operator [FS_224]
+ Limit [LIM_223] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_141] (rows=1045432122 width=88)
+ Select Operator [SEL_222] (rows=1045432122 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
<-Reducer 5 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_140]
- Select Operator [SEL_139] (rows=1045432122 width=88)
+ SHUFFLE [RS_221]
+ Select Operator [SEL_220] (rows=1045432122 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col8","_col10","_col12"]
- Group By Operator [GBY_138] (rows=1045432122 width=88)
+ Group By Operator [GBY_219] (rows=1045432122 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_63]
@@ -153,124 +160,168 @@ Stage-0
Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
Filter Operator [FIL_60] (rows=2090864244 width=88)
predicate:(_col15 is not null or _col17 is not null)
- Merge Join Operator [MERGEJOIN_108] (rows=2090864244 width=88)
- Conds:RS_55._col0=RS_56._col0(Left Semi),RS_55._col0=RS_131._col0(Left Outer),RS_55._col0=RS_137._col0(Left Outer),Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col15","_col17"]
- <-Reducer 10 [SIMPLE_EDGE]
+ Merge Join Operator [MERGEJOIN_172] (rows=2090864244 width=88)
+ Conds:RS_55._col0=RS_56._col0(Left Semi),RS_55._col0=RS_210._col0(Left Outer),RS_55._col0=RS_218._col0(Left Outer),Output:["_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col15","_col17"]
+ <-Reducer 3 [SIMPLE_EDGE]
+ PARTITION_ONLY_SHUFFLE [RS_55]
+ PartitionCols:_col0
+ Merge Join Operator [MERGEJOIN_168] (rows=96800003 width=860)
+ Conds:RS_50._col1=RS_181._col0(Inner),Output:["_col0","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
+ <-Map 9 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_181]
+ PartitionCols:_col0
+ Select Operator [SEL_180] (rows=1861800 width=385)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"]
+ Filter Operator [FIL_179] (rows=1861800 width=385)
+ predicate:cd_demo_sk is not null
+ TableScan [TS_6] (rows=1861800 width=385)
+ default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status","cd_purchase_estimate","cd_credit_rating","cd_dep_count","cd_dep_employed_count","cd_dep_college_count"]
+ <-Reducer 2 [SIMPLE_EDGE]
+ SHUFFLE [RS_50]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_167] (rows=88000001 width=860)
+ Conds:RS_175._col2=RS_178._col0(Inner),Output:["_col0","_col1"]
+ <-Map 1 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_175]
+ PartitionCols:_col2
+ Select Operator [SEL_174] (rows=80000000 width=860)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_173] (rows=80000000 width=860)
+ predicate:(c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null)
+ TableScan [TS_0] (rows=80000000 width=860)
+ default@customer,c,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk"]
+ <-Map 8 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_178]
+ PartitionCols:_col0
+ Select Operator [SEL_177] (rows=20000000 width=1014)
+ Output:["_col0"]
+ Filter Operator [FIL_176] (rows=20000000 width=1014)
+ predicate:((ca_county) IN ('Walker County', 'Richland County', 'Gaines County', 'Douglas County', 'Dona Ana County') and ca_address_sk is not null)
+ TableScan [TS_3] (rows=40000000 width=1014)
+ default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"]
+ <-Reducer 11 [SIMPLE_EDGE]
SHUFFLE [RS_56]
PartitionCols:_col0
Group By Operator [GBY_54] (rows=633595212 width=88)
Output:["_col0"],keys:_col0
Select Operator [SEL_18] (rows=633595212 width=88)
Output:["_col0"]
- Merge Join Operator [MERGEJOIN_105] (rows=633595212 width=88)
- Conds:RS_120._col0=RS_123._col0(Inner),Output:["_col1"]
- <-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_123]
+ Merge Join Operator [MERGEJOIN_169] (rows=633595212 width=88)
+ Conds:RS_202._col0=RS_184._col0(Inner),Output:["_col1"]
+ <-Map 12 [SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_184]
PartitionCols:_col0
- Select Operator [SEL_122] (rows=4058 width=1119)
+ Select Operator [SEL_183] (rows=4058 width=1119)
Output:["_col0"]
- Filter Operator [FIL_121] (rows=4058 width=1119)
+ Filter Operator [FIL_182] (rows=4058 width=1119)
predicate:((d_year = 2002) and d_date_sk is not null and d_moy BETWEEN 4 AND 7)
TableScan [TS_12] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"]
- <-Map 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_120]
+ <-Map 10 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_202]
PartitionCols:_col0
- Select Operator [SEL_119] (rows=575995635 width=88)
+ Select Operator [SEL_201] (rows=575995635 width=88)
Output:["_col0","_col1"]
- Filter Operator [FIL_118] (rows=575995635 width=88)
- predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null)
+ Filter Operator [FIL_200] (rows=575995635 width=88)
+ predicate:((ss_customer_sk BETWEEN DynamicValue(RS_55_c_c_customer_sk_min) AND DynamicValue(RS_55_c_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_55_c_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_16_date_dim_d_date_sk_min) AND DynamicValue(RS_16_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_16_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null)
TableScan [TS_9] (rows=575995635 width=88)
default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk"]
- <-Reducer 13 [ONE_TO_ONE_EDGE] vectorized
- FORWARD [RS_131]
+ <-Reducer 13 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_197]
+ Group By Operator [GBY_196] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_193]
+ Group By Operator [GBY_190] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_185] (rows=4058 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_183]
+ <-Reducer 7 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_199]
+ Group By Operator [GBY_198] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=96800000)"]
+ <-Reducer 3 [CUSTOM_SIMPLE_EDGE]
+ PARTITION_ONLY_SHUFFLE [RS_135]
+ Group By Operator [GBY_134] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=96800000)"]
+ Select Operator [SEL_133] (rows=96800003 width=860)
+ Output:["_col0"]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_168]
+ <-Reducer 15 [ONE_TO_ONE_EDGE] vectorized
+ FORWARD [RS_210]
PartitionCols:_col0
- Select Operator [SEL_130] (rows=79201469 width=135)
+ Select Operator [SEL_209] (rows=79201469 width=135)
Output:["_col0","_col1"]
- Group By Operator [GBY_129] (rows=79201469 width=135)
+ Group By Operator [GBY_208] (rows=79201469 width=135)
Output:["_col0"],keys:KEY._col0
- <-Reducer 12 [SIMPLE_EDGE]
+ <-Reducer 14 [SIMPLE_EDGE]
SHUFFLE [RS_30]
PartitionCols:_col0
Group By Operator [GBY_29] (rows=158402938 width=135)
Output:["_col0"],keys:_col1
- Merge Join Operator [MERGEJOIN_106] (rows=158402938 width=135)
- Conds:RS_128._col0=RS_124._col0(Inner),Output:["_col1"]
- <-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_124]
+ Merge Join Operator [MERGEJOIN_170] (rows=158402938 width=135)
+ Conds:RS_207._col0=RS_186._col0(Inner),Output:["_col1"]
+ <-Map 12 [SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_186]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_122]
- <-Map 16 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_128]
+ Please refer to the previous Select Operator [SEL_183]
+ <-Map 20 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_207]
PartitionCols:_col0
- Select Operator [SEL_127] (rows=144002668 width=135)
+ Select Operator [SEL_206] (rows=144002668 width=135)
Output:["_col0","_col1"]
- Filter Operator [FIL_126] (rows=144002668 width=135)
- predicate:(ws_bill_customer_sk is not null and ws_sold_date_sk is not null)
+ Filter Operator [FIL_205] (rows=144002668 width=135)
+ predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_26_date_dim_d_date_sk_min) AND DynamicValue(RS_26_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_26_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null)
TableScan [TS_19] (rows=144002668 width=135)
default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk"]
- <-Reducer 15 [ONE_TO_ONE_EDGE] vectorized
- FORWARD [RS_137]
+ <-Reducer 16 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_204]
+ Group By Operator [GBY_203] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_194]
+ Group By Operator [GBY_191] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_187] (rows=4058 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_183]
+ <-Reducer 18 [ONE_TO_ONE_EDGE] vectorized
+ FORWARD [RS_218]
PartitionCols:_col0
- Select Operator [SEL_136] (rows=158394413 width=135)
+ Select Operator [SEL_217] (rows=158394413 width=135)
Output:["_col0","_col1"]
- Group By Operator [GBY_135] (rows=158394413 width=135)
+ Group By Operator [GBY_216] (rows=158394413 width=135)
Output:["_col0"],keys:KEY._col0
- <-Reducer 14 [SIMPLE_EDGE]
+ <-Reducer 17 [SIMPLE_EDGE]
SHUFFLE [RS_44]
PartitionCols:_col0
Group By Operator [GBY_43] (rows=316788826 width=135)
Output:["_col0"],keys:_col1
- Merge Join Operator [MERGEJOIN_107] (rows=316788826 width=135)
- Conds:RS_134._col0=RS_125._col0(Inner),Output:["_col1"]
- <-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_125]
+ Merge Join Operator [MERGEJOIN_171] (rows=316788826 width=135)
+ Conds:RS_215._col0=RS_188._col0(Inner),Output:["_col1"]
+ <-Map 12 [SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_188]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_122]
- <-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_134]
+ Please refer to the previous Select Operator [SEL_183]
+ <-Map 21 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_215]
PartitionCols:_col0
- Select Operator [SEL_133] (rows=287989836 width=135)
+ Select Operator [SEL_214] (rows=287989836 width=135)
Output:["_col0","_col1"]
- Filter Operator [FIL_132] (rows=287989836 width=135)
- predicate:(cs_ship_customer_sk is not null and cs_sold_date_sk is not null)
+ Filter Operator [FIL_213] (rows=287989836 width=135)
+ predicate:((cs_sold_date_sk BETWEEN DynamicValue(RS_40_date_dim_d_date_sk_min) AND DynamicValue(RS_40_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_40_date_dim_d_date_sk_bloom_filter))) and cs_ship_customer_sk is not null and cs_sold_date_sk is not null)
TableScan [TS_33] (rows=287989836 width=135)
default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_ship_customer_sk"]
- <-Reducer 3 [SIMPLE_EDGE]
- SHUFFLE [RS_55]
- PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_104] (rows=96800003 width=860)
- Conds:RS_50._col1=RS_117._col0(Inner),Output:["_col0","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
- <-Map 8 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_117]
- PartitionCols:_col0
- Select Operator [SEL_116] (rows=1861800 width=385)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"]
- Filter Operator [FIL_115] (rows=1861800 width=385)
- predicate:cd_demo_sk is not null
- TableScan [TS_6] (rows=1861800 width=385)
- default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status","cd_purchase_estimate","cd_credit_rating","cd_dep_count","cd_dep_employed_count","cd_dep_college_count"]
- <-Reducer 2 [SIMPLE_EDGE]
- SHUFFLE [RS_50]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_103] (rows=88000001 width=860)
- Conds:RS_111._col2=RS_114._col0(Inner),Output:["_col0","_col1"]
- <-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_111]
- PartitionCols:_col2
- Select Operator [SEL_110] (rows=80000000 width=860)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_109] (rows=80000000 width=860)
- predicate:(c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null)
- TableScan [TS_0] (rows=80000000 width=860)
- default@customer,c,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk"]
- <-Map 7 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_114]
- PartitionCols:_col0
- Select Operator [SEL_113] (rows=20000000 width=1014)
- Output:["_col0"]
- Filter Operator [FIL_112] (rows=20000000 width=1014)
- predicate:((ca_county) IN ('Walker County', 'Richland County', 'Gaines County', 'Douglas County', 'Dona Ana County') and ca_address_sk is not null)
- TableScan [TS_3] (rows=40000000 width=1014)
- default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"]
+ <-Reducer 19 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_212]
+ Group By Operator [GBY_211] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_195]
+ Group By Operator [GBY_192] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_189] (rows=4058 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_183]
http://git-wip-us.apache.org/repos/asf/hive/blob/f2c4f319/ql/src/test/results/clientpositive/perf/tez/query11.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query11.q.out b/ql/src/test/results/clientpositive/perf/tez/query11.q.out
index 2599621..bf454a0 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query11.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query11.q.out
@@ -149,30 +149,40 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE)
-Reducer 12 <- Map 18 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE)
-Reducer 13 <- Reducer 12 (SIMPLE_EDGE)
-Reducer 14 <- Map 10 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE)
-Reducer 15 <- Map 18 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE)
-Reducer 16 <- Reducer 15 (SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE)
-Reducer 3 <- Map 18 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
+Map 1 <- Reducer 17 (BROADCAST_EDGE)
+Map 11 <- Reducer 16 (BROADCAST_EDGE), Reducer 24 (BROADCAST_EDGE)
+Map 26 <- Reducer 22 (BROADCAST_EDGE)
+Map 7 <- Reducer 18 (BROADCAST_EDGE), Reducer 25 (BROADCAST_EDGE)
+Reducer 10 <- Reducer 9 (SIMPLE_EDGE)
+Reducer 12 <- Map 11 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE)
+Reducer 13 <- Map 23 (SIMPLE_EDGE), Reducer 12 (SIMPLE_EDGE)
+Reducer 14 <- Reducer 13 (SIMPLE_EDGE)
+Reducer 16 <- Map 15 (CUSTOM_SIMPLE_EDGE)
+Reducer 17 <- Map 15 (CUSTOM_SIMPLE_EDGE)
+Reducer 18 <- Map 15 (CUSTOM_SIMPLE_EDGE)
+Reducer 19 <- Map 15 (SIMPLE_EDGE), Map 26 (SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE)
+Reducer 20 <- Map 23 (SIMPLE_EDGE), Reducer 19 (SIMPLE_EDGE)
+Reducer 21 <- Reducer 20 (SIMPLE_EDGE)
+Reducer 22 <- Map 15 (CUSTOM_SIMPLE_EDGE)
+Reducer 24 <- Map 23 (CUSTOM_SIMPLE_EDGE)
+Reducer 25 <- Map 23 (CUSTOM_SIMPLE_EDGE)
+Reducer 3 <- Map 23 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
Reducer 4 <- Reducer 3 (SIMPLE_EDGE)
-Reducer 5 <- Reducer 13 (SIMPLE_EDGE), Reducer 16 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE)
+Reducer 5 <- Reducer 10 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE), Reducer 21 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Reducer 5 (SIMPLE_EDGE)
-Reducer 7 <- Map 1 (SIMPLE_EDGE), Map 17 (SIMPLE_EDGE)
-Reducer 8 <- Map 18 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE)
-Reducer 9 <- Reducer 8 (SIMPLE_EDGE)
+Reducer 8 <- Map 15 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE)
+Reducer 9 <- Map 23 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE)
Stage-0
Fetch Operator
limit:100
Stage-1
Reducer 6 vectorized
- File Output Operator [FS_218]
- Limit [LIM_217] (rows=100 width=88)
+ File Output Operator [FS_360]
+ Limit [LIM_359] (rows=100 width=88)
Number of rows:100
- Select Operator [SEL_216] (rows=383325119 width=88)
+ Select Operator [SEL_358] (rows=383325119 width=88)
Output:["_col0"]
<-Reducer 5 [SIMPLE_EDGE]
SHUFFLE [RS_93]
@@ -180,103 +190,209 @@ Stage-0
Output:["_col0"]
Filter Operator [FIL_91] (rows=383325119 width=88)
predicate:((_col1 / _col8) > (_col6 / _col3))
- Merge Join Operator [MERGEJOIN_175] (rows=1149975359 width=88)
- Conds:RS_198._col0=RS_215._col0(Inner),RS_215._col0=RS_210._col0(Inner),RS_215._col0=RS_203._col0(Inner),Output:["_col1","_col3","_col5","_col6","_col8"]
- <-Reducer 13 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_210]
+ Merge Join Operator [MERGEJOIN_283] (rows=1149975359 width=88)
+ Conds:RS_325._col0=RS_337._col0(Inner),RS_337._col0=RS_347._col0(Inner),RS_337._col0=RS_357._col0(Inner),Output:["_col1","_col3","_col5","_col6","_col8"]
+ <-Reducer 10 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_337]
PartitionCols:_col0
- Select Operator [SEL_209] (rows=348477374 width=88)
+ Select Operator [SEL_336] (rows=116159124 width=88)
+ Output:["_col0","_col1"]
+ Filter Operator [FIL_335] (rows=116159124 width=88)
+ predicate:(_col7 > 0)
+ Select Operator [SEL_334] (rows=348477374 width=88)
+ Output:["_col0","_col7"]
+ Group By Operator [GBY_333] (rows=348477374 width=88)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6
+ <-Reducer 9 [SIMPLE_EDGE]
+ SHUFFLE [RS_39]
+ PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6
+ Group By Operator [GBY_38] (rows=696954748 width=88)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6
+ Select Operator [SEL_36] (rows=696954748 width=88)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
+ Merge Join Operator [MERGEJOIN_278] (rows=696954748 width=88)
+ Conds:RS_33._col1=RS_316._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
+ <-Map 23 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_316]
+ PartitionCols:_col0
+ Select Operator [SEL_312] (rows=80000000 width=860)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
+ Filter Operator [FIL_311] (rows=80000000 width=860)
+ predicate:(c_customer_id is not null and c_customer_sk is not null)
+ TableScan [TS_49] (rows=80000000 width=860)
+ default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id","c_first_name","c_last_name","c_preferred_cust_flag","c_birth_country","c_login","c_email_address"]
+ <-Reducer 8 [SIMPLE_EDGE]
+ SHUFFLE [RS_33]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_277] (rows=633595212 width=88)
+ Conds:RS_332._col0=RS_294._col0(Inner),Output:["_col1","_col2","_col3"]
+ <-Map 15 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_294]
+ PartitionCols:_col0
+ Select Operator [SEL_288] (rows=36524 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_285] (rows=36524 width=1119)
+ predicate:((d_year = 2001) and d_date_sk is not null)
+ TableScan [TS_46] (rows=73049 width=1119)
+ default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
+ <-Map 7 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_332]
+ PartitionCols:_col0
+ Select Operator [SEL_331] (rows=575995635 width=88)
+ Output:["_col0","_col1","_col2","_col3"]
+ Filter Operator [FIL_330] (rows=575995635 width=88)
+ predicate:((ss_customer_sk BETWEEN DynamicValue(RS_34_customer_c_customer_sk_min) AND DynamicValue(RS_34_customer_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_34_customer_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_31_date_dim_d_date_sk_min) AND DynamicValue(RS_31_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_31_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null)
+ TableScan [TS_21] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_discount_amt","ss_ext_list_price"]
+ <-Reducer 18 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_327]
+ Group By Operator [GBY_326] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_304]
+ Group By Operator [GBY_300] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_295] (rows=36524 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_288]
+ <-Reducer 25 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_329]
+ Group By Operator [GBY_328] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=80000000)"]
+ <-Map 23 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_322]
+ Group By Operator [GBY_320] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=80000000)"]
+ Select Operator [SEL_317] (rows=80000000 width=860)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_312]
+ <-Reducer 14 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_347]
+ PartitionCols:_col0
+ Select Operator [SEL_346] (rows=348477374 width=88)
Output:["_col0","_col1","_col2"]
- Group By Operator [GBY_208] (rows=348477374 width=88)
+ Group By Operator [GBY_345] (rows=348477374 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6
- <-Reducer 12 [SIMPLE_EDGE]
+ <-Reducer 13 [SIMPLE_EDGE]
SHUFFLE [RS_61]
PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6
Group By Operator [GBY_60] (rows=696954748 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6
Select Operator [SEL_58] (rows=696954748 width=88)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
- Merge Join Operator [MERGEJOIN_172] (rows=696954748 width=88)
- Conds:RS_55._col1=RS_192._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
- <-Map 18 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_192]
+ Merge Join Operator [MERGEJOIN_280] (rows=696954748 width=88)
+ Conds:RS_55._col1=RS_313._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
+ <-Map 23 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_313]
PartitionCols:_col0
- Select Operator [SEL_191] (rows=80000000 width=860)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
- Filter Operator [FIL_190] (rows=80000000 width=860)
- predicate:(c_customer_id is not null and c_customer_sk is not null)
- TableScan [TS_49] (rows=80000000 width=860)
- default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_customer_id","c_first_name","c_last_name","c_preferred_cust_flag","c_birth_country","c_login","c_email_address"]
- <-Reducer 11 [SIMPLE_EDGE]
+ Please refer to the previous Select Operator [SEL_312]
+ <-Reducer 12 [SIMPLE_EDGE]
SHUFFLE [RS_55]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_171] (rows=633595212 width=88)
- Conds:RS_206._col0=RS_186._col0(Inner),Output:["_col1","_col2","_col3"]
- <-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_186]
+ Merge Join Operator [MERGEJOIN_279] (rows=633595212 width=88)
+ Conds:RS_344._col0=RS_290._col0(Inner),Output:["_col1","_col2","_col3"]
+ <-Map 15 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_290]
PartitionCols:_col0
- Select Operator [SEL_183] (rows=36524 width=1119)
+ Select Operator [SEL_287] (rows=36524 width=1119)
Output:["_col0"]
- Filter Operator [FIL_180] (rows=36524 width=1119)
+ Filter Operator [FIL_284] (rows=36524 width=1119)
predicate:((d_year = 2002) and d_date_sk is not null)
- TableScan [TS_46] (rows=73049 width=1119)
- default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
- <-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_206]
+ Please refer to the previous TableScan [TS_46]
+ <-Map 11 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_344]
PartitionCols:_col0
- Select Operator [SEL_205] (rows=575995635 width=88)
+ Select Operator [SEL_343] (rows=575995635 width=88)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_204] (rows=575995635 width=88)
- predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null)
+ Filter Operator [FIL_342] (rows=575995635 width=88)
+ predicate:((ss_customer_sk BETWEEN DynamicValue(RS_56_customer_c_customer_sk_min) AND DynamicValue(RS_56_customer_c_customer_sk_max) and in_bloom_filter(ss_customer_sk, DynamicValue(RS_56_customer_c_customer_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_53_date_dim_d_date_sk_min) AND DynamicValue(RS_53_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_53_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null)
TableScan [TS_43] (rows=575995635 width=88)
default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_discount_amt","ss_ext_list_price"]
- <-Reducer 16 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_215]
+ <-Reducer 16 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_339]
+ Group By Operator [GBY_338] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_302]
+ Group By Operator [GBY_298] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_291] (rows=36524 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_287]
+ <-Reducer 24 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_341]
+ Group By Operator [GBY_340] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=80000000)"]
+ <-Map 23 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_321]
+ Group By Operator [GBY_319] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=80000000)"]
+ Select Operator [SEL_314] (rows=80000000 width=860)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_312]
+ <-Reducer 21 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_357]
PartitionCols:_col0
- Select Operator [SEL_214] (rows=116159124 width=88)
+ Select Operator [SEL_356] (rows=29040539 width=135)
Output:["_col0","_col1"]
- Filter Operator [FIL_213] (rows=116159124 width=88)
+ Filter Operator [FIL_355] (rows=29040539 width=135)
predicate:(_col7 > 0)
- Select Operator [SEL_212] (rows=348477374 width=88)
+ Select Operator [SEL_354] (rows=87121617 width=135)
Output:["_col0","_col7"]
- Group By Operator [GBY_211] (rows=348477374 width=88)
+ Group By Operator [GBY_353] (rows=87121617 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6
- <-Reducer 15 [SIMPLE_EDGE]
- SHUFFLE [RS_39]
+ <-Reducer 20 [SIMPLE_EDGE]
+ SHUFFLE [RS_82]
PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6
- Group By Operator [GBY_38] (rows=696954748 width=88)
+ Group By Operator [GBY_81] (rows=174243235 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6
- Select Operator [SEL_36] (rows=696954748 width=88)
+ Select Operator [SEL_79] (rows=174243235 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
- Merge Join Operator [MERGEJOIN_170] (rows=696954748 width=88)
- Conds:RS_33._col1=RS_194._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
- <-Map 18 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_194]
+ Merge Join Operator [MERGEJOIN_282] (rows=174243235 width=135)
+ Conds:RS_76._col1=RS_318._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
+ <-Map 23 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_318]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_191]
- <-Reducer 14 [SIMPLE_EDGE]
- SHUFFLE [RS_33]
+ Please refer to the previous Select Operator [SEL_312]
+ <-Reducer 19 [SIMPLE_EDGE]
+ SHUFFLE [RS_76]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_169] (rows=633595212 width=88)
- Conds:RS_207._col0=RS_188._col0(Inner),Output:["_col1","_col2","_col3"]
- <-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_188]
+ Merge Join Operator [MERGEJOIN_281] (rows=158402938 width=135)
+ Conds:RS_352._col0=RS_296._col0(Inner),Output:["_col1","_col2","_col3"]
+ <-Map 15 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_296]
PartitionCols:_col0
- Select Operator [SEL_184] (rows=36524 width=1119)
+ Select Operator [SEL_289] (rows=36524 width=1119)
Output:["_col0"]
- Filter Operator [FIL_181] (rows=36524 width=1119)
+ Filter Operator [FIL_286] (rows=36524 width=1119)
predicate:((d_year = 2001) and d_date_sk is not null)
Please refer to the previous TableScan [TS_46]
- <-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_207]
+ <-Map 26 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_352]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_205]
+ Select Operator [SEL_351] (rows=144002668 width=135)
+ Output:["_col0","_col1","_col2","_col3"]
+ Filter Operator [FIL_350] (rows=144002668 width=135)
+ predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_74_date_dim_d_date_sk_min) AND DynamicValue(RS_74_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_74_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null)
+ TableScan [TS_64] (rows=144002668 width=135)
+ default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk","ws_ext_discount_amt","ws_ext_list_price"]
+ <-Reducer 22 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_349]
+ Group By Operator [GBY_348] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_305]
+ Group By Operator [GBY_301] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_297] (rows=36524 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_289]
<-Reducer 4 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_198]
+ SHUFFLE [RS_325]
PartitionCols:_col0
- Select Operator [SEL_197] (rows=87121617 width=135)
+ Select Operator [SEL_324] (rows=87121617 width=135)
Output:["_col0","_col1"]
- Group By Operator [GBY_196] (rows=87121617 width=135)
+ Group By Operator [GBY_323] (rows=87121617 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_18]
@@ -285,69 +401,39 @@ Stage-0
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6
Select Operator [SEL_15] (rows=174243235 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
- Merge Join Operator [MERGEJOIN_168] (rows=174243235 width=135)
- Conds:RS_12._col1=RS_193._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
- <-Map 18 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_193]
+ Merge Join Operator [MERGEJOIN_276] (rows=174243235 width=135)
+ Conds:RS_12._col1=RS_315._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
+ <-Map 23 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_315]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_191]
+ Please refer to the previous Select Operator [SEL_312]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_12]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_167] (rows=158402938 width=135)
- Conds:RS_178._col0=RS_187._col0(Inner),Output:["_col1","_col2","_col3"]
- <-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_187]
+ Merge Join Operator [MERGEJOIN_275] (rows=158402938 width=135)
+ Conds:RS_310._col0=RS_292._col0(Inner),Output:["_col1","_col2","_col3"]
+ <-Map 15 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_292]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_183]
+ Please refer to the previous Select Operator [SEL_287]
<-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_178]
+ SHUFFLE [RS_310]
PartitionCols:_col0
- Select Operator [SEL_177] (rows=144002668 width=135)
+ Select Operator [SEL_309] (rows=144002668 width=135)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_176] (rows=144002668 width=135)
- predicate:(ws_bill_customer_sk is not null and ws_sold_date_sk is not null)
+ Filter Operator [FIL_308] (rows=144002668 width=135)
+ predicate:((ws_sold_date_sk BETWEEN DynamicValue(RS_10_date_dim_d_date_sk_min) AND DynamicValue(RS_10_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_10_date_dim_d_date_sk_bloom_filter))) and ws_bill_customer_sk is not null and ws_sold_date_sk is not null)
TableScan [TS_0] (rows=144002668 width=135)
default@web_sales,web_sales,Tbl:COMPLETE,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk","ws_ext_discount_amt","ws_ext_list_price"]
- <-Reducer 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_203]
- PartitionCols:_col0
- Select Operator [SEL_202] (rows=29040539 width=135)
- Output:["_col0","_col1"]
- Filter Operator [FIL_201] (rows=29040539 width=135)
- predicate:(_col7 > 0)
- Select Operator [SEL_200] (rows=87121617 width=135)
- Output:["_col0","_col7"]
- Group By Operator [GBY_199] (rows=87121617 width=135)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6
- <-Reducer 8 [SIMPLE_EDGE]
- SHUFFLE [RS_82]
- PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6
- Group By Operator [GBY_81] (rows=174243235 width=135)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],aggregations:["sum(_col7)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6
- Select Operator [SEL_79] (rows=174243235 width=135)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"]
- Merge Join Operator [MERGEJOIN_174] (rows=174243235 width=135)
- Conds:RS_76._col1=RS_195._col0(Inner),Output:["_col2","_col3","_col7","_col8","_col9","_col10","_col11","_col12","_col13"]
- <-Map 18 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_195]
- PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_191]
- <-Reducer 7 [SIMPLE_EDGE]
- SHUFFLE [RS_76]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_173] (rows=158402938 width=135)
- Conds:RS_179._col0=RS_189._col0(Inner),Output:["_col1","_col2","_col3"]
- <-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_189]
- PartitionCols:_col0
- Select Operator [SEL_185] (rows=36524 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_182] (rows=36524 width=1119)
- predicate:((d_year = 2001) and d_date_sk is not null)
- Please refer to the previous TableScan [TS_46]
- <-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_179]
- PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_177]
+ <-Reducer 17 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_307]
+ Group By Operator [GBY_306] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_303]
+ Group By Operator [GBY_299] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_293] (rows=36524 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_287]