You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by ha...@apache.org on 2018/08/06 05:47:49 UTC
[4/9] hive git commit: HIVE-19097 : related equals and in operators
may cause inaccurate stats estimations (Zoltan Haindrich via Ashutosh
Chauhan)
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query13.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query13.q.out b/ql/src/test/results/clientpositive/perf/tez/query13.q.out
index 5cd4e27..6274d2a 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query13.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query13.q.out
@@ -101,18 +101,18 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Map 9 <- Reducer 11 (BROADCAST_EDGE), Reducer 13 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 8 (BROADCAST_EDGE)
+Map 1 <- Reducer 11 (BROADCAST_EDGE), Reducer 13 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE)
Reducer 11 <- Map 10 (CUSTOM_SIMPLE_EDGE)
Reducer 13 <- Map 12 (CUSTOM_SIMPLE_EDGE)
Reducer 15 <- Map 14 (CUSTOM_SIMPLE_EDGE)
Reducer 17 <- Map 16 (CUSTOM_SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
Reducer 3 <- Map 10 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
Reducer 4 <- Map 12 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
Reducer 5 <- Map 14 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Map 16 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE)
Reducer 7 <- Reducer 6 (CUSTOM_SIMPLE_EDGE)
-Reducer 8 <- Map 1 (CUSTOM_SIMPLE_EDGE)
+Reducer 9 <- Map 8 (CUSTOM_SIMPLE_EDGE)
Stage-0
Fetch Operator
@@ -127,142 +127,140 @@ Stage-0
<-Reducer 6 [CUSTOM_SIMPLE_EDGE]
PARTITION_ONLY_SHUFFLE [RS_37]
Group By Operator [GBY_36] (rows=1 width=256)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col6)","count(_col6)","sum(_col8)","count(_col8)","sum(_col9)","count(_col9)"]
- Select Operator [SEL_35] (rows=715776 width=88)
- Output:["_col6","_col8","_col9"]
- Filter Operator [FIL_34] (rows=715776 width=88)
- predicate:(((_col19 = 'D') and (_col20 = 'Primary') and _col7 BETWEEN 50 AND 100 and (_col14 = 1)) or ((_col19 = 'M') and (_col20 = '4 yr Degree') and _col7 BETWEEN 100 AND 150 and (_col14 = 3)) or ((_col19 = 'U') and (_col20 = 'Advanced Degree') and _col7 BETWEEN 150 AND 200 and (_col14 = 1)))
- Merge Join Operator [MERGEJOIN_121] (rows=17178642 width=88)
- Conds:RS_31._col2=RS_156._col0(Inner),Output:["_col6","_col7","_col8","_col9","_col14","_col19","_col20"]
- <-Map 16 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_156]
- PartitionCols:_col0
- Select Operator [SEL_155] (rows=1861800 width=385)
- Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_154] (rows=1861800 width=385)
- predicate:(((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree')) and ((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and cd_demo_sk is not null)
- TableScan [TS_15] (rows=1861800 width=385)
- default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"]
- <-Reducer 5 [SIMPLE_EDGE]
- SHUFFLE [RS_31]
- PartitionCols:_col2
- Filter Operator [FIL_30] (rows=15616947 width=88)
- predicate:(((_col16) IN ('KY', 'GA', 'NM') and _col10 BETWEEN 100 AND 200) or ((_col16) IN ('MT', 'OR', 'IN') and _col10 BETWEEN 150 AND 300) or ((_col16) IN ('WI', 'MO', 'WV') and _col10 BETWEEN 50 AND 250))
- Merge Join Operator [MERGEJOIN_120] (rows=93701693 width=88)
- Conds:RS_27._col4=RS_148._col0(Inner),Output:["_col2","_col6","_col7","_col8","_col9","_col10","_col14","_col16"]
- <-Map 14 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_148]
- PartitionCols:_col0
- Select Operator [SEL_147] (rows=10000000 width=1014)
- Output:["_col0","_col1"]
- Filter Operator [FIL_146] (rows=10000000 width=1014)
- predicate:((ca_country = 'United States') and (ca_state) IN ('KY', 'GA', 'NM', 'MT', 'OR', 'IN', 'WI', 'MO', 'WV') and ca_address_sk is not null)
- TableScan [TS_12] (rows=40000000 width=1014)
- default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"]
- <-Reducer 4 [SIMPLE_EDGE]
- SHUFFLE [RS_27]
- PartitionCols:_col4
- Merge Join Operator [MERGEJOIN_119] (rows=85183356 width=88)
- Conds:RS_24._col3=RS_140._col0(Inner),Output:["_col2","_col4","_col6","_col7","_col8","_col9","_col10","_col14"]
- <-Map 12 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_140]
- PartitionCols:_col0
- Select Operator [SEL_139] (rows=7200 width=107)
- Output:["_col0","_col1"]
- Filter Operator [FIL_138] (rows=7200 width=107)
- predicate:(((hd_dep_count = 3) or (hd_dep_count = 1)) and hd_demo_sk is not null)
- TableScan [TS_9] (rows=7200 width=107)
- default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"]
- <-Reducer 3 [SIMPLE_EDGE]
- SHUFFLE [RS_24]
- PartitionCols:_col3
- Merge Join Operator [MERGEJOIN_118] (rows=77439413 width=88)
- Conds:RS_21._col1=RS_132._col0(Inner),Output:["_col2","_col3","_col4","_col6","_col7","_col8","_col9","_col10"]
- <-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_132]
- PartitionCols:_col0
- Select Operator [SEL_131] (rows=36524 width=1119)
- Output:["_col0"]
- Filter Operator [FIL_130] (rows=36524 width=1119)
- predicate:((d_year = 2001) and d_date_sk is not null)
- TableScan [TS_6] (rows=73049 width=1119)
- default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
- <-Reducer 2 [SIMPLE_EDGE]
- SHUFFLE [RS_21]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_117] (rows=70399465 width=88)
- Conds:RS_124._col0=RS_164._col4(Inner),Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col9","_col10"]
- <-Map 1 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_124]
- PartitionCols:_col0
- Select Operator [SEL_123] (rows=1704 width=1910)
- Output:["_col0"]
- Filter Operator [FIL_122] (rows=1704 width=1910)
- predicate:s_store_sk is not null
- TableScan [TS_0] (rows=1704 width=1910)
- default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"]
- <-Map 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_164]
- PartitionCols:_col4
- Select Operator [SEL_163] (rows=63999513 width=88)
- Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"]
- Filter Operator [FIL_162] (rows=63999513 width=88)
- predicate:((ss_addr_sk BETWEEN DynamicValue(RS_28_customer_address_ca_address_sk_min) AND DynamicValue(RS_28_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_28_customer_address_ca_address_sk_bloom_filter))) and (ss_cdemo_sk BETWEEN DynamicValue(RS_32_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_32_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_32_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_hdemo_sk BETWEEN DynamicValue(RS_25_household_demographics_hd_demo_sk_min) AND DynamicValue(RS_25_household_demographics_hd_demo_sk_max) and in_bloom_filter(ss_hdemo_sk, DynamicValue(RS_25_household_demographics_hd_demo_sk_bloom_filter))) and (ss_net_profit BETWEEN 100 AND 200 or ss_net_profit BETWEEN 150 AND 300 or ss_net_profit BETWEEN 50 AND 250) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 1
50 AND 200) and (ss_sold_date_sk BETWEEN DynamicValue(RS_22_date_dim_d_date_sk_min) AND DynamicValue(RS_22_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_22_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_18_store_s_store_sk_min) AND DynamicValue(RS_18_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_18_store_s_store_sk_bloom_filter))) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_hdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null)
- TableScan [TS_3] (rows=575995635 width=88)
- default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_ext_sales_price","ss_ext_wholesale_cost","ss_net_profit"]
- <-Reducer 11 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_137]
- Group By Operator [GBY_136] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 10 [CUSTOM_SIMPLE_EDGE] vectorized
- SHUFFLE [RS_135]
- Group By Operator [GBY_134] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_133] (rows=36524 width=1119)
- Output:["_col0"]
- Please refer to the previous Select Operator [SEL_131]
- <-Reducer 13 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_145]
- Group By Operator [GBY_144] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized
- SHUFFLE [RS_143]
- Group By Operator [GBY_142] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_141] (rows=7200 width=107)
- Output:["_col0"]
- Please refer to the previous Select Operator [SEL_139]
- <-Reducer 15 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_153]
- Group By Operator [GBY_152] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=10000000)"]
- <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized
- SHUFFLE [RS_151]
- Group By Operator [GBY_150] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=10000000)"]
- Select Operator [SEL_149] (rows=10000000 width=1014)
- Output:["_col0"]
- Please refer to the previous Select Operator [SEL_147]
- <-Reducer 17 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_161]
- Group By Operator [GBY_160] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1861800)"]
- <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized
- SHUFFLE [RS_159]
- Group By Operator [GBY_158] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1861800)"]
- Select Operator [SEL_157] (rows=1861800 width=385)
- Output:["_col0"]
- Please refer to the previous Select Operator [SEL_155]
- <-Reducer 8 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_129]
- Group By Operator [GBY_128] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 1 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_127]
- Group By Operator [GBY_126] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_125] (rows=1704 width=1910)
- Output:["_col0"]
- Please refer to the previous Select Operator [SEL_123]
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col5)","count(_col5)","sum(_col7)","count(_col7)","sum(_col8)","count(_col8)"]
+ Merge Join Operator [MERGEJOIN_121] (rows=8066665 width=1014)
+ Conds:RS_32._col4=RS_156._col0(Inner),Output:["_col5","_col7","_col8"]
+ <-Map 16 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_156]
+ PartitionCols:_col0
+ Select Operator [SEL_155] (rows=1704 width=1910)
+ Output:["_col0"]
+ Filter Operator [FIL_154] (rows=1704 width=1910)
+ predicate:s_store_sk is not null
+ TableScan [TS_15] (rows=1704 width=1910)
+ default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"]
+ <-Reducer 5 [SIMPLE_EDGE]
+ SHUFFLE [RS_32]
+ PartitionCols:_col4
+ Filter Operator [FIL_31] (rows=7333332 width=1014)
+ predicate:((((_col18 = 'KY') or (_col18 = 'GA') or (_col18 = 'NM')) and _col9 BETWEEN 100 AND 200) or (((_col18 = 'MT') or (_col18 = 'OR') or (_col18 = 'IN')) and _col9 BETWEEN 150 AND 300) or (((_col18 = 'WI') or (_col18 = 'MO') or (_col18 = 'WV')) and _col9 BETWEEN 50 AND 250))
+ Merge Join Operator [MERGEJOIN_120] (rows=22000000 width=1014)
+ Conds:RS_28._col3=RS_148._col0(Inner),Output:["_col4","_col5","_col7","_col8","_col9","_col18"]
+ <-Map 14 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_148]
+ PartitionCols:_col0
+ Select Operator [SEL_147] (rows=20000000 width=1014)
+ Output:["_col0","_col1"]
+ Filter Operator [FIL_146] (rows=20000000 width=1014)
+ predicate:((ca_country = 'United States') and ca_address_sk is not null)
+ TableScan [TS_12] (rows=40000000 width=1014)
+ default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"]
+ <-Reducer 4 [SIMPLE_EDGE]
+ SHUFFLE [RS_28]
+ PartitionCols:_col3
+ Filter Operator [FIL_27] (rows=10647918 width=88)
+ predicate:(((_col13 = 'D') and (_col14 = 'Primary') and _col6 BETWEEN 50 AND 100 and (_col16 = 1)) or ((_col13 = 'M') and (_col14 = '4 yr Degree') and _col6 BETWEEN 100 AND 150 and (_col16 = 3)) or ((_col13 = 'U') and (_col14 = 'Advanced Degree') and _col6 BETWEEN 150 AND 200 and (_col16 = 1)))
+ Merge Join Operator [MERGEJOIN_119] (rows=255550079 width=88)
+ Conds:RS_24._col2=RS_140._col0(Inner),Output:["_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col13","_col14","_col16"]
+ <-Map 12 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_140]
+ PartitionCols:_col0
+ Select Operator [SEL_139] (rows=7200 width=107)
+ Output:["_col0","_col1"]
+ Filter Operator [FIL_138] (rows=7200 width=107)
+ predicate:((hd_dep_count) IN (3, 1) and hd_demo_sk is not null)
+ TableScan [TS_9] (rows=7200 width=107)
+ default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"]
+ <-Reducer 3 [SIMPLE_EDGE]
+ SHUFFLE [RS_24]
+ PartitionCols:_col2
+ Merge Join Operator [MERGEJOIN_118] (rows=232318249 width=88)
+ Conds:RS_21._col1=RS_132._col0(Inner),Output:["_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col13","_col14"]
+ <-Map 10 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_132]
+ PartitionCols:_col0
+ Select Operator [SEL_131] (rows=1861800 width=385)
+ Output:["_col0","_col1","_col2"]
+ Filter Operator [FIL_130] (rows=1861800 width=385)
+ predicate:((cd_education_status) IN ('4 yr Degree', 'Primary', 'Advanced Degree') and (cd_marital_status) IN ('M', 'D', 'U') and cd_demo_sk is not null)
+ TableScan [TS_6] (rows=1861800 width=385)
+ default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"]
+ <-Reducer 2 [SIMPLE_EDGE]
+ SHUFFLE [RS_21]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_117] (rows=211198404 width=88)
+ Conds:RS_164._col0=RS_124._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"]
+ <-Map 8 [SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_124]
+ PartitionCols:_col0
+ Select Operator [SEL_123] (rows=36524 width=1119)
+ Output:["_col0"]
+ Filter Operator [FIL_122] (rows=36524 width=1119)
+ predicate:((d_year = 2001) and d_date_sk is not null)
+ TableScan [TS_3] (rows=73049 width=1119)
+ default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
+ <-Map 1 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_164]
+ PartitionCols:_col0
+ Select Operator [SEL_163] (rows=191998545 width=88)
+ Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"]
+ Filter Operator [FIL_162] (rows=191998545 width=88)
+ predicate:((ss_addr_sk BETWEEN DynamicValue(RS_29_customer_address_ca_address_sk_min) AND DynamicValue(RS_29_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_29_customer_address_ca_address_sk_bloom_filter))) and (ss_cdemo_sk BETWEEN DynamicValue(RS_22_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_22_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_22_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_hdemo_sk BETWEEN DynamicValue(RS_25_household_demographics_hd_demo_sk_min) AND DynamicValue(RS_25_household_demographics_hd_demo_sk_max) and in_bloom_filter(ss_hdemo_sk, DynamicValue(RS_25_household_demographics_hd_demo_sk_bloom_filter))) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 150 AND 200) and (ss_sold_date_sk BETWEEN DynamicValue(RS_19_date_dim_d_date_sk_min) AND DynamicValue(RS_19_date_dim
_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_19_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_33_store_s_store_sk_min) AND DynamicValue(RS_33_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_33_store_s_store_sk_bloom_filter))) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_hdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null)
+ TableScan [TS_0] (rows=575995635 width=88)
+ default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_ext_sales_price","ss_ext_wholesale_cost","ss_net_profit"]
+ <-Reducer 11 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_137]
+ Group By Operator [GBY_136] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1861800)"]
+ <-Map 10 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_135]
+ Group By Operator [GBY_134] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1861800)"]
+ Select Operator [SEL_133] (rows=1861800 width=385)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_131]
+ <-Reducer 13 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_145]
+ Group By Operator [GBY_144] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 12 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_143]
+ Group By Operator [GBY_142] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_141] (rows=7200 width=107)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_139]
+ <-Reducer 15 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_153]
+ Group By Operator [GBY_152] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=20000000)"]
+ <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_151]
+ Group By Operator [GBY_150] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=20000000)"]
+ Select Operator [SEL_149] (rows=20000000 width=1014)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_147]
+ <-Reducer 17 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_161]
+ Group By Operator [GBY_160] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_159]
+ Group By Operator [GBY_158] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_157] (rows=1704 width=1910)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_155]
+ <-Reducer 9 [BROADCAST_EDGE] vectorized
+ BROADCAST [RS_129]
+ Group By Operator [GBY_128] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+ <-Map 8 [CUSTOM_SIMPLE_EDGE] vectorized
+ PARTITION_ONLY_SHUFFLE [RS_127]
+ Group By Operator [GBY_126] (rows=1 width=12)
+ Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+ Select Operator [SEL_125] (rows=36524 width=1119)
+ Output:["_col0"]
+ Please refer to the previous Select Operator [SEL_123]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query15.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query15.q.out b/ql/src/test/results/clientpositive/perf/tez/query15.q.out
index 3c7ae66..e1eca99 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query15.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query15.q.out
@@ -71,7 +71,7 @@ Stage-0
Select Operator [SEL_23] (rows=348467716 width=135)
Output:["_col4","_col7"]
Filter Operator [FIL_22] (rows=348467716 width=135)
- predicate:((_col3) IN ('CA', 'WA', 'GA') or (_col7 > 500) or (substr(_col4, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792'))
+ predicate:((_col3 = 'CA') or (_col3 = 'GA') or (_col3 = 'WA') or (_col7 > 500) or (substr(_col4, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792'))
Merge Join Operator [MERGEJOIN_77] (rows=348467716 width=135)
Conds:RS_19._col0=RS_20._col1(Inner),Output:["_col3","_col4","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query16.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query16.q.out b/ql/src/test/results/clientpositive/perf/tez/query16.q.out
index 5652f3b..cbbd1fa 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query16.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query16.q.out
@@ -150,9 +150,9 @@ Stage-0
<-Map 14 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_149]
PartitionCols:_col0
- Select Operator [SEL_148] (rows=30 width=2045)
+ Select Operator [SEL_148] (rows=60 width=2045)
Output:["_col0"]
- Filter Operator [FIL_147] (rows=30 width=2045)
+ Filter Operator [FIL_147] (rows=60 width=2045)
predicate:((cc_county) IN ('Ziebach County', 'Levy County', 'Huron County', 'Franklin Parish', 'Daviess County') and cc_call_center_sk is not null)
TableScan [TS_9] (rows=60 width=2045)
default@call_center,call_center,Tbl:COMPLETE,Col:NONE,Output:["cc_call_center_sk","cc_county"]
@@ -223,7 +223,7 @@ Stage-0
SHUFFLE [RS_152]
Group By Operator [GBY_151] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_150] (rows=30 width=2045)
+ Select Operator [SEL_150] (rows=60 width=2045)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_148]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query17.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query17.q.out b/ql/src/test/results/clientpositive/perf/tez/query17.q.out
index e185775..6b35492 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query17.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query17.q.out
@@ -161,9 +161,9 @@ Stage-0
<-Map 8 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_224]
PartitionCols:_col0
- Select Operator [SEL_219] (rows=36525 width=1119)
+ Select Operator [SEL_219] (rows=73049 width=1119)
Output:["_col0"]
- Filter Operator [FIL_216] (rows=36525 width=1119)
+ Filter Operator [FIL_216] (rows=73049 width=1119)
predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null)
TableScan [TS_3] (rows=73049 width=1119)
default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_quarter_name"]
@@ -184,9 +184,9 @@ Stage-0
<-Map 8 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_222]
PartitionCols:_col0
- Select Operator [SEL_218] (rows=36525 width=1119)
+ Select Operator [SEL_218] (rows=73049 width=1119)
Output:["_col0"]
- Filter Operator [FIL_215] (rows=36525 width=1119)
+ Filter Operator [FIL_215] (rows=73049 width=1119)
predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null)
Please refer to the previous TableScan [TS_3]
<-Map 18 [SIMPLE_EDGE] vectorized
@@ -244,7 +244,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_228]
Group By Operator [GBY_226] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_223] (rows=36525 width=1119)
+ Select Operator [SEL_223] (rows=73049 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_218]
<-Reducer 3 [SIMPLE_EDGE]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query18.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query18.q.out b/ql/src/test/results/clientpositive/perf/tez/query18.q.out
index 1b9b2fb..da5d3b1 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query18.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query18.q.out
@@ -67,35 +67,34 @@ POSTHOOK: type: QUERY
Plan optimized by CBO.
Vertex dependency in root stage
-Map 10 <- Reducer 15 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 19 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE)
-Reducer 11 <- Map 10 (SIMPLE_EDGE), Map 14 (SIMPLE_EDGE)
-Reducer 12 <- Map 16 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE)
-Reducer 13 <- Map 18 (SIMPLE_EDGE), Reducer 12 (SIMPLE_EDGE)
-Reducer 15 <- Map 14 (CUSTOM_SIMPLE_EDGE)
-Reducer 17 <- Map 16 (CUSTOM_SIMPLE_EDGE)
-Reducer 19 <- Map 18 (CUSTOM_SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
-Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
-Reducer 4 <- Reducer 13 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
+Map 9 <- Reducer 14 (BROADCAST_EDGE), Reducer 16 (BROADCAST_EDGE), Reducer 18 (BROADCAST_EDGE)
+Reducer 10 <- Map 13 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE)
+Reducer 11 <- Map 15 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE)
+Reducer 12 <- Map 17 (SIMPLE_EDGE), Reducer 11 (SIMPLE_EDGE)
+Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE)
+Reducer 16 <- Map 15 (CUSTOM_SIMPLE_EDGE)
+Reducer 18 <- Map 17 (CUSTOM_SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE)
+Reducer 3 <- Map 8 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
+Reducer 4 <- Reducer 12 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
Reducer 5 <- Reducer 4 (SIMPLE_EDGE)
Reducer 6 <- Reducer 5 (SIMPLE_EDGE)
-Reducer 7 <- Reducer 3 (CUSTOM_SIMPLE_EDGE)
Stage-0
Fetch Operator
limit:100
Stage-1
Reducer 6 vectorized
- File Output Operator [FS_189]
- Limit [LIM_188] (rows=100 width=135)
+ File Output Operator [FS_187]
+ Limit [LIM_186] (rows=100 width=135)
Number of rows:100
- Select Operator [SEL_187] (rows=1054114882 width=135)
+ Select Operator [SEL_185] (rows=1054114882 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
<-Reducer 5 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_186]
- Select Operator [SEL_185] (rows=1054114882 width=135)
+ SHUFFLE [RS_184]
+ Select Operator [SEL_183] (rows=1054114882 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
- Group By Operator [GBY_184] (rows=1054114882 width=135)
+ Group By Operator [GBY_182] (rows=1054114882 width=135)
Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["sum(VALUE._col0)","count(VALUE._col1)","sum(VALUE._col2)","count(VALUE._col3)","sum(VALUE._col4)","count(VALUE._col5)","sum(VALUE._col6)","count(VALUE._col7)","sum(VALUE._col8)","count(VALUE._col9)","sum(VALUE._col10)","count(VALUE._col11)","sum(VALUE._col12)","count(VALUE._col13)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4
<-Reducer 4 [SIMPLE_EDGE]
SHUFFLE [RS_43]
@@ -106,51 +105,14 @@ Stage-0
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"]
Merge Join Operator [MERGEJOIN_145] (rows=421645953 width=135)
Conds:RS_37._col0=RS_38._col3(Inner),Output:["_col4","_col6","_col7","_col8","_col11","_col16","_col17","_col18","_col19","_col20","_col26"]
- <-Reducer 3 [SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_37]
- PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_141] (rows=48400001 width=860)
- Conds:RS_34._col1=RS_154._col0(Inner),Output:["_col0","_col4","_col6","_col7","_col8"]
- <-Map 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_154]
- PartitionCols:_col0
- Select Operator [SEL_153] (rows=1861800 width=385)
- Output:["_col0"]
- Filter Operator [FIL_152] (rows=1861800 width=385)
- predicate:cd_demo_sk is not null
- TableScan [TS_6] (rows=1861800 width=385)
- default@customer_demographics,cd2,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk"]
- <-Reducer 2 [SIMPLE_EDGE]
- SHUFFLE [RS_34]
- PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_140] (rows=44000000 width=860)
- Conds:RS_148._col2=RS_151._col0(Inner),Output:["_col0","_col1","_col4","_col6","_col7","_col8"]
- <-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_148]
- PartitionCols:_col2
- Select Operator [SEL_147] (rows=40000000 width=860)
- Output:["_col0","_col1","_col2","_col4"]
- Filter Operator [FIL_146] (rows=40000000 width=860)
- predicate:((c_birth_month) IN (9, 5, 12, 4, 1, 10) and c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null)
- TableScan [TS_0] (rows=80000000 width=860)
- default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk","c_birth_month","c_birth_year"]
- <-Map 8 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_151]
- PartitionCols:_col0
- Select Operator [SEL_150] (rows=20000000 width=1014)
- Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_149] (rows=20000000 width=1014)
- predicate:((ca_state) IN ('ND', 'WI', 'AL', 'NC', 'OK', 'MS', 'TN') and ca_address_sk is not null)
- TableScan [TS_3] (rows=40000000 width=1014)
- default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state","ca_country"]
- <-Reducer 13 [SIMPLE_EDGE]
+ <-Reducer 12 [SIMPLE_EDGE]
SHUFFLE [RS_38]
PartitionCols:_col3
Select Operator [SEL_30] (rows=383314495 width=135)
Output:["_col1","_col3","_col6","_col7","_col8","_col9","_col10","_col16"]
Merge Join Operator [MERGEJOIN_144] (rows=383314495 width=135)
Conds:RS_27._col3=RS_173._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col8","_col14","_col16"]
- <-Map 18 [SIMPLE_EDGE] vectorized
+ <-Map 17 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_173]
PartitionCols:_col0
Select Operator [SEL_172] (rows=462000 width=1436)
@@ -159,12 +121,12 @@ Stage-0
predicate:i_item_sk is not null
TableScan [TS_18] (rows=462000 width=1436)
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"]
- <-Reducer 12 [SIMPLE_EDGE]
+ <-Reducer 11 [SIMPLE_EDGE]
SHUFFLE [RS_27]
PartitionCols:_col3
Merge Join Operator [MERGEJOIN_143] (rows=348467716 width=135)
Conds:RS_24._col2=RS_165._col0(Inner),Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col14"]
- <-Map 16 [SIMPLE_EDGE] vectorized
+ <-Map 15 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_165]
PartitionCols:_col0
Select Operator [SEL_164] (rows=465450 width=385)
@@ -173,12 +135,12 @@ Stage-0
predicate:((cd_education_status = 'College') and (cd_gender = 'M') and cd_demo_sk is not null)
TableScan [TS_15] (rows=1861800 width=385)
default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_education_status","cd_dep_count"]
- <-Reducer 11 [SIMPLE_EDGE]
+ <-Reducer 10 [SIMPLE_EDGE]
SHUFFLE [RS_24]
PartitionCols:_col2
Merge Join Operator [MERGEJOIN_142] (rows=316788826 width=135)
- Conds:RS_183._col0=RS_157._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"]
- <-Map 14 [SIMPLE_EDGE] vectorized
+ Conds:RS_181._col0=RS_157._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"]
+ <-Map 13 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_157]
PartitionCols:_col0
Select Operator [SEL_156] (rows=36524 width=1119)
@@ -187,57 +149,83 @@ Stage-0
predicate:((d_year = 2001) and d_date_sk is not null)
TableScan [TS_12] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
- <-Map 10 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_183]
+ <-Map 9 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_181]
PartitionCols:_col0
- Select Operator [SEL_182] (rows=287989836 width=135)
+ Select Operator [SEL_180] (rows=287989836 width=135)
Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"]
- Filter Operator [FIL_181] (rows=287989836 width=135)
- predicate:((cs_bill_cdemo_sk BETWEEN DynamicValue(RS_25_cd1_cd_demo_sk_min) AND DynamicValue(RS_25_cd1_cd_demo_sk_max) and in_bloom_filter(cs_bill_cdemo_sk, DynamicValue(RS_25_cd1_cd_demo_sk_bloom_filter))) and (cs_bill_customer_sk BETWEEN DynamicValue(RS_37_customer_c_customer_sk_min) AND DynamicValue(RS_37_customer_c_customer_sk_max) and in_bloom_filter(cs_bill_customer_sk, DynamicValue(RS_37_customer_c_customer_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_28_item_i_item_sk_min) AND DynamicValue(RS_28_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_28_item_i_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_22_date_dim_d_date_sk_min) AND DynamicValue(RS_22_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_22_date_dim_d_date_sk_bloom_filter))) and cs_bill_cdemo_sk is not null and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk
is not null)
+ Filter Operator [FIL_179] (rows=287989836 width=135)
+ predicate:((cs_bill_cdemo_sk BETWEEN DynamicValue(RS_25_cd1_cd_demo_sk_min) AND DynamicValue(RS_25_cd1_cd_demo_sk_max) and in_bloom_filter(cs_bill_cdemo_sk, DynamicValue(RS_25_cd1_cd_demo_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_28_item_i_item_sk_min) AND DynamicValue(RS_28_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_28_item_i_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_22_date_dim_d_date_sk_min) AND DynamicValue(RS_22_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_22_date_dim_d_date_sk_bloom_filter))) and cs_bill_cdemo_sk is not null and cs_bill_customer_sk is not null and cs_item_sk is not null and cs_sold_date_sk is not null)
TableScan [TS_9] (rows=287989836 width=135)
default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_bill_cdemo_sk","cs_item_sk","cs_quantity","cs_list_price","cs_sales_price","cs_coupon_amt","cs_net_profit"]
- <-Reducer 15 [BROADCAST_EDGE] vectorized
+ <-Reducer 14 [BROADCAST_EDGE] vectorized
BROADCAST [RS_162]
Group By Operator [GBY_161] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 14 [CUSTOM_SIMPLE_EDGE] vectorized
+ <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_160]
Group By Operator [GBY_159] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
Select Operator [SEL_158] (rows=36524 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_156]
- <-Reducer 17 [BROADCAST_EDGE] vectorized
+ <-Reducer 16 [BROADCAST_EDGE] vectorized
BROADCAST [RS_170]
Group By Operator [GBY_169] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized
+ <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_168]
Group By Operator [GBY_167] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
Select Operator [SEL_166] (rows=465450 width=385)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_164]
- <-Reducer 19 [BROADCAST_EDGE] vectorized
+ <-Reducer 18 [BROADCAST_EDGE] vectorized
BROADCAST [RS_178]
Group By Operator [GBY_177] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
- <-Map 18 [CUSTOM_SIMPLE_EDGE] vectorized
+ <-Map 17 [CUSTOM_SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_176]
Group By Operator [GBY_175] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
Select Operator [SEL_174] (rows=462000 width=1436)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_172]
- <-Reducer 7 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_180]
- Group By Operator [GBY_179] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=48400000)"]
- <-Reducer 3 [CUSTOM_SIMPLE_EDGE]
- PARTITION_ONLY_SHUFFLE [RS_126]
- Group By Operator [GBY_125] (rows=1 width=12)
- Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=48400000)"]
- Select Operator [SEL_124] (rows=48400001 width=860)
- Output:["_col0"]
- Please refer to the previous Merge Join Operator [MERGEJOIN_141]
+ <-Reducer 3 [SIMPLE_EDGE]
+ SHUFFLE [RS_37]
+ PartitionCols:_col0
+ Merge Join Operator [MERGEJOIN_141] (rows=96800003 width=860)
+ Conds:RS_34._col1=RS_154._col0(Inner),Output:["_col0","_col4","_col6","_col7","_col8"]
+ <-Map 8 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_154]
+ PartitionCols:_col0
+ Select Operator [SEL_153] (rows=1861800 width=385)
+ Output:["_col0"]
+ Filter Operator [FIL_152] (rows=1861800 width=385)
+ predicate:cd_demo_sk is not null
+ TableScan [TS_6] (rows=1861800 width=385)
+ default@customer_demographics,cd2,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk"]
+ <-Reducer 2 [SIMPLE_EDGE]
+ SHUFFLE [RS_34]
+ PartitionCols:_col1
+ Merge Join Operator [MERGEJOIN_140] (rows=88000001 width=860)
+ Conds:RS_148._col2=RS_151._col0(Inner),Output:["_col0","_col1","_col4","_col6","_col7","_col8"]
+ <-Map 1 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_148]
+ PartitionCols:_col2
+ Select Operator [SEL_147] (rows=80000000 width=860)
+ Output:["_col0","_col1","_col2","_col4"]
+ Filter Operator [FIL_146] (rows=80000000 width=860)
+ predicate:((c_birth_month) IN (9, 5, 12, 4, 1, 10) and c_current_addr_sk is not null and c_current_cdemo_sk is not null and c_customer_sk is not null)
+ TableScan [TS_0] (rows=80000000 width=860)
+ default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk","c_birth_month","c_birth_year"]
+ <-Map 7 [SIMPLE_EDGE] vectorized
+ SHUFFLE [RS_151]
+ PartitionCols:_col0
+ Select Operator [SEL_150] (rows=40000000 width=1014)
+ Output:["_col0","_col1","_col2","_col3"]
+ Filter Operator [FIL_149] (rows=40000000 width=1014)
+ predicate:((ca_state) IN ('ND', 'WI', 'AL', 'NC', 'OK', 'MS', 'TN') and ca_address_sk is not null)
+ TableScan [TS_3] (rows=40000000 width=1014)
+ default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state","ca_country"]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query20.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query20.q.out b/ql/src/test/results/clientpositive/perf/tez/query20.q.out
index 7d126a8..cfa58f1 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query20.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query20.q.out
@@ -99,9 +99,9 @@ Stage-0
<-Map 9 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_69]
PartitionCols:_col0
- Select Operator [SEL_68] (rows=231000 width=1436)
+ Select Operator [SEL_68] (rows=462000 width=1436)
Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
- Filter Operator [FIL_67] (rows=231000 width=1436)
+ Filter Operator [FIL_67] (rows=462000 width=1436)
predicate:((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null)
TableScan [TS_6] (rows=462000 width=1436)
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_class","i_category"]
@@ -136,7 +136,7 @@ Stage-0
SHUFFLE [RS_72]
Group By Operator [GBY_71] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_70] (rows=231000 width=1436)
+ Select Operator [SEL_70] (rows=462000 width=1436)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_68]
<-Reducer 8 [BROADCAST_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query23.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query23.q.out b/ql/src/test/results/clientpositive/perf/tez/query23.q.out
index aab3f93..4d8e319 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query23.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query23.q.out
@@ -206,9 +206,9 @@ Stage-0
<-Map 18 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_613]
PartitionCols:_col0
- Select Operator [SEL_612] (rows=36525 width=1119)
+ Select Operator [SEL_612] (rows=73049 width=1119)
Output:["_col0","_col1"]
- Filter Operator [FIL_611] (rows=36525 width=1119)
+ Filter Operator [FIL_611] (rows=73049 width=1119)
predicate:((d_year) IN (1999, 2000, 2001, 2002) and d_date_sk is not null)
TableScan [TS_9] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_year"]
@@ -229,7 +229,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_616]
Group By Operator [GBY_615] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_614] (rows=36525 width=1119)
+ Select Operator [SEL_614] (rows=73049 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_612]
<-Reducer 21 [BROADCAST_EDGE] vectorized
@@ -367,9 +367,9 @@ Stage-0
<-Map 30 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_652]
PartitionCols:_col0
- Select Operator [SEL_649] (rows=36525 width=1119)
+ Select Operator [SEL_649] (rows=73049 width=1119)
Output:["_col0"]
- Filter Operator [FIL_648] (rows=36525 width=1119)
+ Filter Operator [FIL_648] (rows=73049 width=1119)
predicate:((d_year) IN (1999, 2000, 2001, 2002) and d_date_sk is not null)
TableScan [TS_36] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
@@ -390,7 +390,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_657]
Group By Operator [GBY_655] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_653] (rows=36525 width=1119)
+ Select Operator [SEL_653] (rows=73049 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_649]
<-Reducer 37 [CUSTOM_SIMPLE_EDGE] vectorized
@@ -481,7 +481,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_656]
Group By Operator [GBY_654] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_651] (rows=36525 width=1119)
+ Select Operator [SEL_651] (rows=73049 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_649]
<-Reducer 29 [CUSTOM_SIMPLE_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query27.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query27.q.out b/ql/src/test/results/clientpositive/perf/tez/query27.q.out
index 7ea13c8..20da0af 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query27.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query27.q.out
@@ -101,9 +101,9 @@ Stage-0
<-Map 12 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_119]
PartitionCols:_col0
- Select Operator [SEL_118] (rows=852 width=1910)
+ Select Operator [SEL_118] (rows=1704 width=1910)
Output:["_col0","_col1"]
- Filter Operator [FIL_117] (rows=852 width=1910)
+ Filter Operator [FIL_117] (rows=1704 width=1910)
predicate:((s_state) IN ('SD', 'FL', 'MI', 'LA', 'MO', 'SC') and s_store_sk is not null)
TableScan [TS_9] (rows=1704 width=1910)
default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"]
@@ -163,7 +163,7 @@ Stage-0
SHUFFLE [RS_122]
Group By Operator [GBY_121] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_120] (rows=852 width=1910)
+ Select Operator [SEL_120] (rows=1704 width=1910)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_118]
<-Reducer 15 [BROADCAST_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query29.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query29.q.out b/ql/src/test/results/clientpositive/perf/tez/query29.q.out
index 9bfcdfa..b051622 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query29.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query29.q.out
@@ -289,9 +289,9 @@ Stage-0
<-Map 6 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_208]
PartitionCols:_col0
- Select Operator [SEL_207] (rows=36525 width=1119)
+ Select Operator [SEL_207] (rows=73049 width=1119)
Output:["_col0"]
- Filter Operator [FIL_206] (rows=36525 width=1119)
+ Filter Operator [FIL_206] (rows=73049 width=1119)
predicate:((d_year) IN (1999, 2000, 2001) and d_date_sk is not null)
TableScan [TS_3] (rows=73049 width=1119)
default@date_dim,d3,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
@@ -312,7 +312,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_211]
Group By Operator [GBY_210] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_209] (rows=36525 width=1119)
+ Select Operator [SEL_209] (rows=73049 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_207]
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query34.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query34.q.out b/ql/src/test/results/clientpositive/perf/tez/query34.q.out
index 9b7b482..994e602 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query34.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query34.q.out
@@ -115,9 +115,9 @@ Stage-0
<-Map 14 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_119]
PartitionCols:_col0
- Select Operator [SEL_118] (rows=852 width=1910)
+ Select Operator [SEL_118] (rows=1704 width=1910)
Output:["_col0"]
- Filter Operator [FIL_117] (rows=852 width=1910)
+ Filter Operator [FIL_117] (rows=1704 width=1910)
predicate:((s_county) IN ('Mobile County', 'Maverick County', 'Huron County', 'Kittitas County', 'Fairfield County', 'Jackson County', 'Barrow County', 'Pennington County') and s_store_sk is not null)
TableScan [TS_12] (rows=1704 width=1910)
default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_county"]
@@ -132,7 +132,7 @@ Stage-0
Select Operator [SEL_11] (rows=1200 width=107)
Output:["_col0"]
Filter Operator [FIL_55] (rows=1200 width=107)
- predicate:(((hd_buy_potential = '>10000') or (hd_buy_potential = 'unknown')) and (hd_vehicle_count > 0) and CASE WHEN ((hd_vehicle_count > 0)) THEN (((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count)) > 1.2D)) ELSE (null) END and hd_demo_sk is not null)
+ predicate:((hd_buy_potential) IN ('>10000', 'unknown') and (hd_vehicle_count > 0) and CASE WHEN ((hd_vehicle_count > 0)) THEN (((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count)) > 1.2D)) ELSE (null) END and hd_demo_sk is not null)
TableScan [TS_9] (rows=7200 width=107)
default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential","hd_dep_count","hd_vehicle_count"]
<-Reducer 6 [SIMPLE_EDGE]
@@ -143,9 +143,9 @@ Stage-0
<-Map 10 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_109]
PartitionCols:_col0
- Select Operator [SEL_108] (rows=8116 width=1119)
+ Select Operator [SEL_108] (rows=16232 width=1119)
Output:["_col0"]
- Filter Operator [FIL_107] (rows=8116 width=1119)
+ Filter Operator [FIL_107] (rows=16232 width=1119)
predicate:((d_dom BETWEEN 1 AND 3 or d_dom BETWEEN 25 AND 28) and (d_year) IN (2000, 2001, 2002) and d_date_sk is not null)
TableScan [TS_6] (rows=73049 width=1119)
default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"]
@@ -166,7 +166,7 @@ Stage-0
SHUFFLE [RS_112]
Group By Operator [GBY_111] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_110] (rows=8116 width=1119)
+ Select Operator [SEL_110] (rows=16232 width=1119)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_108]
<-Reducer 13 [BROADCAST_EDGE] vectorized
@@ -188,7 +188,7 @@ Stage-0
SHUFFLE [RS_122]
Group By Operator [GBY_121] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_120] (rows=852 width=1910)
+ Select Operator [SEL_120] (rows=1704 width=1910)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_118]
<-Reducer 4 [BROADCAST_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query36.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query36.q.out b/ql/src/test/results/clientpositive/perf/tez/query36.q.out
index c86c9e4..bc9a40e 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query36.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query36.q.out
@@ -121,9 +121,9 @@ Stage-0
<-Map 10 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_93]
PartitionCols:_col0
- Select Operator [SEL_92] (rows=852 width=1910)
+ Select Operator [SEL_92] (rows=1704 width=1910)
Output:["_col0"]
- Filter Operator [FIL_91] (rows=852 width=1910)
+ Filter Operator [FIL_91] (rows=1704 width=1910)
predicate:((s_state) IN ('SD', 'FL', 'MI', 'LA', 'MO', 'SC', 'AL', 'GA') and s_store_sk is not null)
TableScan [TS_6] (rows=1704 width=1910)
default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"]
@@ -158,7 +158,7 @@ Stage-0
SHUFFLE [RS_96]
Group By Operator [GBY_95] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_94] (rows=852 width=1910)
+ Select Operator [SEL_94] (rows=1704 width=1910)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_92]
<-Reducer 13 [BROADCAST_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query37.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query37.q.out b/ql/src/test/results/clientpositive/perf/tez/query37.q.out
index 2b3ae52..6b5ce3e 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query37.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query37.q.out
@@ -67,9 +67,9 @@ Stage-0
<-Map 5 [SIMPLE_EDGE] vectorized
PARTITION_ONLY_SHUFFLE [RS_76]
PartitionCols:_col0
- Select Operator [SEL_75] (rows=25666 width=1436)
+ Select Operator [SEL_75] (rows=51333 width=1436)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_74] (rows=25666 width=1436)
+ Filter Operator [FIL_74] (rows=51333 width=1436)
predicate:((i_manufact_id) IN (678, 964, 918, 849) and i_current_price BETWEEN 22 AND 52 and i_item_sk is not null)
TableScan [TS_3] (rows=462000 width=1436)
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_manufact_id"]
@@ -113,7 +113,7 @@ Stage-0
PARTITION_ONLY_SHUFFLE [RS_79]
Group By Operator [GBY_78] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_77] (rows=25666 width=1436)
+ Select Operator [SEL_77] (rows=51333 width=1436)
Output:["_col0"]
Please refer to the previous Select Operator [SEL_75]
<-Reducer 9 [BROADCAST_EDGE] vectorized
http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query45.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query45.q.out b/ql/src/test/results/clientpositive/perf/tez/query45.q.out
index edb047d..6458811 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query45.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query45.q.out
@@ -91,9 +91,9 @@ Stage-0
SHUFFLE [RS_150]
Group By Operator [GBY_148] (rows=1 width=16)
Output:["_col0","_col1"],aggregations:["count()","count(i_item_id)"]
- Select Operator [SEL_145] (rows=231000 width=1436)
+ Select Operator [SEL_145] (rows=462000 width=1436)
Output:["i_item_id"]
- Filter Operator [FIL_142] (rows=231000 width=1436)
+ Filter Operator [FIL_142] (rows=462000 width=1436)
predicate:(i_item_sk) IN (2, 3, 5, 7, 11, 13, 17, 19, 23, 29)
TableScan [TS_6] (rows=462000 width=1436)
default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"]
@@ -122,18 +122,18 @@ Stage-0
<-Reducer 12 [ONE_TO_ONE_EDGE] vectorized
FORWARD [RS_153]
PartitionCols:_col0
- Select Operator [SEL_152] (rows=115500 width=1436)
+ Select Operator [SEL_152] (rows=231000 width=1436)
Output:["_col0","_col1"]
- Group By Operator [GBY_151] (rows=115500 width=1436)
+ Group By Operator [GBY_151] (rows=231000 width=1436)
Output:["_col0"],keys:KEY._col0
<-Map 8 [SIMPLE_EDGE] vectorized
SHUFFLE [RS_149]
PartitionCols:_col0
- Group By Operator [GBY_147] (rows=231000 width=1436)
+ Group By Operator [GBY_147] (rows=462000 width=1436)
Output:["_col0"],keys:i_item_id
- Select Operator [SEL_144] (rows=231000 width=1436)
+ Select Operator [SEL_144] (rows=462000 width=1436)
Output:["i_item_id"]
- Filter Operator [FIL_141] (rows=231000 width=1436)
+ Filter Operator [FIL_141] (rows=462000 width=1436)
predicate:(i_item_sk) IN (2, 3, 5, 7, 11, 13, 17, 19, 23, 29)
Please refer to the previous TableScan [TS_6]
<-Reducer 15 [SIMPLE_EDGE]