You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by se...@apache.org on 2018/10/26 21:12:16 UTC
[66/75] [abbrv] hive git commit: HIVE-20788: Extended SJ reduction
may backtrack columns incorrectly when creating filters (Jesus Camacho
Rodriguez, reviewed by Deepak Jaiswal)
http://git-wip-us.apache.org/repos/asf/hive/blob/3cbc13e9/ql/src/test/results/clientpositive/perf/tez/constraints/query33.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/constraints/query33.q.out b/ql/src/test/results/clientpositive/perf/tez/constraints/query33.q.out
index c82c415..6d7c620 100644
--- a/ql/src/test/results/clientpositive/perf/tez/constraints/query33.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/constraints/query33.q.out
@@ -194,57 +194,57 @@ Stage-0
limit:100
Stage-1
Reducer 7 vectorized
- File Output Operator [FS_372]
- Limit [LIM_371] (rows=59 width=115)
+ File Output Operator [FS_368]
+ Limit [LIM_367] (rows=59 width=115)
Number of rows:100
- Select Operator [SEL_370] (rows=59 width=115)
+ Select Operator [SEL_366] (rows=59 width=115)
Output:["_col0","_col1"]
<-Reducer 6 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_369]
- Group By Operator [GBY_368] (rows=59 width=115)
+ SHUFFLE [RS_365]
+ Group By Operator [GBY_364] (rows=59 width=115)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Union 5 [SIMPLE_EDGE]
<-Reducer 11 [CONTAINS] vectorized
- Reduce Output Operator [RS_392]
+ Reduce Output Operator [RS_388]
PartitionCols:_col0
- Group By Operator [GBY_391] (rows=59 width=115)
+ Group By Operator [GBY_387] (rows=59 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_390] (rows=19 width=115)
+ Group By Operator [GBY_386] (rows=19 width=115)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 10 [SIMPLE_EDGE]
SHUFFLE [RS_109]
PartitionCols:_col0
Group By Operator [GBY_108] (rows=19 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_308] (rows=11364 width=3)
+ Merge Join Operator [MERGEJOIN_304] (rows=11364 width=3)
Conds:RS_104._col0=RS_105._col2(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_104]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_297] (rows=461514 width=7)
- Conds:RS_323._col1=RS_329._col0(Inner),Output:["_col0","_col1"]
+ Merge Join Operator [MERGEJOIN_293] (rows=461514 width=7)
+ Conds:RS_319._col1=RS_325._col0(Inner),Output:["_col0","_col1"]
<-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_323]
+ SHUFFLE [RS_319]
PartitionCols:_col1
- Select Operator [SEL_322] (rows=460848 width=7)
+ Select Operator [SEL_318] (rows=460848 width=7)
Output:["_col0","_col1"]
- Filter Operator [FIL_321] (rows=460848 width=7)
+ Filter Operator [FIL_317] (rows=460848 width=7)
predicate:i_manufact_id is not null
TableScan [TS_0] (rows=462000 width=7)
default@item,item,Tbl:COMPLETE,Col:COMPLETE,Output:["i_item_sk","i_manufact_id"]
<-Reducer 13 [ONE_TO_ONE_EDGE] vectorized
- FORWARD [RS_329]
+ FORWARD [RS_325]
PartitionCols:_col0
- Group By Operator [GBY_328] (rows=692 width=3)
+ Group By Operator [GBY_324] (rows=692 width=3)
Output:["_col0"],keys:KEY._col0
<-Map 12 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_327]
+ SHUFFLE [RS_323]
PartitionCols:_col0
- Group By Operator [GBY_326] (rows=692 width=3)
+ Group By Operator [GBY_322] (rows=692 width=3)
Output:["_col0"],keys:i_manufact_id
- Select Operator [SEL_325] (rows=46085 width=93)
+ Select Operator [SEL_321] (rows=46085 width=93)
Output:["i_manufact_id"]
- Filter Operator [FIL_324] (rows=46085 width=93)
+ Filter Operator [FIL_320] (rows=46085 width=93)
predicate:((i_category = 'Books') and i_manufact_id is not null)
TableScan [TS_3] (rows=462000 width=93)
default@item,item,Tbl:COMPLETE,Col:COMPLETE,Output:["i_category","i_manufact_id"]
@@ -253,198 +253,198 @@ Stage-0
PartitionCols:_col2
Select Operator [SEL_100] (rows=788222 width=110)
Output:["_col2","_col4"]
- Merge Join Operator [MERGEJOIN_305] (rows=788222 width=110)
- Conds:RS_97._col2=RS_352._col0(Inner),Output:["_col1","_col3"]
+ Merge Join Operator [MERGEJOIN_301] (rows=788222 width=110)
+ Conds:RS_97._col2=RS_348._col0(Inner),Output:["_col1","_col3"]
<-Map 25 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_352]
+ PARTITION_ONLY_SHUFFLE [RS_348]
PartitionCols:_col0
- Select Operator [SEL_347] (rows=8000000 width=4)
+ Select Operator [SEL_343] (rows=8000000 width=4)
Output:["_col0"]
- Filter Operator [FIL_346] (rows=8000000 width=112)
+ Filter Operator [FIL_342] (rows=8000000 width=112)
predicate:(ca_gmt_offset = -6)
TableScan [TS_16] (rows=40000000 width=112)
default@customer_address,customer_address,Tbl:COMPLETE,Col:COMPLETE,Output:["ca_address_sk","ca_gmt_offset"]
<-Reducer 22 [SIMPLE_EDGE]
SHUFFLE [RS_97]
PartitionCols:_col2
- Merge Join Operator [MERGEJOIN_304] (rows=3941109 width=118)
- Conds:RS_389._col0=RS_336._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_300] (rows=3941109 width=118)
+ Conds:RS_385._col0=RS_332._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 17 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_336]
+ PARTITION_ONLY_SHUFFLE [RS_332]
PartitionCols:_col0
- Select Operator [SEL_331] (rows=50 width=4)
+ Select Operator [SEL_327] (rows=50 width=4)
Output:["_col0"]
- Filter Operator [FIL_330] (rows=50 width=12)
+ Filter Operator [FIL_326] (rows=50 width=12)
predicate:((d_moy = 3) and (d_year = 1999))
TableScan [TS_13] (rows=73049 width=12)
default@date_dim,date_dim,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_year","d_moy"]
<-Map 30 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_389]
+ SHUFFLE [RS_385]
PartitionCols:_col0
- Select Operator [SEL_388] (rows=143931246 width=123)
+ Select Operator [SEL_384] (rows=143931246 width=123)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_387] (rows=143931246 width=123)
+ Filter Operator [FIL_383] (rows=143931246 width=123)
predicate:((ws_bill_addr_sk BETWEEN DynamicValue(RS_98_customer_address_ca_address_sk_min) AND DynamicValue(RS_98_customer_address_ca_address_sk_max) and in_bloom_filter(ws_bill_addr_sk, DynamicValue(RS_98_customer_address_ca_address_sk_bloom_filter))) and (ws_sold_date_sk BETWEEN DynamicValue(RS_95_date_dim_d_date_sk_min) AND DynamicValue(RS_95_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_95_date_dim_d_date_sk_bloom_filter))) and ws_bill_addr_sk is not null and ws_sold_date_sk is not null)
TableScan [TS_85] (rows=144002668 width=123)
default@web_sales,web_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["ws_sold_date_sk","ws_item_sk","ws_bill_addr_sk","ws_ext_sales_price"]
<-Reducer 24 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_384]
- Group By Operator [GBY_383] (rows=1 width=12)
+ BROADCAST [RS_380]
+ Group By Operator [GBY_379] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 17 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_343]
- Group By Operator [GBY_340] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_339]
+ Group By Operator [GBY_336] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_337] (rows=50 width=4)
+ Select Operator [SEL_333] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_331]
+ Please refer to the previous Select Operator [SEL_327]
<-Reducer 28 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_386]
- Group By Operator [GBY_385] (rows=1 width=12)
+ BROADCAST [RS_382]
+ Group By Operator [GBY_381] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 25 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_359]
- Group By Operator [GBY_356] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_355]
+ Group By Operator [GBY_352] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_353] (rows=8000000 width=4)
+ Select Operator [SEL_349] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_347]
+ Please refer to the previous Select Operator [SEL_343]
<-Reducer 4 [CONTAINS] vectorized
- Reduce Output Operator [RS_367]
+ Reduce Output Operator [RS_363]
PartitionCols:_col0
- Group By Operator [GBY_366] (rows=59 width=115)
+ Group By Operator [GBY_362] (rows=59 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_365] (rows=64 width=115)
+ Group By Operator [GBY_361] (rows=64 width=115)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_34]
PartitionCols:_col0
Group By Operator [GBY_33] (rows=64 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_306] (rows=41476 width=3)
+ Merge Join Operator [MERGEJOIN_302] (rows=41476 width=3)
Conds:RS_29._col0=RS_30._col2(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_29]
PartitionCols:_col0
- Please refer to the previous Merge Join Operator [MERGEJOIN_297]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_293]
<-Reducer 16 [SIMPLE_EDGE]
SHUFFLE [RS_30]
PartitionCols:_col2
Select Operator [SEL_25] (rows=2876890 width=4)
Output:["_col2","_col4"]
- Merge Join Operator [MERGEJOIN_299] (rows=2876890 width=4)
- Conds:RS_22._col2=RS_348._col0(Inner),Output:["_col1","_col3"]
+ Merge Join Operator [MERGEJOIN_295] (rows=2876890 width=4)
+ Conds:RS_22._col2=RS_344._col0(Inner),Output:["_col1","_col3"]
<-Map 25 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_348]
+ PARTITION_ONLY_SHUFFLE [RS_344]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_347]
+ Please refer to the previous Select Operator [SEL_343]
<-Reducer 15 [SIMPLE_EDGE]
SHUFFLE [RS_22]
PartitionCols:_col2
- Merge Join Operator [MERGEJOIN_298] (rows=14384447 width=4)
- Conds:RS_364._col0=RS_332._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_294] (rows=14384447 width=4)
+ Conds:RS_360._col0=RS_328._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 17 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_332]
+ PARTITION_ONLY_SHUFFLE [RS_328]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_331]
+ Please refer to the previous Select Operator [SEL_327]
<-Map 14 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_364]
+ SHUFFLE [RS_360]
PartitionCols:_col0
- Select Operator [SEL_363] (rows=525327191 width=118)
+ Select Operator [SEL_359] (rows=525327191 width=118)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_362] (rows=525327191 width=118)
+ Filter Operator [FIL_358] (rows=525327191 width=118)
predicate:((ss_addr_sk BETWEEN DynamicValue(RS_23_customer_address_ca_address_sk_min) AND DynamicValue(RS_23_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_23_customer_address_ca_address_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_20_date_dim_d_date_sk_min) AND DynamicValue(RS_20_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_20_date_dim_d_date_sk_bloom_filter))) and ss_addr_sk is not null and ss_sold_date_sk is not null)
TableScan [TS_10] (rows=575995635 width=118)
default@store_sales,store_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["ss_sold_date_sk","ss_item_sk","ss_addr_sk","ss_ext_sales_price"]
<-Reducer 18 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_345]
- Group By Operator [GBY_344] (rows=1 width=12)
+ BROADCAST [RS_341]
+ Group By Operator [GBY_340] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 17 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_341]
- Group By Operator [GBY_338] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_337]
+ Group By Operator [GBY_334] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_333] (rows=50 width=4)
+ Select Operator [SEL_329] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_331]
+ Please refer to the previous Select Operator [SEL_327]
<-Reducer 26 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_361]
- Group By Operator [GBY_360] (rows=1 width=12)
+ BROADCAST [RS_357]
+ Group By Operator [GBY_356] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 25 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_357]
- Group By Operator [GBY_354] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_353]
+ Group By Operator [GBY_350] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_349] (rows=8000000 width=4)
+ Select Operator [SEL_345] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_347]
+ Please refer to the previous Select Operator [SEL_343]
<-Reducer 9 [CONTAINS] vectorized
- Reduce Output Operator [RS_382]
+ Reduce Output Operator [RS_378]
PartitionCols:_col0
- Group By Operator [GBY_381] (rows=59 width=115)
+ Group By Operator [GBY_377] (rows=59 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_380] (rows=35 width=115)
+ Group By Operator [GBY_376] (rows=35 width=115)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 8 [SIMPLE_EDGE]
SHUFFLE [RS_71]
PartitionCols:_col0
Group By Operator [GBY_70] (rows=35 width=115)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_307] (rows=22352 width=3)
+ Merge Join Operator [MERGEJOIN_303] (rows=22352 width=3)
Conds:RS_66._col0=RS_67._col3(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_66]
PartitionCols:_col0
- Please refer to the previous Merge Join Operator [MERGEJOIN_297]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_293]
<-Reducer 20 [SIMPLE_EDGE]
SHUFFLE [RS_67]
PartitionCols:_col3
Select Operator [SEL_62] (rows=1550375 width=13)
Output:["_col3","_col4"]
- Merge Join Operator [MERGEJOIN_302] (rows=1550375 width=13)
- Conds:RS_59._col1=RS_350._col0(Inner),Output:["_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_298] (rows=1550375 width=13)
+ Conds:RS_59._col1=RS_346._col0(Inner),Output:["_col2","_col3"]
<-Map 25 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_350]
+ PARTITION_ONLY_SHUFFLE [RS_346]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_347]
+ Please refer to the previous Select Operator [SEL_343]
<-Reducer 19 [SIMPLE_EDGE]
SHUFFLE [RS_59]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_301] (rows=7751872 width=98)
- Conds:RS_379._col0=RS_334._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_297] (rows=7751872 width=98)
+ Conds:RS_375._col0=RS_330._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 17 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_334]
+ PARTITION_ONLY_SHUFFLE [RS_330]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_331]
+ Please refer to the previous Select Operator [SEL_327]
<-Map 29 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_379]
+ SHUFFLE [RS_375]
PartitionCols:_col0
- Select Operator [SEL_378] (rows=285117733 width=123)
+ Select Operator [SEL_374] (rows=285117733 width=123)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_377] (rows=285117733 width=123)
+ Filter Operator [FIL_373] (rows=285117733 width=123)
predicate:((cs_bill_addr_sk BETWEEN DynamicValue(RS_60_customer_address_ca_address_sk_min) AND DynamicValue(RS_60_customer_address_ca_address_sk_max) and in_bloom_filter(cs_bill_addr_sk, DynamicValue(RS_60_customer_address_ca_address_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_57_date_dim_d_date_sk_min) AND DynamicValue(RS_57_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_57_date_dim_d_date_sk_bloom_filter))) and cs_bill_addr_sk is not null and cs_sold_date_sk is not null)
TableScan [TS_47] (rows=287989836 width=123)
default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["cs_sold_date_sk","cs_bill_addr_sk","cs_item_sk","cs_ext_sales_price"]
<-Reducer 21 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_374]
- Group By Operator [GBY_373] (rows=1 width=12)
+ BROADCAST [RS_370]
+ Group By Operator [GBY_369] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 17 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_342]
- Group By Operator [GBY_339] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_338]
+ Group By Operator [GBY_335] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_335] (rows=50 width=4)
+ Select Operator [SEL_331] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_331]
+ Please refer to the previous Select Operator [SEL_327]
<-Reducer 27 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_376]
- Group By Operator [GBY_375] (rows=1 width=12)
+ BROADCAST [RS_372]
+ Group By Operator [GBY_371] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 25 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_358]
- Group By Operator [GBY_355] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_354]
+ Group By Operator [GBY_351] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_351] (rows=8000000 width=4)
+ Select Operator [SEL_347] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_347]
+ Please refer to the previous Select Operator [SEL_343]
http://git-wip-us.apache.org/repos/asf/hive/blob/3cbc13e9/ql/src/test/results/clientpositive/perf/tez/constraints/query56.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/constraints/query56.q.out b/ql/src/test/results/clientpositive/perf/tez/constraints/query56.q.out
index b57ded3..cac7668 100644
--- a/ql/src/test/results/clientpositive/perf/tez/constraints/query56.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/constraints/query56.q.out
@@ -183,55 +183,55 @@ Stage-0
limit:100
Stage-1
Reducer 7 vectorized
- File Output Operator [FS_370]
- Limit [LIM_369] (rows=100 width=212)
+ File Output Operator [FS_366]
+ Limit [LIM_365] (rows=100 width=212)
Number of rows:100
- Select Operator [SEL_368] (rows=430 width=212)
+ Select Operator [SEL_364] (rows=430 width=212)
Output:["_col0","_col1"]
<-Reducer 6 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_367]
- Group By Operator [GBY_366] (rows=430 width=212)
+ SHUFFLE [RS_363]
+ Group By Operator [GBY_362] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Union 5 [SIMPLE_EDGE]
<-Reducer 10 [CONTAINS] vectorized
- Reduce Output Operator [RS_382]
+ Reduce Output Operator [RS_378]
PartitionCols:_col0
- Group By Operator [GBY_381] (rows=430 width=212)
+ Group By Operator [GBY_377] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_380] (rows=430 width=212)
+ Group By Operator [GBY_376] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 9 [SIMPLE_EDGE]
SHUFFLE [RS_69]
PartitionCols:_col0
Group By Operator [GBY_68] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_304] (rows=373066 width=100)
+ Merge Join Operator [MERGEJOIN_300] (rows=373066 width=100)
Conds:RS_64._col0=RS_65._col3(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_64]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_294] (rows=17170 width=104)
- Conds:RS_319._col1=RS_325._col0(Inner),Output:["_col0","_col1"]
+ Merge Join Operator [MERGEJOIN_290] (rows=17170 width=104)
+ Conds:RS_315._col1=RS_321._col0(Inner),Output:["_col0","_col1"]
<-Map 1 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_319]
+ SHUFFLE [RS_315]
PartitionCols:_col1
- Select Operator [SEL_318] (rows=462000 width=104)
+ Select Operator [SEL_314] (rows=462000 width=104)
Output:["_col0","_col1"]
TableScan [TS_0] (rows=462000 width=104)
default@item,item,Tbl:COMPLETE,Col:COMPLETE,Output:["i_item_sk","i_item_id"]
<-Reducer 16 [ONE_TO_ONE_EDGE] vectorized
- FORWARD [RS_325]
+ FORWARD [RS_321]
PartitionCols:_col0
- Group By Operator [GBY_324] (rows=11550 width=100)
+ Group By Operator [GBY_320] (rows=11550 width=100)
Output:["_col0"],keys:KEY._col0
<-Map 15 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_323]
+ SHUFFLE [RS_319]
PartitionCols:_col0
- Group By Operator [GBY_322] (rows=11550 width=100)
+ Group By Operator [GBY_318] (rows=11550 width=100)
Output:["_col0"],keys:i_item_id
- Select Operator [SEL_321] (rows=23100 width=189)
+ Select Operator [SEL_317] (rows=23100 width=189)
Output:["i_item_id"]
- Filter Operator [FIL_320] (rows=23100 width=189)
+ Filter Operator [FIL_316] (rows=23100 width=189)
predicate:(i_color) IN ('orchid', 'chiffon', 'lace')
TableScan [TS_2] (rows=462000 width=189)
default@item,item,Tbl:COMPLETE,Col:COMPLETE,Output:["i_item_id","i_color"]
@@ -240,231 +240,231 @@ Stage-0
PartitionCols:_col3
Select Operator [SEL_60] (rows=1550375 width=13)
Output:["_col3","_col4"]
- Merge Join Operator [MERGEJOIN_299] (rows=1550375 width=13)
- Conds:RS_57._col1=RS_346._col0(Inner),Output:["_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_295] (rows=1550375 width=13)
+ Conds:RS_57._col1=RS_342._col0(Inner),Output:["_col2","_col3"]
<-Map 28 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_346]
+ PARTITION_ONLY_SHUFFLE [RS_342]
PartitionCols:_col0
- Select Operator [SEL_343] (rows=8000000 width=4)
+ Select Operator [SEL_339] (rows=8000000 width=4)
Output:["_col0"]
- Filter Operator [FIL_342] (rows=8000000 width=112)
+ Filter Operator [FIL_338] (rows=8000000 width=112)
predicate:(ca_gmt_offset = -8)
TableScan [TS_15] (rows=40000000 width=112)
default@customer_address,customer_address,Tbl:COMPLETE,Col:COMPLETE,Output:["ca_address_sk","ca_gmt_offset"]
<-Reducer 22 [SIMPLE_EDGE]
SHUFFLE [RS_57]
PartitionCols:_col1
- Merge Join Operator [MERGEJOIN_298] (rows=7751872 width=98)
- Conds:RS_379._col0=RS_330._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_294] (rows=7751872 width=98)
+ Conds:RS_375._col0=RS_326._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 20 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_330]
+ PARTITION_ONLY_SHUFFLE [RS_326]
PartitionCols:_col0
- Select Operator [SEL_327] (rows=50 width=4)
+ Select Operator [SEL_323] (rows=50 width=4)
Output:["_col0"]
- Filter Operator [FIL_326] (rows=50 width=12)
+ Filter Operator [FIL_322] (rows=50 width=12)
predicate:((d_moy = 1) and (d_year = 2000))
TableScan [TS_12] (rows=73049 width=12)
default@date_dim,date_dim,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_year","d_moy"]
<-Map 32 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_379]
+ SHUFFLE [RS_375]
PartitionCols:_col0
- Select Operator [SEL_378] (rows=285117733 width=123)
+ Select Operator [SEL_374] (rows=285117733 width=123)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_377] (rows=285117733 width=123)
+ Filter Operator [FIL_373] (rows=285117733 width=123)
predicate:((cs_bill_addr_sk BETWEEN DynamicValue(RS_58_customer_address_ca_address_sk_min) AND DynamicValue(RS_58_customer_address_ca_address_sk_max) and in_bloom_filter(cs_bill_addr_sk, DynamicValue(RS_58_customer_address_ca_address_sk_bloom_filter))) and (cs_item_sk BETWEEN DynamicValue(RS_64_item_i_item_sk_min) AND DynamicValue(RS_64_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_64_item_i_item_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_55_date_dim_d_date_sk_min) AND DynamicValue(RS_55_date_dim_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_55_date_dim_d_date_sk_bloom_filter))) and cs_bill_addr_sk is not null and cs_sold_date_sk is not null)
TableScan [TS_45] (rows=287989836 width=123)
default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["cs_sold_date_sk","cs_bill_addr_sk","cs_item_sk","cs_ext_sales_price"]
<-Reducer 11 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_376]
- Group By Operator [GBY_375] (rows=1 width=12)
+ BROADCAST [RS_372]
+ Group By Operator [GBY_371] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- SHUFFLE [RS_239]
- Group By Operator [GBY_238] (rows=1 width=12)
+ SHUFFLE [RS_237]
+ Group By Operator [GBY_236] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_237] (rows=17170 width=4)
+ Select Operator [SEL_235] (rows=17170 width=4)
Output:["_col0"]
- Please refer to the previous Merge Join Operator [MERGEJOIN_294]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_290]
<-Reducer 24 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_372]
- Group By Operator [GBY_371] (rows=1 width=12)
+ BROADCAST [RS_368]
+ Group By Operator [GBY_367] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 20 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_338]
- Group By Operator [GBY_335] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_334]
+ Group By Operator [GBY_331] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_331] (rows=50 width=4)
+ Select Operator [SEL_327] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_327]
+ Please refer to the previous Select Operator [SEL_323]
<-Reducer 30 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_374]
- Group By Operator [GBY_373] (rows=1 width=12)
+ BROADCAST [RS_370]
+ Group By Operator [GBY_369] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 28 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_354]
- Group By Operator [GBY_351] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_350]
+ Group By Operator [GBY_347] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_347] (rows=8000000 width=4)
+ Select Operator [SEL_343] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_343]
+ Please refer to the previous Select Operator [SEL_339]
<-Reducer 13 [CONTAINS] vectorized
- Reduce Output Operator [RS_394]
+ Reduce Output Operator [RS_390]
PartitionCols:_col0
- Group By Operator [GBY_393] (rows=430 width=212)
+ Group By Operator [GBY_389] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_392] (rows=430 width=212)
+ Group By Operator [GBY_388] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 12 [SIMPLE_EDGE]
SHUFFLE [RS_106]
PartitionCols:_col0
Group By Operator [GBY_105] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_305] (rows=189670 width=190)
+ Merge Join Operator [MERGEJOIN_301] (rows=189670 width=190)
Conds:RS_101._col0=RS_102._col2(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_101]
PartitionCols:_col0
- Please refer to the previous Merge Join Operator [MERGEJOIN_294]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_290]
<-Reducer 26 [SIMPLE_EDGE]
SHUFFLE [RS_102]
PartitionCols:_col2
Select Operator [SEL_97] (rows=788222 width=110)
Output:["_col2","_col4"]
- Merge Join Operator [MERGEJOIN_302] (rows=788222 width=110)
- Conds:RS_94._col2=RS_348._col0(Inner),Output:["_col1","_col3"]
+ Merge Join Operator [MERGEJOIN_298] (rows=788222 width=110)
+ Conds:RS_94._col2=RS_344._col0(Inner),Output:["_col1","_col3"]
<-Map 28 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_348]
+ PARTITION_ONLY_SHUFFLE [RS_344]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_343]
+ Please refer to the previous Select Operator [SEL_339]
<-Reducer 25 [SIMPLE_EDGE]
SHUFFLE [RS_94]
PartitionCols:_col2
- Merge Join Operator [MERGEJOIN_301] (rows=3941109 width=118)
- Conds:RS_391._col0=RS_332._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_297] (rows=3941109 width=118)
+ Conds:RS_387._col0=RS_328._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 20 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_332]
+ PARTITION_ONLY_SHUFFLE [RS_328]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_327]
+ Please refer to the previous Select Operator [SEL_323]
<-Map 33 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_391]
+ SHUFFLE [RS_387]
PartitionCols:_col0
- Select Operator [SEL_390] (rows=143931246 width=123)
+ Select Operator [SEL_386] (rows=143931246 width=123)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_389] (rows=143931246 width=123)
+ Filter Operator [FIL_385] (rows=143931246 width=123)
predicate:((ws_bill_addr_sk BETWEEN DynamicValue(RS_95_customer_address_ca_address_sk_min) AND DynamicValue(RS_95_customer_address_ca_address_sk_max) and in_bloom_filter(ws_bill_addr_sk, DynamicValue(RS_95_customer_address_ca_address_sk_bloom_filter))) and (ws_item_sk BETWEEN DynamicValue(RS_101_item_i_item_sk_min) AND DynamicValue(RS_101_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_101_item_i_item_sk_bloom_filter))) and (ws_sold_date_sk BETWEEN DynamicValue(RS_92_date_dim_d_date_sk_min) AND DynamicValue(RS_92_date_dim_d_date_sk_max) and in_bloom_filter(ws_sold_date_sk, DynamicValue(RS_92_date_dim_d_date_sk_bloom_filter))) and ws_bill_addr_sk is not null and ws_sold_date_sk is not null)
TableScan [TS_82] (rows=144002668 width=123)
default@web_sales,web_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["ws_sold_date_sk","ws_item_sk","ws_bill_addr_sk","ws_ext_sales_price"]
<-Reducer 14 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_388]
- Group By Operator [GBY_387] (rows=1 width=12)
+ BROADCAST [RS_384]
+ Group By Operator [GBY_383] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- SHUFFLE [RS_285]
- Group By Operator [GBY_284] (rows=1 width=12)
+ SHUFFLE [RS_277]
+ Group By Operator [GBY_276] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_283] (rows=17170 width=4)
+ Select Operator [SEL_275] (rows=17170 width=4)
Output:["_col0"]
- Please refer to the previous Merge Join Operator [MERGEJOIN_294]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_290]
<-Reducer 27 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_384]
- Group By Operator [GBY_383] (rows=1 width=12)
+ BROADCAST [RS_380]
+ Group By Operator [GBY_379] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 20 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_339]
- Group By Operator [GBY_336] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_335]
+ Group By Operator [GBY_332] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_333] (rows=50 width=4)
+ Select Operator [SEL_329] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_327]
+ Please refer to the previous Select Operator [SEL_323]
<-Reducer 31 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_386]
- Group By Operator [GBY_385] (rows=1 width=12)
+ BROADCAST [RS_382]
+ Group By Operator [GBY_381] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 28 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_355]
- Group By Operator [GBY_352] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_351]
+ Group By Operator [GBY_348] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_349] (rows=8000000 width=4)
+ Select Operator [SEL_345] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_343]
+ Please refer to the previous Select Operator [SEL_339]
<-Reducer 4 [CONTAINS] vectorized
- Reduce Output Operator [RS_365]
+ Reduce Output Operator [RS_361]
PartitionCols:_col0
- Group By Operator [GBY_364] (rows=430 width=212)
+ Group By Operator [GBY_360] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0
- Group By Operator [GBY_363] (rows=430 width=212)
+ Group By Operator [GBY_359] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0
<-Reducer 3 [SIMPLE_EDGE]
SHUFFLE [RS_33]
PartitionCols:_col0
Group By Operator [GBY_32] (rows=430 width=212)
Output:["_col0","_col1"],aggregations:["sum(_col7)"],keys:_col1
- Merge Join Operator [MERGEJOIN_303] (rows=692265 width=100)
+ Merge Join Operator [MERGEJOIN_299] (rows=692265 width=100)
Conds:RS_28._col0=RS_29._col2(Inner),Output:["_col1","_col7"]
<-Reducer 2 [SIMPLE_EDGE]
SHUFFLE [RS_28]
PartitionCols:_col0
- Please refer to the previous Merge Join Operator [MERGEJOIN_294]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_290]
<-Reducer 19 [SIMPLE_EDGE]
SHUFFLE [RS_29]
PartitionCols:_col2
Select Operator [SEL_24] (rows=2876890 width=4)
Output:["_col2","_col4"]
- Merge Join Operator [MERGEJOIN_296] (rows=2876890 width=4)
- Conds:RS_21._col2=RS_344._col0(Inner),Output:["_col1","_col3"]
+ Merge Join Operator [MERGEJOIN_292] (rows=2876890 width=4)
+ Conds:RS_21._col2=RS_340._col0(Inner),Output:["_col1","_col3"]
<-Map 28 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_344]
+ PARTITION_ONLY_SHUFFLE [RS_340]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_343]
+ Please refer to the previous Select Operator [SEL_339]
<-Reducer 18 [SIMPLE_EDGE]
SHUFFLE [RS_21]
PartitionCols:_col2
- Merge Join Operator [MERGEJOIN_295] (rows=14384447 width=4)
- Conds:RS_362._col0=RS_328._col0(Inner),Output:["_col1","_col2","_col3"]
+ Merge Join Operator [MERGEJOIN_291] (rows=14384447 width=4)
+ Conds:RS_358._col0=RS_324._col0(Inner),Output:["_col1","_col2","_col3"]
<-Map 20 [SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_328]
+ PARTITION_ONLY_SHUFFLE [RS_324]
PartitionCols:_col0
- Please refer to the previous Select Operator [SEL_327]
+ Please refer to the previous Select Operator [SEL_323]
<-Map 17 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_362]
+ SHUFFLE [RS_358]
PartitionCols:_col0
- Select Operator [SEL_361] (rows=525327191 width=118)
+ Select Operator [SEL_357] (rows=525327191 width=118)
Output:["_col0","_col1","_col2","_col3"]
- Filter Operator [FIL_360] (rows=525327191 width=118)
+ Filter Operator [FIL_356] (rows=525327191 width=118)
predicate:((ss_addr_sk BETWEEN DynamicValue(RS_22_customer_address_ca_address_sk_min) AND DynamicValue(RS_22_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_22_customer_address_ca_address_sk_bloom_filter))) and (ss_item_sk BETWEEN DynamicValue(RS_28_item_i_item_sk_min) AND DynamicValue(RS_28_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_28_item_i_item_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_19_date_dim_d_date_sk_min) AND DynamicValue(RS_19_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_19_date_dim_d_date_sk_bloom_filter))) and ss_addr_sk is not null and ss_sold_date_sk is not null)
TableScan [TS_9] (rows=575995635 width=118)
default@store_sales,store_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["ss_sold_date_sk","ss_item_sk","ss_addr_sk","ss_ext_sales_price"]
<-Reducer 21 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_341]
- Group By Operator [GBY_340] (rows=1 width=12)
+ BROADCAST [RS_337]
+ Group By Operator [GBY_336] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 20 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_337]
- Group By Operator [GBY_334] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_333]
+ Group By Operator [GBY_330] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_329] (rows=50 width=4)
+ Select Operator [SEL_325] (rows=50 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_327]
+ Please refer to the previous Select Operator [SEL_323]
<-Reducer 29 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_357]
- Group By Operator [GBY_356] (rows=1 width=12)
+ BROADCAST [RS_353]
+ Group By Operator [GBY_352] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=8000000)"]
<-Map 28 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_353]
- Group By Operator [GBY_350] (rows=1 width=12)
+ PARTITION_ONLY_SHUFFLE [RS_349]
+ Group By Operator [GBY_346] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=8000000)"]
- Select Operator [SEL_345] (rows=8000000 width=4)
+ Select Operator [SEL_341] (rows=8000000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_343]
+ Please refer to the previous Select Operator [SEL_339]
<-Reducer 8 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_359]
- Group By Operator [GBY_358] (rows=1 width=12)
+ BROADCAST [RS_355]
+ Group By Operator [GBY_354] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Reducer 2 [CUSTOM_SIMPLE_EDGE]
- SHUFFLE [RS_203]
- Group By Operator [GBY_202] (rows=1 width=12)
+ SHUFFLE [RS_197]
+ Group By Operator [GBY_196] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_201] (rows=17170 width=4)
+ Select Operator [SEL_195] (rows=17170 width=4)
Output:["_col0"]
- Please refer to the previous Merge Join Operator [MERGEJOIN_294]
+ Please refer to the previous Merge Join Operator [MERGEJOIN_290]
http://git-wip-us.apache.org/repos/asf/hive/blob/3cbc13e9/ql/src/test/results/clientpositive/perf/tez/constraints/query6.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/constraints/query6.q.out b/ql/src/test/results/clientpositive/perf/tez/constraints/query6.q.out
index 85c962f..74bec5c 100644
--- a/ql/src/test/results/clientpositive/perf/tez/constraints/query6.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/constraints/query6.q.out
@@ -1,4 +1,4 @@
-Warning: Map Join MAPJOIN[172][bigTable=?] in task 'Reducer 15' is a cross product
+Warning: Map Join MAPJOIN[170][bigTable=?] in task 'Reducer 15' is a cross product
PREHOOK: query: explain
select a.ca_state state, count(*) cnt
from customer_address a
@@ -83,153 +83,153 @@ Stage-0
limit:100
Stage-1
Reducer 10 vectorized
- File Output Operator [FS_234]
- Limit [LIM_233] (rows=1 width=94)
+ File Output Operator [FS_232]
+ Limit [LIM_231] (rows=1 width=94)
Number of rows:100
- Select Operator [SEL_232] (rows=1 width=94)
+ Select Operator [SEL_230] (rows=1 width=94)
Output:["_col0","_col1"]
<-Reducer 9 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_231]
- Filter Operator [FIL_230] (rows=1 width=94)
+ SHUFFLE [RS_229]
+ Filter Operator [FIL_228] (rows=1 width=94)
predicate:(_col1 >= 10L)
- Group By Operator [GBY_229] (rows=1 width=94)
+ Group By Operator [GBY_227] (rows=1 width=94)
Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0
<-Reducer 8 [SIMPLE_EDGE]
SHUFFLE [RS_68]
PartitionCols:_col0
Group By Operator [GBY_67] (rows=1 width=94)
Output:["_col0","_col1"],aggregations:["count()"],keys:_col9
- Merge Join Operator [MERGEJOIN_175] (rows=316 width=86)
- Conds:RS_63._col4=RS_214._col0(Inner),Output:["_col9"]
+ Merge Join Operator [MERGEJOIN_173] (rows=316 width=86)
+ Conds:RS_63._col4=RS_212._col0(Inner),Output:["_col9"]
<-Map 16 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_214]
+ SHUFFLE [RS_212]
PartitionCols:_col0
- Select Operator [SEL_213] (rows=154000 width=227)
+ Select Operator [SEL_211] (rows=154000 width=227)
Output:["_col0"]
- Filter Operator [FIL_212] (rows=154000 width=227)
+ Filter Operator [FIL_210] (rows=154000 width=227)
predicate:(_col4 > _col1)
- Map Join Operator [MAPJOIN_211] (rows=462000 width=227)
- Conds:RS_208._col0=SEL_210._col2(Inner),HybridGraceHashJoin:true,Output:["_col1","_col3","_col4"]
+ Map Join Operator [MAPJOIN_209] (rows=462000 width=227)
+ Conds:RS_206._col0=SEL_208._col2(Inner),HybridGraceHashJoin:true,Output:["_col1","_col3","_col4"]
<-Reducer 15 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_208]
+ BROADCAST [RS_206]
PartitionCols:_col0
- Map Join Operator [MAPJOIN_207] (rows=10 width=202)
+ Map Join Operator [MAPJOIN_205] (rows=10 width=202)
Conds:(Inner),Output:["_col0","_col1"]
<-Reducer 5 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_204]
- Select Operator [SEL_203] (rows=1 width=8)
- Filter Operator [FIL_202] (rows=1 width=8)
+ BROADCAST [RS_202]
+ Select Operator [SEL_201] (rows=1 width=8)
+ Filter Operator [FIL_200] (rows=1 width=8)
predicate:(sq_count_check(_col0) <= 1)
- Group By Operator [GBY_201] (rows=1 width=8)
+ Group By Operator [GBY_199] (rows=1 width=8)
Output:["_col0"],aggregations:["count(VALUE._col0)"]
<-Reducer 4 [CUSTOM_SIMPLE_EDGE] vectorized
- PARTITION_ONLY_SHUFFLE [RS_200]
- Group By Operator [GBY_199] (rows=1 width=8)
+ PARTITION_ONLY_SHUFFLE [RS_198]
+ Group By Operator [GBY_197] (rows=1 width=8)
Output:["_col0"],aggregations:["count()"]
- Select Operator [SEL_198] (rows=25 width=4)
- Group By Operator [GBY_197] (rows=25 width=4)
+ Select Operator [SEL_196] (rows=25 width=4)
+ Group By Operator [GBY_195] (rows=25 width=4)
Output:["_col0"],keys:KEY._col0
<-Map 2 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_187]
+ SHUFFLE [RS_185]
PartitionCols:_col0
- Group By Operator [GBY_185] (rows=25 width=4)
+ Group By Operator [GBY_183] (rows=25 width=4)
Output:["_col0"],keys:d_month_seq
- Select Operator [SEL_183] (rows=50 width=12)
+ Select Operator [SEL_181] (rows=50 width=12)
Output:["d_month_seq"]
- Filter Operator [FIL_181] (rows=50 width=12)
+ Filter Operator [FIL_179] (rows=50 width=12)
predicate:((d_moy = 2) and (d_year = 2000))
TableScan [TS_3] (rows=73049 width=12)
default@date_dim,date_dim,Tbl:COMPLETE,Col:COMPLETE,Output:["d_month_seq","d_year","d_moy"]
- <-Select Operator [SEL_206] (rows=10 width=202)
+ <-Select Operator [SEL_204] (rows=10 width=202)
Output:["_col0","_col1"]
- Group By Operator [GBY_205] (rows=10 width=210)
+ Group By Operator [GBY_203] (rows=10 width=210)
Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","count(VALUE._col1)"],keys:KEY._col0
<-Map 14 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_196]
+ SHUFFLE [RS_194]
PartitionCols:_col0
- Group By Operator [GBY_195] (rows=10 width=210)
+ Group By Operator [GBY_193] (rows=10 width=210)
Output:["_col0","_col1","_col2"],aggregations:["sum(i_current_price)","count(i_current_price)"],keys:i_category
- Filter Operator [FIL_194] (rows=462000 width=201)
+ Filter Operator [FIL_192] (rows=462000 width=201)
predicate:i_category is not null
TableScan [TS_22] (rows=462000 width=201)
default@item,j,Tbl:COMPLETE,Col:COMPLETE,Output:["i_current_price","i_category"]
- <-Select Operator [SEL_210] (rows=462000 width=205)
+ <-Select Operator [SEL_208] (rows=462000 width=205)
Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_209] (rows=462000 width=205)
+ Filter Operator [FIL_207] (rows=462000 width=205)
predicate:i_category is not null
TableScan [TS_43] (rows=462000 width=205)
default@item,i,Tbl:COMPLETE,Col:COMPLETE,Output:["i_item_sk","i_current_price","i_category"]
<-Reducer 7 [SIMPLE_EDGE]
SHUFFLE [RS_63]
PartitionCols:_col4
- Merge Join Operator [MERGEJOIN_174] (rows=7192227 width=90)
- Conds:RS_223._col5=RS_61._col0(Inner),Output:["_col4","_col9"]
+ Merge Join Operator [MERGEJOIN_172] (rows=7192227 width=90)
+ Conds:RS_221._col5=RS_61._col0(Inner),Output:["_col4","_col9"]
<-Map 6 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_223]
+ SHUFFLE [RS_221]
PartitionCols:_col5
- Map Join Operator [MAPJOIN_222] (rows=7192227 width=4)
- Conds:RS_193._col0=SEL_221._col0(Inner),HybridGraceHashJoin:true,Output:["_col4","_col5"]
+ Map Join Operator [MAPJOIN_220] (rows=7192227 width=4)
+ Conds:RS_191._col0=SEL_219._col0(Inner),HybridGraceHashJoin:true,Output:["_col4","_col5"]
<-Map 1 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_193]
+ BROADCAST [RS_191]
PartitionCols:_col0
- Map Join Operator [MAPJOIN_192] (rows=660 width=4)
- Conds:SEL_191._col1=RS_189._col0(Inner),HybridGraceHashJoin:true,Output:["_col0"]
+ Map Join Operator [MAPJOIN_190] (rows=660 width=4)
+ Conds:SEL_189._col1=RS_187._col0(Inner),HybridGraceHashJoin:true,Output:["_col0"]
<-Reducer 3 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_189]
+ BROADCAST [RS_187]
PartitionCols:_col0
- Group By Operator [GBY_188] (rows=25 width=4)
+ Group By Operator [GBY_186] (rows=25 width=4)
Output:["_col0"],keys:KEY._col0
<-Map 2 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_186]
+ SHUFFLE [RS_184]
PartitionCols:_col0
- Group By Operator [GBY_184] (rows=25 width=4)
+ Group By Operator [GBY_182] (rows=25 width=4)
Output:["_col0"],keys:d_month_seq
- Select Operator [SEL_182] (rows=50 width=12)
+ Select Operator [SEL_180] (rows=50 width=12)
Output:["d_month_seq"]
- Filter Operator [FIL_180] (rows=50 width=12)
+ Filter Operator [FIL_178] (rows=50 width=12)
predicate:((d_moy = 2) and (d_year = 2000) and d_month_seq is not null)
Please refer to the previous TableScan [TS_3]
- <-Select Operator [SEL_191] (rows=73049 width=8)
+ <-Select Operator [SEL_189] (rows=73049 width=8)
Output:["_col0","_col1"]
- Filter Operator [FIL_190] (rows=73049 width=8)
+ Filter Operator [FIL_188] (rows=73049 width=8)
predicate:d_month_seq is not null
TableScan [TS_0] (rows=73049 width=8)
default@date_dim,d,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_month_seq"]
- <-Select Operator [SEL_221] (rows=525327388 width=11)
+ <-Select Operator [SEL_219] (rows=525327388 width=11)
Output:["_col0","_col1","_col2"]
- Filter Operator [FIL_220] (rows=525327388 width=11)
+ Filter Operator [FIL_218] (rows=525327388 width=11)
predicate:((ss_item_sk BETWEEN DynamicValue(RS_64_i_i_item_sk_min) AND DynamicValue(RS_64_i_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_64_i_i_item_sk_bloom_filter))) and ss_customer_sk is not null and ss_sold_date_sk is not null)
TableScan [TS_10] (rows=575995635 width=11)
default@store_sales,s,Tbl:COMPLETE,Col:COMPLETE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk"]
<-Reducer 17 [BROADCAST_EDGE] vectorized
- BROADCAST [RS_219]
- Group By Operator [GBY_218] (rows=1 width=12)
+ BROADCAST [RS_217]
+ Group By Operator [GBY_216] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
<-Map 16 [CUSTOM_SIMPLE_EDGE] vectorized
- SHUFFLE [RS_217]
- Group By Operator [GBY_216] (rows=1 width=12)
+ SHUFFLE [RS_215]
+ Group By Operator [GBY_214] (rows=1 width=12)
Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
- Select Operator [SEL_215] (rows=154000 width=4)
+ Select Operator [SEL_213] (rows=154000 width=4)
Output:["_col0"]
- Please refer to the previous Select Operator [SEL_213]
+ Please refer to the previous Select Operator [SEL_211]
<-Reducer 12 [SIMPLE_EDGE]
SHUFFLE [RS_61]
PartitionCols:_col0
- Merge Join Operator [MERGEJOIN_171] (rows=80000000 width=90)
- Conds:RS_226._col1=RS_228._col0(Inner),Output:["_col0","_col3"]
+ Merge Join Operator [MERGEJOIN_169] (rows=80000000 width=90)
+ Conds:RS_224._col1=RS_226._col0(Inner),Output:["_col0","_col3"]
<-Map 11 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_226]
+ SHUFFLE [RS_224]
PartitionCols:_col1
- Select Operator [SEL_225] (rows=80000000 width=8)
+ Select Operator [SEL_223] (rows=80000000 width=8)
Output:["_col0","_col1"]
- Filter Operator [FIL_224] (rows=80000000 width=8)
+ Filter Operator [FIL_222] (rows=80000000 width=8)
predicate:c_current_addr_sk is not null
TableScan [TS_13] (rows=80000000 width=8)
default@customer,c,Tbl:COMPLETE,Col:COMPLETE,Output:["c_customer_sk","c_current_addr_sk"]
<-Map 13 [SIMPLE_EDGE] vectorized
- SHUFFLE [RS_228]
+ SHUFFLE [RS_226]
PartitionCols:_col0
- Select Operator [SEL_227] (rows=40000000 width=90)
+ Select Operator [SEL_225] (rows=40000000 width=90)
Output:["_col0","_col1"]
TableScan [TS_16] (rows=40000000 width=90)
default@customer_address,a,Tbl:COMPLETE,Col:COMPLETE,Output:["ca_address_sk","ca_state"]