You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hive.apache.org by ha...@apache.org on 2018/08/06 05:47:48 UTC

[3/9] hive git commit: HIVE-19097 : related equals and in operators may cause inaccurate stats estimations (Zoltan Haindrich via Ashutosh Chauhan)

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query46.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query46.q.out b/ql/src/test/results/clientpositive/perf/tez/query46.q.out
index 708a852..66f51c3 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query46.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query46.q.out
@@ -165,9 +165,9 @@ Stage-0
                                       <-Map 16 [SIMPLE_EDGE] vectorized
                                         PARTITION_ONLY_SHUFFLE [RS_166]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_165] (rows=852 width=1910)
+                                          Select Operator [SEL_165] (rows=1704 width=1910)
                                             Output:["_col0"]
-                                            Filter Operator [FIL_164] (rows=852 width=1910)
+                                            Filter Operator [FIL_164] (rows=1704 width=1910)
                                               predicate:((s_city) IN ('Cedar Grove', 'Wildwood', 'Union', 'Salem', 'Highland Park') and s_store_sk is not null)
                                               TableScan [TS_12] (rows=1704 width=1910)
                                                 default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_city"]
@@ -179,9 +179,9 @@ Stage-0
                                           <-Map 14 [SIMPLE_EDGE] vectorized
                                             PARTITION_ONLY_SHUFFLE [RS_158]
                                               PartitionCols:_col0
-                                              Select Operator [SEL_157] (rows=18263 width=1119)
+                                              Select Operator [SEL_157] (rows=73049 width=1119)
                                                 Output:["_col0"]
-                                                Filter Operator [FIL_156] (rows=18263 width=1119)
+                                                Filter Operator [FIL_156] (rows=73049 width=1119)
                                                   predicate:((d_dow) IN (6, 0) and (d_year) IN (1998, 1999, 2000) and d_date_sk is not null)
                                                   TableScan [TS_9] (rows=73049 width=1119)
                                                     default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dow"]
@@ -202,7 +202,7 @@ Stage-0
                                                         PARTITION_ONLY_SHUFFLE [RS_161]
                                                           Group By Operator [GBY_160] (rows=1 width=12)
                                                             Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                            Select Operator [SEL_159] (rows=18263 width=1119)
+                                                            Select Operator [SEL_159] (rows=73049 width=1119)
                                                               Output:["_col0"]
                                                                Please refer to the previous Select Operator [SEL_157]
                                                   <-Reducer 17 [BROADCAST_EDGE] vectorized
@@ -213,7 +213,7 @@ Stage-0
                                                         PARTITION_ONLY_SHUFFLE [RS_169]
                                                           Group By Operator [GBY_168] (rows=1 width=12)
                                                             Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                            Select Operator [SEL_167] (rows=852 width=1910)
+                                                            Select Operator [SEL_167] (rows=1704 width=1910)
                                                               Output:["_col0"]
                                                                Please refer to the previous Select Operator [SEL_165]
                                                   <-Reducer 19 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query48.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query48.q.out b/ql/src/test/results/clientpositive/perf/tez/query48.q.out
index 1cf8d5c..7b0ce1c 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query48.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query48.q.out
@@ -131,16 +131,16 @@ POSTHOOK: type: QUERY
 Plan optimized by CBO.
 
 Vertex dependency in root stage
-Map 8 <- Reducer 10 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE)
+Map 1 <- Reducer 10 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE), Reducer 8 (BROADCAST_EDGE)
 Reducer 10 <- Map 9 (CUSTOM_SIMPLE_EDGE)
 Reducer 12 <- Map 11 (CUSTOM_SIMPLE_EDGE)
 Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE)
-Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE)
+Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE)
 Reducer 3 <- Map 9 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE)
 Reducer 4 <- Map 11 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE)
 Reducer 5 <- Map 13 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE)
 Reducer 6 <- Reducer 5 (CUSTOM_SIMPLE_EDGE)
-Reducer 7 <- Map 1 (CUSTOM_SIMPLE_EDGE)
+Reducer 8 <- Map 7 (CUSTOM_SIMPLE_EDGE)
 
 Stage-0
   Fetch Operator
@@ -153,115 +153,113 @@ Stage-0
         <-Reducer 5 [CUSTOM_SIMPLE_EDGE]
           PARTITION_ONLY_SHUFFLE [RS_30]
             Group By Operator [GBY_29] (rows=1 width=8)
-              Output:["_col0"],aggregations:["sum(_col5)"]
-              Select Operator [SEL_28] (rows=15616947 width=88)
-                Output:["_col5"]
-                Filter Operator [FIL_27] (rows=15616947 width=88)
-                  predicate:(((_col14) IN ('KY', 'GA', 'NM') and _col7 BETWEEN 0 AND 2000) or ((_col14) IN ('MT', 'OR', 'IN') and _col7 BETWEEN 150 AND 3000) or ((_col14) IN ('WI', 'MO', 'WV') and _col7 BETWEEN 50 AND 25000))
-                  Merge Join Operator [MERGEJOIN_96] (rows=93701693 width=88)
-                    Conds:RS_24._col3=RS_123._col0(Inner),Output:["_col5","_col7","_col14"]
-                  <-Map 13 [SIMPLE_EDGE] vectorized
-                    SHUFFLE [RS_123]
-                      PartitionCols:_col0
-                      Select Operator [SEL_122] (rows=10000000 width=1014)
-                        Output:["_col0","_col1"]
-                        Filter Operator [FIL_121] (rows=10000000 width=1014)
-                          predicate:((ca_country = 'United States') and (ca_state) IN ('KY', 'GA', 'NM', 'MT', 'OR', 'IN', 'WI', 'MO', 'WV') and ca_address_sk is not null)
-                          TableScan [TS_12] (rows=40000000 width=1014)
-                            default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"]
-                  <-Reducer 4 [SIMPLE_EDGE]
-                    SHUFFLE [RS_24]
-                      PartitionCols:_col3
-                      Merge Join Operator [MERGEJOIN_95] (rows=85183356 width=88)
-                        Conds:RS_21._col2=RS_115._col0(Inner),Output:["_col3","_col5","_col7"]
-                      <-Map 11 [SIMPLE_EDGE] vectorized
-                        SHUFFLE [RS_115]
-                          PartitionCols:_col0
-                          Select Operator [SEL_114] (rows=465450 width=385)
-                            Output:["_col0"]
-                            Filter Operator [FIL_113] (rows=465450 width=385)
-                              predicate:((cd_education_status = '4 yr Degree') and (cd_marital_status = 'M') and cd_demo_sk is not null)
-                              TableScan [TS_9] (rows=1861800 width=385)
-                                default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"]
-                      <-Reducer 3 [SIMPLE_EDGE]
-                        SHUFFLE [RS_21]
-                          PartitionCols:_col2
-                          Merge Join Operator [MERGEJOIN_94] (rows=77439413 width=88)
-                            Conds:RS_18._col1=RS_107._col0(Inner),Output:["_col2","_col3","_col5","_col7"]
-                          <-Map 9 [SIMPLE_EDGE] vectorized
-                            SHUFFLE [RS_107]
-                              PartitionCols:_col0
-                              Select Operator [SEL_106] (rows=36524 width=1119)
-                                Output:["_col0"]
-                                Filter Operator [FIL_105] (rows=36524 width=1119)
-                                  predicate:((d_year = 1998) and d_date_sk is not null)
-                                  TableScan [TS_6] (rows=73049 width=1119)
-                                    default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
-                          <-Reducer 2 [SIMPLE_EDGE]
-                            SHUFFLE [RS_18]
-                              PartitionCols:_col1
-                              Merge Join Operator [MERGEJOIN_93] (rows=70399465 width=88)
-                                Conds:RS_99._col0=RS_131._col3(Inner),Output:["_col1","_col2","_col3","_col5","_col7"]
-                              <-Map 1 [SIMPLE_EDGE] vectorized
-                                PARTITION_ONLY_SHUFFLE [RS_99]
-                                  PartitionCols:_col0
-                                  Select Operator [SEL_98] (rows=1704 width=1910)
-                                    Output:["_col0"]
-                                    Filter Operator [FIL_97] (rows=1704 width=1910)
-                                      predicate:s_store_sk is not null
-                                      TableScan [TS_0] (rows=1704 width=1910)
-                                        default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"]
-                              <-Map 8 [SIMPLE_EDGE] vectorized
-                                SHUFFLE [RS_131]
-                                  PartitionCols:_col3
-                                  Select Operator [SEL_130] (rows=63999513 width=88)
-                                    Output:["_col0","_col1","_col2","_col3","_col4","_col6"]
-                                    Filter Operator [FIL_129] (rows=63999513 width=88)
-                                      predicate:((ss_addr_sk BETWEEN DynamicValue(RS_25_customer_address_ca_address_sk_min) AND DynamicValue(RS_25_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_25_customer_address_ca_address_sk_bloom_filter))) and (ss_cdemo_sk BETWEEN DynamicValue(RS_22_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_22_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_22_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_net_profit BETWEEN 0 AND 2000 or ss_net_profit BETWEEN 150 AND 3000 or ss_net_profit BETWEEN 50 AND 25000) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 150 AND 200) and (ss_sold_date_sk BETWEEN DynamicValue(RS_19_date_dim_d_date_sk_min) AND DynamicValue(RS_19_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_19_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN Dynami
 cValue(RS_15_store_s_store_sk_min) AND DynamicValue(RS_15_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_15_store_s_store_sk_bloom_filter))) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null)
-                                      TableScan [TS_3] (rows=575995635 width=88)
-                                        default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_net_profit"]
-                                      <-Reducer 10 [BROADCAST_EDGE] vectorized
-                                        BROADCAST [RS_112]
-                                          Group By Operator [GBY_111] (rows=1 width=12)
-                                            Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
-                                          <-Map 9 [CUSTOM_SIMPLE_EDGE] vectorized
-                                            SHUFFLE [RS_110]
-                                              Group By Operator [GBY_109] (rows=1 width=12)
-                                                Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                Select Operator [SEL_108] (rows=36524 width=1119)
-                                                  Output:["_col0"]
-                                                   Please refer to the previous Select Operator [SEL_106]
-                                      <-Reducer 12 [BROADCAST_EDGE] vectorized
-                                        BROADCAST [RS_120]
-                                          Group By Operator [GBY_119] (rows=1 width=12)
-                                            Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
-                                          <-Map 11 [CUSTOM_SIMPLE_EDGE] vectorized
-                                            SHUFFLE [RS_118]
-                                              Group By Operator [GBY_117] (rows=1 width=12)
-                                                Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                Select Operator [SEL_116] (rows=465450 width=385)
-                                                  Output:["_col0"]
-                                                   Please refer to the previous Select Operator [SEL_114]
-                                      <-Reducer 14 [BROADCAST_EDGE] vectorized
-                                        BROADCAST [RS_128]
-                                          Group By Operator [GBY_127] (rows=1 width=12)
-                                            Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=10000000)"]
-                                          <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized
-                                            SHUFFLE [RS_126]
-                                              Group By Operator [GBY_125] (rows=1 width=12)
-                                                Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=10000000)"]
-                                                Select Operator [SEL_124] (rows=10000000 width=1014)
-                                                  Output:["_col0"]
-                                                   Please refer to the previous Select Operator [SEL_122]
-                                      <-Reducer 7 [BROADCAST_EDGE] vectorized
-                                        BROADCAST [RS_104]
-                                          Group By Operator [GBY_103] (rows=1 width=12)
-                                            Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
-                                          <-Map 1 [CUSTOM_SIMPLE_EDGE] vectorized
-                                            PARTITION_ONLY_SHUFFLE [RS_102]
-                                              Group By Operator [GBY_101] (rows=1 width=12)
-                                                Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                Select Operator [SEL_100] (rows=1704 width=1910)
-                                                  Output:["_col0"]
-                                                   Please refer to the previous Select Operator [SEL_98]
+              Output:["_col0"],aggregations:["sum(_col4)"]
+              Merge Join Operator [MERGEJOIN_96] (rows=93701696 width=88)
+                Conds:RS_25._col3=RS_123._col0(Inner),Output:["_col4"]
+              <-Map 13 [SIMPLE_EDGE] vectorized
+                SHUFFLE [RS_123]
+                  PartitionCols:_col0
+                  Select Operator [SEL_122] (rows=1704 width=1910)
+                    Output:["_col0"]
+                    Filter Operator [FIL_121] (rows=1704 width=1910)
+                      predicate:s_store_sk is not null
+                      TableScan [TS_12] (rows=1704 width=1910)
+                        default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"]
+              <-Reducer 4 [SIMPLE_EDGE]
+                SHUFFLE [RS_25]
+                  PartitionCols:_col3
+                  Filter Operator [FIL_24] (rows=85183359 width=88)
+                    predicate:((((_col13 = 'KY') or (_col13 = 'GA') or (_col13 = 'NM')) and _col6 BETWEEN 0 AND 2000) or (((_col13 = 'MT') or (_col13 = 'OR') or (_col13 = 'IN')) and _col6 BETWEEN 150 AND 3000) or (((_col13 = 'WI') or (_col13 = 'MO') or (_col13 = 'WV')) and _col6 BETWEEN 50 AND 25000))
+                    Merge Join Operator [MERGEJOIN_95] (rows=255550079 width=88)
+                      Conds:RS_21._col2=RS_115._col0(Inner),Output:["_col3","_col4","_col6","_col13"]
+                    <-Map 11 [SIMPLE_EDGE] vectorized
+                      SHUFFLE [RS_115]
+                        PartitionCols:_col0
+                        Select Operator [SEL_114] (rows=20000000 width=1014)
+                          Output:["_col0","_col1"]
+                          Filter Operator [FIL_113] (rows=20000000 width=1014)
+                            predicate:((ca_country = 'United States') and ca_address_sk is not null)
+                            TableScan [TS_9] (rows=40000000 width=1014)
+                              default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"]
+                    <-Reducer 3 [SIMPLE_EDGE]
+                      SHUFFLE [RS_21]
+                        PartitionCols:_col2
+                        Merge Join Operator [MERGEJOIN_94] (rows=232318249 width=88)
+                          Conds:RS_18._col1=RS_107._col0(Inner),Output:["_col2","_col3","_col4","_col6"]
+                        <-Map 9 [SIMPLE_EDGE] vectorized
+                          SHUFFLE [RS_107]
+                            PartitionCols:_col0
+                            Select Operator [SEL_106] (rows=465450 width=385)
+                              Output:["_col0"]
+                              Filter Operator [FIL_105] (rows=465450 width=385)
+                                predicate:((cd_education_status = '4 yr Degree') and (cd_marital_status = 'M') and cd_demo_sk is not null)
+                                TableScan [TS_6] (rows=1861800 width=385)
+                                  default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"]
+                        <-Reducer 2 [SIMPLE_EDGE]
+                          SHUFFLE [RS_18]
+                            PartitionCols:_col1
+                            Merge Join Operator [MERGEJOIN_93] (rows=211198404 width=88)
+                              Conds:RS_131._col0=RS_99._col0(Inner),Output:["_col1","_col2","_col3","_col4","_col6"]
+                            <-Map 7 [SIMPLE_EDGE] vectorized
+                              PARTITION_ONLY_SHUFFLE [RS_99]
+                                PartitionCols:_col0
+                                Select Operator [SEL_98] (rows=36524 width=1119)
+                                  Output:["_col0"]
+                                  Filter Operator [FIL_97] (rows=36524 width=1119)
+                                    predicate:((d_year = 1998) and d_date_sk is not null)
+                                    TableScan [TS_3] (rows=73049 width=1119)
+                                      default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
+                            <-Map 1 [SIMPLE_EDGE] vectorized
+                              SHUFFLE [RS_131]
+                                PartitionCols:_col0
+                                Select Operator [SEL_130] (rows=191998545 width=88)
+                                  Output:["_col0","_col1","_col2","_col3","_col4","_col6"]
+                                  Filter Operator [FIL_129] (rows=191998545 width=88)
+                                    predicate:((ss_addr_sk BETWEEN DynamicValue(RS_22_customer_address_ca_address_sk_min) AND DynamicValue(RS_22_customer_address_ca_address_sk_max) and in_bloom_filter(ss_addr_sk, DynamicValue(RS_22_customer_address_ca_address_sk_bloom_filter))) and (ss_cdemo_sk BETWEEN DynamicValue(RS_19_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_19_customer_demographics_cd_demo_sk_max) and in_bloom_filter(ss_cdemo_sk, DynamicValue(RS_19_customer_demographics_cd_demo_sk_bloom_filter))) and (ss_sales_price BETWEEN 100 AND 150 or ss_sales_price BETWEEN 50 AND 100 or ss_sales_price BETWEEN 150 AND 200) and (ss_sold_date_sk BETWEEN DynamicValue(RS_16_date_dim_d_date_sk_min) AND DynamicValue(RS_16_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_16_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_26_store_s_store_sk_min) AND DynamicValue(RS_26_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, Dyna
 micValue(RS_26_store_s_store_sk_bloom_filter))) and ss_addr_sk is not null and ss_cdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null)
+                                    TableScan [TS_0] (rows=575995635 width=88)
+                                      default@store_sales,store_sales,Tbl:COMPLETE,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_net_profit"]
+                                    <-Reducer 10 [BROADCAST_EDGE] vectorized
+                                      BROADCAST [RS_112]
+                                        Group By Operator [GBY_111] (rows=1 width=12)
+                                          Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+                                        <-Map 9 [CUSTOM_SIMPLE_EDGE] vectorized
+                                          SHUFFLE [RS_110]
+                                            Group By Operator [GBY_109] (rows=1 width=12)
+                                              Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+                                              Select Operator [SEL_108] (rows=465450 width=385)
+                                                Output:["_col0"]
+                                                 Please refer to the previous Select Operator [SEL_106]
+                                    <-Reducer 12 [BROADCAST_EDGE] vectorized
+                                      BROADCAST [RS_120]
+                                        Group By Operator [GBY_119] (rows=1 width=12)
+                                          Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=20000000)"]
+                                        <-Map 11 [CUSTOM_SIMPLE_EDGE] vectorized
+                                          SHUFFLE [RS_118]
+                                            Group By Operator [GBY_117] (rows=1 width=12)
+                                              Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=20000000)"]
+                                              Select Operator [SEL_116] (rows=20000000 width=1014)
+                                                Output:["_col0"]
+                                                 Please refer to the previous Select Operator [SEL_114]
+                                    <-Reducer 14 [BROADCAST_EDGE] vectorized
+                                      BROADCAST [RS_128]
+                                        Group By Operator [GBY_127] (rows=1 width=12)
+                                          Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+                                        <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized
+                                          SHUFFLE [RS_126]
+                                            Group By Operator [GBY_125] (rows=1 width=12)
+                                              Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+                                              Select Operator [SEL_124] (rows=1704 width=1910)
+                                                Output:["_col0"]
+                                                 Please refer to the previous Select Operator [SEL_122]
+                                    <-Reducer 8 [BROADCAST_EDGE] vectorized
+                                      BROADCAST [RS_104]
+                                        Group By Operator [GBY_103] (rows=1 width=12)
+                                          Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"]
+                                        <-Map 7 [CUSTOM_SIMPLE_EDGE] vectorized
+                                          PARTITION_ONLY_SHUFFLE [RS_102]
+                                            Group By Operator [GBY_101] (rows=1 width=12)
+                                              Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
+                                              Select Operator [SEL_100] (rows=36524 width=1119)
+                                                Output:["_col0"]
+                                                 Please refer to the previous Select Operator [SEL_98]
 

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query53.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query53.q.out b/ql/src/test/results/clientpositive/perf/tez/query53.q.out
index 3567534..267e28c 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query53.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query53.q.out
@@ -113,9 +113,9 @@ Stage-0
                                   <-Map 9 [SIMPLE_EDGE] vectorized
                                     SHUFFLE [RS_95]
                                       PartitionCols:_col0
-                                      Select Operator [SEL_94] (rows=36525 width=1119)
+                                      Select Operator [SEL_94] (rows=73049 width=1119)
                                         Output:["_col0","_col2"]
-                                        Filter Operator [FIL_93] (rows=36525 width=1119)
+                                        Filter Operator [FIL_93] (rows=73049 width=1119)
                                           predicate:((d_month_seq) IN (1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223) and d_date_sk is not null)
                                           TableScan [TS_6] (rows=73049 width=1119)
                                             default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq","d_qoy"]
@@ -127,10 +127,10 @@ Stage-0
                                       <-Map 7 [SIMPLE_EDGE] vectorized
                                         PARTITION_ONLY_SHUFFLE [RS_87]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_86] (rows=115500 width=1436)
+                                          Select Operator [SEL_86] (rows=462000 width=1436)
                                             Output:["_col0","_col4"]
-                                            Filter Operator [FIL_85] (rows=115500 width=1436)
-                                              predicate:((((i_category) IN ('Books', 'Children', 'Electronics') and (i_class) IN ('personal', 'portable', 'reference', 'self-help') and (i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9')) or ((i_category) IN ('Women', 'Music', 'Men') and (i_class) IN ('accessories', 'classical', 'fragrances', 'pants') and (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1'))) and ((i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9') or (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1')) and ((i_category) IN ('Books', 'Children', 'Electronics') or (i_category) IN ('Women', 'Music', 'Men')) and ((i_class) IN ('personal', 'portable', 'reference', 'self-help') or (i_class) IN ('accessories', 'classical', 'fragrances', 'pants')) and i_item_sk is not null)
+                                            Filter Operator [FIL_85] (rows=462000 width=1436)
+                                              predicate:((((i_category) IN ('Books', 'Children', 'Electronics') and (i_class) IN ('personal', 'portable', 'reference', 'self-help') and (i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9')) or ((i_category) IN ('Women', 'Music', 'Men') and (i_class) IN ('accessories', 'classical', 'fragrances', 'pants') and (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1'))) and i_item_sk is not null)
                                               TableScan [TS_3] (rows=462000 width=1436)
                                                 default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand","i_class","i_category","i_manufact_id"]
                                       <-Map 1 [SIMPLE_EDGE] vectorized
@@ -150,7 +150,7 @@ Stage-0
                                                     SHUFFLE [RS_98]
                                                       Group By Operator [GBY_97] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_96] (rows=36525 width=1119)
+                                                        Select Operator [SEL_96] (rows=73049 width=1119)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_94]
                                               <-Reducer 12 [BROADCAST_EDGE] vectorized
@@ -172,7 +172,7 @@ Stage-0
                                                     PARTITION_ONLY_SHUFFLE [RS_90]
                                                       Group By Operator [GBY_89] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_88] (rows=115500 width=1436)
+                                                        Select Operator [SEL_88] (rows=462000 width=1436)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_86]
 

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query56.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query56.q.out b/ql/src/test/results/clientpositive/perf/tez/query56.q.out
index 0d8ac48..40f39b5 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query56.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query56.q.out
@@ -210,16 +210,16 @@ Stage-0
                                 <-Reducer 16 [ONE_TO_ONE_EDGE] vectorized
                                   FORWARD [RS_325]
                                     PartitionCols:_col0
-                                    Group By Operator [GBY_324] (rows=115500 width=1436)
+                                    Group By Operator [GBY_324] (rows=231000 width=1436)
                                       Output:["_col0"],keys:KEY._col0
                                     <-Map 15 [SIMPLE_EDGE] vectorized
                                       SHUFFLE [RS_323]
                                         PartitionCols:_col0
-                                        Group By Operator [GBY_322] (rows=231000 width=1436)
+                                        Group By Operator [GBY_322] (rows=462000 width=1436)
                                           Output:["_col0"],keys:i_item_id
-                                          Select Operator [SEL_321] (rows=231000 width=1436)
+                                          Select Operator [SEL_321] (rows=462000 width=1436)
                                             Output:["i_item_id"]
-                                            Filter Operator [FIL_320] (rows=231000 width=1436)
+                                            Filter Operator [FIL_320] (rows=462000 width=1436)
                                               predicate:((i_color) IN ('orchid', 'chiffon', 'lace') and i_item_id is not null)
                                               TableScan [TS_3] (rows=462000 width=1436)
                                                 default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_id","i_color"]

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query63.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query63.q.out b/ql/src/test/results/clientpositive/perf/tez/query63.q.out
index a5b7b5a..c9502f0 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query63.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query63.q.out
@@ -115,9 +115,9 @@ Stage-0
                                   <-Map 9 [SIMPLE_EDGE] vectorized
                                     SHUFFLE [RS_95]
                                       PartitionCols:_col0
-                                      Select Operator [SEL_94] (rows=36525 width=1119)
+                                      Select Operator [SEL_94] (rows=73049 width=1119)
                                         Output:["_col0","_col2"]
-                                        Filter Operator [FIL_93] (rows=36525 width=1119)
+                                        Filter Operator [FIL_93] (rows=73049 width=1119)
                                           predicate:((d_month_seq) IN (1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223) and d_date_sk is not null)
                                           TableScan [TS_6] (rows=73049 width=1119)
                                             default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq","d_moy"]
@@ -129,10 +129,10 @@ Stage-0
                                       <-Map 7 [SIMPLE_EDGE] vectorized
                                         PARTITION_ONLY_SHUFFLE [RS_87]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_86] (rows=115500 width=1436)
+                                          Select Operator [SEL_86] (rows=462000 width=1436)
                                             Output:["_col0","_col4"]
-                                            Filter Operator [FIL_85] (rows=115500 width=1436)
-                                              predicate:((((i_category) IN ('Books', 'Children', 'Electronics') and (i_class) IN ('personal', 'portable', 'refernece', 'self-help') and (i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9')) or ((i_category) IN ('Women', 'Music', 'Men') and (i_class) IN ('accessories', 'classical', 'fragrances', 'pants') and (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1'))) and ((i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9') or (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1')) and ((i_category) IN ('Books', 'Children', 'Electronics') or (i_category) IN ('Women', 'Music', 'Men')) and ((i_class) IN ('personal', 'portable', 'refernece', 'self-help') or (i_class) IN ('accessories', 'classical', 'fragrances', 'pants')) and i_item_sk is not null)
+                                            Filter Operator [FIL_85] (rows=462000 width=1436)
+                                              predicate:((((i_category) IN ('Books', 'Children', 'Electronics') and (i_class) IN ('personal', 'portable', 'refernece', 'self-help') and (i_brand) IN ('scholaramalgamalg #14', 'scholaramalgamalg #7', 'exportiunivamalg #9', 'scholaramalgamalg #9')) or ((i_category) IN ('Women', 'Music', 'Men') and (i_class) IN ('accessories', 'classical', 'fragrances', 'pants') and (i_brand) IN ('amalgimporto #1', 'edu packscholar #1', 'exportiimporto #1', 'importoamalg #1'))) and i_item_sk is not null)
                                               TableScan [TS_3] (rows=462000 width=1436)
                                                 default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand","i_class","i_category","i_manager_id"]
                                       <-Map 1 [SIMPLE_EDGE] vectorized
@@ -152,7 +152,7 @@ Stage-0
                                                     SHUFFLE [RS_98]
                                                       Group By Operator [GBY_97] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_96] (rows=36525 width=1119)
+                                                        Select Operator [SEL_96] (rows=73049 width=1119)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_94]
                                               <-Reducer 12 [BROADCAST_EDGE] vectorized
@@ -174,7 +174,7 @@ Stage-0
                                                     PARTITION_ONLY_SHUFFLE [RS_90]
                                                       Group By Operator [GBY_89] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_88] (rows=115500 width=1436)
+                                                        Select Operator [SEL_88] (rows=462000 width=1436)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_86]
 

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query64.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query64.q.out b/ql/src/test/results/clientpositive/perf/tez/query64.q.out
index 6d3edd3..e3eea58 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query64.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query64.q.out
@@ -519,11 +519,11 @@ Stage-0
                                                                                     PARTITION_ONLY_SHUFFLE [RS_1144]
                                                                                       Group By Operator [GBY_1142] (rows=1 width=12)
                                                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                                                        Select Operator [SEL_1140] (rows=2851 width=1436)
+                                                                                        Select Operator [SEL_1140] (rows=5703 width=1436)
                                                                                           Output:["_col0"]
-                                                                                          Select Operator [SEL_1136] (rows=2851 width=1436)
+                                                                                          Select Operator [SEL_1136] (rows=5703 width=1436)
                                                                                             Output:["_col0","_col3"]
-                                                                                            Filter Operator [FIL_1135] (rows=2851 width=1436)
+                                                                                            Filter Operator [FIL_1135] (rows=5703 width=1436)
                                                                                               predicate:((i_color) IN ('maroon', 'burnished', 'dim', 'steel', 'navajo', 'chocolate') and i_current_price BETWEEN 35 AND 45 and i_current_price BETWEEN 36 AND 50 and i_item_sk is not null)
                                                                                               TableScan [TS_34] (rows=462000 width=1436)
                                                                                                 default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price","i_color","i_product_name"]
@@ -624,7 +624,7 @@ Stage-0
                                                                                       PARTITION_ONLY_SHUFFLE [RS_1143]
                                                                                         Group By Operator [GBY_1141] (rows=1 width=12)
                                                                                           Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                                                          Select Operator [SEL_1138] (rows=2851 width=1436)
+                                                                                          Select Operator [SEL_1138] (rows=5703 width=1436)
                                                                                             Output:["_col0"]
                                                                                              Please refer to the previous Select Operator [SEL_1136]
                                                                                 <-Reducer 45 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query68.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query68.q.out b/ql/src/test/results/clientpositive/perf/tez/query68.q.out
index 24b2502..fd1e04b 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query68.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query68.q.out
@@ -179,9 +179,9 @@ Stage-0
                                       <-Map 16 [SIMPLE_EDGE] vectorized
                                         PARTITION_ONLY_SHUFFLE [RS_166]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_165] (rows=852 width=1910)
+                                          Select Operator [SEL_165] (rows=1704 width=1910)
                                             Output:["_col0"]
-                                            Filter Operator [FIL_164] (rows=852 width=1910)
+                                            Filter Operator [FIL_164] (rows=1704 width=1910)
                                               predicate:((s_city) IN ('Cedar Grove', 'Wildwood') and s_store_sk is not null)
                                               TableScan [TS_12] (rows=1704 width=1910)
                                                 default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_city"]
@@ -193,9 +193,9 @@ Stage-0
                                           <-Map 14 [SIMPLE_EDGE] vectorized
                                             PARTITION_ONLY_SHUFFLE [RS_158]
                                               PartitionCols:_col0
-                                              Select Operator [SEL_157] (rows=4058 width=1119)
+                                              Select Operator [SEL_157] (rows=8116 width=1119)
                                                 Output:["_col0"]
-                                                Filter Operator [FIL_156] (rows=4058 width=1119)
+                                                Filter Operator [FIL_156] (rows=8116 width=1119)
                                                   predicate:((d_year) IN (1998, 1999, 2000) and d_date_sk is not null and d_dom BETWEEN 1 AND 2)
                                                   TableScan [TS_9] (rows=73049 width=1119)
                                                     default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"]
@@ -216,7 +216,7 @@ Stage-0
                                                         PARTITION_ONLY_SHUFFLE [RS_161]
                                                           Group By Operator [GBY_160] (rows=1 width=12)
                                                             Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                            Select Operator [SEL_159] (rows=4058 width=1119)
+                                                            Select Operator [SEL_159] (rows=8116 width=1119)
                                                               Output:["_col0"]
                                                                Please refer to the previous Select Operator [SEL_157]
                                                   <-Reducer 17 [BROADCAST_EDGE] vectorized
@@ -227,7 +227,7 @@ Stage-0
                                                         PARTITION_ONLY_SHUFFLE [RS_169]
                                                           Group By Operator [GBY_168] (rows=1 width=12)
                                                             Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                            Select Operator [SEL_167] (rows=852 width=1910)
+                                                            Select Operator [SEL_167] (rows=1704 width=1910)
                                                               Output:["_col0"]
                                                                Please refer to the previous Select Operator [SEL_165]
                                                   <-Reducer 19 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query69.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query69.q.out b/ql/src/test/results/clientpositive/perf/tez/query69.q.out
index 738508a..4aad667 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query69.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query69.q.out
@@ -224,9 +224,9 @@ Stage-0
                                             <-Map 9 [SIMPLE_EDGE] vectorized
                                               SHUFFLE [RS_187]
                                                 PartitionCols:_col0
-                                                Select Operator [SEL_186] (rows=20000000 width=1014)
+                                                Select Operator [SEL_186] (rows=40000000 width=1014)
                                                   Output:["_col0"]
-                                                  Filter Operator [FIL_185] (rows=20000000 width=1014)
+                                                  Filter Operator [FIL_185] (rows=40000000 width=1014)
                                                     predicate:((ca_state) IN ('CO', 'IL', 'MN') and ca_address_sk is not null)
                                                     TableScan [TS_3] (rows=40000000 width=1014)
                                                       default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state"]

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query71.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query71.q.out b/ql/src/test/results/clientpositive/perf/tez/query71.q.out
index 4521aab..ca62fa3 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query71.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query71.q.out
@@ -120,7 +120,7 @@ Stage-0
                         Select Operator [SEL_172] (rows=86400 width=471)
                           Output:["_col0","_col1","_col2"]
                           Filter Operator [FIL_171] (rows=86400 width=471)
-                            predicate:(((t_meal_time = 'breakfast') or (t_meal_time = 'dinner')) and t_time_sk is not null)
+                            predicate:((t_meal_time) IN ('breakfast', 'dinner') and t_time_sk is not null)
                             TableScan [TS_35] (rows=86400 width=471)
                               default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute","t_meal_time"]
                     <-Reducer 4 [SIMPLE_EDGE]

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query73.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query73.q.out b/ql/src/test/results/clientpositive/perf/tez/query73.q.out
index cfa5213..153b8b4 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query73.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query73.q.out
@@ -109,9 +109,9 @@ Stage-0
                             <-Map 14 [SIMPLE_EDGE] vectorized
                               SHUFFLE [RS_119]
                                 PartitionCols:_col0
-                                Select Operator [SEL_118] (rows=852 width=1910)
+                                Select Operator [SEL_118] (rows=1704 width=1910)
                                   Output:["_col0"]
-                                  Filter Operator [FIL_117] (rows=852 width=1910)
+                                  Filter Operator [FIL_117] (rows=1704 width=1910)
                                     predicate:((s_county) IN ('Mobile County', 'Maverick County', 'Huron County', 'Kittitas County') and s_store_sk is not null)
                                     TableScan [TS_12] (rows=1704 width=1910)
                                       default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_county"]
@@ -126,7 +126,7 @@ Stage-0
                                     Select Operator [SEL_11] (rows=1200 width=107)
                                       Output:["_col0"]
                                       Filter Operator [FIL_55] (rows=1200 width=107)
-                                        predicate:(((hd_buy_potential = '>10000') or (hd_buy_potential = 'unknown')) and (hd_vehicle_count > 0) and CASE WHEN ((hd_vehicle_count > 0)) THEN (((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count)) > 1.0D)) ELSE (null) END and hd_demo_sk is not null)
+                                        predicate:((hd_buy_potential) IN ('>10000', 'unknown') and (hd_vehicle_count > 0) and CASE WHEN ((hd_vehicle_count > 0)) THEN (((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count)) > 1.0D)) ELSE (null) END and hd_demo_sk is not null)
                                         TableScan [TS_9] (rows=7200 width=107)
                                           default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential","hd_dep_count","hd_vehicle_count"]
                                 <-Reducer 6 [SIMPLE_EDGE]
@@ -137,9 +137,9 @@ Stage-0
                                     <-Map 10 [SIMPLE_EDGE] vectorized
                                       SHUFFLE [RS_109]
                                         PartitionCols:_col0
-                                        Select Operator [SEL_108] (rows=4058 width=1119)
+                                        Select Operator [SEL_108] (rows=8116 width=1119)
                                           Output:["_col0"]
-                                          Filter Operator [FIL_107] (rows=4058 width=1119)
+                                          Filter Operator [FIL_107] (rows=8116 width=1119)
                                             predicate:((d_year) IN (2000, 2001, 2002) and d_date_sk is not null and d_dom BETWEEN 1 AND 2)
                                             TableScan [TS_6] (rows=73049 width=1119)
                                               default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"]
@@ -160,7 +160,7 @@ Stage-0
                                                   SHUFFLE [RS_112]
                                                     Group By Operator [GBY_111] (rows=1 width=12)
                                                       Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                      Select Operator [SEL_110] (rows=4058 width=1119)
+                                                      Select Operator [SEL_110] (rows=8116 width=1119)
                                                         Output:["_col0"]
                                                          Please refer to the previous Select Operator [SEL_108]
                                             <-Reducer 13 [BROADCAST_EDGE] vectorized
@@ -182,7 +182,7 @@ Stage-0
                                                   SHUFFLE [RS_122]
                                                     Group By Operator [GBY_121] (rows=1 width=12)
                                                       Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                      Select Operator [SEL_120] (rows=852 width=1910)
+                                                      Select Operator [SEL_120] (rows=1704 width=1910)
                                                         Output:["_col0"]
                                                          Please refer to the previous Select Operator [SEL_118]
                                             <-Reducer 4 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query74.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query74.q.out b/ql/src/test/results/clientpositive/perf/tez/query74.q.out
index 854e6dc..82f6655 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query74.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query74.q.out
@@ -199,9 +199,9 @@ Stage-0
                                       <-Map 19 [SIMPLE_EDGE] vectorized
                                         SHUFFLE [RS_290]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_284] (rows=18262 width=1119)
+                                          Select Operator [SEL_284] (rows=36524 width=1119)
                                             Output:["_col0","_col1"]
-                                            Filter Operator [FIL_281] (rows=18262 width=1119)
+                                            Filter Operator [FIL_281] (rows=36524 width=1119)
                                               predicate:((d_year = 2001) and (d_year) IN (2001, 2002) and d_date_sk is not null)
                                               TableScan [TS_65] (rows=73049 width=1119)
                                                 default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"]
@@ -222,7 +222,7 @@ Stage-0
                                                     SHUFFLE [RS_300]
                                                       Group By Operator [GBY_296] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_291] (rows=18262 width=1119)
+                                                        Select Operator [SEL_291] (rows=36524 width=1119)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_284]
                                               <-Reducer 26 [BROADCAST_EDGE] vectorized
@@ -266,9 +266,9 @@ Stage-0
                                       <-Map 19 [SIMPLE_EDGE] vectorized
                                         SHUFFLE [RS_292]
                                           PartitionCols:_col0
-                                          Select Operator [SEL_285] (rows=18262 width=1119)
+                                          Select Operator [SEL_285] (rows=36524 width=1119)
                                             Output:["_col0","_col1"]
-                                            Filter Operator [FIL_282] (rows=18262 width=1119)
+                                            Filter Operator [FIL_282] (rows=36524 width=1119)
                                               predicate:((d_year = 2001) and (d_year) IN (2001, 2002) and d_date_sk is not null)
                                                Please refer to the previous TableScan [TS_65]
                                       <-Map 11 [SIMPLE_EDGE] vectorized
@@ -288,7 +288,7 @@ Stage-0
                                                     SHUFFLE [RS_301]
                                                       Group By Operator [GBY_297] (rows=1 width=12)
                                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                        Select Operator [SEL_293] (rows=18262 width=1119)
+                                                        Select Operator [SEL_293] (rows=36524 width=1119)
                                                           Output:["_col0"]
                                                            Please refer to the previous Select Operator [SEL_285]
                   <-Reducer 18 [SIMPLE_EDGE] vectorized
@@ -317,9 +317,9 @@ Stage-0
                                   <-Map 19 [SIMPLE_EDGE] vectorized
                                     SHUFFLE [RS_286]
                                       PartitionCols:_col0
-                                      Select Operator [SEL_283] (rows=18262 width=1119)
+                                      Select Operator [SEL_283] (rows=36524 width=1119)
                                         Output:["_col0","_col1"]
-                                        Filter Operator [FIL_280] (rows=18262 width=1119)
+                                        Filter Operator [FIL_280] (rows=36524 width=1119)
                                           predicate:((d_year = 2002) and (d_year) IN (2001, 2002) and d_date_sk is not null)
                                            Please refer to the previous TableScan [TS_65]
                                   <-Map 15 [SIMPLE_EDGE] vectorized
@@ -339,7 +339,7 @@ Stage-0
                                                 SHUFFLE [RS_298]
                                                   Group By Operator [GBY_294] (rows=1 width=12)
                                                     Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                    Select Operator [SEL_287] (rows=18262 width=1119)
+                                                    Select Operator [SEL_287] (rows=36524 width=1119)
                                                       Output:["_col0"]
                                                        Please refer to the previous Select Operator [SEL_283]
                                           <-Reducer 25 [BROADCAST_EDGE] vectorized
@@ -397,7 +397,7 @@ Stage-0
                                                 SHUFFLE [RS_299]
                                                   Group By Operator [GBY_295] (rows=1 width=12)
                                                     Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                    Select Operator [SEL_289] (rows=18262 width=1119)
+                                                    Select Operator [SEL_289] (rows=36524 width=1119)
                                                       Output:["_col0"]
                                                        Please refer to the previous Select Operator [SEL_283]
 

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query79.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query79.q.out b/ql/src/test/results/clientpositive/perf/tez/query79.q.out
index 105a739..7b9d48f 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query79.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query79.q.out
@@ -127,9 +127,9 @@ Stage-0
                                     <-Map 10 [SIMPLE_EDGE] vectorized
                                       SHUFFLE [RS_109]
                                         PartitionCols:_col0
-                                        Select Operator [SEL_108] (rows=18262 width=1119)
+                                        Select Operator [SEL_108] (rows=36524 width=1119)
                                           Output:["_col0"]
-                                          Filter Operator [FIL_107] (rows=18262 width=1119)
+                                          Filter Operator [FIL_107] (rows=36524 width=1119)
                                             predicate:((d_dow = 1) and (d_year) IN (1998, 1999, 2000) and d_date_sk is not null)
                                             TableScan [TS_6] (rows=73049 width=1119)
                                               default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dow"]
@@ -150,7 +150,7 @@ Stage-0
                                                   SHUFFLE [RS_112]
                                                     Group By Operator [GBY_111] (rows=1 width=12)
                                                       Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                                      Select Operator [SEL_110] (rows=18262 width=1119)
+                                                      Select Operator [SEL_110] (rows=36524 width=1119)
                                                         Output:["_col0"]
                                                          Please refer to the previous Select Operator [SEL_108]
                                             <-Reducer 13 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query82.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query82.q.out b/ql/src/test/results/clientpositive/perf/tez/query82.q.out
index bb5a9e9..de5a681 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query82.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query82.q.out
@@ -67,9 +67,9 @@ Stage-0
                       <-Map 5 [SIMPLE_EDGE] vectorized
                         PARTITION_ONLY_SHUFFLE [RS_76]
                           PartitionCols:_col0
-                          Select Operator [SEL_75] (rows=25666 width=1436)
+                          Select Operator [SEL_75] (rows=51333 width=1436)
                             Output:["_col0","_col1","_col2","_col3"]
-                            Filter Operator [FIL_74] (rows=25666 width=1436)
+                            Filter Operator [FIL_74] (rows=51333 width=1436)
                               predicate:((i_manufact_id) IN (437, 129, 727, 663) and i_current_price BETWEEN 30 AND 60 and i_item_sk is not null)
                               TableScan [TS_3] (rows=462000 width=1436)
                                 default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_manufact_id"]
@@ -113,7 +113,7 @@ Stage-0
                                     PARTITION_ONLY_SHUFFLE [RS_79]
                                       Group By Operator [GBY_78] (rows=1 width=12)
                                         Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"]
-                                        Select Operator [SEL_77] (rows=25666 width=1436)
+                                        Select Operator [SEL_77] (rows=51333 width=1436)
                                           Output:["_col0"]
                                            Please refer to the previous Select Operator [SEL_75]
                               <-Reducer 9 [BROADCAST_EDGE] vectorized

http://git-wip-us.apache.org/repos/asf/hive/blob/20c95c1c/ql/src/test/results/clientpositive/perf/tez/query83.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/perf/tez/query83.q.out b/ql/src/test/results/clientpositive/perf/tez/query83.q.out
index f766e8d..c33b37c 100644
--- a/ql/src/test/results/clientpositive/perf/tez/query83.q.out
+++ b/ql/src/test/results/clientpositive/perf/tez/query83.q.out
@@ -214,11 +214,11 @@ Stage-0
                                         <-Map 19 [SIMPLE_EDGE] vectorized
                                           SHUFFLE [RS_378]
                                             PartitionCols:_col0
-                                            Group By Operator [GBY_377] (rows=36525 width=1119)
+                                            Group By Operator [GBY_377] (rows=73049 width=1119)
                                               Output:["_col0"],keys:_col0
-                                              Select Operator [SEL_376] (rows=36525 width=1119)
+                                              Select Operator [SEL_376] (rows=73049 width=1119)
                                                 Output:["_col0"]
-                                                Filter Operator [FIL_375] (rows=36525 width=1119)
+                                                Filter Operator [FIL_375] (rows=73049 width=1119)
                                                   predicate:((d_date) IN ('1998-01-02', '1998-10-15', '1998-11-10') and d_week_seq is not null)
                                                   TableScan [TS_12] (rows=73049 width=1119)
                                                     default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"]