You are viewing a plain text version of this content. The canonical link for it is here.
Posted to issues@drill.apache.org by "Rahul Challapalli (JIRA)" <ji...@apache.org> on 2016/11/11 19:29:58 UTC

[jira] [Updated] (DRILL-5037) NPE in Parquet Decimal Converter with the complex parquet reader

     [ https://issues.apache.org/jira/browse/DRILL-5037?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]

Rahul Challapalli updated DRILL-5037:
-------------------------------------
    Description: 
git.commit.id.abbrev=4b1902c

The below query fails when we enable the new parquet reader

Query :
{code}
alter session set `store.parquet.use_new_reader` = true;
 select
                 count(*)			as count_star,
 		sum(a.d18)		as sum_d18,
 		--round(avg(a.d18))	as round_avg_d18,
 		cast(avg(a.d18) as bigint)	as round_avg_d18,
 		--trunc(avg(a.d18))	as trunc_avg_d18,
 		cast(avg(a.d18) as bigint)	as trunc_avg_d18,
 		--sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as case_in_sum_d18,
 		cast(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as bigint) as case_in_sum_d18,
 		--coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as case_in_sum_d18
 		cast(coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as bigint) as case_in_sum_d18
 
from
 		alltypes_with_nulls a
		left outer join alltypes_with_nulls b on (a.c_integer = b.c_integer)
		left outer join alltypes_with_nulls c on (b.c_integer = c.c_integer)
group by
  		a.c_varchar
 		,b.c_varchar
 		,c.c_varchar
 		,a.c_integer
 		,b.c_integer
 		,c.c_integer
 		,a.d9
 		,b.d9
 		,c.d9
 		,a.d18
 		,b.d18
 		,c.d18
 		,a.d28
 		,b.d28
 		,c.d28
 		,a.d38
 		,b.d38
 		,c.d38
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_time

 order by
  		a.c_varchar
 		,b.c_varchar
 		,c.c_varchar
 		,a.c_integer
 		,b.c_integer
 		,c.c_integer
 		,a.d9
 		,b.d9
 		,c.d9
 		,a.d18
 		,b.d18
 		,c.d18
 		,a.d28
 		,b.d28
 		,c.d28
 		,a.d38
 		,b.d38
 		,c.d38
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_time
{code}

I attached the data set and error from the log file

  was:
git.commit.id.abbrev=4b1902c

In one of our regression runs, I observed that the below query failed. I couldn't reproduce this issue again.

Query :
{code}
select

				
		count(*)			as count_star,
 		sum(a.d18)		as sum_d18,
 		--round(avg(a.d18))	as round_avg_d18,
 		cast(avg(a.d18) as bigint)	as round_avg_d18,
 		--trunc(avg(a.d18))	as trunc_avg_d18,
 		cast(avg(a.d18) as bigint)	as trunc_avg_d18,
 		--sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as case_in_sum_d18,
 		cast(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as bigint) as case_in_sum_d18,
 		--coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as case_in_sum_d18
 		cast(coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as bigint) as case_in_sum_d18
 
from
 		alltypes_with_nulls a
		left outer join alltypes_with_nulls b on (a.c_integer = b.c_integer)
		left outer join alltypes_with_nulls c on (b.c_integer = c.c_integer)
group by
  		a.c_varchar
 		,b.c_varchar
 		,c.c_varchar
 		,a.c_integer
 		,b.c_integer
 		,c.c_integer
 		,a.d9
 		,b.d9
 		,c.d9
 		,a.d18
 		,b.d18
 		,c.d18
 		,a.d28
 		,b.d28
 		,c.d28
 		,a.d38
 		,b.d38
 		,c.d38
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_time

 order by
  		a.c_varchar
 		,b.c_varchar
 		,c.c_varchar
 		,a.c_integer
 		,b.c_integer
 		,c.c_integer
 		,a.d9
 		,b.d9
 		,c.d9
 		,a.d18
 		,b.d18
 		,c.d18
 		,a.d28
 		,b.d28
 		,c.d28
 		,a.d38
 		,b.d38
 		,c.d38
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_date
 		,b.c_date
 		,c.c_date
 		,a.c_time
{code}

I attached the data set and error from the log file

        Summary:  NPE in Parquet Decimal Converter with the complex parquet reader  (was:  NPE in Parquet Decimal Converter)

>  NPE in Parquet Decimal Converter with the complex parquet reader
> -----------------------------------------------------------------
>
>                 Key: DRILL-5037
>                 URL: https://issues.apache.org/jira/browse/DRILL-5037
>             Project: Apache Drill
>          Issue Type: Bug
>          Components: Storage - Parquet
>    Affects Versions: 1.9.0
>            Reporter: Rahul Challapalli
>         Attachments: drill5037.parquet
>
>
> git.commit.id.abbrev=4b1902c
> The below query fails when we enable the new parquet reader
> Query :
> {code}
> alter session set `store.parquet.use_new_reader` = true;
>  select
>                  count(*)			as count_star,
>  		sum(a.d18)		as sum_d18,
>  		--round(avg(a.d18))	as round_avg_d18,
>  		cast(avg(a.d18) as bigint)	as round_avg_d18,
>  		--trunc(avg(a.d18))	as trunc_avg_d18,
>  		cast(avg(a.d18) as bigint)	as trunc_avg_d18,
>  		--sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as case_in_sum_d18,
>  		cast(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end) as bigint) as case_in_sum_d18,
>  		--coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as case_in_sum_d18
>  		cast(coalesce(sum(case when a.d18 = 0 then 100 else round(a.d18/12) end), 0) as bigint) as case_in_sum_d18
>  
> from
>  		alltypes_with_nulls a
> 		left outer join alltypes_with_nulls b on (a.c_integer = b.c_integer)
> 		left outer join alltypes_with_nulls c on (b.c_integer = c.c_integer)
> group by
>   		a.c_varchar
>  		,b.c_varchar
>  		,c.c_varchar
>  		,a.c_integer
>  		,b.c_integer
>  		,c.c_integer
>  		,a.d9
>  		,b.d9
>  		,c.d9
>  		,a.d18
>  		,b.d18
>  		,c.d18
>  		,a.d28
>  		,b.d28
>  		,c.d28
>  		,a.d38
>  		,b.d38
>  		,c.d38
>  		,a.c_date
>  		,b.c_date
>  		,c.c_date
>  		,a.c_date
>  		,b.c_date
>  		,c.c_date
>  		,a.c_time
>  order by
>   		a.c_varchar
>  		,b.c_varchar
>  		,c.c_varchar
>  		,a.c_integer
>  		,b.c_integer
>  		,c.c_integer
>  		,a.d9
>  		,b.d9
>  		,c.d9
>  		,a.d18
>  		,b.d18
>  		,c.d18
>  		,a.d28
>  		,b.d28
>  		,c.d28
>  		,a.d38
>  		,b.d38
>  		,c.d38
>  		,a.c_date
>  		,b.c_date
>  		,c.c_date
>  		,a.c_date
>  		,b.c_date
>  		,c.c_date
>  		,a.c_time
> {code}
> I attached the data set and error from the log file



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)