You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@hive.apache.org by "Shengjun Xin (JIRA)" <ji...@apache.org> on 2013/11/19 09:45:21 UTC
[jira] [Updated] (HIVE-5850) Multiple table join error for avro
[ https://issues.apache.org/jira/browse/HIVE-5850?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]
Shengjun Xin updated HIVE-5850:
-------------------------------
Description:
Reproduce step:
{code}
-- Create table Part.
CREATE EXTERNAL TABLE part
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
STORED AS
INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/part'
TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/part.avsc');
-- Create table Part Supplier.
CREATE EXTERNAL TABLE partsupp
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
STORED AS
INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/partsupp'
TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/partsupp.avsc');
--- Query
select * from partsupp ps join part p on ps.ps_partkey = p.p_partkey where p.p_partkey=1;
{code}
{code}
Error message is:
Error: java.io.IOException: java.io.IOException: org.apache.avro.AvroTypeException: Found {
"type" : "record",
"name" : "partsupp",
"namespace" : "com.gs.sdst.pl.avro.tpch",
"fields" : [ {
"name" : "ps_partkey",
"type" : "long"
}, {
"name" : "ps_suppkey",
"type" : "long"
}, {
"name" : "ps_availqty",
"type" : "long"
}, {
"name" : "ps_supplycost",
"type" : "double"
}, {
"name" : "ps_comment",
"type" : "string"
}, {
"name" : "systimestamp",
"type" : "long"
} ]
}, expecting {
"type" : "record",
"name" : "part",
"namespace" : "com.gs.sdst.pl.avro.tpch",
"fields" : [ {
"name" : "p_partkey",
"type" : "long"
}, {
"name" : "p_name",
"type" : "string"
}, {
"name" : "p_mfgr",
"type" : "string"
}, {
"name" : "p_brand",
"type" : "string"
}, {
"name" : "p_type",
"type" : "string"
}, {
"name" : "p_size",
"type" : "int"
}, {
"name" : "p_container",
"type" : "string"
}, {
"name" : "p_retailprice",
"type" : "double"
}, {
"name" : "p_comment",
"type" : "string"
}, {
"name" : "systimestamp",
"type" : "long"
} ]
}
at org.apache.hadoop.hive.io.HiveIOExceptionHandlerChain.handleRecordReaderNextException(HiveIOExceptionHandlerChain.java:121)
at org.apache.hadoop.hive.io.HiveIOExceptionHandlerUtil.handleRecordReaderNextException(HiveIOExceptionHandlerUtil.java:77)
at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.doNextWithExceptionHandler(HadoopShimsSecure.java:302)
at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.next(HadoopShimsSecure.java:218)
at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.moveToNext(MapTask.java:197)
at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.next(MapTask.java:183)
at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:52)
at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:429)
at org.apache.hadoop.mapred.MapTask.run(MapTask.java:341)
at org.apache.hadoop.mapred.YarnChild$2.run(YarnChild.java:158)
at java.security.AccessController.doPrivileged(Native Method)
at javax.security.auth.Subject.doAs(Subject.java:415)
at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1478)
at org.apache.hadoop.mapred.YarnChild.main(YarnChild.java:153)
{code}
was:
Reproduce step:
{code}
-- Create table Part.
CREATE EXTERNAL TABLE part
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
STORED AS
INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/part'
TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/part.avsc');
-- Create table Part Supplier.
CREATE EXTERNAL TABLE partsupp
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
STORED AS
INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/partsupp'
TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/partsupp.avsc');
--- Query
select * from partsupp ps join part p on ps.ps_partkey = p.p_partkey where p.p_partkey=1;
{code}
Error message is:
Error: java.io.IOException: java.io.IOException: org.apache.avro.AvroTypeException: Found {
"type" : "record",
"name" : "partsupp",
"namespace" : "com.gs.sdst.pl.avro.tpch",
"fields" : [ {
"name" : "ps_partkey",
"type" : "long"
}, {
"name" : "ps_suppkey",
"type" : "long"
}, {
"name" : "ps_availqty",
"type" : "long"
}, {
"name" : "ps_supplycost",
"type" : "double"
}, {
"name" : "ps_comment",
"type" : "string"
}, {
"name" : "systimestamp",
"type" : "long"
} ]
}, expecting {
"type" : "record",
"name" : "part",
"namespace" : "com.gs.sdst.pl.avro.tpch",
"fields" : [ {
"name" : "p_partkey",
"type" : "long"
}, {
"name" : "p_name",
"type" : "string"
}, {
"name" : "p_mfgr",
"type" : "string"
}, {
"name" : "p_brand",
"type" : "string"
}, {
"name" : "p_type",
"type" : "string"
}, {
"name" : "p_size",
"type" : "int"
}, {
"name" : "p_container",
"type" : "string"
}, {
"name" : "p_retailprice",
"type" : "double"
}, {
"name" : "p_comment",
"type" : "string"
}, {
"name" : "systimestamp",
"type" : "long"
} ]
}
at org.apache.hadoop.hive.io.HiveIOExceptionHandlerChain.handleRecordReaderNextException(HiveIOExceptionHandlerChain.java:121)
at org.apache.hadoop.hive.io.HiveIOExceptionHandlerUtil.handleRecordReaderNextException(HiveIOExceptionHandlerUtil.java:77)
at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.doNextWithExceptionHandler(HadoopShimsSecure.java:302)
at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.next(HadoopShimsSecure.java:218)
at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.moveToNext(MapTask.java:197)
at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.next(MapTask.java:183)
at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:52)
at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:429)
at org.apache.hadoop.mapred.MapTask.run(MapTask.java:341)
at org.apache.hadoop.mapred.YarnChild$2.run(YarnChild.java:158)
at java.security.AccessController.doPrivileged(Native Method)
at javax.security.auth.Subject.doAs(Subject.java:415)
at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1478)
at org.apache.hadoop.mapred.YarnChild.main(YarnChild.java:153)
> Multiple table join error for avro
> -----------------------------------
>
> Key: HIVE-5850
> URL: https://issues.apache.org/jira/browse/HIVE-5850
> Project: Hive
> Issue Type: Bug
> Affects Versions: 0.11.0
> Reporter: Shengjun Xin
>
> Reproduce step:
> {code}
> -- Create table Part.
> CREATE EXTERNAL TABLE part
> ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
> STORED AS
> INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
> OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
> LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/part'
> TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/part.avsc');
> -- Create table Part Supplier.
> CREATE EXTERNAL TABLE partsupp
> ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.avro.AvroSerDe'
> STORED AS
> INPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat'
> OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat'
> LOCATION 'hdfs://<hostname>/user/hadoop/tpc-h/data/partsupp'
> TBLPROPERTIES ('avro.schema.url'='hdfs://<hostname>/user/hadoop/tpc-h/schema/partsupp.avsc');
> --- Query
> select * from partsupp ps join part p on ps.ps_partkey = p.p_partkey where p.p_partkey=1;
> {code}
> {code}
> Error message is:
> Error: java.io.IOException: java.io.IOException: org.apache.avro.AvroTypeException: Found {
> "type" : "record",
> "name" : "partsupp",
> "namespace" : "com.gs.sdst.pl.avro.tpch",
> "fields" : [ {
> "name" : "ps_partkey",
> "type" : "long"
> }, {
> "name" : "ps_suppkey",
> "type" : "long"
> }, {
> "name" : "ps_availqty",
> "type" : "long"
> }, {
> "name" : "ps_supplycost",
> "type" : "double"
> }, {
> "name" : "ps_comment",
> "type" : "string"
> }, {
> "name" : "systimestamp",
> "type" : "long"
> } ]
> }, expecting {
> "type" : "record",
> "name" : "part",
> "namespace" : "com.gs.sdst.pl.avro.tpch",
> "fields" : [ {
> "name" : "p_partkey",
> "type" : "long"
> }, {
> "name" : "p_name",
> "type" : "string"
> }, {
> "name" : "p_mfgr",
> "type" : "string"
> }, {
> "name" : "p_brand",
> "type" : "string"
> }, {
> "name" : "p_type",
> "type" : "string"
> }, {
> "name" : "p_size",
> "type" : "int"
> }, {
> "name" : "p_container",
> "type" : "string"
> }, {
> "name" : "p_retailprice",
> "type" : "double"
> }, {
> "name" : "p_comment",
> "type" : "string"
> }, {
> "name" : "systimestamp",
> "type" : "long"
> } ]
> }
> at org.apache.hadoop.hive.io.HiveIOExceptionHandlerChain.handleRecordReaderNextException(HiveIOExceptionHandlerChain.java:121)
> at org.apache.hadoop.hive.io.HiveIOExceptionHandlerUtil.handleRecordReaderNextException(HiveIOExceptionHandlerUtil.java:77)
> at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.doNextWithExceptionHandler(HadoopShimsSecure.java:302)
> at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.next(HadoopShimsSecure.java:218)
> at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.moveToNext(MapTask.java:197)
> at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.next(MapTask.java:183)
> at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:52)
> at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:429)
> at org.apache.hadoop.mapred.MapTask.run(MapTask.java:341)
> at org.apache.hadoop.mapred.YarnChild$2.run(YarnChild.java:158)
> at java.security.AccessController.doPrivileged(Native Method)
> at javax.security.auth.Subject.doAs(Subject.java:415)
> at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1478)
> at org.apache.hadoop.mapred.YarnChild.main(YarnChild.java:153)
> {code}
--
This message was sent by Atlassian JIRA
(v6.1#6144)