You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@falcon.apache.org by "Raghav Kumar Gautam (JIRA)" <ji...@apache.org> on 2014/03/24 22:12:43 UTC
[jira] [Created] (FALCON-372) Process that has hcat partitions with
/ in partition name does not succeed
Raghav Kumar Gautam created FALCON-372:
------------------------------------------
Summary: Process that has hcat partitions with / in partition name does not succeed
Key: FALCON-372
URL: https://issues.apache.org/jira/browse/FALCON-372
Project: Falcon
Issue Type: Bug
Reporter: Raghav Kumar Gautam
Test name: HCatProcessTest#OneHCatInputOneHCatOutput, with separator '/'
Here are the entity definition:
{code:xml}
<?xml version="1.0" encoding="UTF-8"?>
<cluster xmlns="uri:falcon:cluster:0.1" name="corp-65636c71-a466-4906-aabc-3ce40f7a9850" description="" colo="default">
<interfaces>
<interface type="readonly" endpoint="webhdfs://rkg1-2:50070" version="0.20.2"/>
<interface type="write" endpoint="hdfs://rkg1-2:8020" version="0.20.2"/>
<interface type="execute" endpoint="rkg1-2:8032" version="0.20.2"/>
<interface type="workflow" endpoint="http://rkg1-2:11000/oozie/" version="3.1"/>
<interface type="messaging" endpoint="tcp://rkg1-2:61616?daemon=true" version="5.1.6"/>
<interface type="registry" endpoint="thrift://rkg1-2.cs1cloud.internal:9083" version="0.11.0"/>
</interfaces>
<locations>
<location name="staging" path="/projects/ivory/staging"/>
<location name="temp" path="/tmp"/>
<location name="working" path="/projectsTest/ivory/working"/>
</locations>
<properties>
<property name="field1" value="value1"/>
<property name="field2" value="value2"/>
<property name="dfs.namenode.kerberos.principal" value="nn/rkg1-2@EXAMPLE.COM"/>
<property name="hive.metastore.kerberos.principal" value="hive/rkg1-2@EXAMPLE.COM"/>
</properties>
</cluster>
{code}
{code:xml}
<?xml version="1.0" encoding="UTF-8"?>
<feed xmlns="uri:falcon:feed:0.1" name="raaw-logs16-b36bdd1e-8b81-47f5-bfef-42fec8ecc68a" description="clicks log">
<frequency>hours(1)</frequency>
<timezone>UTC</timezone>
<late-arrival cut-off="hours(6)"/>
<clusters>
<cluster name="corp-65636c71-a466-4906-aabc-3ce40f7a9850" type="source">
<validity start="2010-01-01T20:00Z" end="2010-01-02T04:00Z"/>
<retention limit="months(9000)" action="delete"/>
</cluster>
</clusters>
<table uri="catalog:default:hcatprocesstest_input_table#dt=${YEAR}/${MONTH}/${DAY}/${HOUR}"/>
<ACL owner="testuser" group="group" permission="0x755"/>
<schema location="hcat" provider="hcat"/>
<properties>
<property name="field1" value="value1"/>
<property name="field2" value="value2"/>
</properties>
</feed>
{code}
{code:xml}
<?xml version="1.0" encoding="UTF-8"?>
<feed xmlns="uri:falcon:feed:0.1" name="agregated-logs16-621e03ea-dee5-4a47-b6f5-09523b8fc0ee" description="clicks log">
<frequency>hours(1)</frequency>
<timezone>UTC</timezone>
<late-arrival cut-off="hours(6)"/>
<clusters>
<cluster name="corp-65636c71-a466-4906-aabc-3ce40f7a9850" type="source">
<validity start="2010-01-01T20:00Z" end="2010-01-02T04:00Z"/>
<retention limit="hours(6)" action="delete"/>
</cluster>
</clusters>
<table uri="catalog:default:hcatprocesstest_output_table#dt=${YEAR}/${MONTH}/${DAY}/${HOUR}"/>
<ACL owner="testuser" group="group" permission="0x755"/>
<schema location="hcat" provider="hcat"/>
<properties>
<property name="field1" value="value1"/>
<property name="field2" value="value2"/>
</properties>
</feed>
{code}
{code:xml}
<process xmlns="uri:falcon:process:0.1" name="agregator-coord16-fa1776e0-1b9a-4bb9-815e-3b43c147aee4">
<clusters>
<cluster name="corp-65636c71-a466-4906-aabc-3ce40f7a9850">
<validity start="2010-01-01T20:00Z" end="2010-01-02T04:00Z"/>
</cluster>
</clusters>
<parallel>1</parallel>
<order>FIFO</order>
<frequency>hours(1)</frequency>
<timezone>UTC</timezone>
<inputs>
<input name="inputData" feed="raaw-logs16-b36bdd1e-8b81-47f5-bfef-42fec8ecc68a" start="now(0,0)" end="now(0,0)"/>
</inputs>
<outputs>
<output name="outputData" feed="agregated-logs16-621e03ea-dee5-4a47-b6f5-09523b8fc0ee" instance="now(0,0)"/>
</outputs>
<properties>
<property name="queueName" value="default"/>
</properties>
<workflow engine="hive" path="/tmp/falcon-regression/workflows/hive/script.hql"/>
<retry policy="periodic" delay="minutes(3)" attempts="3"/>
</process>
{code}
Stacktrace from oozie logs:
{noformat}
org.apache.oozie.command.CommandException: E1012: Coord Job Materialization Error: E0906: URI parsing error : hcat://rkg1-2.cs1cloud.internal:9083/default/hcatprocesstest_input_table\
/dt=2010/01/01/20
at org.apache.oozie.command.coord.CoordMaterializeTransitionXCommand.materialize(CoordMaterializeTransitionXCommand.java:282)
at org.apache.oozie.command.MaterializeTransitionXCommand.execute(MaterializeTransitionXCommand.java:72)
at org.apache.oozie.command.MaterializeTransitionXCommand.execute(MaterializeTransitionXCommand.java:28)
at org.apache.oozie.command.XCommand.call(XCommand.java:280)
at org.apache.oozie.service.CallableQueueService$CallableWrapper.run(CallableQueueService.java:175)
at java.util.concurrent.ThreadPoolExecutor$Worker.runTask(ThreadPoolExecutor.java:886)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:908)
at java.lang.Thread.run(Thread.java:662)
Caused by: org.apache.oozie.dependency.URIHandlerException: E0906: URI parsing error : hcat://rkg1-2.cs1cloud.internal:9083/default/hcatprocesstest_input_table/dt=2010/01/01/20
at org.apache.oozie.dependency.HCatURIHandler.validate(HCatURIHandler.java:169)
at org.apache.oozie.command.coord.CoordCommandUtils.createEarlyURIs(CoordCommandUtils.java:365)
at org.apache.oozie.command.coord.CoordCommandUtils.separateResolvedAndUnresolved(CoordCommandUtils.java:303)
at org.apache.oozie.command.coord.CoordCommandUtils.materializeDataEvents(CoordCommandUtils.java:577)
at org.apache.oozie.command.coord.CoordCommandUtils.materializeOneInstance(CoordCommandUtils.java:444)
at org.apache.oozie.command.coord.CoordMaterializeTransitionXCommand.materializeActions(CoordMaterializeTransitionXCommand.java:381)
at org.apache.oozie.command.coord.CoordMaterializeTransitionXCommand.materialize(CoordMaterializeTransitionXCommand.java:263)
... 7 more
Caused by: java.net.URISyntaxException: URI path is not in expected format: hcat://rkg1-2.cs1cloud.internal:9083/default/hcatprocesstest_input_table/dt=2010/01/01/20
at org.apache.oozie.util.HCatURI.parse(HCatURI.java:66)
at org.apache.oozie.util.HCatURI.<init>(HCatURI.java:52)
at org.apache.oozie.util.HCatURI.<init>(HCatURI.java:48)
at org.apache.oozie.dependency.HCatURIHandler.validate(HCatURIHandler.java:166)
... 13 more
{noformat}
--
This message was sent by Atlassian JIRA
(v6.2#6252)