You are viewing a plain text version of this content. The canonical link for it is here.
Posted to issues@flink.apache.org by "Huang Xingbo (Jira)" <ji...@apache.org> on 2022/06/02 12:06:00 UTC

[jira] [Updated] (FLINK-27869) AdaptiveSchedulerITCase. testStopWithSavepointFailOnStop failed with FAIL_ON_CHECKPOINT_COMPLETE

     [ https://issues.apache.org/jira/browse/FLINK-27869?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]

Huang Xingbo updated FLINK-27869:
---------------------------------
    Priority: Critical  (was: Major)

> AdaptiveSchedulerITCase. testStopWithSavepointFailOnStop failed with FAIL_ON_CHECKPOINT_COMPLETE 
> -------------------------------------------------------------------------------------------------
>
>                 Key: FLINK-27869
>                 URL: https://issues.apache.org/jira/browse/FLINK-27869
>             Project: Flink
>          Issue Type: Bug
>          Components: Runtime / Checkpointing
>    Affects Versions: 1.16.0
>            Reporter: Huang Xingbo
>            Priority: Critical
>              Labels: test-stability
>
> {code:java}
> 8.6667579Z May 31 01:18:28 [ERROR] org.apache.flink.test.scheduling.AdaptiveSchedulerITCase.testStopWithSavepointFailOnStop  Time elapsed: 0.235 s  <<< ERROR!
> 2022-05-31T01:18:28.6668521Z May 31 01:18:28 org.apache.flink.util.FlinkException: Stop with savepoint operation could not be completed.
> 2022-05-31T01:18:28.6669435Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.StopWithSavepoint.onLeave(StopWithSavepoint.java:125)
> 2022-05-31T01:18:28.6670470Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.AdaptiveScheduler.transitionToState(AdaptiveScheduler.java:1171)
> 2022-05-31T01:18:28.6671487Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.AdaptiveScheduler.goToRestarting(AdaptiveScheduler.java:849)
> 2022-05-31T01:18:28.6672481Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.FailureResultUtil.restartOrFail(FailureResultUtil.java:28)
> 2022-05-31T01:18:28.6673459Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.StopWithSavepoint.onFailure(StopWithSavepoint.java:151)
> 2022-05-31T01:18:28.6674502Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.StateWithExecutionGraph.updateTaskExecutionState(StateWithExecutionGraph.java:363)
> 2022-05-31T01:18:28.6675603Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.AdaptiveScheduler.lambda$updateTaskExecutionState$4(AdaptiveScheduler.java:496)
> 2022-05-31T01:18:28.6677238Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.State.tryCall(State.java:137)
> 2022-05-31T01:18:28.6678573Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.adaptive.AdaptiveScheduler.updateTaskExecutionState(AdaptiveScheduler.java:493)
> 2022-05-31T01:18:28.6679517Z May 31 01:18:28 	at org.apache.flink.runtime.scheduler.SchedulerNG.updateTaskExecutionState(SchedulerNG.java:78)
> 2022-05-31T01:18:28.6680538Z May 31 01:18:28 	at org.apache.flink.runtime.jobmaster.JobMaster.updateTaskExecutionState(JobMaster.java:443)
> 2022-05-31T01:18:28.6681304Z May 31 01:18:28 	at sun.reflect.GeneratedMethodAccessor13.invoke(Unknown Source)
> 2022-05-31T01:18:28.6682058Z May 31 01:18:28 	at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> 2022-05-31T01:18:28.6682800Z May 31 01:18:28 	at java.lang.reflect.Method.invoke(Method.java:498)
> 2022-05-31T01:18:28.6683611Z May 31 01:18:28 	at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.lambda$handleRpcInvocation$1(AkkaRpcActor.java:304)
> 2022-05-31T01:18:28.6684559Z May 31 01:18:28 	at org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.runWithContextClassLoader(ClassLoadingUtils.java:83)
> 2022-05-31T01:18:28.6685483Z May 31 01:18:28 	at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcInvocation(AkkaRpcActor.java:302)
> 2022-05-31T01:18:28.6686343Z May 31 01:18:28 	at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcMessage(AkkaRpcActor.java:217)
> 2022-05-31T01:18:28.6687224Z May 31 01:18:28 	at org.apache.flink.runtime.rpc.akka.FencedAkkaRpcActor.handleRpcMessage(FencedAkkaRpcActor.java:78)
> 2022-05-31T01:18:28.6688093Z May 31 01:18:28 	at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleMessage(AkkaRpcActor.java:163)
> 2022-05-31T01:18:28.6688877Z May 31 01:18:28 	at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:24)
> 2022-05-31T01:18:28.6689602Z May 31 01:18:28 	at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:20)
> 2022-05-31T01:18:28.6690313Z May 31 01:18:28 	at scala.PartialFunction.applyOrElse(PartialFunction.scala:123)
> 2022-05-31T01:18:28.6691045Z May 31 01:18:28 	at scala.PartialFunction.applyOrElse$(PartialFunction.scala:122)
> 2022-05-31T01:18:28.6691782Z May 31 01:18:28 	at akka.japi.pf.UnitCaseStatement.applyOrElse(CaseStatements.scala:20)
> 2022-05-31T01:18:28.6692535Z May 31 01:18:28 	at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:171)
> 2022-05-31T01:18:28.6693283Z May 31 01:18:28 	at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172)
> 2022-05-31T01:18:28.6694031Z May 31 01:18:28 	at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172)
> 2022-05-31T01:18:28.6694733Z May 31 01:18:28 	at akka.actor.Actor.aroundReceive(Actor.scala:537)
> 2022-05-31T01:18:28.6695400Z May 31 01:18:28 	at akka.actor.Actor.aroundReceive$(Actor.scala:535)
> 2022-05-31T01:18:28.6696100Z May 31 01:18:28 	at akka.actor.AbstractActor.aroundReceive(AbstractActor.scala:220)
> 2022-05-31T01:18:28.6696807Z May 31 01:18:28 	at akka.actor.ActorCell.receiveMessage(ActorCell.scala:580)
> 2022-05-31T01:18:28.6697495Z May 31 01:18:28 	at akka.actor.ActorCell.invoke(ActorCell.scala:548)
> 2022-05-31T01:18:28.6698183Z May 31 01:18:28 	at akka.dispatch.Mailbox.processMailbox(Mailbox.scala:270)
> 2022-05-31T01:18:28.6698850Z May 31 01:18:28 	at akka.dispatch.Mailbox.run(Mailbox.scala:231)
> 2022-05-31T01:18:28.6699493Z May 31 01:18:28 	at akka.dispatch.Mailbox.exec(Mailbox.scala:243)
> 2022-05-31T01:18:28.6700184Z May 31 01:18:28 	at java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:289)
> 2022-05-31T01:18:28.6701039Z May 31 01:18:28 	at java.util.concurrent.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1056)
> 2022-05-31T01:18:28.6702033Z May 31 01:18:28 	at java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1692)
> 2022-05-31T01:18:28.6718393Z May 31 01:18:28 	at java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:175)
> 2022-05-31T01:18:28.6719334Z May 31 01:18:28 Caused by: java.lang.RuntimeException: FAIL_ON_CHECKPOINT_COMPLETE
> 2022-05-31T01:18:28.6720311Z May 31 01:18:28 	at org.apache.flink.test.scheduling.AdaptiveSchedulerITCase$DummySource.notifyCheckpointComplete(AdaptiveSchedulerITCase.java:363)
> 2022-05-31T01:18:28.6722132Z May 31 01:18:28 	at org.apache.flink.streaming.api.operators.AbstractUdfStreamOperator.notifyCheckpointComplete(AbstractUdfStreamOperator.java:126)
> 2022-05-31T01:18:28.6724882Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamOperatorWrapper.notifyCheckpointComplete(StreamOperatorWrapper.java:104)
> 2022-05-31T01:18:28.6725781Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.RegularOperatorChain.notifyCheckpointComplete(RegularOperatorChain.java:145)
> 2022-05-31T01:18:28.6761885Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.SubtaskCheckpointCoordinatorImpl.notifyCheckpoint(SubtaskCheckpointCoordinatorImpl.java:479)
> 2022-05-31T01:18:28.6764133Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.SubtaskCheckpointCoordinatorImpl.notifyCheckpointComplete(SubtaskCheckpointCoordinatorImpl.java:413)
> 2022-05-31T01:18:28.6765072Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTask.notifyCheckpointComplete(StreamTask.java:1407)
> 2022-05-31T01:18:28.6771019Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTask.lambda$notifyCheckpointCompleteAsync$15(StreamTask.java:1348)
> 2022-05-31T01:18:28.6771910Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTask.lambda$notifyCheckpointOperation$18(StreamTask.java:1387)
> 2022-05-31T01:18:28.6772850Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTaskActionExecutor$SynchronizedStreamTaskActionExecutor.runThrowing(StreamTaskActionExecutor.java:93)
> 2022-05-31T01:18:28.6773693Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.mailbox.Mail.run(Mail.java:90)
> 2022-05-31T01:18:28.6774423Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.mailbox.MailboxProcessor.runMail(MailboxProcessor.java:398)
> 2022-05-31T01:18:28.6775292Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.mailbox.MailboxProcessor.processMailsWhenDefaultActionUnavailable(MailboxProcessor.java:367)
> 2022-05-31T01:18:28.6776191Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.mailbox.MailboxProcessor.processMail(MailboxProcessor.java:352)
> 2022-05-31T01:18:28.6776992Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.mailbox.MailboxProcessor.runMailboxLoop(MailboxProcessor.java:229)
> 2022-05-31T01:18:28.6777759Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTask.afterInvoke(StreamTask.java:856)
> 2022-05-31T01:18:28.6778461Z May 31 01:18:28 	at org.apache.flink.streaming.runtime.tasks.StreamTask.invoke(StreamTask.java:781)
> 2022-05-31T01:18:28.6779163Z May 31 01:18:28 	at org.apache.flink.runtime.taskmanager.Task.runWithSystemExitMonitoring(Task.java:935)
> 2022-05-31T01:18:28.6779852Z May 31 01:18:28 	at org.apache.flink.runtime.taskmanager.Task.restoreAndInvoke(Task.java:914)
> 2022-05-31T01:18:28.6780484Z May 31 01:18:28 	at org.apache.flink.runtime.taskmanager.Task.doRun(Task.java:728)
> 2022-05-31T01:18:28.6781093Z May 31 01:18:28 	at org.apache.flink.runtime.taskmanager.Task.run(Task.java:550)
> 2022-05-31T01:18:28.6781626Z May 31 01:18:28 	at java.lang.Thread.run(Thread.java:748)
> {code}
> https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=36190&view=logs&j=39d5b1d5-3b41-54dc-6458-1e2ddd1cdcf3&t=0c010d0c-3dec-5bf1-d408-7b18988b1b2b



--
This message was sent by Atlassian Jira
(v8.20.7#820007)