[ https://issues.apache.org/jira/browse/FLINK-27792?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17555511#comment-17555511 ]
Chesnay Schepler commented on FLINK-27792: ------------------------------------------ A potential source {{ChannelStateWriteRequestExecutorImpl#close}}, which interrupts the internal thread. > InterruptedException thrown by ChannelStateWriterImpl > ----------------------------------------------------- > > Key: FLINK-27792 > URL: https://issues.apache.org/jira/browse/FLINK-27792 > Project: Flink > Issue Type: Bug > Components: Table SQL / Planner > Affects Versions: 1.16.0 > Reporter: Huang Xingbo > Assignee: Atri Sharma > Priority: Blocker > Labels: test-stability > > {code:java} > 2022-05-25T15:45:17.7584795Z May 25 15:45:17 [ERROR] > WindowDistinctAggregateITCase.testTumbleWindow_Rollup Time elapsed: 1.522 s > <<< ERROR! > 2022-05-25T15:45:17.7586025Z May 25 15:45:17 > org.apache.flink.runtime.client.JobExecutionException: Job execution failed. > 2022-05-25T15:45:17.7587205Z May 25 15:45:17 at > org.apache.flink.runtime.jobmaster.JobResult.toJobExecutionResult(JobResult.java:144) > 2022-05-25T15:45:17.7588649Z May 25 15:45:17 at > org.apache.flink.runtime.minicluster.MiniClusterJobClient.lambda$getJobExecutionResult$3(MiniClusterJobClient.java:141) > 2022-05-25T15:45:17.7589984Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.uniApply(CompletableFuture.java:616) > 2022-05-25T15:45:17.7603647Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:591) > 2022-05-25T15:45:17.7605042Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:488) > 2022-05-25T15:45:17.7605750Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:1975) > 2022-05-25T15:45:17.7606751Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.AkkaInvocationHandler.lambda$invokeRpc$1(AkkaInvocationHandler.java:268) > 2022-05-25T15:45:17.7607513Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:774) > 2022-05-25T15:45:17.7608232Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:750) > 2022-05-25T15:45:17.7608953Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:488) > 2022-05-25T15:45:17.7614259Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:1975) > 2022-05-25T15:45:17.7615777Z May 25 15:45:17 at > org.apache.flink.util.concurrent.FutureUtils.doForward(FutureUtils.java:1277) > 2022-05-25T15:45:17.7617284Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.lambda$null$1(ClassLoadingUtils.java:93) > 2022-05-25T15:45:17.7618847Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.runWithContextClassLoader(ClassLoadingUtils.java:68) > 2022-05-25T15:45:17.7620579Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.lambda$guardCompletionWithContextClassLoader$2(ClassLoadingUtils.java:92) > 2022-05-25T15:45:17.7622674Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:774) > 2022-05-25T15:45:17.7624066Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:750) > 2022-05-25T15:45:17.7625352Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:488) > 2022-05-25T15:45:17.7626524Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:1975) > 2022-05-25T15:45:17.7627743Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.AkkaFutureUtils$1.onComplete(AkkaFutureUtils.java:47) > 2022-05-25T15:45:17.7628913Z May 25 15:45:17 at > akka.dispatch.OnComplete.internal(Future.scala:300) > 2022-05-25T15:45:17.7629902Z May 25 15:45:17 at > akka.dispatch.OnComplete.internal(Future.scala:297) > 2022-05-25T15:45:17.7630891Z May 25 15:45:17 at > akka.dispatch.japi$CallbackBridge.apply(Future.scala:224) > 2022-05-25T15:45:17.7632074Z May 25 15:45:17 at > akka.dispatch.japi$CallbackBridge.apply(Future.scala:221) > 2022-05-25T15:45:17.7654202Z May 25 15:45:17 at > scala.concurrent.impl.CallbackRunnable.run(Promise.scala:60) > 2022-05-25T15:45:17.7655764Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.AkkaFutureUtils$DirectExecutionContext.execute(AkkaFutureUtils.java:65) > 2022-05-25T15:45:17.7657231Z May 25 15:45:17 at > scala.concurrent.impl.CallbackRunnable.executeWithValue(Promise.scala:68) > 2022-05-25T15:45:17.7658586Z May 25 15:45:17 at > scala.concurrent.impl.Promise$DefaultPromise.$anonfun$tryComplete$1(Promise.scala:284) > 2022-05-25T15:45:17.7660014Z May 25 15:45:17 at > scala.concurrent.impl.Promise$DefaultPromise.$anonfun$tryComplete$1$adapted(Promise.scala:284) > 2022-05-25T15:45:17.7661422Z May 25 15:45:17 at > scala.concurrent.impl.Promise$DefaultPromise.tryComplete(Promise.scala:284) > 2022-05-25T15:45:17.7663302Z May 25 15:45:17 at > akka.pattern.PromiseActorRef.$bang(AskSupport.scala:621) > 2022-05-25T15:45:17.7664594Z May 25 15:45:17 at > akka.pattern.PipeToSupport$PipeableFuture$$anonfun$pipeTo$1.applyOrElse(PipeToSupport.scala:24) > 2022-05-25T15:45:17.7665956Z May 25 15:45:17 at > akka.pattern.PipeToSupport$PipeableFuture$$anonfun$pipeTo$1.applyOrElse(PipeToSupport.scala:23) > 2022-05-25T15:45:17.7667111Z May 25 15:45:17 at > scala.concurrent.Future.$anonfun$andThen$1(Future.scala:532) > 2022-05-25T15:45:17.7668159Z May 25 15:45:17 at > scala.concurrent.impl.Promise.liftedTree1$1(Promise.scala:29) > 2022-05-25T15:45:17.7669229Z May 25 15:45:17 at > scala.concurrent.impl.Promise.$anonfun$transform$1(Promise.scala:29) > 2022-05-25T15:45:17.7670271Z May 25 15:45:17 at > scala.concurrent.impl.CallbackRunnable.run(Promise.scala:60) > 2022-05-25T15:45:17.7671379Z May 25 15:45:17 at > akka.dispatch.BatchingExecutor$AbstractBatch.processBatch(BatchingExecutor.scala:63) > 2022-05-25T15:45:17.7673048Z May 25 15:45:17 at > akka.dispatch.BatchingExecutor$BlockableBatch.$anonfun$run$1(BatchingExecutor.scala:100) > 2022-05-25T15:45:17.7725189Z May 25 15:45:17 at > scala.runtime.java8.JFunction0$mcV$sp.apply(JFunction0$mcV$sp.java:12) > 2022-05-25T15:45:17.7753834Z May 25 15:45:17 at > scala.concurrent.BlockContext$.withBlockContext(BlockContext.scala:81) > 2022-05-25T15:45:17.7805369Z May 25 15:45:17 at > akka.dispatch.BatchingExecutor$BlockableBatch.run(BatchingExecutor.scala:100) > 2022-05-25T15:45:17.7806838Z May 25 15:45:17 at > akka.dispatch.TaskInvocation.run(AbstractDispatcher.scala:49) > 2022-05-25T15:45:17.7808159Z May 25 15:45:17 at > akka.dispatch.ForkJoinExecutorConfigurator$AkkaForkJoinTask.exec(ForkJoinExecutorConfigurator.scala:48) > 2022-05-25T15:45:17.7809497Z May 25 15:45:17 at > java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:289) > 2022-05-25T15:45:17.7810702Z May 25 15:45:17 at > java.util.concurrent.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1056) > 2022-05-25T15:45:17.7812155Z May 25 15:45:17 at > java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1692) > 2022-05-25T15:45:17.7813377Z May 25 15:45:17 at > java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:175) > 2022-05-25T15:45:17.7814839Z May 25 15:45:17 Caused by: > org.apache.flink.runtime.JobException: Recovery is suppressed by > FixedDelayRestartBackoffTimeStrategy(maxNumberRestartAttempts=1, > backoffTimeMS=0) > 2022-05-25T15:45:17.7816569Z May 25 15:45:17 at > org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.handleFailure(ExecutionFailureHandler.java:138) > 2022-05-25T15:45:17.7818320Z May 25 15:45:17 at > org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.getFailureHandlingResult(ExecutionFailureHandler.java:82) > 2022-05-25T15:45:17.7819932Z May 25 15:45:17 at > org.apache.flink.runtime.scheduler.DefaultScheduler.handleTaskFailure(DefaultScheduler.java:300) > 2022-05-25T15:45:17.7821396Z May 25 15:45:17 at > org.apache.flink.runtime.scheduler.DefaultScheduler.maybeHandleTaskFailure(DefaultScheduler.java:290) > 2022-05-25T15:45:17.7822960Z May 25 15:45:17 at > org.apache.flink.runtime.scheduler.DefaultScheduler.updateTaskExecutionStateInternal(DefaultScheduler.java:281) > 2022-05-25T15:45:17.7824471Z May 25 15:45:17 at > org.apache.flink.runtime.scheduler.SchedulerBase.updateTaskExecutionState(SchedulerBase.java:716) > 2022-05-25T15:45:17.7826204Z May 25 15:45:17 at > org.apache.flink.runtime.scheduler.SchedulerNG.updateTaskExecutionState(SchedulerNG.java:78) > 2022-05-25T15:45:17.7827583Z May 25 15:45:17 at > org.apache.flink.runtime.jobmaster.JobMaster.updateTaskExecutionState(JobMaster.java:443) > 2022-05-25T15:45:17.7828764Z May 25 15:45:17 at > sun.reflect.GeneratedMethodAccessor17.invoke(Unknown Source) > 2022-05-25T15:45:17.7829926Z May 25 15:45:17 at > sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) > 2022-05-25T15:45:17.7831105Z May 25 15:45:17 at > java.lang.reflect.Method.invoke(Method.java:498) > 2022-05-25T15:45:17.7832521Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.AkkaRpcActor.lambda$handleRpcInvocation$1(AkkaRpcActor.java:304) > 2022-05-25T15:45:17.7834045Z May 25 15:45:17 at > org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.runWithContextClassLoader(ClassLoadingUtils.java:83) > 2022-05-25T15:45:17.7835535Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcInvocation(AkkaRpcActor.java:302) > 2022-05-25T15:45:17.7836936Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcMessage(AkkaRpcActor.java:217) > 2022-05-25T15:45:17.7838289Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.FencedAkkaRpcActor.handleRpcMessage(FencedAkkaRpcActor.java:78) > 2022-05-25T15:45:17.7839679Z May 25 15:45:17 at > org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleMessage(AkkaRpcActor.java:163) > 2022-05-25T15:45:17.7840897Z May 25 15:45:17 at > akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:24) > 2022-05-25T15:45:17.7842452Z May 25 15:45:17 at > akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:20) > 2022-05-25T15:45:17.7843596Z May 25 15:45:17 at > scala.PartialFunction.applyOrElse(PartialFunction.scala:123) > 2022-05-25T15:45:17.7844725Z May 25 15:45:17 at > scala.PartialFunction.applyOrElse$(PartialFunction.scala:122) > 2022-05-25T15:45:17.7845896Z May 25 15:45:17 at > akka.japi.pf.UnitCaseStatement.applyOrElse(CaseStatements.scala:20) > 2022-05-25T15:45:17.7847076Z May 25 15:45:17 at > scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:171) > 2022-05-25T15:45:17.7848258Z May 25 15:45:17 at > scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172) > 2022-05-25T15:45:17.7849401Z May 25 15:45:17 at > scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172) > 2022-05-25T15:45:17.7850510Z May 25 15:45:17 at > akka.actor.Actor.aroundReceive(Actor.scala:537) > 2022-05-25T15:45:17.7851532Z May 25 15:45:17 at > akka.actor.Actor.aroundReceive$(Actor.scala:535) > 2022-05-25T15:45:17.7852808Z May 25 15:45:17 at > akka.actor.AbstractActor.aroundReceive(AbstractActor.scala:220) > 2022-05-25T15:45:17.7853919Z May 25 15:45:17 at > akka.actor.ActorCell.receiveMessage(ActorCell.scala:580) > 2022-05-25T15:45:17.7855126Z May 25 15:45:17 at > akka.actor.ActorCell.invoke(ActorCell.scala:548) > 2022-05-25T15:45:17.7856172Z May 25 15:45:17 at > akka.dispatch.Mailbox.processMailbox(Mailbox.scala:270) > 2022-05-25T15:45:17.7857219Z May 25 15:45:17 at > akka.dispatch.Mailbox.run(Mailbox.scala:231) > 2022-05-25T15:45:17.7858209Z May 25 15:45:17 at > akka.dispatch.Mailbox.exec(Mailbox.scala:243) > 2022-05-25T15:45:17.7859009Z May 25 15:45:17 ... 4 more > 2022-05-25T15:45:17.7859790Z May 25 15:45:17 Caused by: java.io.IOException: > java.lang.InterruptedException > 2022-05-25T15:45:17.7861180Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriteRequestExecutorImpl.close(ChannelStateWriteRequestExecutorImpl.java:175) > 2022-05-25T15:45:17.7862855Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriterImpl.close(ChannelStateWriterImpl.java:234) > 2022-05-25T15:45:17.7864447Z May 25 15:45:17 at > org.apache.flink.streaming.runtime.tasks.SubtaskCheckpointCoordinatorImpl.cancel(SubtaskCheckpointCoordinatorImpl.java:560) > 2022-05-25T15:45:17.7866077Z May 25 15:45:17 at > org.apache.flink.streaming.runtime.tasks.SubtaskCheckpointCoordinatorImpl.close(SubtaskCheckpointCoordinatorImpl.java:547) > 2022-05-25T15:45:17.7867645Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:254) > 2022-05-25T15:45:17.7868821Z May 25 15:45:17 at > org.apache.flink.core.fs.AutoCloseableRegistry.doClose(AutoCloseableRegistry.java:72) > 2022-05-25T15:45:17.7870194Z May 25 15:45:17 at > org.apache.flink.util.AbstractAutoCloseableRegistry.close(AbstractAutoCloseableRegistry.java:127) > 2022-05-25T15:45:17.7871500Z May 25 15:45:17 at > org.apache.flink.streaming.runtime.tasks.StreamTask.cleanUp(StreamTask.java:938) > 2022-05-25T15:45:17.7872941Z May 25 15:45:17 at > org.apache.flink.runtime.taskmanager.Task.lambda$restoreAndInvoke$1(Task.java:923) > 2022-05-25T15:45:17.7874230Z May 25 15:45:17 at > org.apache.flink.runtime.taskmanager.Task.runWithSystemExitMonitoring(Task.java:935) > 2022-05-25T15:45:17.7875430Z May 25 15:45:17 at > org.apache.flink.runtime.taskmanager.Task.restoreAndInvoke(Task.java:923) > 2022-05-25T15:45:17.7876630Z May 25 15:45:17 at > org.apache.flink.runtime.taskmanager.Task.doRun(Task.java:728) > 2022-05-25T15:45:17.7877772Z May 25 15:45:17 at > org.apache.flink.runtime.taskmanager.Task.run(Task.java:550) > 2022-05-25T15:45:17.7878769Z May 25 15:45:17 at > java.lang.Thread.run(Thread.java:748) > 2022-05-25T15:45:17.7879657Z May 25 15:45:17 Caused by: > java.lang.InterruptedException > 2022-05-25T15:45:17.7880692Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.reportGet(CompletableFuture.java:347) > 2022-05-25T15:45:17.7882088Z May 25 15:45:17 at > java.util.concurrent.CompletableFuture.get(CompletableFuture.java:1908) > 2022-05-25T15:45:17.7883596Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriteRequest.lambda$buildFutureWriteRequest$4(ChannelStateWriteRequest.java:113) > 2022-05-25T15:45:17.7885476Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.CheckpointInProgressRequest.cancel(ChannelStateWriteRequest.java:253) > 2022-05-25T15:45:17.7887201Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriteRequestExecutorImpl.lambda$null$1(ChannelStateWriteRequestExecutorImpl.java:117) > 2022-05-25T15:45:17.7888654Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:254) > 2022-05-25T15:45:17.7889760Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:233) > 2022-05-25T15:45:17.7891233Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriteRequestExecutorImpl.cleanupRequests(ChannelStateWriteRequestExecutorImpl.java:115) > 2022-05-25T15:45:17.7892866Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:254) > 2022-05-25T15:45:17.7893951Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:233) > 2022-05-25T15:45:17.7895045Z May 25 15:45:17 at > org.apache.flink.util.IOUtils.closeAll(IOUtils.java:222) > 2022-05-25T15:45:17.7896427Z May 25 15:45:17 at > org.apache.flink.runtime.checkpoint.channel.ChannelStateWriteRequestExecutorImpl.run(ChannelStateWriteRequestExecutorImpl.java:80) > 2022-05-25T15:45:17.7897602Z May 25 15:45:17 ... 1 more > {code} > https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=36066&view=logs&j=0c940707-2659-5648-cbe6-a1ad63045f0a&t=075c2716-8010-5565-fe08-3c4bb45824a4 -- This message was sent by Atlassian Jira (v8.20.7#820007)