[ https://issues.apache.org/jira/browse/IGNITE-25915?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]
Kirill Sizov updated IGNITE-25915: ----------------------------------- Summary: Critical system error in ItIgniteNodeRestartTest on sendWithRetryTimeout (was: Critical system error on sendWithRetryTimeout) > Critical system error in ItIgniteNodeRestartTest on sendWithRetryTimeout > ------------------------------------------------------------------------ > > Key: IGNITE-25915 > URL: https://issues.apache.org/jira/browse/IGNITE-25915 > Project: Ignite > Issue Type: Bug > Affects Versions: 3.1 > Reporter: Kirill Sizov > Priority: Major > Labels: ignite-3 > Attachments: Integration Tests Module Runner 41134.zip, > _Integration_Tests_Module_Runner_41125.log.zip > > > Found on "ItIgniteNodeRestartTest.testRestartDiffConfig", > "testOneNodeRestartWithGap" fail with "PeerUnavailableException" > {noformat} > 10:58:19]W: [:ignite-runner:integrationTest] > org.apache.ignite.internal.failure.StackTraceCapturingException: Unknown > error[10:58:19]W: [:ignite-runner:integrationTest] at > org.apache.ignite.internal.failure.FailureManager.process(FailureManager.java:191)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.failure.FailureManager.process(FailureManager.java:168)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.metastorage.server.WatchProcessor.notifyFailureHandlerOnFirstFailureInNotificationChain(WatchProcessor.java:441)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.metastorage.server.WatchProcessor.lambda$enqueue$3(WatchProcessor.java:240)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:863)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:841)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:510)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture.completeExceptionally(CompletableFuture.java:2162)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.raft.RaftGroupServiceImpl.sendWithRetry(RaftGroupServiceImpl.java:686)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.raft.RaftGroupServiceImpl.sendWithRetry(RaftGroupServiceImpl.java:660)[10:58:19]W: > [:ignite-runner:integrationTest] at > org.apache.ignite.internal.raft.RaftGroupServiceImpl.lambda$scheduleRetry$51(RaftGroupServiceImpl.java:910)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:539)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.FutureTask.run(FutureTask.java:264)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:304)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.lang.Thread.run(Thread.java:833)[10:58:19]W: > [:ignite-runner:integrationTest] Caused by: > java.util.concurrent.CompletionException: > java.util.concurrent.TimeoutException: Send with retry timed out [retryCount > = 340, groupId = metastorage_group, traceId = null, request = > org.apache.ignite.raft.jraft.rpc.WriteActionRequestImpl(org.apache.ignite.internal.metastorage.command.MultiInvokeCommandImpl), > originCommand = null, retryReasons = [[time=1752595098493, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=18, > attemptDuration=2, attemptStartTime=2025-07-15T15:58:18,493], > [time=1752595098513, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=18, attemptDuration=2, > attemptStartTime=2025-07-15T15:58:18,513], [time=1752595098533, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=18, > attemptDuration=2, attemptStartTime=2025-07-15T15:58:18,533], > [time=1752595098553, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=18, attemptDuration=2, > attemptStartTime=2025-07-15T15:58:18,553], [time=1752595098573, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=18, > attemptDuration=2, attemptStartTime=2025-07-15T15:58:18,573], > [time=1752595098594, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=18, attemptDuration=3, > attemptStartTime=2025-07-15T15:58:18,594], [time=1752595098614, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=17, > attemptDuration=3, attemptStartTime=2025-07-15T15:58:18,614], > [time=1752595098634, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=17, attemptDuration=3, > attemptStartTime=2025-07-15T15:58:18,634], [time=1752595098654, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=17, > attemptDuration=3, attemptStartTime=2025-07-15T15:58:18,654], > [time=1752595098674, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=17, attemptDuration=3, > attemptStartTime=2025-07-15T15:58:18,674], [time=1752595098694, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=17, > attemptDuration=3, attemptStartTime=2025-07-15T15:58:18,694], > [time=1752595098714, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=17, attemptDuration=3, > attemptStartTime=2025-07-15T15:58:18,714], [time=1752595098735, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=17, > attemptDuration=4, attemptStartTime=2025-07-15T15:58:18,735], > [time=1752595098755, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=16, attemptDuration=4, > attemptStartTime=2025-07-15T15:58:18,755], [time=1752595098775, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=16, > attemptDuration=4, attemptStartTime=2025-07-15T15:58:18,775], > [time=1752595098795, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=16, attemptDuration=4, > attemptStartTime=2025-07-15T15:58:18,795], [time=1752595098815, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=16, > attemptDuration=4, attemptStartTime=2025-07-15T15:58:18,815], > [time=1752595098836, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=16, attemptDuration=5, > attemptStartTime=2025-07-15T15:58:18,836], [time=1752595098856, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=15, > attemptDuration=5, attemptStartTime=2025-07-15T15:58:18,856], > [time=1752595098876, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=15, attemptDuration=5, > attemptStartTime=2025-07-15T15:58:18,876], [time=1752595098896, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=15, > attemptDuration=5, attemptStartTime=2025-07-15T15:58:18,896], > [time=1752595098916, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=15, attemptDuration=5, > attemptStartTime=2025-07-15T15:58:18,916], [time=1752595098936, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=15, > attemptDuration=5, attemptStartTime=2025-07-15T15:58:18,936], > [time=1752595098956, msg=Peer iinrt_tonrwg_0:0 threw > PeerUnavailableException; attemptWaitDuration=15, attemptDuration=5, > attemptStartTime=2025-07-15T15:58:18,956], [time=1752595098977, msg=Peer > iinrt_tonrwg_0:0 threw PeerUnavailableException; attemptWaitDuration=15, > attemptDuration=6, attemptStartTime=2025-07-15T15:58:18,977]], stopTime = > 1752595098991, currentTime = 1752595098997, startTime = 1752595088991, > duration = 10006].[10:58:19]W: [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture.encodeThrowable(CompletableFuture.java:332)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture.completeThrowable(CompletableFuture.java:347)[10:58:19]W: > [:ignite-runner:integrationTest] at > java.base/java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:636)[10:58:19]W: > [:ignite-runner:integrationTest] ... 11 more{noformat} -- This message was sent by Atlassian Jira (v8.20.10#820010)