[ https://issues.apache.org/jira/browse/CASSANDRA-19761?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17864760#comment-17864760 ]
David Capwell commented on CASSANDRA-19761: ------------------------------------------- Here is one more stack trace impacted {code} node1_MiscStage:1: java.base@11.0.15/jdk.internal.misc.Unsafe.park(Native Method) java.base@11.0.15/java.util.concurrent.locks.LockSupport.parkNanos(LockSupport.java:357) org.apache.cassandra.utils.concurrent.WaitQueue$Standard$AbstractSignal.awaitUntil(WaitQueue.java:303) org.apache.cassandra.utils.concurrent.Awaitable$AsyncAwaitable.awaitUntil(Awaitable.java:314) org.apache.cassandra.utils.concurrent.AsyncFuture.awaitUntil(AsyncFuture.java:171) org.apache.cassandra.utils.concurrent.Awaitable$Defaults.awaitUntilUninterruptibly(Awaitable.java:163) org.apache.cassandra.utils.concurrent.Awaitable$Defaults.awaitUninterruptibly(Awaitable.java:124) org.apache.cassandra.utils.concurrent.AbstractFuture.awaitUninterruptibly(AbstractFuture.java:494) org.apache.cassandra.tcm.PaxosBackedProcessor.fetchLogAndWait(PaxosBackedProcessor.java:139) org.apache.cassandra.tcm.AbstractLocalProcessor.commit(AbstractLocalProcessor.java:109) org.apache.cassandra.distributed.test.log.TestProcessor.commit(TestProcessor.java:61) org.apache.cassandra.tcm.ClusterMetadataService$SwitchableProcessor.commit(ClusterMetadataService.java:841) org.apache.cassandra.tcm.Processor.commit(Processor.java:45) org.apache.cassandra.tcm.ClusterMetadataService.commit(ClusterMetadataService.java:516) {code} > When JVM dtest is shutting down, if a new epoch is being committed the node > is unable to shut down > -------------------------------------------------------------------------------------------------- > > Key: CASSANDRA-19761 > URL: https://issues.apache.org/jira/browse/CASSANDRA-19761 > Project: Cassandra > Issue Type: Bug > Components: Transactional Cluster Metadata > Reporter: David Capwell > Priority: Normal > > The following was seen in the accord branch, but the problem is found in > trunk as well. > {code} > node1_isolatedExecutor:8: > java.base@11.0.15/jdk.internal.misc.Unsafe.park(Native Method) > > java.base@11.0.15/java.util.concurrent.locks.LockSupport.parkNanos(LockSupport.java:234) > > org.apache.cassandra.simulator.systems.InterceptorOfSystemMethods$None.parkNanos(InterceptorOfSystemMethods.java:373) > > org.apache.cassandra.simulator.systems.InterceptorOfSystemMethods$Global.parkNanos(InterceptorOfSystemMethods.java:166) > > java.base@11.0.15/java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.awaitNanos(AbstractQueuedSynchronizer.java:2123) > > java.base@11.0.15/java.util.concurrent.ThreadPoolExecutor.awaitTermination(ThreadPoolExecutor.java:1454) > > org.apache.cassandra.utils.ExecutorUtils.awaitTerminationUntil(ExecutorUtils.java:110) > > org.apache.cassandra.utils.ExecutorUtils.awaitTermination(ExecutorUtils.java:100) > org.apache.cassandra.concurrent.Stage.shutdownAndWait(Stage.java:195) > > org.apache.cassandra.distributed.impl.Instance.lambda$shutdown$44(Instance.java:975) > {code} > {code} > node1_MiscStage:1: > java.base@11.0.15/jdk.internal.misc.Unsafe.park(Native Method) > > java.base@11.0.15/java.util.concurrent.locks.LockSupport.park(LockSupport.java:323) > > org.apache.cassandra.utils.concurrent.WaitQueue$Standard$AbstractSignal.await(WaitQueue.java:290) > > org.apache.cassandra.utils.concurrent.WaitQueue$Standard$AbstractSignal.await(WaitQueue.java:283) > > org.apache.cassandra.utils.concurrent.Awaitable$AsyncAwaitable.await(Awaitable.java:306) > > org.apache.cassandra.utils.concurrent.Awaitable$AsyncAwaitable.await(Awaitable.java:338) > > org.apache.cassandra.utils.concurrent.Awaitable$Defaults.awaitUninterruptibly(Awaitable.java:186) > > org.apache.cassandra.utils.concurrent.Awaitable$AbstractAwaitable.awaitUninterruptibly(Awaitable.java:259) > org.apache.cassandra.tcm.log.LocalLog$Async.runOnce(LocalLog.java:710) > org.apache.cassandra.tcm.log.LocalLog.runOnce(LocalLog.java:404) > > org.apache.cassandra.tcm.log.LocalLog.waitForHighestConsecutive(LocalLog.java:346) > > org.apache.cassandra.tcm.PaxosBackedProcessor.fetchLogAndWait(PaxosBackedProcessor.java:163) > > org.apache.cassandra.tcm.AbstractLocalProcessor.commit(AbstractLocalProcessor.java:109) > > org.apache.cassandra.distributed.test.log.TestProcessor.commit(TestProcessor.java:61) > > org.apache.cassandra.tcm.ClusterMetadataService$SwitchableProcessor.commit(ClusterMetadataService.java:841) > org.apache.cassandra.tcm.Processor.commit(Processor.java:45) > > org.apache.cassandra.tcm.ClusterMetadataService.commit(ClusterMetadataService.java:516) > > org.apache.cassandra.service.accord.AccordFastPathCoordinator$Impl.lambda$updateFastPath$2(AccordFastPathCoordinator.java:208) > > org.apache.cassandra.service.accord.AccordFastPathCoordinator$Impl$$Lambda$11211/0x0000000802441840.run(Unknown > Source) > {code} > Accord is trying to commit a new epoch, but TCM uses “awaitUninterruptibly” > which ignores the thread interrupt done while the cluster is shutting down. > When this is happening the instance is unable to make progress so loops > endlessly, causing the test to fail to close. -- This message was sent by Atlassian Jira (v8.20.10#820010) --------------------------------------------------------------------- To unsubscribe, e-mail: commits-unsubscr...@cassandra.apache.org For additional commands, e-mail: commits-h...@cassandra.apache.org