Mate Czagany created FLINK-38967:
------------------------------------

             Summary: UnalignedCheckpointFailureHandlingITCase fails 
intermittently
                 Key: FLINK-38967
                 URL: https://issues.apache.org/jira/browse/FLINK-38967
             Project: Flink
          Issue Type: Improvement
          Components: Tests
            Reporter: Mate Czagany


{code:java}
Jan 23 09:35:49 09:35:49.853 [ERROR] Tests run: 1, Failures: 0, Errors: 1, 
Skipped: 0, Time elapsed: 8.913 s <<< FAILURE! -- in 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase
Jan 23 09:35:49 09:35:49.853 [ERROR] 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase.testCheckpointSuccessAfterFailure
 -- Time elapsed: 8.869 s <<< ERROR!
Jan 23 09:35:49 java.util.concurrent.ExecutionException: 
org.apache.flink.runtime.checkpoint.CheckpointException: Asynchronous task 
checkpoint failed.
Jan 23 09:35:49         at 
java.base/java.util.concurrent.CompletableFuture.reportGet(CompletableFuture.java:396)
Jan 23 09:35:49         at 
java.base/java.util.concurrent.CompletableFuture.get(CompletableFuture.java:2073)
Jan 23 09:35:49         at 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase.testCheckpointSuccessAfterFailure(UnalignedCheckpointFailureHandlingITCase.java:123)
Jan 23 09:35:49         at 
java.base/java.lang.reflect.Method.invoke(Method.java:568)
Jan 23 09:35:49 Caused by: 
org.apache.flink.runtime.checkpoint.CheckpointException: Asynchronous task 
checkpoint failed.
Jan 23 09:35:49         at 
org.apache.flink.runtime.checkpoint.PendingCheckpoint.abort(PendingCheckpoint.java:561)
Jan 23 09:35:49         at 
org.apache.flink.runtime.checkpoint.CheckpointCoordinator.abortPendingCheckpoint(CheckpointCoordinator.java:2274)
Jan 23 09:35:49         at 
org.apache.flink.runtime.checkpoint.CheckpointCoordinator.receiveDeclineMessage(CheckpointCoordinator.java:1175)
Jan 23 09:35:49         at 
org.apache.flink.runtime.scheduler.ExecutionGraphHandler.lambda$declineCheckpoint$3(ExecutionGraphHandler.java:123)
Jan 23 09:35:49         at 
org.apache.flink.runtime.scheduler.ExecutionGraphHandler.lambda$processCheckpointCoordinatorMessage$4(ExecutionGraphHandler.java:139)
Jan 23 09:35:49         at 
org.apache.flink.util.MdcUtils.lambda$wrapRunnable$1(MdcUtils.java:70)
Jan 23 09:35:49         at 
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)
Jan 23 09:35:49         at 
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)
Jan 23 09:35:49         at java.base/java.lang.Thread.run(Thread.java:833)
Jan 23 09:35:49 Caused by: 
org.apache.flink.runtime.checkpoint.CheckpointException: 
org.apache.flink.runtime.checkpoint.CheckpointException: Asynchronous task 
checkpoint failed.
Jan 23 09:35:49         at 
org.apache.flink.streaming.runtime.tasks.AsyncCheckpointRunnable.handleExecutionException(AsyncCheckpointRunnable.java:320)
Jan 23 09:35:49         at 
org.apache.flink.streaming.runtime.tasks.AsyncCheckpointRunnable.run(AsyncCheckpointRunnable.java:155)
Jan 23 09:35:49         ... 4 more
Jan 23 09:35:49 Caused by: java.lang.Exception: java.lang.Exception: Could not 
materialize checkpoint 2 for operator Source: num-source (2/2)#0.
Jan 23 09:35:49         at 
org.apache.flink.streaming.runtime.tasks.AsyncCheckpointRunnable.handleExecutionException(AsyncCheckpointRunnable.java:298)
Jan 23 09:35:49         ... 5 more
Jan 23 09:35:49 Caused by: java.util.concurrent.ExecutionException: 
java.util.concurrent.ExecutionException: 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase$TestException:
 failure from closeAndGetHandle
Jan 23 09:35:49         at 
java.base/java.util.concurrent.FutureTask.report(FutureTask.java:122)
Jan 23 09:35:49         at 
java.base/java.util.concurrent.FutureTask.get(FutureTask.java:191)
Jan 23 09:35:49         at 
org.apache.flink.util.concurrent.FutureUtils.runIfNotDoneAndGet(FutureUtils.java:511)
Jan 23 09:35:49         at 
org.apache.flink.streaming.api.operators.OperatorSnapshotFinalizer.create(OperatorSnapshotFinalizer.java:60)
Jan 23 09:35:49         at 
org.apache.flink.streaming.runtime.tasks.AsyncCheckpointRunnable.finalizeNonFinishedSnapshots(AsyncCheckpointRunnable.java:192)
Jan 23 09:35:49         at 
org.apache.flink.streaming.runtime.tasks.AsyncCheckpointRunnable.run(AsyncCheckpointRunnable.java:124)
Jan 23 09:35:49         ... 4 more
Jan 23 09:35:49 Caused by: 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase$TestException:
 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase$TestException:
 failure from closeAndGetHandle
Jan 23 09:35:49         at 
org.apache.flink.test.checkpointing.UnalignedCheckpointFailureHandlingITCase$FailingOnceFsCheckpointOutputStream.closeAndGetHandle(UnalignedCheckpointFailureHandlingITCase.java:337)
Jan 23 09:35:49         at 
org.apache.flink.runtime.state.DefaultOperatorStateBackendSnapshotStrategy.lambda$asyncSnapshot$2(DefaultOperatorStateBackendSnapshotStrategy.java:218)
Jan 23 09:35:49         at 
org.apache.flink.runtime.state.SnapshotStrategyRunner$1.callInternal(SnapshotStrategyRunner.java:91)
Jan 23 09:35:49         at 
org.apache.flink.runtime.state.SnapshotStrategyRunner$1.callInternal(SnapshotStrategyRunner.java:88)
Jan 23 09:35:49         at 
org.apache.flink.runtime.state.AsyncSnapshotCallable.call(AsyncSnapshotCallable.java:78)
Jan 23 09:35:49         at 
java.base/java.util.concurrent.FutureTask.run(FutureTask.java:264)
Jan 23 09:35:49         at 
org.apache.flink.util.concurrent.FutureUtils.runIfNotDoneAndGet(FutureUtils.java:508)
Jan 23 09:35:49         ... 7 more
{code}



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to