davidshtian commented on issue #7591: URL: https://github.com/apache/hudi/issues/7591#issuecomment-1375225426
Or lots of similar logs like this "RemoteTransportException: Connection unexpectedly closed by remote task manager '142.151.160.20/142.151.160.20:6121'. This might indicate that the remote task manager was lost. This may indicate that the taskmanagers are overloaded." ``` "applicationARN": "arn:aws:kinesisanalytics:us-east-1:xxx:application/kda-studio-david", "applicationVersionId": "19", "locationInformation": "org.apache.zeppelin.flink.FlinkSqlInterrpeter.runSqlList(FlinkSqlInterrpeter.java:163)", "logger": "org.apache.zeppelin.flink.FlinkSqlInterrpeter", "message": "Fail to run sql:INSERT INTO t1 SELECT uuid, event_time, ticker,price from stock_table", "messageSchemaVersion": "1", "messageType": "ERROR", "threadName": "ParallelScheduler-Worker-9", "throwableInformation": "java.io.IOException: org.apache.flink.client.program.ProgramInvocationException: Job failed (JobID: 3e6e3e07934084f5fafc542a4a91bc2c) at org.apache.zeppelin.flink.FlinkSqlInterrpeter.callInsertInto(FlinkSqlInterrpeter.java:538 at org.apache.zeppelin.flink.FlinkStreamSqlInterpreter.callInsertInto(FlinkStreamSqlInterpreter.java:97 at org.apache.zeppelin.flink.FlinkSqlInterrpeter.callCommand(FlinkSqlInterrpeter.java:273 at org.apache.zeppelin.flink.FlinkSqlInterrpeter.runSqlList(FlinkSqlInterrpeter.java:160 at org.apache.zeppelin.flink.FlinkSqlInterrpeter.internalInterpret(FlinkSqlInterrpeter.java:112 at org.apache.zeppelin.interpreter.AbstractInterpreter.interpret(AbstractInterpreter.java:47 at org.apache.zeppelin.interpreter.LazyOpenInterpreter.interpret(LazyOpenInterpreter.java:110 at org.apache.zeppelin.interpreter.remote.RemoteInterpreterServer$InterpretJob.jobRun(RemoteInterpreterServer.java:852 at org.apache.zeppelin.interpreter.remote.RemoteInterpreterServer$InterpretJob.jobRun(RemoteInterpreterServer.java:744 at org.apache.zeppelin.scheduler.Job.run(Job.java:172 at org.apache.zeppelin.scheduler.AbstractScheduler.runJob(AbstractScheduler.java:132 at org.apache.zeppelin.scheduler.ParallelScheduler.lambda$runJobInScheduler$0(ParallelScheduler.java:46 at java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128 at java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628 at java.base/java.lang.Thread.run(Thread.java:829 Caused by: org.apache.flink.client.program.ProgramInvocationException: Job failed (JobID: 3e6e3e07934084f5fafc542a4a91bc2c at org.apache.flink.client.deployment.ClusterClientJobClientAdapter.lambda$getJobExecutionResult$6(ClusterClientJobClientAdapter.java:125 at java.base/java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:642 at java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506 at java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073 at org.apache.flink.runtime.concurrent.FutureUtils.lambda$retryOperationWithDelay$9(FutureUtils.java:394 at java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859 at java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837 at java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506 at java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073 at org.apache.flink.client.program.rest.RestClusterClient.lambda$pollResourceAsync$24(RestClusterClient.java:670 at java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859 at java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837 at java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506 at java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073 at org.apache.flink.runtime.concurrent.FutureUtils.lambda$retryOperationWithDelay$9(FutureUtils.java:394 at java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859 at java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837 at java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506 at java.base/java.util.concurrent.CompletableFuture.postFire(CompletableFuture.java:610 at java.base/java.util.concurrent.CompletableFuture$UniCompose.tryFire(CompletableFuture.java:1085 at java.base/java.util.concurrent.CompletableFuture$Completion.run(CompletableFuture.java:478 ... 3 mor Caused by: org.apache.flink.runtime.client.JobExecutionException: Job execution failed at org.apache.flink.runtime.jobmaster.JobResult.toJobExecutionResult(JobResult.java:144 at org.apache.flink.client.deployment.ClusterClientJobClientAdapter.lambda$getJobExecutionResult$6(ClusterClientJobClientAdapter.java:123 ... 23 mor Caused by: org.apache.flink.runtime.JobException: Recovery is suppressed by NoRestartBackoffTimeStrateg at org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.handleFailure(ExecutionFailureHandler.java:138 at org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.getFailureHandlingResult(ExecutionFailureHandler.java:82 at org.apache.flink.runtime.scheduler.DefaultScheduler.handleTaskFailure(DefaultScheduler.java:222 at org.apache.flink.runtime.scheduler.DefaultScheduler.maybeHandleTaskFailure(DefaultScheduler.java:212 at org.apache.flink.runtime.scheduler.DefaultScheduler.updateTaskExecutionStateInternal(DefaultScheduler.java:203 at org.apache.flink.runtime.scheduler.SchedulerBase.updateTaskExecutionState(SchedulerBase.java:718 at org.apache.flink.runtime.scheduler.SchedulerNG.updateTaskExecutionState(SchedulerNG.java:79 at org.apache.flink.runtime.jobmaster.JobMaster.updateTaskExecutionState(JobMaster.java:443 at jdk.internal.reflect.GeneratedMethodAccessor100.invoke(Unknown Source at java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43 at java.base/java.lang.reflect.Method.invoke(Method.java:566 at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcInvocation(AkkaRpcActor.java:305 at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcMessage(AkkaRpcActor.java:212 at org.apache.flink.runtime.rpc.akka.FencedAkkaRpcActor.handleRpcMessage(FencedAkkaRpcActor.java:77 at org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleMessage(AkkaRpcActor.java:158 at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:26 at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:21 at scala.PartialFunction.applyOrElse(PartialFunction.scala:123 at scala.PartialFunction.applyOrElse$(PartialFunction.scala:122 at akka.japi.pf.UnitCaseStatement.applyOrElse(CaseStatements.scala:21 at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:171 at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172 at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172 at akka.actor.Actor.aroundReceive(Actor.scala:517 at akka.actor.Actor.aroundReceive$(Actor.scala:515 at akka.actor.AbstractActor.aroundReceive(AbstractActor.scala:225 at akka.actor.ActorCell.receiveMessage(ActorCell.scala:592 at akka.actor.ActorCell.invoke(ActorCell.scala:561 at akka.dispatch.Mailbox.processMailbox(Mailbox.scala:258 at akka.dispatch.Mailbox.run(Mailbox.scala:225 at akka.dispatch.Mailbox.exec(Mailbox.scala:235 at akka.dispatch.forkjoin.ForkJoinTask.doExec(ForkJoinTask.java:260 at akka.dispatch.forkjoin.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1339 at akka.dispatch.forkjoin.ForkJoinPool.runWorker(ForkJoinPool.java:1979 at akka.dispatch.forkjoin.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:107 Caused by: org.apache.flink.runtime.io.network.netty.exception.RemoteTransportException: Connection unexpectedly closed by remote task manager '142.151.160.20/142.151.160.20:6121'. This might indicate that the remote task manager was lost at org.apache.flink.runtime.io.network.netty.CreditBasedPartitionRequestClientHandler.channelInactive(CreditBasedPartitionRequestClientHandler.java:160 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241 at org.apache.flink.shaded.netty4.io.netty.channel.ChannelInboundHandlerAdapter.channelInactive(ChannelInboundHandlerAdapter.java:81 at org.apache.flink.runtime.io.network.netty.NettyMessageClientDecoderDelegate.channelInactive(NettyMessageClientDecoderDelegate.java:94 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241 at org.apache.flink.shaded.netty4.io.netty.handler.codec.ByteToMessageDecoder.channelInputClosed(ByteToMessageDecoder.java:389 at org.apache.flink.shaded.netty4.io.netty.handler.codec.ByteToMessageDecoder.channelInactive(ByteToMessageDecoder.java:354 at org.apache.flink.shaded.netty4.io.netty.handler.ssl.SslHandler.channelInactive(SslHandler.java:1106 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241 at org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline$HeadContext.channelInactive(DefaultChannelPipeline.java:1405 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248 at org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline.fireChannelInactive(DefaultChannelPipeline.java:901 at org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannel$AbstractUnsafe$8.run(AbstractChannel.java:818 at org.apache.flink.shaded.netty4.io.netty.util.concurrent.AbstractEventExecutor.safeExecute(AbstractEventExecutor.java:164 at org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.runAllTasks(SingleThreadEventExecutor.java:472 at org.apache.flink.shaded.netty4.io.netty.channel.epoll.EpollEventLoop.run(EpollEventLoop.java:384 at org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor$4.run(SingleThreadEventExecutor.java:989 at org.apache.flink.shaded.netty4.io.netty.util.internal.ThreadExecutorMap$2.run(ThreadExecutorMap.java:74 at java.base/java.lang.Thread.run(Thread.java:829) " } ``` -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: commits-unsubscr...@hudi.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org