davidshtian commented on issue #7591:
URL: https://github.com/apache/hudi/issues/7591#issuecomment-1375225426

   Or lots of similar logs like this "RemoteTransportException: Connection 
unexpectedly closed by remote task manager 
'142.151.160.20/142.151.160.20:6121'. This might indicate that the remote task 
manager was lost.
   This may indicate that the taskmanagers are overloaded."
   ```
   "applicationARN": 
"arn:aws:kinesisanalytics:us-east-1:xxx:application/kda-studio-david",
   "applicationVersionId": "19",
   "locationInformation": 
"org.apache.zeppelin.flink.FlinkSqlInterrpeter.runSqlList(FlinkSqlInterrpeter.java:163)",
   "logger": "org.apache.zeppelin.flink.FlinkSqlInterrpeter",
   "message": "Fail to run sql:INSERT INTO t1 SELECT uuid, event_time, 
ticker,price from stock_table",
   "messageSchemaVersion": "1",
   "messageType": "ERROR",
   "threadName": "ParallelScheduler-Worker-9",
   "throwableInformation": "java.io.IOException: 
org.apache.flink.client.program.ProgramInvocationException: Job failed (JobID: 
3e6e3e07934084f5fafc542a4a91bc2c)
   at 
org.apache.zeppelin.flink.FlinkSqlInterrpeter.callInsertInto(FlinkSqlInterrpeter.java:538
   at 
org.apache.zeppelin.flink.FlinkStreamSqlInterpreter.callInsertInto(FlinkStreamSqlInterpreter.java:97
   at 
org.apache.zeppelin.flink.FlinkSqlInterrpeter.callCommand(FlinkSqlInterrpeter.java:273
   at 
org.apache.zeppelin.flink.FlinkSqlInterrpeter.runSqlList(FlinkSqlInterrpeter.java:160
   at 
org.apache.zeppelin.flink.FlinkSqlInterrpeter.internalInterpret(FlinkSqlInterrpeter.java:112
   at 
org.apache.zeppelin.interpreter.AbstractInterpreter.interpret(AbstractInterpreter.java:47
   at 
org.apache.zeppelin.interpreter.LazyOpenInterpreter.interpret(LazyOpenInterpreter.java:110
   at 
org.apache.zeppelin.interpreter.remote.RemoteInterpreterServer$InterpretJob.jobRun(RemoteInterpreterServer.java:852
   at 
org.apache.zeppelin.interpreter.remote.RemoteInterpreterServer$InterpretJob.jobRun(RemoteInterpreterServer.java:744
   at org.apache.zeppelin.scheduler.Job.run(Job.java:172
   at 
org.apache.zeppelin.scheduler.AbstractScheduler.runJob(AbstractScheduler.java:132
   at 
org.apache.zeppelin.scheduler.ParallelScheduler.lambda$runJobInScheduler$0(ParallelScheduler.java:46
   at 
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128
   at 
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628
   at java.base/java.lang.Thread.run(Thread.java:829
   Caused by: org.apache.flink.client.program.ProgramInvocationException: Job 
failed (JobID: 3e6e3e07934084f5fafc542a4a91bc2c
   at 
org.apache.flink.client.deployment.ClusterClientJobClientAdapter.lambda$getJobExecutionResult$6(ClusterClientJobClientAdapter.java:125
   at 
java.base/java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:642
   at 
java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506
   at 
java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073
   at 
org.apache.flink.runtime.concurrent.FutureUtils.lambda$retryOperationWithDelay$9(FutureUtils.java:394
   at 
java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859
   at 
java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837
   at 
java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506
   at 
java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073
   at 
org.apache.flink.client.program.rest.RestClusterClient.lambda$pollResourceAsync$24(RestClusterClient.java:670
   at 
java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859
   at 
java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837
   at 
java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506
   at 
java.base/java.util.concurrent.CompletableFuture.complete(CompletableFuture.java:2073
   at 
org.apache.flink.runtime.concurrent.FutureUtils.lambda$retryOperationWithDelay$9(FutureUtils.java:394
   at 
java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:859
   at 
java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837
   at 
java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506
   at 
java.base/java.util.concurrent.CompletableFuture.postFire(CompletableFuture.java:610
   at 
java.base/java.util.concurrent.CompletableFuture$UniCompose.tryFire(CompletableFuture.java:1085
   at 
java.base/java.util.concurrent.CompletableFuture$Completion.run(CompletableFuture.java:478
   ... 3 mor
   Caused by: org.apache.flink.runtime.client.JobExecutionException: Job 
execution failed
   at 
org.apache.flink.runtime.jobmaster.JobResult.toJobExecutionResult(JobResult.java:144
   at 
org.apache.flink.client.deployment.ClusterClientJobClientAdapter.lambda$getJobExecutionResult$6(ClusterClientJobClientAdapter.java:123
   ... 23 mor
   Caused by: org.apache.flink.runtime.JobException: Recovery is suppressed by 
NoRestartBackoffTimeStrateg
   at 
org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.handleFailure(ExecutionFailureHandler.java:138
   at 
org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.getFailureHandlingResult(ExecutionFailureHandler.java:82
   at 
org.apache.flink.runtime.scheduler.DefaultScheduler.handleTaskFailure(DefaultScheduler.java:222
   at 
org.apache.flink.runtime.scheduler.DefaultScheduler.maybeHandleTaskFailure(DefaultScheduler.java:212
   at 
org.apache.flink.runtime.scheduler.DefaultScheduler.updateTaskExecutionStateInternal(DefaultScheduler.java:203
   at 
org.apache.flink.runtime.scheduler.SchedulerBase.updateTaskExecutionState(SchedulerBase.java:718
   at 
org.apache.flink.runtime.scheduler.SchedulerNG.updateTaskExecutionState(SchedulerNG.java:79
   at 
org.apache.flink.runtime.jobmaster.JobMaster.updateTaskExecutionState(JobMaster.java:443
   at jdk.internal.reflect.GeneratedMethodAccessor100.invoke(Unknown Source
   at 
java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43
   at java.base/java.lang.reflect.Method.invoke(Method.java:566
   at 
org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcInvocation(AkkaRpcActor.java:305
   at 
org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcMessage(AkkaRpcActor.java:212
   at 
org.apache.flink.runtime.rpc.akka.FencedAkkaRpcActor.handleRpcMessage(FencedAkkaRpcActor.java:77
   at 
org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleMessage(AkkaRpcActor.java:158
   at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:26
   at akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:21
   at scala.PartialFunction.applyOrElse(PartialFunction.scala:123
   at scala.PartialFunction.applyOrElse$(PartialFunction.scala:122
   at akka.japi.pf.UnitCaseStatement.applyOrElse(CaseStatements.scala:21
   at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:171
   at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172
   at scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172
   at akka.actor.Actor.aroundReceive(Actor.scala:517
   at akka.actor.Actor.aroundReceive$(Actor.scala:515
   at akka.actor.AbstractActor.aroundReceive(AbstractActor.scala:225
   at akka.actor.ActorCell.receiveMessage(ActorCell.scala:592
   at akka.actor.ActorCell.invoke(ActorCell.scala:561
   at akka.dispatch.Mailbox.processMailbox(Mailbox.scala:258
   at akka.dispatch.Mailbox.run(Mailbox.scala:225
   at akka.dispatch.Mailbox.exec(Mailbox.scala:235
   at akka.dispatch.forkjoin.ForkJoinTask.doExec(ForkJoinTask.java:260
   at 
akka.dispatch.forkjoin.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1339
   at akka.dispatch.forkjoin.ForkJoinPool.runWorker(ForkJoinPool.java:1979
   at 
akka.dispatch.forkjoin.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:107
   Caused by: 
org.apache.flink.runtime.io.network.netty.exception.RemoteTransportException: 
Connection unexpectedly closed by remote task manager 
'142.151.160.20/142.151.160.20:6121'. This might indicate that the remote task 
manager was lost
   at 
org.apache.flink.runtime.io.network.netty.CreditBasedPartitionRequestClientHandler.channelInactive(CreditBasedPartitionRequestClientHandler.java:160
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241
   at 
org.apache.flink.shaded.netty4.io.netty.channel.ChannelInboundHandlerAdapter.channelInactive(ChannelInboundHandlerAdapter.java:81
   at 
org.apache.flink.runtime.io.network.netty.NettyMessageClientDecoderDelegate.channelInactive(NettyMessageClientDecoderDelegate.java:94
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241
   at 
org.apache.flink.shaded.netty4.io.netty.handler.codec.ByteToMessageDecoder.channelInputClosed(ByteToMessageDecoder.java:389
   at 
org.apache.flink.shaded.netty4.io.netty.handler.codec.ByteToMessageDecoder.channelInactive(ByteToMessageDecoder.java:354
   at 
org.apache.flink.shaded.netty4.io.netty.handler.ssl.SslHandler.channelInactive(SslHandler.java:1106
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelInactive(AbstractChannelHandlerContext.java:241
   at 
org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline$HeadContext.channelInactive(DefaultChannelPipeline.java:1405
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:262
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelInactive(AbstractChannelHandlerContext.java:248
   at 
org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline.fireChannelInactive(DefaultChannelPipeline.java:901
   at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannel$AbstractUnsafe$8.run(AbstractChannel.java:818
   at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.AbstractEventExecutor.safeExecute(AbstractEventExecutor.java:164
   at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.runAllTasks(SingleThreadEventExecutor.java:472
   at 
org.apache.flink.shaded.netty4.io.netty.channel.epoll.EpollEventLoop.run(EpollEventLoop.java:384
   at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor$4.run(SingleThreadEventExecutor.java:989
   at 
org.apache.flink.shaded.netty4.io.netty.util.internal.ThreadExecutorMap$2.run(ThreadExecutorMap.java:74
   at java.base/java.lang.Thread.run(Thread.java:829)
   "
   }
   ```


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: commits-unsubscr...@hudi.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org

Reply via email to