[ https://issues.apache.org/jira/browse/HUDI-3616?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]
Raymond Xu updated HUDI-3616: ----------------------------- Fix Version/s: 0.14.0 (was: 0.13.1) > Ingestigate mor async compact integ test failure > ------------------------------------------------ > > Key: HUDI-3616 > URL: https://issues.apache.org/jira/browse/HUDI-3616 > Project: Apache Hudi > Issue Type: Bug > Components: tests-ci > Reporter: sivabalan narayanan > Priority: Minor > Fix For: 0.14.0 > > > mor async compact integ test validation is failing. > > {code:java} > 22/03/14 01:31:28 WARN DagNode: Validation using data from input path > /home/hadoop/staging/input//*/* > 266722/03/14 01:31:28 INFO ValidateDatasetNode: Validate data in target hudi > path /home/hadoop/staging/output//*/*/* > 266822/03/14 01:31:31 ERROR DagNode: Data set validation failed. Total count > in hudi 64400, input df count 64400 > 266922/03/14 01:31:31 INFO DagScheduler: Forcing shutdown of executor > service, this might kill running tasks > 267022/03/14 01:31:31 ERROR HoodieTestSuiteJob: Failed to run Test Suite > 2671java.util.concurrent.ExecutionException: java.lang.AssertionError: Hudi > contents does not match contents input data. > 2672 at java.util.concurrent.FutureTask.report(FutureTask.java:122) > 2673 at java.util.concurrent.FutureTask.get(FutureTask.java:206) > 2674 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.execute(DagScheduler.java:113) > 2675 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.schedule(DagScheduler.java:68) > 2676 at > org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:203) > 2677 at > org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.main(HoodieTestSuiteJob.java:170) > 2678 at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method) > 2679 at > sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62) > 2680 at > sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) > 2681 at java.lang.reflect.Method.invoke(Method.java:498) > 2682 at > org.apache.spark.deploy.JavaMainApplication.start(SparkApplication.scala:52) > 2683 at > org.apache.spark.deploy.SparkSubmit.org$apache$spark$deploy$SparkSubmit$$runMain(SparkSubmit.scala:955) > 2684 at > org.apache.spark.deploy.SparkSubmit.doRunMain$1(SparkSubmit.scala:180) > 2685 at org.apache.spark.deploy.SparkSubmit.submit(SparkSubmit.scala:203) > 2686 at org.apache.spark.deploy.SparkSubmit.doSubmit(SparkSubmit.scala:90) > 2687 at > org.apache.spark.deploy.SparkSubmit$$anon$2.doSubmit(SparkSubmit.scala:1043) > 2688 at org.apache.spark.deploy.SparkSubmit$.main(SparkSubmit.scala:1052) > 2689 at org.apache.spark.deploy.SparkSubmit.main(SparkSubmit.scala) > 2690Caused by: java.lang.AssertionError: Hudi contents does not match > contents input data. > 2691 at > org.apache.hudi.integ.testsuite.dag.nodes.BaseValidateDatasetNode.execute(BaseValidateDatasetNode.java:119) > 2692 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.executeNode(DagScheduler.java:139) > 2693 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.lambda$execute$0(DagScheduler.java:105) > 2694 at > java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) > 2695 at java.util.concurrent.FutureTask.run(FutureTask.java:266) > 2696 at > java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) > 2697 at > java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) > 2698 at java.lang.Thread.run(Thread.java:748) > 2699Exception in thread "main" org.apache.hudi.exception.HoodieException: > Failed to run Test Suite > 2700 at > org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:208) > 2701 at > org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.main(HoodieTestSuiteJob.java:170) > 2702 at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method) > 2703 at > sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62) > 2704 at > sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) > 2705 at java.lang.reflect.Method.invoke(Method.java:498) > 2706 at > org.apache.spark.deploy.JavaMainApplication.start(SparkApplication.scala:52) > 2707 at > org.apache.spark.deploy.SparkSubmit.org$apache$spark$deploy$SparkSubmit$$runMain(SparkSubmit.scala:955) > 2708 at > org.apache.spark.deploy.SparkSubmit.doRunMain$1(SparkSubmit.scala:180) > 2709 at org.apache.spark.deploy.SparkSubmit.submit(SparkSubmit.scala:203) > 2710 at org.apache.spark.deploy.SparkSubmit.doSubmit(SparkSubmit.scala:90) > 2711 at > org.apache.spark.deploy.SparkSubmit$$anon$2.doSubmit(SparkSubmit.scala:1043) > 2712 at org.apache.spark.deploy.SparkSubmit$.main(SparkSubmit.scala:1052) > 2713 at org.apache.spark.deploy.SparkSubmit.main(SparkSubmit.scala) > 2714Caused by: java.util.concurrent.ExecutionException: > java.lang.AssertionError: Hudi contents does not match contents input data. > 2715 at java.util.concurrent.FutureTask.report(FutureTask.java:122) > 2716 at java.util.concurrent.FutureTask.get(FutureTask.java:206) > 2717 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.execute(DagScheduler.java:113) > 2718 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.schedule(DagScheduler.java:68) > 2719 at > org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:203) > 2720 ... 13 more > 2721Caused by: java.lang.AssertionError: Hudi contents does not match > contents input data. > 2722 at > org.apache.hudi.integ.testsuite.dag.nodes.BaseValidateDatasetNode.execute(BaseValidateDatasetNode.java:119) > 2723 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.executeNode(DagScheduler.java:139) > 2724 at > org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.lambda$execute$0(DagScheduler.java:105) > 2725 at > java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) > 2726 at java.util.concurrent.FutureTask.run(FutureTask.java:266) > 2727 at > java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) > 2728 at > java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) > 2729 at java.lang.Thread.run(Thread.java:748) {code} -- This message was sent by Atlassian Jira (v8.20.10#820010)