hudi-bot opened a new issue, #15059:
URL: https://github.com/apache/hudi/issues/15059
mor async compact integ test validation is failing.
{code:java}
22/03/14 01:31:28 WARN DagNode: Validation using data from input path
/home/hadoop/staging/input//*/*
266722/03/14 01:31:28 INFO ValidateDatasetNode: Validate data in target hudi
path /home/hadoop/staging/output//*/*/*
266822/03/14 01:31:31 ERROR DagNode: Data set validation failed. Total count
in hudi 64400, input df count 64400
266922/03/14 01:31:31 INFO DagScheduler: Forcing shutdown of executor
service, this might kill running tasks
267022/03/14 01:31:31 ERROR HoodieTestSuiteJob: Failed to run Test Suite
2671java.util.concurrent.ExecutionException: java.lang.AssertionError: Hudi
contents does not match contents input data.
2672 at java.util.concurrent.FutureTask.report(FutureTask.java:122)
2673 at java.util.concurrent.FutureTask.get(FutureTask.java:206)
2674 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.execute(DagScheduler.java:113)
2675 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.schedule(DagScheduler.java:68)
2676 at
org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:203)
2677 at
org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.main(HoodieTestSuiteJob.java:170)
2678 at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
2679 at
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
2680 at
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
2681 at java.lang.reflect.Method.invoke(Method.java:498)
2682 at
org.apache.spark.deploy.JavaMainApplication.start(SparkApplication.scala:52)
2683 at
org.apache.spark.deploy.SparkSubmit.org$apache$spark$deploy$SparkSubmit$$runMain(SparkSubmit.scala:955)
2684 at
org.apache.spark.deploy.SparkSubmit.doRunMain$1(SparkSubmit.scala:180)
2685 at org.apache.spark.deploy.SparkSubmit.submit(SparkSubmit.scala:203)
2686 at org.apache.spark.deploy.SparkSubmit.doSubmit(SparkSubmit.scala:90)
2687 at
org.apache.spark.deploy.SparkSubmit$$anon$2.doSubmit(SparkSubmit.scala:1043)
2688 at org.apache.spark.deploy.SparkSubmit$.main(SparkSubmit.scala:1052)
2689 at org.apache.spark.deploy.SparkSubmit.main(SparkSubmit.scala)
2690Caused by: java.lang.AssertionError: Hudi contents does not match
contents input data.
2691 at
org.apache.hudi.integ.testsuite.dag.nodes.BaseValidateDatasetNode.execute(BaseValidateDatasetNode.java:119)
2692 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.executeNode(DagScheduler.java:139)
2693 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.lambda$execute$0(DagScheduler.java:105)
2694 at
java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511)
2695 at java.util.concurrent.FutureTask.run(FutureTask.java:266)
2696 at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
2697 at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
2698 at java.lang.Thread.run(Thread.java:748)
2699Exception in thread "main" org.apache.hudi.exception.HoodieException:
Failed to run Test Suite
2700 at
org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:208)
2701 at
org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.main(HoodieTestSuiteJob.java:170)
2702 at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
2703 at
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
2704 at
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
2705 at java.lang.reflect.Method.invoke(Method.java:498)
2706 at
org.apache.spark.deploy.JavaMainApplication.start(SparkApplication.scala:52)
2707 at
org.apache.spark.deploy.SparkSubmit.org$apache$spark$deploy$SparkSubmit$$runMain(SparkSubmit.scala:955)
2708 at
org.apache.spark.deploy.SparkSubmit.doRunMain$1(SparkSubmit.scala:180)
2709 at org.apache.spark.deploy.SparkSubmit.submit(SparkSubmit.scala:203)
2710 at org.apache.spark.deploy.SparkSubmit.doSubmit(SparkSubmit.scala:90)
2711 at
org.apache.spark.deploy.SparkSubmit$$anon$2.doSubmit(SparkSubmit.scala:1043)
2712 at org.apache.spark.deploy.SparkSubmit$.main(SparkSubmit.scala:1052)
2713 at org.apache.spark.deploy.SparkSubmit.main(SparkSubmit.scala)
2714Caused by: java.util.concurrent.ExecutionException:
java.lang.AssertionError: Hudi contents does not match contents input data.
2715 at java.util.concurrent.FutureTask.report(FutureTask.java:122)
2716 at java.util.concurrent.FutureTask.get(FutureTask.java:206)
2717 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.execute(DagScheduler.java:113)
2718 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.schedule(DagScheduler.java:68)
2719 at
org.apache.hudi.integ.testsuite.HoodieTestSuiteJob.runTestSuite(HoodieTestSuiteJob.java:203)
2720 ... 13 more
2721Caused by: java.lang.AssertionError: Hudi contents does not match
contents input data.
2722 at
org.apache.hudi.integ.testsuite.dag.nodes.BaseValidateDatasetNode.execute(BaseValidateDatasetNode.java:119)
2723 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.executeNode(DagScheduler.java:139)
2724 at
org.apache.hudi.integ.testsuite.dag.scheduler.DagScheduler.lambda$execute$0(DagScheduler.java:105)
2725 at
java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511)
2726 at java.util.concurrent.FutureTask.run(FutureTask.java:266)
2727 at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
2728 at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
2729 at java.lang.Thread.run(Thread.java:748) {code}
## JIRA info
- Link: https://issues.apache.org/jira/browse/HUDI-3616
- Type: Bug
- Epic: https://issues.apache.org/jira/browse/HUDI-3303
- Fix version(s):
- 1.1.0
---
## Comments
28/Apr/22 13:05;xushiyan;[~shivnarayan] is this still valid?;;;
---
06/May/22 16:23;shivnarayan;we are not running this test yaml for now. All
our existing running yamls are working. will lower the priority. ;;;
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]