[ https://issues.apache.org/jira/browse/HIVE-29003?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]
László Bodor updated HIVE-29003: -------------------------------- Description: HIVE-28028 removed some Tez class sources from the Hive repository. However, the corresponding artifacts are still required by certain Hive components (e.g., metastore schema initialization), where the tez-protobuf-history-plugin JAR is not intended to be on the classpath. The user should not be responsible for including this JAR manually—especially since the hive-exec fat JAR is expected to include everything necessary, properly shaded (though not necessarily relocalized). The absence of these classes caused something like below: {code} 2025-06-09 12:49:13,217 INFO org.apache.hadoop.hive.ql.Driver: [HiveServer2-Background-Pool: Thread-69]: Executing command(queryId=hive_20250609124913_b5efd16f-35b0-424a-b839-b298358b8395): CREATE DATABASE IF NOT EXISTS SYS 2025-06-09 12:49:13,222 INFO org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook: [HiveServer2-Background-Pool: Thread-69]: Event per file enabled: false 2025-06-09 12:49:13,223 INFO org.apache.hadoop.hive.ql.reexec.ReOptimizePlugin: [HiveServer2-Background-Pool: Thread-69]: ReOptimization: retryPossible: false 2025-06-09 12:49:13,223 INFO org.apache.hadoop.hive.ql.reexec.ReExecuteLostAMQueryPlugin: [HiveServer2-Background-Pool: Thread-69]: Exception is not a TezRuntimeException, no need to check further with ReExecuteLostAMQueryPlugin 2025-06-09 12:49:13,223 INFO org.apache.hadoop.hive.ql.reexec.ReExecutionDagSubmitPlugin: [HiveServer2-Background-Pool: Thread-69]: Got exception message: org/apache/tez/dag/history/logging/proto/DatePartitionedLogger retryPossible: false 2025-06-09 12:49:13,224 INFO org.apache.hadoop.hive.ql.reexec.ReExecuteOnWriteConflictPlugin: [HiveServer2-Background-Pool: Thread-69]: Got exception message: org/apache/tez/dag/history/logging/proto/DatePartitionedLogger retryPossible: false 2025-06-09 12:49:13,224 INFO org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook: [HiveServer2-Background-Pool: Thread-69]: Event per file enabled: false 2025-06-09 12:49:13,225 INFO hive.ql.metadata.Hive: [HiveServer2-Background-Pool: Thread-69]: Dumping metastore api call timing information for : execution phase 2025-06-09 12:49:13,225 INFO hive.ql.metadata.Hive: [HiveServer2-Background-Pool: Thread-69]: Total time spent in each metastore function (ms): {} 2025-06-09 12:49:13,225 INFO org.apache.hadoop.hive.ql.Driver: [HiveServer2-Background-Pool: Thread-69]: Completed executing command(queryId=hive_20250609124913_b5efd16f-35b0-424a-b839-b298358b8395); Time taken: 0.008 seconds 2025-06-09 12:49:13,225 INFO org.apache.hadoop.hive.ql.Driver: [HiveServer2-Background-Pool: Thread-69]: OK 2025-06-09 12:49:13,230 ERROR org.apache.hive.service.cli.operation.Operation: [HiveServer2-Background-Pool: Thread-69]: Error running hive query: org.apache.hive.service.cli.HiveSQLException: Error running query: java.lang.NoClassDefFoundError: org/apache/tez/dag/history/logging/proto/DatePartitionedLogger at org.apache.hive.service.cli.operation.SQLOperation.runQuery(SQLOperation.java:256) ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hive.service.cli.operation.SQLOperation.access$700(SQLOperation.java:92) ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hive.service.cli.operation.SQLOperation$BackgroundWork$1.run(SQLOperation.java:341) ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at java.security.AccessController.doPrivileged(Native Method) ~[?:1.8.0_232] at javax.security.auth.Subject.doAs(Subject.java:422) ~[?:1.8.0_232] at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1910) ~[hadoop-common-3.1.1.7.3.1.400-92.jar:?] at org.apache.hive.service.cli.operation.SQLOperation$BackgroundWork.run(SQLOperation.java:361) ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) ~[?:1.8.0_232] at java.util.concurrent.FutureTask.run(FutureTask.java:266) ~[?:1.8.0_232] at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) ~[?:1.8.0_232] at java.util.concurrent.FutureTask.run(FutureTask.java:266) ~[?:1.8.0_232] at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) ~[?:1.8.0_232] at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) ~[?:1.8.0_232] at java.lang.Thread.run(Thread.java:748) ~[?:1.8.0_232] Caused by: java.lang.NoClassDefFoundError: org/apache/tez/dag/history/logging/proto/DatePartitionedLogger at org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook$EventLogger.<init>(HiveProtoLoggingHook.java:206) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook$EventLogger.getInstance(HiveProtoLoggingHook.java:559) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook.run(HiveProtoLoggingHook.java:571) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.HookRunner.invokeGeneralHook(HookRunner.java:307) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.HookRunner.runFailureHooks(HookRunner.java:294) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.DriverUtils.invokeFailureHooks(DriverUtils.java:158) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.Executor.handleException(Executor.java:514) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.Executor.execute(Executor.java:118) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.Driver.runInternal(Driver.java:812) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.Driver.run(Driver.java:547) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.Driver.run(Driver.java:541) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:190) ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] at org.apache.hive.service.cli.operation.SQLOperation.runQuery(SQLOperation.java:236) ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] ... 13 more {code} was: HIVE-28028 removed some Tez class sources from the Hive repository. However, the corresponding artifacts are still required by certain Hive components (e.g., metastore schema initialization), where the tez-protobuf-history-plugin JAR is not intended to be on the classpath. The user should not be responsible for including this JAR manually—especially since the hive-exec fat JAR is expected to include everything necessary, properly shaded (though not necessarily relocalized). > DataPartitionedLogger from Tez is always needed for hive logging hook > --------------------------------------------------------------------- > > Key: HIVE-29003 > URL: https://issues.apache.org/jira/browse/HIVE-29003 > Project: Hive > Issue Type: Bug > Reporter: László Bodor > Assignee: László Bodor > Priority: Major > > HIVE-28028 removed some Tez class sources from the Hive repository. However, > the corresponding artifacts are still required by certain Hive components > (e.g., metastore schema initialization), where the > tez-protobuf-history-plugin JAR is not intended to be on the classpath. > The user should not be responsible for including this JAR manually—especially > since the hive-exec fat JAR is expected to include everything necessary, > properly shaded (though not necessarily relocalized). > The absence of these classes caused something like below: > {code} > 2025-06-09 12:49:13,217 INFO org.apache.hadoop.hive.ql.Driver: > [HiveServer2-Background-Pool: Thread-69]: Executing > command(queryId=hive_20250609124913_b5efd16f-35b0-424a-b839-b298358b8395): > CREATE DATABASE IF NOT EXISTS SYS > 2025-06-09 12:49:13,222 INFO > org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook: > [HiveServer2-Background-Pool: Thread-69]: Event per file enabled: false > 2025-06-09 12:49:13,223 INFO > org.apache.hadoop.hive.ql.reexec.ReOptimizePlugin: > [HiveServer2-Background-Pool: Thread-69]: ReOptimization: retryPossible: false > 2025-06-09 12:49:13,223 INFO > org.apache.hadoop.hive.ql.reexec.ReExecuteLostAMQueryPlugin: > [HiveServer2-Background-Pool: Thread-69]: Exception is not a > TezRuntimeException, no need to check further with ReExecuteLostAMQueryPlugin > 2025-06-09 12:49:13,223 INFO > org.apache.hadoop.hive.ql.reexec.ReExecutionDagSubmitPlugin: > [HiveServer2-Background-Pool: Thread-69]: Got exception message: > org/apache/tez/dag/history/logging/proto/DatePartitionedLogger retryPossible: > false > 2025-06-09 12:49:13,224 INFO > org.apache.hadoop.hive.ql.reexec.ReExecuteOnWriteConflictPlugin: > [HiveServer2-Background-Pool: Thread-69]: Got exception message: > org/apache/tez/dag/history/logging/proto/DatePartitionedLogger retryPossible: > false > 2025-06-09 12:49:13,224 INFO > org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook: > [HiveServer2-Background-Pool: Thread-69]: Event per file enabled: false > 2025-06-09 12:49:13,225 INFO hive.ql.metadata.Hive: > [HiveServer2-Background-Pool: Thread-69]: Dumping metastore api call timing > information for : execution phase > 2025-06-09 12:49:13,225 INFO hive.ql.metadata.Hive: > [HiveServer2-Background-Pool: Thread-69]: Total time spent in each metastore > function (ms): {} > 2025-06-09 12:49:13,225 INFO org.apache.hadoop.hive.ql.Driver: > [HiveServer2-Background-Pool: Thread-69]: Completed executing > command(queryId=hive_20250609124913_b5efd16f-35b0-424a-b839-b298358b8395); > Time taken: 0.008 seconds > 2025-06-09 12:49:13,225 INFO org.apache.hadoop.hive.ql.Driver: > [HiveServer2-Background-Pool: Thread-69]: OK > 2025-06-09 12:49:13,230 ERROR > org.apache.hive.service.cli.operation.Operation: > [HiveServer2-Background-Pool: Thread-69]: Error running hive query: > org.apache.hive.service.cli.HiveSQLException: Error running query: > java.lang.NoClassDefFoundError: > org/apache/tez/dag/history/logging/proto/DatePartitionedLogger > at > org.apache.hive.service.cli.operation.SQLOperation.runQuery(SQLOperation.java:256) > ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hive.service.cli.operation.SQLOperation.access$700(SQLOperation.java:92) > ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hive.service.cli.operation.SQLOperation$BackgroundWork$1.run(SQLOperation.java:341) > ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at java.security.AccessController.doPrivileged(Native Method) > ~[?:1.8.0_232] > at javax.security.auth.Subject.doAs(Subject.java:422) ~[?:1.8.0_232] > at > org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1910) > ~[hadoop-common-3.1.1.7.3.1.400-92.jar:?] > at > org.apache.hive.service.cli.operation.SQLOperation$BackgroundWork.run(SQLOperation.java:361) > ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) > ~[?:1.8.0_232] > at java.util.concurrent.FutureTask.run(FutureTask.java:266) > ~[?:1.8.0_232] > at > java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) > ~[?:1.8.0_232] > at java.util.concurrent.FutureTask.run(FutureTask.java:266) > ~[?:1.8.0_232] > at > java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) > ~[?:1.8.0_232] > at > java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) > ~[?:1.8.0_232] > at java.lang.Thread.run(Thread.java:748) ~[?:1.8.0_232] > Caused by: java.lang.NoClassDefFoundError: > org/apache/tez/dag/history/logging/proto/DatePartitionedLogger > at > org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook$EventLogger.<init>(HiveProtoLoggingHook.java:206) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook$EventLogger.getInstance(HiveProtoLoggingHook.java:559) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.hooks.HiveProtoLoggingHook.run(HiveProtoLoggingHook.java:571) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.HookRunner.invokeGeneralHook(HookRunner.java:307) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.HookRunner.runFailureHooks(HookRunner.java:294) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.DriverUtils.invokeFailureHooks(DriverUtils.java:158) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.Executor.handleException(Executor.java:514) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at org.apache.hadoop.hive.ql.Executor.execute(Executor.java:118) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at org.apache.hadoop.hive.ql.Driver.runInternal(Driver.java:812) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at org.apache.hadoop.hive.ql.Driver.run(Driver.java:547) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at org.apache.hadoop.hive.ql.Driver.run(Driver.java:541) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:190) > ~[hive-exec-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > at > org.apache.hive.service.cli.operation.SQLOperation.runQuery(SQLOperation.java:236) > ~[hive-service-3.1.3000.7.3.1.400-92.jar:3.1.3000.7.3.1.400-92] > ... 13 more > {code} -- This message was sent by Atlassian Jira (v8.20.10#820010)