This is an automated email from the ASF dual-hosted git repository.
morningman pushed a commit to branch branch-4.0
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/branch-4.0 by this push:
new ac5a8c941cd branch-4.0: [fix](insert) fix INSERT job statistics lost
in show load after FE restart #62331 (#62545)
ac5a8c941cd is described below
commit ac5a8c941cd0e5ae59a41805ef4570a4262088a8
Author: github-actions[bot]
<41898282+github-actions[bot]@users.noreply.github.com>
AuthorDate: Fri May 15 21:11:03 2026 -0700
branch-4.0: [fix](insert) fix INSERT job statistics lost in show load after
FE restart #62331 (#62545)
Cherry-picked from #62331
Co-authored-by: hui lai <[email protected]>
---
.../apache/doris/load/loadv2/InsertLoadJob.java | 19 +++++
.../java/org/apache/doris/load/loadv2/LoadJob.java | 6 +-
.../test_insert_statistic_after_fe_restart.groovy | 92 ++++++++++++++++++++++
3 files changed, 116 insertions(+), 1 deletion(-)
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/InsertLoadJob.java
b/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/InsertLoadJob.java
index fd456be4cab..6c204da1083 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/InsertLoadJob.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/InsertLoadJob.java
@@ -48,6 +48,12 @@ public class InsertLoadJob extends LoadJob {
@SerializedName("tid")
private long tableId;
+ // Snapshot of loadStatistic.toJson() captured when the job finishes.
+ // loadStatistic is not persisted (no @SerializedName), so we save it here
+ // to survive FE restarts.
+ @SerializedName("jdj")
+ private String jobDetailsJson = null;
+
// only for log replay
public InsertLoadJob() {
super(EtlJobType.INSERT);
@@ -91,6 +97,9 @@ public class InsertLoadJob extends LoadJob {
this.loadingStatus.setTrackingUrl(trackingUrl);
this.loadingStatus.setFirstErrorMsg(firstErrorMsg);
this.userInfo = userInfo;
+ // Snapshot the current loadStatistic so it survives FE restarts.
+ // loadStatistic itself is not annotated with @SerializedName and
won't be persisted.
+ this.jobDetailsJson = this.loadStatistic.toJson();
}
public AuthorizationInfo gatherAuthInfo() throws MetaNotFoundException {
@@ -116,4 +125,14 @@ public class InsertLoadJob extends LoadJob {
throw e;
}
}
+
+ @Override
+ protected String getJobDetailsJson() {
+ // Use the persisted snapshot when loadStatistic is empty (e.g. after
FE restart).
+ // Fall back to the live loadStatistic during execution.
+ if (jobDetailsJson != null) {
+ return jobDetailsJson;
+ }
+ return loadStatistic.toJson();
+ }
}
diff --git a/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/LoadJob.java
b/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/LoadJob.java
index 947ed64244d..1ca2eb05562 100644
--- a/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/LoadJob.java
+++ b/fe/fe-core/src/main/java/org/apache/doris/load/loadv2/LoadJob.java
@@ -790,7 +790,7 @@ public abstract class LoadJob extends
AbstractTxnStateChangeCallback
jobInfo.add(TimeUtils.longToTimeString(finishTimestamp));
// tracking url
jobInfo.add(loadingStatus.getTrackingUrl());
- jobInfo.add(loadStatistic.toJson());
+ jobInfo.add(getJobDetailsJson());
// transaction id
jobInfo.add(transactionId);
// error tablets
@@ -820,6 +820,10 @@ public abstract class LoadJob extends
AbstractTxnStateChangeCallback
return "N/A";
}
+ protected String getJobDetailsJson() {
+ return loadStatistic.toJson();
+ }
+
protected long getEtlStartTimestamp() {
return loadStartTimestamp;
}
diff --git
a/regression-test/suites/load_p0/insert/test_insert_statistic_after_fe_restart.groovy
b/regression-test/suites/load_p0/insert/test_insert_statistic_after_fe_restart.groovy
new file mode 100644
index 00000000000..cab13258e88
--- /dev/null
+++
b/regression-test/suites/load_p0/insert/test_insert_statistic_after_fe_restart.groovy
@@ -0,0 +1,92 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements. See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership. The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License. You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied. See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+import org.apache.doris.regression.suite.ClusterOptions
+
+// Verify that INSERT job statistics (ScannedRows, LoadBytes, etc.) shown in
+// SHOW LOAD are preserved after a FE restart. Before the fix, loadStatistic
+// was not serialized to the edit log, so all counters reset to 0 after
restart.
+suite("test_insert_statistic_after_fe_restart", "docker") {
+ def options = new ClusterOptions()
+ options.setFeNum(1)
+ docker(options) {
+ def dbName = "test_insert_statistic_restart_db"
+ def srcTbl = "src_tbl"
+ def dstTbl = "dst_tbl"
+
+ sql """DROP DATABASE IF EXISTS ${dbName}"""
+ sql """CREATE DATABASE ${dbName}"""
+ sql """USE ${dbName}"""
+
+ sql """
+ CREATE TABLE ${srcTbl} (
+ k1 INT NULL,
+ k2 VARCHAR(50) NULL
+ ) ENGINE=OLAP
+ DUPLICATE KEY(k1)
+ DISTRIBUTED BY HASH(k1) BUCKETS 3
+ PROPERTIES ("replication_num" = "1")
+ """
+ sql """
+ CREATE TABLE ${dstTbl} (
+ k1 INT NULL,
+ k2 VARCHAR(50) NULL
+ ) ENGINE=OLAP
+ DUPLICATE KEY(k1)
+ DISTRIBUTED BY HASH(k1) BUCKETS 3
+ PROPERTIES ("replication_num" = "1")
+ """
+
+ // Insert enough rows so ScannedRows and LoadBytes are clearly non-zero
+ sql """INSERT INTO ${srcTbl} SELECT number, concat('value_', number)
+ FROM numbers('number'='1000')"""
+
+ // insert into select — this creates the INSERT load job tracked by
show load
+ sql """INSERT INTO ${dstTbl} SELECT * FROM ${srcTbl}"""
+
+ def result = sql """SHOW LOAD FROM ${dbName}"""
+ assertEquals(1, result.size())
+ def jobDetailsBefore = parseJson(result[0][14])
+ logger.info("JobDetails before restart: ${result[0][14]}")
+
+ assertTrue(jobDetailsBefore.ScannedRows > 0,
+ "ScannedRows should be > 0 before restart, got
${jobDetailsBefore.ScannedRows}")
+ assertTrue(jobDetailsBefore.LoadBytes > 0,
+ "LoadBytes should be > 0 before restart, got
${jobDetailsBefore.LoadBytes}")
+
+ // Restart FE and reconnect
+ cluster.restartFrontends()
+ sleep(30000)
+ context.reconnectFe()
+
+ sql """USE ${dbName}"""
+
+ result = sql """SHOW LOAD FROM ${dbName}"""
+ assertEquals(1, result.size())
+ def jobDetailsAfter = parseJson(result[0][14])
+ logger.info("JobDetails after restart: ${result[0][14]}")
+
+ assertEquals(jobDetailsBefore.ScannedRows, jobDetailsAfter.ScannedRows,
+ "ScannedRows changed after FE restart:
before=${jobDetailsBefore.ScannedRows}, after=${jobDetailsAfter.ScannedRows}")
+ assertEquals(jobDetailsBefore.LoadBytes, jobDetailsAfter.LoadBytes,
+ "LoadBytes changed after FE restart:
before=${jobDetailsBefore.LoadBytes}, after=${jobDetailsAfter.LoadBytes}")
+ assertEquals(jobDetailsBefore.FileNumber, jobDetailsAfter.FileNumber,
+ "FileNumber changed after FE restart")
+ assertEquals(jobDetailsBefore.FileSize, jobDetailsAfter.FileSize,
+ "FileSize changed after FE restart")
+ }
+}
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]