(druid) branch master updated: Fix issue with Integer Joda timestamp coercion in DeterminePartitionsJob (#18327)

tuglu Fri, 25 Jul 2025 14:23:08 -0700

This is an automated email from the ASF dual-hosted git repository.

tuglu pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/druid.git



The following commit(s) were added to refs/heads/master by this push:
     new 8127d2cd7ec Fix issue with Integer Joda timestamp coercion in 
DeterminePartitionsJob (#18327)
8127d2cd7ec is described below

commit 8127d2cd7ec691b751fa61f0fc5ab65220fd6839
Author: jtuglu1 <[email protected]>
AuthorDate: Fri Jul 25 14:22:57 2025 -0700

    Fix issue with Integer Joda timestamp coercion in DeterminePartitionsJob 
(#18327)
    
    Timestamp columns that can fit in 32bits are coerced to Integer, which 
causes Joda DateTime ctor to break.
---
 .../druid/indexer/DeterminePartitionsJob.java      |  5 +++-
 .../druid/indexer/DeterminePartitionsJobTest.java  | 30 ++++++++++++++++------
 2 files changed, 26 insertions(+), 9 deletions(-)

diff --git 
a/indexing-hadoop/src/main/java/org/apache/druid/indexer/DeterminePartitionsJob.java
 
b/indexing-hadoop/src/main/java/org/apache/druid/indexer/DeterminePartitionsJob.java
index ca5f49937ab..3523eaf9ef2 100644
--- 
a/indexing-hadoop/src/main/java/org/apache/druid/indexer/DeterminePartitionsJob.java
+++ 
b/indexing-hadoop/src/main/java/org/apache/druid/indexer/DeterminePartitionsJob.java
@@ -414,7 +414,10 @@ public class DeterminePartitionsJob implements Jobby
     {
       final List<Object> timeAndDims = 
HadoopDruidIndexerConfig.JSON_MAPPER.readValue(key.getBytes(), List.class);
 
-      final DateTime timestamp = new DateTime(timeAndDims.get(0), 
ISOChronology.getInstanceUTC());
+      final Object timestampObj = timeAndDims.get(0);
+      final long longTimestamp = ((Number) timestampObj).longValue();
+      final DateTime timestamp = new DateTime(longTimestamp, 
ISOChronology.getInstanceUTC());
+
       final Map<String, Iterable<String>> dims = (Map<String, 
Iterable<String>>) timeAndDims.get(1);
 
       helper.emitDimValueCounts(context, timestamp, dims);
diff --git 
a/indexing-hadoop/src/test/java/org/apache/druid/indexer/DeterminePartitionsJobTest.java
 
b/indexing-hadoop/src/test/java/org/apache/druid/indexer/DeterminePartitionsJobTest.java
index f57ce6bdd64..7107824e6c4 100644
--- 
a/indexing-hadoop/src/test/java/org/apache/druid/indexer/DeterminePartitionsJobTest.java
+++ 
b/indexing-hadoop/src/test/java/org/apache/druid/indexer/DeterminePartitionsJobTest.java
@@ -65,7 +65,7 @@ public class DeterminePartitionsJobTest
   @Parameterized.Parameters(name = "assumeGrouped={0}, "
                                    + "targetRowsPerSegment={1}, "
                                    + "maxRowsPerSegment={2}, "
-                                   + "interval={3}"
+                                   + "intervals={3}"
                                    + "expectedNumOfSegments={4}, "
                                    + "expectedNumOfShardsForEachSegment={5}, "
                                    + "expectedStartEndForEachShard={6}, "
@@ -74,12 +74,26 @@ public class DeterminePartitionsJobTest
   {
     return Arrays.asList(
         new Object[][]{
+            {
+                false,
+                1,
+                NO_MAX_ROWS_PER_SEGMENT,
+                List.of("1970-01-01T00:00:00Z/P1D"),
+                1,
+                new int[]{1},
+                new String[][][]{
+                    {
+                        {null, null}
+                    }
+                },
+                ImmutableList.of("1970010100,c.example.com,CN,100")
+            },
             {
                 // Test partitoning by targetRowsPerSegment
                 true,
                 2,
                 NO_MAX_ROWS_PER_SEGMENT,
-                "2014-10-22T00:00:00Z/P1D",
+                List.of("2014-10-22T00:00:00Z/P1D"),
                 1,
                 new int[]{5},
                 new String[][][]{
@@ -108,7 +122,7 @@ public class DeterminePartitionsJobTest
                 true,
                 NO_TARGET_ROWS_PER_SEGMENT,
                 2,
-                "2014-10-22T00:00:00Z/P1D",
+                List.of("2014-10-22T00:00:00Z/P1D"),
                 1,
                 new int[]{5},
                 new String[][][]{
@@ -137,7 +151,7 @@ public class DeterminePartitionsJobTest
                 false,
                 NO_TARGET_ROWS_PER_SEGMENT,
                 2,
-                "2014-10-20T00:00:00Z/P1D",
+                List.of("2014-10-20T00:00:00Z/P1D"),
                 1,
                 new int[]{5},
                 new String[][][]{
@@ -176,7 +190,7 @@ public class DeterminePartitionsJobTest
                 true,
                 NO_TARGET_ROWS_PER_SEGMENT,
                 5,
-                "2014-10-20T00:00:00Z/P3D",
+                List.of("2014-10-20T00:00:00Z/P3D"),
                 3,
                 new int[]{2, 2, 2},
                 new String[][][]{
@@ -230,7 +244,7 @@ public class DeterminePartitionsJobTest
                 true,
                 NO_TARGET_ROWS_PER_SEGMENT,
                 1000,
-                "2014-10-22T00:00:00Z/P1D",
+                List.of("2014-10-22T00:00:00Z/P1D"),
                 1,
                 new int[]{1},
                 new String[][][]{
@@ -259,7 +273,7 @@ public class DeterminePartitionsJobTest
       boolean assumeGrouped,
       @Nullable Integer targetRowsPerSegment,
       Integer maxRowsPerSegment,
-      String interval,
+      List<String> intervals,
       int expectedNumOfSegments,
       int[] expectedNumOfShardsForEachSegment,
       String[][][] expectedStartEndForEachShard,
@@ -304,7 +318,7 @@ public class DeterminePartitionsJobTest
                           new UniformGranularitySpec(
                               Granularities.DAY,
                               Granularities.NONE,
-                              ImmutableList.of(Intervals.of(interval))
+                              
intervals.stream().map(Intervals::of).collect(ImmutableList.toImmutableList())
                           )
                       )
                       .withObjectMapper(HadoopDruidIndexerConfig.JSON_MAPPER)


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

(druid) branch master updated: Fix issue with Integer Joda timestamp coercion in DeterminePartitionsJob (#18327)

Reply via email to