Re: [PR] feat: implement endian conversion utilities [iceberg-cpp]

via GitHub Mon, 01 Sep 2025 00:21:36 -0700


wgtmac commented on code in PR #196:
URL: https://github.com/apache/iceberg-cpp/pull/196#discussion_r2306077067



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value

Review Comment:
   ```suggestion
   ```
   
   The comment is redundant.



##########
src/iceberg/util/endian.h:
##########
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <bit>
+#include <concepts>
+#include <cstdint>
+
+/// \file iceberg/util/endian.h
+/// \brief Endianness conversion utilities
+
+namespace iceberg {
+
+/// \brief Concept for values that can be converted to/from another endian 
format.
+template <typename T>
+concept EndianConvertible = std::is_arithmetic_v<T> && !std::same_as<T, bool>;
+
+/// \brief Byte-swap a value. For floating-point types, only support 32-bit 
and 64-bit
+/// floats.
+template <EndianConvertible T>
+constexpr T ByteSwap(T value) {
+  if constexpr (sizeof(T) <= 1) {
+    return value;
+  } else if constexpr (std::is_integral_v<T>) {
+    return std::byteswap(value);
+  } else if constexpr (std::is_floating_point_v<T>) {
+    if constexpr (sizeof(T) == sizeof(uint32_t)) {

Review Comment:
   Should we add `if constexpr (sizeof(T) == sizeof(uint16_t))` to be 
future-proof?
   
   There are std::float16_t and std::bfloat16_t.



##########
src/iceberg/util/endian.h:
##########
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <bit>
+#include <concepts>
+#include <cstdint>
+
+/// \file iceberg/util/endian.h
+/// \brief Endianness conversion utilities
+
+namespace iceberg {
+
+/// \brief Concept for values that can be converted to/from another endian 
format.
+template <typename T>
+concept EndianConvertible = std::is_arithmetic_v<T> && !std::same_as<T, bool>;
+
+/// \brief Byte-swap a value. For floating-point types, only support 32-bit 
and 64-bit
+/// floats.
+template <EndianConvertible T>
+constexpr T ByteSwap(T value) {
+  if constexpr (sizeof(T) <= 1) {

Review Comment:
   It seems that you have already supported bool type here.



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0xDEADBEEF)), 0xDEADBEEF);
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<uint64_t>::max())),
+            std::numeric_limits<uint64_t>::max());
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0)), 0);
+
+  EXPECT_EQ(FromBigEndian(ToBigEndian<int16_t>(-1)), -1);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<int32_t>(-0x12345678)), 
-0x12345678);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<int64_t>::min())),
+            std::numeric_limits<int64_t>::min());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<int16_t>::max())),
+            std::numeric_limits<int16_t>::max());
+
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(3.14f)), 3.14f);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(2.718281828459045)), 2.718281828459045);
+
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::infinity())),
+            std::numeric_limits<float>::infinity());
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(-std::numeric_limits<float>::infinity())),
+            -std::numeric_limits<float>::infinity());
+  EXPECT_TRUE(std::isnan(
+      
FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::quiet_NaN()))));
+  EXPECT_EQ(FromBigEndian(ToBigEndian(0.0f)), 0.0f);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(-0.0f)), -0.0f);
+
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<double>::infinity())),
+            std::numeric_limits<double>::infinity());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(-std::numeric_limits<double>::infinity())),
+            -std::numeric_limits<double>::infinity());
+  EXPECT_TRUE(
+      
std::isnan(FromBigEndian(ToBigEndian(std::numeric_limits<double>::quiet_NaN()))));
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(0.0)), 0.0);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(-0.0)), -0.0);
+}
+
+// test constexpr evaluation
+TEST(EndianTest, ConstexprEvaluation) {
+  static_assert(FromBigEndian(ToBigEndian<uint16_t>(0x1234)) == 0x1234);
+  static_assert(FromLittleEndian(ToLittleEndian<uint32_t>(0x12345678)) == 
0x12345678);
+  static_assert(FromBigEndian(ToBigEndian<int64_t>(-1)) == -1);
+
+  static_assert(ToBigEndian<uint8_t>(0xFF) == 0xFF);
+  static_assert(FromLittleEndian<int8_t>(-1) == -1);
+
+  static_assert(FromLittleEndian(ToLittleEndian(3.14f)) == 3.14f);
+  static_assert(FromBigEndian(ToBigEndian(2.71)) == 2.71);
+}
+
+// test platform dependent behavior
+TEST(EndianTest, PlatformDependentBehavior) {

Review Comment:
   I don't think we need this case.



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);

Review Comment:
   There are a lot of duplicate lines here. Can we use a simple macro for this?
   
   ```
   #define EXPECT_ROUNDTRIP(T value)                            \
     EXPECT_EQ(FromLittleEndian(ToLittleEndian(value)), value); \
     EXPECT_EQ(FromBigEndian(ToBigEndian(value)), value);
   ```



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0xDEADBEEF)), 0xDEADBEEF);
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<uint64_t>::max())),
+            std::numeric_limits<uint64_t>::max());
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0)), 0);
+
+  EXPECT_EQ(FromBigEndian(ToBigEndian<int16_t>(-1)), -1);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<int32_t>(-0x12345678)), 
-0x12345678);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<int64_t>::min())),
+            std::numeric_limits<int64_t>::min());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<int16_t>::max())),
+            std::numeric_limits<int16_t>::max());
+
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(3.14f)), 3.14f);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(2.718281828459045)), 2.718281828459045);
+
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::infinity())),
+            std::numeric_limits<float>::infinity());
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(-std::numeric_limits<float>::infinity())),
+            -std::numeric_limits<float>::infinity());
+  EXPECT_TRUE(std::isnan(
+      
FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::quiet_NaN()))));
+  EXPECT_EQ(FromBigEndian(ToBigEndian(0.0f)), 0.0f);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(-0.0f)), -0.0f);
+
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<double>::infinity())),
+            std::numeric_limits<double>::infinity());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(-std::numeric_limits<double>::infinity())),
+            -std::numeric_limits<double>::infinity());
+  EXPECT_TRUE(
+      
std::isnan(FromBigEndian(ToBigEndian(std::numeric_limits<double>::quiet_NaN()))));
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(0.0)), 0.0);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(-0.0)), -0.0);
+}
+
+// test constexpr evaluation
+TEST(EndianTest, ConstexprEvaluation) {
+  static_assert(FromBigEndian(ToBigEndian<uint16_t>(0x1234)) == 0x1234);
+  static_assert(FromLittleEndian(ToLittleEndian<uint32_t>(0x12345678)) == 
0x12345678);
+  static_assert(FromBigEndian(ToBigEndian<int64_t>(-1)) == -1);
+
+  static_assert(ToBigEndian<uint8_t>(0xFF) == 0xFF);
+  static_assert(FromLittleEndian<int8_t>(-1) == -1);
+
+  static_assert(FromLittleEndian(ToLittleEndian(3.14f)) == 3.14f);
+  static_assert(FromBigEndian(ToBigEndian(2.71)) == 2.71);
+}
+
+// test platform dependent behavior
+TEST(EndianTest, PlatformDependentBehavior) {
+  uint32_t test_value = 0x12345678;
+
+  if constexpr (std::endian::native == std::endian::little) {
+    EXPECT_EQ(ToLittleEndian(test_value), test_value);
+    EXPECT_EQ(FromLittleEndian(test_value), test_value);
+    EXPECT_NE(ToBigEndian(test_value), test_value);
+  } else if constexpr (std::endian::native == std::endian::big) {
+    EXPECT_EQ(ToBigEndian(test_value), test_value);
+    EXPECT_EQ(FromBigEndian(test_value), test_value);
+    EXPECT_NE(ToLittleEndian(test_value), test_value);
+  }
+
+  EXPECT_EQ(ToLittleEndian<uint8_t>(0xAB), 0xAB);
+  EXPECT_EQ(ToBigEndian<uint8_t>(0xAB), 0xAB);
+}
+
+// test specific byte pattern validation
+TEST(EndianTest, SpecificBytePatternValidation) {
+  uint32_t original_int = 0x12345678;
+  uint32_t little_endian_int = ToLittleEndian(original_int);
+  uint32_t big_endian_int = ToBigEndian(original_int);
+
+  auto little_int_bytes = std::bit_cast<std::array<uint8_t, 
4>>(little_endian_int);
+  auto big_int_bytes = std::bit_cast<std::array<uint8_t, 4>>(big_endian_int);
+
+  EXPECT_EQ(little_int_bytes, (std::array<uint8_t, 4>{0x78, 0x56, 0x34, 
0x12}));
+  EXPECT_EQ(big_int_bytes, (std::array<uint8_t, 4>{0x12, 0x34, 0x56, 0x78}));
+
+  float original_float = 3.14f;
+  float little_endian_float = ToLittleEndian(original_float);
+  float big_endian_float = ToBigEndian(original_float);
+
+  auto little_float_bytes = std::bit_cast<std::array<uint8_t, 
4>>(little_endian_float);
+  auto big_float_bytes = std::bit_cast<std::array<uint8_t, 
4>>(big_endian_float);
+
+  EXPECT_EQ(little_float_bytes, (std::array<uint8_t, 4>{0xC3, 0xF5, 0x48, 
0x40}));
+  EXPECT_EQ(big_float_bytes, (std::array<uint8_t, 4>{0x40, 0x48, 0xF5, 0xC3}));

Review Comment:
   ```suggestion
     EXPECT_EQ(little_float_bytes, std::array<uint8_t, 4>{0xC3, 0xF5, 0x48, 
0x40});
     EXPECT_EQ(big_float_bytes, std::array<uint8_t, 4>{0x40, 0x48, 0xF5, 0xC3});
   ```



##########
src/iceberg/util/endian.h:
##########
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <bit>
+#include <concepts>
+#include <cstdint>
+
+/// \file iceberg/util/endian.h
+/// \brief Endianness conversion utilities
+
+namespace iceberg {
+
+/// \brief Concept for values that can be converted to/from another endian 
format.
+template <typename T>
+concept EndianConvertible = std::is_arithmetic_v<T> && !std::same_as<T, bool>;
+
+/// \brief Byte-swap a value. For floating-point types, only support 32-bit 
and 64-bit
+/// floats.
+template <EndianConvertible T>
+constexpr T ByteSwap(T value) {
+  if constexpr (sizeof(T) <= 1) {
+    return value;
+  } else if constexpr (std::is_integral_v<T>) {
+    return std::byteswap(value);
+  } else if constexpr (std::is_floating_point_v<T>) {
+    if constexpr (sizeof(T) == sizeof(uint32_t)) {
+      return std::bit_cast<T>(std::byteswap(std::bit_cast<uint32_t>(value)));
+    } else if constexpr (sizeof(T) == sizeof(uint64_t)) {
+      return std::bit_cast<T>(std::byteswap(std::bit_cast<uint64_t>(value)));
+    } else {
+      static_assert(false, "Unsupported floating-point size for endian 
conversion.");
+    }
+  }
+}
+
+/// \brief Convert a value to little-endian format.
+template <EndianConvertible T>
+constexpr T ToLittleEndian(T value) {
+  if constexpr (std::endian::native == std::endian::little || sizeof(T) <= 1) {
+    return value;
+  } else {
+    return ByteSwap(value);
+  }

Review Comment:
   ```suggestion
     if constexpr (std::endian::native == std::endian::little) {
       return value;
     } else {
       return ByteSwap(value);
     }
   ```
   
   Doesn't it look better?



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0xDEADBEEF)), 0xDEADBEEF);
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<uint64_t>::max())),
+            std::numeric_limits<uint64_t>::max());
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0)), 0);
+
+  EXPECT_EQ(FromBigEndian(ToBigEndian<int16_t>(-1)), -1);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<int32_t>(-0x12345678)), 
-0x12345678);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<int64_t>::min())),
+            std::numeric_limits<int64_t>::min());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<int16_t>::max())),
+            std::numeric_limits<int16_t>::max());
+
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(3.14f)), 3.14f);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(2.718281828459045)), 2.718281828459045);
+
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::infinity())),
+            std::numeric_limits<float>::infinity());
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(-std::numeric_limits<float>::infinity())),
+            -std::numeric_limits<float>::infinity());
+  EXPECT_TRUE(std::isnan(
+      
FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::quiet_NaN()))));
+  EXPECT_EQ(FromBigEndian(ToBigEndian(0.0f)), 0.0f);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(-0.0f)), -0.0f);
+
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<double>::infinity())),
+            std::numeric_limits<double>::infinity());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(-std::numeric_limits<double>::infinity())),
+            -std::numeric_limits<double>::infinity());
+  EXPECT_TRUE(
+      
std::isnan(FromBigEndian(ToBigEndian(std::numeric_limits<double>::quiet_NaN()))));
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(0.0)), 0.0);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(-0.0)), -0.0);
+}
+
+// test constexpr evaluation
+TEST(EndianTest, ConstexprEvaluation) {
+  static_assert(FromBigEndian(ToBigEndian<uint16_t>(0x1234)) == 0x1234);
+  static_assert(FromLittleEndian(ToLittleEndian<uint32_t>(0x12345678)) == 
0x12345678);
+  static_assert(FromBigEndian(ToBigEndian<int64_t>(-1)) == -1);
+
+  static_assert(ToBigEndian<uint8_t>(0xFF) == 0xFF);
+  static_assert(FromLittleEndian<int8_t>(-1) == -1);
+
+  static_assert(FromLittleEndian(ToLittleEndian(3.14f)) == 3.14f);
+  static_assert(FromBigEndian(ToBigEndian(2.71)) == 2.71);
+}
+
+// test platform dependent behavior
+TEST(EndianTest, PlatformDependentBehavior) {
+  uint32_t test_value = 0x12345678;
+
+  if constexpr (std::endian::native == std::endian::little) {
+    EXPECT_EQ(ToLittleEndian(test_value), test_value);
+    EXPECT_EQ(FromLittleEndian(test_value), test_value);
+    EXPECT_NE(ToBigEndian(test_value), test_value);
+  } else if constexpr (std::endian::native == std::endian::big) {
+    EXPECT_EQ(ToBigEndian(test_value), test_value);
+    EXPECT_EQ(FromBigEndian(test_value), test_value);
+    EXPECT_NE(ToLittleEndian(test_value), test_value);
+  }
+
+  EXPECT_EQ(ToLittleEndian<uint8_t>(0xAB), 0xAB);
+  EXPECT_EQ(ToBigEndian<uint8_t>(0xAB), 0xAB);
+}
+
+// test specific byte pattern validation
+TEST(EndianTest, SpecificBytePatternValidation) {

Review Comment:
   ```suggestion
   TEST(EndianTest, ByteWiseValidation) {
   ```



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0xDEADBEEF)), 0xDEADBEEF);
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<uint64_t>::max())),
+            std::numeric_limits<uint64_t>::max());
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0)), 0);
+
+  EXPECT_EQ(FromBigEndian(ToBigEndian<int16_t>(-1)), -1);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<int32_t>(-0x12345678)), 
-0x12345678);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<int64_t>::min())),
+            std::numeric_limits<int64_t>::min());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<int16_t>::max())),
+            std::numeric_limits<int16_t>::max());
+
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(3.14f)), 3.14f);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(2.718281828459045)), 2.718281828459045);
+
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::infinity())),
+            std::numeric_limits<float>::infinity());
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(-std::numeric_limits<float>::infinity())),
+            -std::numeric_limits<float>::infinity());
+  EXPECT_TRUE(std::isnan(
+      
FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::quiet_NaN()))));
+  EXPECT_EQ(FromBigEndian(ToBigEndian(0.0f)), 0.0f);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(-0.0f)), -0.0f);
+
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<double>::infinity())),
+            std::numeric_limits<double>::infinity());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(-std::numeric_limits<double>::infinity())),
+            -std::numeric_limits<double>::infinity());
+  EXPECT_TRUE(
+      
std::isnan(FromBigEndian(ToBigEndian(std::numeric_limits<double>::quiet_NaN()))));
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(0.0)), 0.0);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(-0.0)), -0.0);
+}
+
+// test constexpr evaluation
+TEST(EndianTest, ConstexprEvaluation) {

Review Comment:
   Is there any difference with the above case?



##########
src/iceberg/util/endian.h:
##########
@@ -0,0 +1,124 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <bit>
+#include <concepts>
+
+/// \file iceberg/util/endian.h
+/// \brief Endianness conversion utilities
+
+namespace iceberg {
+
+/// \brief Concept for values that can be converted to/from another endian 
format.
+template <typename T>
+concept EndianConvertible = std::is_arithmetic_v<T> && !std::same_as<T, bool>;

Review Comment:
   If we don't support bool here, users may need to special case bool to avoid 
passing it to `ByteSwap`. For simplicity, should we support bool as well?



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);

Review Comment:
   Or we can use template function to leverage parameterized test to improve 
readability.



##########
test/endian_test.cc:
##########
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "iceberg/util/endian.h"
+
+#include <array>
+#include <cmath>
+#include <limits>
+
+#include <gtest/gtest.h>
+
+namespace iceberg {
+
+// test round trip preserves value
+TEST(EndianTest, RoundTripPreservesValue) {
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<uint16_t>(0x1234)), 0x1234);
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0xDEADBEEF)), 0xDEADBEEF);
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<uint64_t>::max())),
+            std::numeric_limits<uint64_t>::max());
+  EXPECT_EQ(FromBigEndian(ToBigEndian<uint32_t>(0)), 0);
+
+  EXPECT_EQ(FromBigEndian(ToBigEndian<int16_t>(-1)), -1);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian<int32_t>(-0x12345678)), 
-0x12345678);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<int64_t>::min())),
+            std::numeric_limits<int64_t>::min());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<int16_t>::max())),
+            std::numeric_limits<int16_t>::max());
+
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(3.14f)), 3.14f);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(2.718281828459045)), 2.718281828459045);
+
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::infinity())),
+            std::numeric_limits<float>::infinity());
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(-std::numeric_limits<float>::infinity())),
+            -std::numeric_limits<float>::infinity());
+  EXPECT_TRUE(std::isnan(
+      
FromLittleEndian(ToLittleEndian(std::numeric_limits<float>::quiet_NaN()))));
+  EXPECT_EQ(FromBigEndian(ToBigEndian(0.0f)), 0.0f);
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(-0.0f)), -0.0f);
+
+  
EXPECT_EQ(FromBigEndian(ToBigEndian(std::numeric_limits<double>::infinity())),
+            std::numeric_limits<double>::infinity());
+  
EXPECT_EQ(FromLittleEndian(ToLittleEndian(-std::numeric_limits<double>::infinity())),
+            -std::numeric_limits<double>::infinity());
+  EXPECT_TRUE(
+      
std::isnan(FromBigEndian(ToBigEndian(std::numeric_limits<double>::quiet_NaN()))));
+  EXPECT_EQ(FromLittleEndian(ToLittleEndian(0.0)), 0.0);
+  EXPECT_EQ(FromBigEndian(ToBigEndian(-0.0)), -0.0);
+}
+
+// test constexpr evaluation
+TEST(EndianTest, ConstexprEvaluation) {
+  static_assert(FromBigEndian(ToBigEndian<uint16_t>(0x1234)) == 0x1234);
+  static_assert(FromLittleEndian(ToLittleEndian<uint32_t>(0x12345678)) == 
0x12345678);
+  static_assert(FromBigEndian(ToBigEndian<int64_t>(-1)) == -1);
+
+  static_assert(ToBigEndian<uint8_t>(0xFF) == 0xFF);
+  static_assert(FromLittleEndian<int8_t>(-1) == -1);
+
+  static_assert(FromLittleEndian(ToLittleEndian(3.14f)) == 3.14f);
+  static_assert(FromBigEndian(ToBigEndian(2.71)) == 2.71);
+}
+
+// test platform dependent behavior
+TEST(EndianTest, PlatformDependentBehavior) {
+  uint32_t test_value = 0x12345678;
+
+  if constexpr (std::endian::native == std::endian::little) {
+    EXPECT_EQ(ToLittleEndian(test_value), test_value);
+    EXPECT_EQ(FromLittleEndian(test_value), test_value);
+    EXPECT_NE(ToBigEndian(test_value), test_value);
+  } else if constexpr (std::endian::native == std::endian::big) {
+    EXPECT_EQ(ToBigEndian(test_value), test_value);
+    EXPECT_EQ(FromBigEndian(test_value), test_value);
+    EXPECT_NE(ToLittleEndian(test_value), test_value);
+  }
+
+  EXPECT_EQ(ToLittleEndian<uint8_t>(0xAB), 0xAB);
+  EXPECT_EQ(ToBigEndian<uint8_t>(0xAB), 0xAB);
+}
+
+// test specific byte pattern validation
+TEST(EndianTest, SpecificBytePatternValidation) {
+  uint32_t original_int = 0x12345678;
+  uint32_t little_endian_int = ToLittleEndian(original_int);
+  uint32_t big_endian_int = ToBigEndian(original_int);
+
+  auto little_int_bytes = std::bit_cast<std::array<uint8_t, 
4>>(little_endian_int);
+  auto big_int_bytes = std::bit_cast<std::array<uint8_t, 4>>(big_endian_int);
+
+  EXPECT_EQ(little_int_bytes, (std::array<uint8_t, 4>{0x78, 0x56, 0x34, 
0x12}));
+  EXPECT_EQ(big_int_bytes, (std::array<uint8_t, 4>{0x12, 0x34, 0x56, 0x78}));

Review Comment:
   ```suggestion
     EXPECT_EQ(little_int_bytes, std::array<uint8_t, 4>{0x78, 0x56, 0x34, 
0x12});
     EXPECT_EQ(big_int_bytes, std::array<uint8_t, 4>{0x12, 0x34, 0x56, 0x78});
   ```



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


---------------------------------------------------------------------
To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org
For additional commands, e-mail: issues-h...@iceberg.apache.org

Re: [PR] feat: implement endian conversion utilities [iceberg-cpp]

Reply via email to