Skip to content

Commit

Permalink
Merge pull request #24113 from mmaslankaprv/avro-decimal
Browse files Browse the repository at this point in the history
datalake/avro: fixed encoding decimal values
  • Loading branch information
mmaslankaprv authored Nov 14, 2024
2 parents c84cb6a + d7f13ab commit 0ea6197
Show file tree
Hide file tree
Showing 2 changed files with 41 additions and 9 deletions.
18 changes: 9 additions & 9 deletions src/v/iceberg/avro_decimal.h
Original file line number Diff line number Diff line change
Expand Up @@ -16,20 +16,20 @@
#include <array>
namespace iceberg {
/**
* Converts a decimal into an array of bytes (big endian)
* Converts a decimal into an array of bytes (big endian), this works the same
* way as the Java's BigInteger.toByteArray() method.
*/

inline bytes encode_avro_decimal(absl::int128 decimal) {
auto high_half = absl::Uint128High64(decimal);
auto low_half = absl::Uint128Low64(decimal);
auto high_half = ss::cpu_to_be(absl::Uint128High64(decimal));
auto low_half = ss::cpu_to_be(absl::Uint128Low64(decimal));

bytes decimal_bytes(bytes::initialized_zero{}, 16);

for (int i = 0; i < 8; i++) {
// NOLINTNEXTLINE(hicpp-signed-bitwise)
decimal_bytes[i] = (low_half >> (i * 8)) & 0xFF;
decimal_bytes[i] = (high_half >> (i * 8)) & 0xFF;
// NOLINTNEXTLINE(hicpp-signed-bitwise)
decimal_bytes[i + 8] = (high_half >> (i * 8)) & 0xFF;
decimal_bytes[i + 8] = (low_half >> (i * 8)) & 0xFF;
}

return decimal_bytes;
Expand All @@ -41,12 +41,12 @@ inline absl::int128 decode_avro_decimal(bytes bytes) {
int64_t high_half = 0;
uint64_t low_half = 0;
for (size_t i = 0; i < 8; i++) {
low_half |= static_cast<uint64_t>(bytes[i]) << i * 8;
// NOLINTNEXTLINE(hicpp-signed-bitwise)
high_half |= static_cast<int64_t>(bytes[8 + i]) << i * 8;
high_half |= static_cast<int64_t>(bytes[i]) << i * 8;
low_half |= static_cast<uint64_t>(bytes[i + 8]) << i * 8;
}

return absl::MakeInt128(high_half, low_half);
return absl::MakeInt128(ss::be_to_cpu(high_half), ss::be_to_cpu(low_half));
}

inline iobuf avro_decimal_to_iobuf(absl::int128 decimal, size_t max_size) {
Expand Down
32 changes: 32 additions & 0 deletions src/v/iceberg/tests/values_avro_test.cc
Original file line number Diff line number Diff line change
Expand Up @@ -113,3 +113,35 @@ TEST(ValuesAvroTest, TestDecimalConversionsLimitedSize) {
ASSERT_EQ(
decimal, iobuf_to_avro_decimal(avro_decimal_to_iobuf(decimal, 8)));
}

TEST(ValuesAvroTest, TestDecimalConversionAgainstJavaBigInteger) {
// value of 65536
ASSERT_EQ(
encode_avro_decimal(absl::MakeInt128(0, 65536)),
bytes({0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0}));
// value of 35209893291843950283695459221
ASSERT_EQ(
encode_avro_decimal(absl::MakeInt128(1908732140, 89247320981)),
bytes({0, 0, 0, 0, 113, 196, 240, 236, 0, 0, 0, 20, 199, 142, 11, 149}));

// value of -18218949492341193300753118315
ASSERT_EQ(
encode_avro_decimal(absl::MakeInt128(-987651231, 89247320981)),
bytes(
{255,
255,
255,
255,
197,
33,
163,
97,
0,
0,
0,
20,
199,
142,
11,
149}));
}

0 comments on commit 0ea6197

Please sign in to comment.