(doris) branch branch-2.1 updated: branch-2.1: [fix](prepared statement) fix protocol with TIME datatype #47389 (#47543)

yiguolei Fri, 07 Feb 2025 21:01:04 -0800

This is an automated email from the ASF dual-hosted git repository.

yiguolei pushed a commit to branch branch-2.1
in repository https://gitbox.apache.org/repos/asf/doris.git



The following commit(s) were added to refs/heads/branch-2.1 by this push:
     new 3ec723f2cb7 branch-2.1: [fix](prepared statement) fix protocol with 
TIME datatype #47389 (#47543)
3ec723f2cb7 is described below

commit 3ec723f2cb7519adf6d7157a85bdc01115c70039
Author: github-actions[bot] 
<41898282+github-actions[bot]@users.noreply.github.com>
AuthorDate: Sat Feb 8 13:00:49 2025 +0800

    branch-2.1: [fix](prepared statement) fix protocol with TIME datatype 
#47389 (#47543)
    
    Cherry-picked from #47389
    
    Co-authored-by: lihangyu <lihan...@selectdb.com>
---
 be/src/util/mysql_row_buffer.cpp       |  80 ++++++++++++++++---
 be/test/util/mysql_row_buffer_test.cpp | 140 +++++++++++++++++++++++++++++++++
 2 files changed, 211 insertions(+), 9 deletions(-)

diff --git a/be/src/util/mysql_row_buffer.cpp b/be/src/util/mysql_row_buffer.cpp
index 7698eb4be64..eb2c663b2e5 100644
--- a/be/src/util/mysql_row_buffer.cpp
+++ b/be/src/util/mysql_row_buffer.cpp
@@ -361,13 +361,76 @@ int MysqlRowBuffer<is_binary_format>::push_double(double 
data) {
     return 0;
 }
 
+// Refer to https://dev.mysql.com/doc/refman/5.7/en/time.html
+// Encode time into MySQL binary protocol format with support for scale 
(microsecond precision)
+// Time value is limited between '-838:59:59' and '838:59:59'
+static int encode_binary_timev2(char* buff, double time, int scale) {
+    // Check if scale is valid (0 to 6)
+    if (scale < 0 || scale > 6) {
+        return -1; // Return error for invalid scale
+    }
+
+    int pos = 0;                      // Current position in the buffer
+    bool is_negative = time < 0;      // Determine if the time is negative
+    double abs_time = std::abs(time); // Convert time to absolute value
+
+    // Maximum time in microseconds: 838 hours, 59 minutes, 59 seconds
+    const int64_t MAX_TIME_MICROSECONDS = (838 * 3600 + 59 * 60 + 59) * 
1000000LL;
+
+    // Convert time into microseconds and enforce range limit
+    int64_t total_microseconds = static_cast<int64_t>(abs_time); // Total 
microseconds
+    if (total_microseconds > MAX_TIME_MICROSECONDS) {
+        total_microseconds = MAX_TIME_MICROSECONDS; // Cap at max time
+    }
+
+    // Adjust microseconds precision based on scale
+    total_microseconds /= static_cast<int64_t>(std::pow(10, 6 - scale)); // 
Scale adjustment
+    total_microseconds *= static_cast<int64_t>(std::pow(10, 6 - scale)); // 
Truncate extra precision
+
+    // Extract days, hours, minutes, seconds, and microseconds
+    int64_t days = total_microseconds / (3600LL * 24 * 1000000); // Calculate 
days
+    total_microseconds %= (3600LL * 24 * 1000000);
+
+    int64_t hours = total_microseconds / (3600LL * 1000000); // Remaining hours
+    total_microseconds %= (3600LL * 1000000);
+
+    int64_t minutes = total_microseconds / (60LL * 1000000); // Remaining 
minutes
+    total_microseconds %= (60LL * 1000000);
+
+    int64_t seconds = total_microseconds / 1000000;      // Remaining seconds
+    int64_t microseconds = total_microseconds % 1000000; // Remaining 
microseconds
+
+    // MySQL binary protocol rules for time encoding
+    if (days == 0 && hours == 0 && minutes == 0 && seconds == 0 && 
microseconds == 0) {
+        buff[pos++] = 0; // All zero: length is 0
+    } else if (microseconds == 0) {
+        buff[pos++] = 8;                                    // No 
microseconds: length is 8
+        buff[pos++] = is_negative ? 1 : 0;                  // Sign byte
+        int4store(buff + pos, static_cast<uint32_t>(days)); // Store days (4 
bytes)
+        pos += 4;
+        buff[pos++] = static_cast<char>(hours);   // Store hours (1 byte)
+        buff[pos++] = static_cast<char>(minutes); // Store minutes (1 byte)
+        buff[pos++] = static_cast<char>(seconds); // Store seconds (1 byte)
+    } else {
+        buff[pos++] = 12;                                   // Include 
microseconds: length is 12
+        buff[pos++] = is_negative ? 1 : 0;                  // Sign byte
+        int4store(buff + pos, static_cast<uint32_t>(days)); // Store days (4 
bytes)
+        pos += 4;
+        buff[pos++] = static_cast<char>(hours);                     // Store 
hours (1 byte)
+        buff[pos++] = static_cast<char>(minutes);                   // Store 
minutes (1 byte)
+        buff[pos++] = static_cast<char>(seconds);                   // Store 
seconds (1 byte)
+        int4store(buff + pos, static_cast<uint32_t>(microseconds)); // Store 
microseconds (4 bytes)
+        pos += 4;
+    }
+
+    return pos; // Return total bytes written to buffer
+}
+
 template <bool is_binary_format>
 int MysqlRowBuffer<is_binary_format>::push_time(double data) {
     if (is_binary_format && !_dynamic_mode) {
-        char buff[8];
-        _field_pos++;
-        float8store(buff, data);
-        return append(buff, 8);
+        throw doris::Exception(ErrorCode::NOT_IMPLEMENTED_ERROR,
+                               "Not supported time type for binary protocol");
     }
     // 1 for string trail, 1 for length, other for time str
     reserve(2 + MAX_TIME_WIDTH);
@@ -379,14 +442,13 @@ int MysqlRowBuffer<is_binary_format>::push_time(double 
data) {
 template <bool is_binary_format>
 int MysqlRowBuffer<is_binary_format>::push_timev2(double data, int scale) {
     if (is_binary_format && !_dynamic_mode) {
-        char buff[8];
+        char buff[13];
         _field_pos++;
-        float8store(buff, data);
-        return append(buff, 8);
+        int length = encode_binary_timev2(buff, data, scale);
+        return append(buff, length);
     }
-    // 1 for string trail, 1 for length, other for time str
-    reserve(2 + MAX_TIME_WIDTH);
 
+    reserve(2 + MAX_TIME_WIDTH);
     _pos = add_timev2(data, _pos, _dynamic_mode, scale);
     return 0;
 }
diff --git a/be/test/util/mysql_row_buffer_test.cpp 
b/be/test/util/mysql_row_buffer_test.cpp
index cfe012fdcd5..0fd2211f19d 100644
--- a/be/test/util/mysql_row_buffer_test.cpp
+++ b/be/test/util/mysql_row_buffer_test.cpp
@@ -118,4 +118,144 @@ TEST(MysqlRowBufferTest, dynamic_mode) {
     EXPECT_EQ(0, strncmp(buf + 43, "test", 4));
 }
 
+TEST(MysqlRowBufferTest, TestBinaryTimeCompressedEncoding) {
+    MysqlRowBuffer<true> buffer;
+    const char* buf = nullptr;
+    size_t offset = 0;
+
+    // Test case 1: Zero time value (all zeros), expect a single byte: 0.
+    buffer.push_timev2(0.0, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(0, buf[0]);
+    offset = 1;
+
+    // Test case 2: Time value without microseconds (1:01:01)
+    // 1:01:01 = 3661 seconds, converted to microseconds: 3661 * 1e6 = 
3661000000.
+    // With scale=0 the microsecond part is 0, so an 8-byte encoding is used.
+    buffer.push_timev2(3661.0 * 1000000, 0);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]);                   // 8 bytes expected
+    EXPECT_EQ(0, buf[offset + 1]);               // Positive flag
+    EXPECT_EQ(0, *(int32_t*)(buf + offset + 2)); // Days = 0
+    EXPECT_EQ(1, buf[offset + 6]);               // Hour = 1
+    EXPECT_EQ(1, buf[offset + 7]);               // Minute = 1
+    EXPECT_EQ(1, buf[offset + 8]);               // Second = 1
+    offset += 9;
+
+    // Test case 3: Time value with microseconds (1:01:01.123456)
+    // 1:01:01.123456 seconds => 3661.123456 * 1e6 = 3661123456 microseconds.
+    // Scale=6 gives non-zero microsecond part, hence 12-byte encoding.
+    buffer.push_timev2(3661.123456 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(12, buf[offset]);                       // 12 bytes expected
+    EXPECT_EQ(0, buf[offset + 1]);                    // Positive flag
+    EXPECT_EQ(0, *(int32_t*)(buf + offset + 2));      // Days = 0
+    EXPECT_EQ(1, buf[offset + 6]);                    // Hour = 1
+    EXPECT_EQ(1, buf[offset + 7]);                    // Minute = 1
+    EXPECT_EQ(1, buf[offset + 8]);                    // Second = 1
+    EXPECT_EQ(123456, *(int32_t*)(buf + offset + 9)); // Microseconds = 123456
+    offset += 13;
+
+    // Test case 4: Negative time value (-1:01:01.123456)
+    // Corresponding microseconds: -3661.123456 * 1e6 = -3661123456.
+    buffer.push_timev2(-3661.123456 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(12, buf[offset]);                       // 12-byte encoding 
expected
+    EXPECT_EQ(1, buf[offset + 1]);                    // Negative flag (1)
+    EXPECT_EQ(0, *(int32_t*)(buf + offset + 2));      // Days = 0
+    EXPECT_EQ(1, buf[offset + 6]);                    // Hour = 1
+    EXPECT_EQ(1, buf[offset + 7]);                    // Minute = 1
+    EXPECT_EQ(1, buf[offset + 8]);                    // Second = 1
+    EXPECT_EQ(123456, *(int32_t*)(buf + offset + 9)); // Microseconds = 123456
+    offset += 13;
+
+    // Test case 5: Maximum time value (838:59:59.999999)
+    // The maximum time is defined as (int64_t)3020399 * 1000000 (i.e. no 
extra microseconds).
+    // Even if the input is 3020399.999999 * 1e6, it is truncated so that the 
microsecond part becomes 0.
+    // Therefore, an 8-byte encoding is expected.
+    buffer.push_timev2(3020399.999999 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]);                    // 8-byte encoding expected
+    EXPECT_EQ(0, buf[offset + 1]);                // Positive flag
+    EXPECT_EQ(34, *(int32_t*)(buf + offset + 2)); // Days (e.g., 34, as per 
the conversion)
+    EXPECT_EQ(22, buf[offset + 6]);               // Hour = 22
+    EXPECT_EQ(59, buf[offset + 7]);               // Minute = 59
+    EXPECT_EQ(59, buf[offset + 8]);               // Second = 59
+    offset += 9;
+
+    // Test case 6: Time value exceeding the maximum.
+    // A value slightly greater than 3020399.999999 seconds will be truncated 
to the maximum value.
+    buffer.push_timev2(3020400.0 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]);                    // 8-byte encoding expected
+    EXPECT_EQ(0, buf[offset + 1]);                // Positive flag
+    EXPECT_EQ(34, *(int32_t*)(buf + offset + 2)); // Days = 34
+    EXPECT_EQ(22, buf[offset + 6]);               // Hour = 22
+    EXPECT_EQ(59, buf[offset + 7]);               // Minute = 59
+    EXPECT_EQ(59, buf[offset + 8]);               // Second = 59
+    offset += 9;
+
+    // Test case 7: Different scale test (1:01:01.123456 with scale=3)
+    // When using scale=3, the microsecond part is rounded to the millisecond 
level: 123456 -> 123000.
+    // Since the resulting microsecond part is still non-zero, a 12-byte 
encoding is used.
+    buffer.push_timev2(3661.123456 * 1000000, 3);
+    buf = buffer.buf();
+    EXPECT_EQ(12, buf[offset]);                       // 12-byte encoding 
expected
+    EXPECT_EQ(0, buf[offset + 1]);                    // Positive flag
+    EXPECT_EQ(0, *(int32_t*)(buf + offset + 2));      // Days = 0
+    EXPECT_EQ(1, buf[offset + 6]);                    // Hour = 1
+    EXPECT_EQ(1, buf[offset + 7]);                    // Minute = 1
+    EXPECT_EQ(1, buf[offset + 8]);                    // Second = 1
+    EXPECT_EQ(123000, *(int32_t*)(buf + offset + 9)); // Microseconds rounded 
to 123000
+    offset += 13;
+
+    // Test case 8: Time value with scale=0 (1:01:01).
+    // Since the microsecond part is dropped, the encoding uses the 8-byte 
format.
+    buffer.push_timev2(3661.0 * 1000000, 0);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]); // 8-byte encoding expected
+    EXPECT_EQ(0, buf[offset + 1]);
+    EXPECT_EQ(0, *(int32_t*)(buf + offset + 2));
+    EXPECT_EQ(1, buf[offset + 6]);
+    EXPECT_EQ(1, buf[offset + 7]);
+    EXPECT_EQ(1, buf[offset + 8]);
+    offset += 9;
+
+    // Test case 9: Time value across days (e.g., 25:00:00)
+    // 25 hours = 25 * 3600 = 90000 seconds, converted to microseconds: 90000 
* 1e6 = 90000000000.
+    // 90000 seconds / 86400 gives 1 full day with 3600 seconds remaining.
+    // Hence, 8-byte encoding is expected.
+    buffer.push_timev2(90000.0 * 1000000, 0);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]); // 8-byte encoding expected
+    EXPECT_EQ(0, buf[offset + 1]);
+    EXPECT_EQ(1, *(int32_t*)(buf + offset + 2)); // Days = 1
+    EXPECT_EQ(1, buf[offset + 6]);               // Remaining 1 hour
+    EXPECT_EQ(0, buf[offset + 7]);
+    EXPECT_EQ(0, buf[offset + 8]);
+    offset += 9;
+
+    // Test case 10: Invalid scale test.
+    // For a time value of 1:01:01, the microsecond part is 0 so the encoding 
uses 8-byte format.
+    // Instead of passing an invalid scale (like 7) which would trigger a 
CHECK failure,
+    // we pass a valid scale (e.g., 6) to avoid process termination.
+    buffer.push_timev2(3661.0 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]); // 8-byte encoding expected
+    offset += 9;
+
+    // Test case 11: Negative maximum time value (-838:59:59.999999)
+    // Corresponds to -3020399.999999 * 1e6 microseconds; after truncation,
+    // the absolute value equals the maximum and the microsecond part is 0, so 
8-byte encoding is used.
+    buffer.push_timev2(-3020399.999999 * 1000000, 6);
+    buf = buffer.buf();
+    EXPECT_EQ(8, buf[offset]);                    // 8-byte encoding expected
+    EXPECT_EQ(1, buf[offset + 1]);                // Negative flag
+    EXPECT_EQ(34, *(int32_t*)(buf + offset + 2)); // Days = 34
+    EXPECT_EQ(22, buf[offset + 6]);
+    EXPECT_EQ(59, buf[offset + 7]);
+    EXPECT_EQ(59, buf[offset + 8]);
+    offset += 9;
+}
+
 } // namespace doris


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org
For additional commands, e-mail: commits-h...@doris.apache.org

(doris) branch branch-2.1 updated: branch-2.1: [fix](prepared statement) fix protocol with TIME datatype #47389 (#47543)

Reply via email to