This is an automated email from the ASF dual-hosted git repository.

dataroaring pushed a commit to branch branch-3.0
in repository https://gitbox.apache.org/repos/asf/doris.git


The following commit(s) were added to refs/heads/branch-3.0 by this push:
     new e3073edd6f8 branch-3.0: [Opt](function) Speed up function string and 
add regression #45062 (#45107)
e3073edd6f8 is described below

commit e3073edd6f868afe999480f02f69976ca1d17417
Author: github-actions[bot] 
<41898282+github-actions[bot]@users.noreply.github.com>
AuthorDate: Fri Dec 20 00:42:31 2024 +0800

    branch-3.0: [Opt](function) Speed up function string and add regression 
#45062 (#45107)
    
    Cherry-picked from #45062
    
    Co-authored-by: zclllhhjj <zhaochan...@selectdb.com>
---
 be/src/vec/functions/function_string.cpp              | 19 ++++++++++---------
 .../nereids_function_p0/scalar_function/S.groovy      |  1 +
 2 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/be/src/vec/functions/function_string.cpp 
b/be/src/vec/functions/function_string.cpp
index 1876ed499f4..1f88c0f5bcf 100644
--- a/be/src/vec/functions/function_string.cpp
+++ b/be/src/vec/functions/function_string.cpp
@@ -888,16 +888,17 @@ struct StringSpace {
                          ColumnString::Offsets& res_offsets) {
         res_offsets.resize(data.size());
         size_t input_size = res_offsets.size();
-        std::vector<char, Allocator_<char>> buffer;
+        // sample to get approximate best reserve size
+        if (input_size > 4) {
+            res_data.reserve(((data[0] + data[input_size >> 1] + 
data[input_size >> 2] +
+                               data[input_size - 1]) >>
+                              2) *
+                             input_size);
+        }
         for (size_t i = 0; i < input_size; ++i) {
-            buffer.clear();
-            if (data[i] > 0) {
-                buffer.resize(data[i]);
-                for (size_t j = 0; j < data[i]; ++j) {
-                    buffer[j] = ' ';
-                }
-                StringOP::push_value_string(std::string_view(buffer.data(), 
buffer.size()), i,
-                                            res_data, res_offsets);
+            if (data[i] > 0) [[likely]] {
+                res_data.resize_fill(res_data.size() + data[i], ' ');
+                res_offsets[i] = res_data.size();
             } else {
                 StringOP::push_empty_string(i, res_data, res_offsets);
             }
diff --git 
a/regression-test/suites/nereids_function_p0/scalar_function/S.groovy 
b/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
index 98a8685a888..ea0d80d8adc 100644
--- a/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
+++ b/regression-test/suites/nereids_function_p0/scalar_function/S.groovy
@@ -126,6 +126,7 @@ suite("nereids_scalar_fn_S") {
 
        sql "select space(10) from fn_test order by kint"
        sql "select space(10) from fn_test_not_nullable order by kint"
+       sql """select k from (select length(space(number)) k from 
numbers("number" = "10"))t;""" // before #44919 will crash
        qt_sql_split_part_Varchar_Varchar_Integer "select split_part(kvchrs1, ' 
', 1) from fn_test order by kvchrs1"
        qt_sql_split_part_Varchar_Varchar_Integer_notnull "select 
split_part(kvchrs1, ' ', 1) from fn_test_not_nullable order by kvchrs1"
        qt_sql_split_part_String_String_Integer "select split_part(kstr, ' ', 
1) from fn_test order by kstr"


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org
For additional commands, e-mail: commits-h...@doris.apache.org

Reply via email to