This is an automated email from the ASF dual-hosted git repository.

mrhhsg pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/doris.git


The following commit(s) were added to refs/heads/master by this push:
     new 8fad28d108c [fix](function) A crash caused by nullptr in 
json_exists_path (#56331)
8fad28d108c is described below

commit 8fad28d108ca55cae7b0f8e7a480a193049cb6b3
Author: Jerry Hu <[email protected]>
AuthorDate: Tue Sep 23 17:30:38 2025 +0800

    [fix](function) A crash caused by nullptr in json_exists_path (#56331)
    
    ### What problem does this PR solve?
    
    ```
    *** SIGSEGV address not mapped to object (@0x0) received by PID 2836285 
(TID 2842945 OR 0x7bcf0eee9700) from PID 0; stack trace: ***
     0# doris::signal::(anonymous namespace)::FailureSignalHandler(int, 
siginfo_t*, void*) at /root/doris/be/src/common/signal_handler.h:420
     1# 0x00007FD73A577D10 in /lib64/libpthread.so.0
     2# doris::vectorized::PODArray<unsigned char, 4096ul, 
doris::Allocator<false, false, false, doris::DefaultMemoryAllocator, false>, 
16ul, 15ul>::t_start() const at /root/doris/be/src/vec/common/pod_array.h:414
     3# doris::vectorized::PODArray<unsigned char, 4096ul, 
doris::Allocator<false, false, false, doris::DefaultMemoryAllocator, false>, 
16ul, 15ul>::data() const at /root/doris/be/src/vec/common/pod_array.h:454
     4# 
doris::vectorized::FunctionJsonbExtractPath::execute_impl(doris::FunctionContext*,
 doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long) const at 
/root/doris/be/src/vec/functions/function_jsonb.cpp:730
     5# non-virtual thunk to 
doris::vectorized::FunctionJsonbExtractPath::execute_impl(doris::FunctionContext*,
 doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long) const in 
/root/doris/be/output/lib/doris_be
     6# 
doris::vectorized::PreparedFunctionImpl::_execute_skipped_constant_deal(doris::FunctionContext*,
 doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long, bool) const at 
/root/doris/be/src/vec/functions/function.cpp:120
     7# 
doris::vectorized::PreparedFunctionImpl::execute_without_low_cardinality_columns(doris::FunctionContext*,
 doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long, bool) const at 
/root/doris/be/src/vec/functions/function.cpp:242
     8# 
doris::vectorized::PreparedFunctionImpl::execute(doris::FunctionContext*, 
doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long, bool) const at 
/root/doris/be/src/vec/functions/function.cpp:248
     9# doris::vectorized::IFunctionBase::execute(doris::FunctionContext*, 
doris::vectorized::Block&, std::vector<unsigned int, std::allocator<unsigned 
int> > const&, unsigned int, unsigned long, bool) const at 
/root/doris/be/src/vec/functions/function.h:189
    10# 
doris::vectorized::VectorizedFnCall::_do_execute(doris::vectorized::VExprContext*,
 doris::vectorized::Block*, int*, std::vector<unsigned int, 
std::allocator<unsigned int> >&) at 
/root/doris/be/src/vec/exprs/vectorized_fn_call.cpp:238
    11# 
doris::vectorized::VectorizedFnCall::execute(doris::vectorized::VExprContext*, 
doris::vectorized::Block*, int*) at 
/root/doris/be/src/vec/exprs/vectorized_fn_call.cpp:272
    12# doris::vectorized::VExprContext::execute(doris::vectorized::Block*, 
int*) at /root/doris/be/src/vec/exprs/vexpr_context.cpp:61
    13# doris::vectorized::Scanner::_do_projections(doris::vectorized::Block*, 
doris::vectorized::Block*) at /root/doris/be/src/vec/exec/scan/scanner.cpp:191
    14# 
doris::vectorized::Scanner::get_block_after_projects(doris::RuntimeState*, 
doris::vectorized::Block*, bool*) at 
/root/doris/be/src/vec/exec/scan/scanner.cpp:83
    15# 
doris::vectorized::ScannerScheduler::_scanner_scan(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>) at 
/root/doris/be/src/vec/exec/scan/scanner_scheduler.cpp:182
    16# 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const at 
/root/doris/be/src/vec/exec/scan/scanner_scheduler.cpp:96
    17# 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}::operator()() const at 
/root/doris/be/src/vec/exec/scan/scanner_scheduler.cpp:95
    18# bool std::__invoke_impl<bool, 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}&>(std::__invoke_other, 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/ [...]
    19# std::enable_if<is_invocable_r_v<bool, 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}&>, bool>::type std::__invoke_r<bool, 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}&>(doris::vectorized::ScannerScheduler::submit(st [...]
    20# std::_Function_handler<bool (), 
doris::vectorized::ScannerScheduler::submit(std::shared_ptr<doris::vectorized::ScannerContext>,
 std::shared_ptr<doris::vectorized::ScanTask>)::$_0::operator()() 
const::{lambda()#1}>::_M_invoke(std::_Any_data const&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:292
    21# std::function<bool ()>::operator()() const at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:593
    22# 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}::operator()()
 const at /root/doris/be/src/vec/exec/scan/scanner_scheduler.h:193
    23# void std::__invoke_impl<void, 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}&>(std::__invoke_other,
 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}&)
 at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/invoke.h:63
    24# std::enable_if<is_invocable_r_v<void, 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}&>,
 void>::type std::__invoke_r<void, 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}&>(doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}&)
 at /root/ldb_toolchain_taipan/bin/ [...]
    25# std::_Function_handler<void (), 
doris::vectorized::ThreadPoolSimplifiedScanScheduler::submit_scan_task(doris::vectorized::SimplifiedScanTask)::{lambda()#1}>::_M_invoke(std::_Any_data
 const&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:292
    26# std::function<void ()>::operator()() const at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:593
    27# doris::FunctionRunnable::run() at 
/root/doris/be/src/util/threadpool.cpp:60
    28# doris::ThreadPool::dispatch_thread() at 
/root/doris/be/src/util/threadpool.cpp:614
    29# void std::__invoke_impl<void, void (doris::ThreadPool::*&)(), 
doris::ThreadPool*&>(std::__invoke_memfun_deref, void 
(doris::ThreadPool::*&)(), doris::ThreadPool*&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/invoke.h:76
    30# std::__invoke_result<void (doris::ThreadPool::*&)(), 
doris::ThreadPool*&>::type std::__invoke<void (doris::ThreadPool::*&)(), 
doris::ThreadPool*&>(void (doris::ThreadPool::*&)(), doris::ThreadPool*&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/invoke.h:98
    31# void std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>::__call<void, , 
0ul>(std::tuple<>&&, std::_Index_tuple<0ul>) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/functional:515
    32# void std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>::operator()<, void>() at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/functional:600
    33# void std::__invoke_impl<void, std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>&>(std::__invoke_other, 
std::_Bind<void (doris::ThreadPool::*(doris::ThreadPool*))()>&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/invoke.h:63
    34# std::enable_if<is_invocable_r_v<void, std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>&>, void>::type 
std::__invoke_r<void, std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>&>(std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()>&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/invoke.h:119
    35# std::_Function_handler<void (), std::_Bind<void 
(doris::ThreadPool::*(doris::ThreadPool*))()> >::_M_invoke(std::_Any_data 
const&) at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:292
    36# std::function<void ()>::operator()() const at 
/root/ldb_toolchain_taipan/bin/../lib/gcc/x86_64-pc-linux-gnu/15/include/g++-v15/bits/std_function.h:593
    37# doris::Thread::supervise_thread(void*) at 
/root/doris/be/src/util/thread.cpp:460
    38# asan_thread_start(void*) in /root/doris/be/output/lib/doris_be
    39# start_thread in /lib64/libpthread.so.0
    40# __GI___clone in /lib64/libc.so.6
    ```
    
    Related PR: #xxx
    
    Problem Summary:
    
    ### Release note
    
    None
    
    ### Check List (For Author)
    
    - Test <!-- At least one of them must be included. -->
        - [ ] Regression test
        - [ ] Unit Test
        - [ ] Manual test (add detailed scripts or steps below)
        - [ ] No need to test or manual test. Explain why:
    - [ ] This is a refactor/code format and no logic has been changed.
            - [ ] Previous test can cover this change.
            - [ ] No code files have been changed.
            - [ ] Other reason <!-- Add your reason?  -->
    
    - Behavior changed:
        - [ ] No.
        - [ ] Yes. <!-- Explain the behavior change -->
    
    - Does this need documentation?
        - [ ] No.
    - [ ] Yes. <!-- Add document PR link here. eg:
    https://github.com/apache/doris-website/pull/1214 -->
    
    ### Check List (For Reviewer who merge this PR)
    
    - [ ] Confirm the release note
    - [ ] Confirm test cases
    - [ ] Confirm document
    - [ ] Add branch pick label <!-- Add branch pick label that this PR
    should merge into -->
---
 be/src/vec/functions/function_jsonb.cpp            |  2 +-
 .../json_functions/test_json_exists_path.out       |  5 ++++
 .../json_functions/test_json_exists_path.groovy    | 32 ++++++++++++++++++++++
 3 files changed, 38 insertions(+), 1 deletion(-)

diff --git a/be/src/vec/functions/function_jsonb.cpp 
b/be/src/vec/functions/function_jsonb.cpp
index 7d83fa4c9be..de2b52480a9 100644
--- a/be/src/vec/functions/function_jsonb.cpp
+++ b/be/src/vec/functions/function_jsonb.cpp
@@ -727,7 +727,7 @@ public:
                 VectorizedUtils::update_null_map(*result_null_map, 
*path_null_map, path_const);
             }
 
-            if (0 == simd::count_zero_num(reinterpret_cast<const 
int8_t*>(data_null_map->data()),
+            if (0 == simd::count_zero_num(reinterpret_cast<const 
int8_t*>(result_null_map->data()),
                                           input_rows_count)) {
                 return create_all_null_result();
             }
diff --git 
a/regression-test/data/query_p0/sql_functions/json_functions/test_json_exists_path.out
 
b/regression-test/data/query_p0/sql_functions/json_functions/test_json_exists_path.out
index 31f5da434da..ec932f45fbf 100644
--- 
a/regression-test/data/query_p0/sql_functions/json_functions/test_json_exists_path.out
+++ 
b/regression-test/data/query_p0/sql_functions/json_functions/test_json_exists_path.out
@@ -117,3 +117,8 @@ true
 12     \N      $.k2    \N
 13     \N      $.k3    \N
 
+-- !test_all_null2 --
+2      {"k1":"v31","k2":{"sub_key":1234.56}}   \N      \N
+4      {"k1":"v31","k2":300}   \N      \N
+6      {"k1":"v31","k2":300}   \N      \N
+
diff --git 
a/regression-test/suites/query_p0/sql_functions/json_functions/test_json_exists_path.groovy
 
b/regression-test/suites/query_p0/sql_functions/json_functions/test_json_exists_path.groovy
index dedf9bb91f6..317523f51fd 100644
--- 
a/regression-test/suites/query_p0/sql_functions/json_functions/test_json_exists_path.groovy
+++ 
b/regression-test/suites/query_p0/sql_functions/json_functions/test_json_exists_path.groovy
@@ -163,6 +163,38 @@ suite("test_json_exists_path") {
         exception "Invalid Json Path for value: \$."
     }
 
+    sql """
+        drop table if exists json_exists_path_test2;
+    """
+
+    sql """
+        create table json_exists_path_test2 (
+            id int,
+            json_col json not null,
+            json_path string
+        ) distributed by hash(id) buckets 1 properties("replication_num" = 
"1");
+    """
+
+    sql """
+        insert into json_exists_path_test2 values
+        (1, '{"k1":"v31","k2":300}', '\$.k1'),
+        (2, '{"k1":"v31","k2":{"sub_key": 1234.56}}', null),
+        (3, '{"k1":"v31","k2": null}', '\$.k2'),
+        (4, '{"k1":"v31","k2":300}', null),
+        (5, '{"id": 123, "name": "doris"}', '\$.'),
+        (6, '{"k1":"v31","k2":300}', null),
+        (7, '{"k1":"v31","k2":{"sub_key": 1234.56}}', null);
+    """
+
+    qt_test_all_null2 """
+        select
+            id
+            , json_col
+            , json_path
+            , json_exists_path(json_col, json_path)
+        from json_exists_path_test2 where id % 2 = 0 order by id
+    """
+
     test {
         sql """
             select json_exists_path(json_col_non_null, '\$.') from 
json_exists_path_test where id = 5;


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to