raulcd opened a new issue, #45212:
URL: https://github.com/apache/arrow/issues/45212

   ### Describe the bug, including details regarding any error messages, 
version, and platform.
   
   The 
[test-conda-cpp-valgrind](https://github.com/ursacomputing/crossbow/actions/runs/12680490061/job/35342372038)
 has been failing for a while now with some errors. Here is some part of the 
error log but more context can be found on the failed job:
   ```
    }
   ==13669== Conditional jump or move depends on uninitialised value(s)
   ==13669==    at 0x4C1629E: 
parquet::TypedColumnWriterImpl<parquet::PhysicalType<(parquet::Type::type)4> 
>::GetPageStatistics() (column_writer.cc:1381)
   ==13669==    by 0x4BF3659: parquet::ColumnWriterImpl::BuildDataPageV1(long, 
long, long, std::shared_ptr<arrow::Buffer> const&) (column_writer.cc:992)
   ==13669==    by 0x4C06447: parquet::ColumnWriterImpl::AddDataPage() 
(column_writer.cc:968)
   ==13669==    by 0x4C0677B: 
parquet::ColumnWriterImpl::FlushBufferedDataPages() (column_writer.cc:1118)
   ==13669==    by 0x4C0714D: parquet::ColumnWriterImpl::Close() 
(column_writer.cc:1094)
   ==13669==    by 0x4C07324: 
parquet::TypedColumnWriterImpl<parquet::PhysicalType<(parquet::Type::type)4> 
>::Close() (column_writer.cc:1243)
   ==13669==    by 0x4B8DFCD: parquet::arrow::(anonymous 
namespace)::ArrowColumnWriterV2::Write(parquet::ArrowWriteContext*) 
(writer.cc:160)
   ==13669==    by 0x4B92C9C: 
parquet::arrow::FileWriterImpl::WriteColumnChunk(std::shared_ptr<arrow::ChunkedArray>
 const&, long, long) (writer.cc:355)
   ==13669==    by 0x4B8D8A1: 
parquet::arrow::FileWriterImpl::WriteTable(arrow::Table const&, 
long)::{lambda(long, long)#1}::operator()(long, long) const (writer.cc:384)
   ==13669==    by 0x4B9117C: 
parquet::arrow::FileWriterImpl::WriteTable(arrow::Table const&, long) 
(writer.cc:397)
   ==13669==    by 0x49B79C9: 
arrow::dataset::ParquetFileWriter::Write(std::shared_ptr<arrow::RecordBatch> 
const&) (file_parquet.cc:765)
   ==13669==    by 0x48FE006: arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}::operator()()
 const (dataset_writer.cc:236)
   ==13669==    by 0x48FE08A: 
std::enable_if<((!std::is_void<arrow::Status>::value)&&(!arrow::detail::is_future<arrow::Status>::value))&&((!arrow::Future<arrow::internal::Empty>::is_empty)||std::is_same<arrow::Status,
 arrow::Status>::value), void>::type 
arrow::detail::ContinueFuture::operator()<arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&,
 , arrow::Status, arrow::Future<arrow::internal::Empty> 
>(arrow::Future<arrow::internal::Empty>, arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&)
 const (future.h:150)
   ==13669==    by 0x48FE128: void std::__invoke_impl<void, 
arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, 
arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&>(std::__invoke_other,
 arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, 
arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&)
 (invoke.h:61)
   ==13669==    by 0x48FE19A: __invoke<arrow::detail::ContinueFuture&, 
arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::<lambda()>&>
 (invoke.h:96)
   ==13669==    by 0x48FE19A: __call<void, 0, 1> (functional:506)
   ==13669==    by 0x48FE19A: operator()<> (functional:591)
   ==13669==    by 0x48FE19A: arrow::internal::FnOnce<void 
()>::FnImpl<std::_Bind<arrow::detail::ContinueFuture 
(arrow::Future<arrow::internal::Empty>, arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1})>
 >::invoke() (functional.h:152)
   ==13669==    by 0x67F6021: arrow::internal::FnOnce<void ()>::operator()() && 
(functional.h:140)
   ==13669==    by 0x67F8E48: 
arrow::internal::WorkerLoop(std::shared_ptr<arrow::internal::ThreadPool::State>,
 std::_List_iterator<std::thread>) (thread_pool.cc:478)
   ==13669==    by 0x67F9179: 
arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::{lambda()#1}::operator()()
 const (thread_pool.cc:643)
   ==13669==    by 0x67F91E4: __invoke_impl<void, 
arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > 
(invoke.h:61)
   ==13669==    by 0x67F91E4: 
__invoke<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > 
(invoke.h:96)
   ==13669==    by 0x67F91E4: _M_invoke<0> (std_thread.h:292)
   ==13669==    by 0x67F91E4: operator() (std_thread.h:299)
   ==13669==    by 0x67F91E4: 
std::thread::_State_impl<std::thread::_Invoker<std::tuple<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::{lambda()#1}>
 > >::_M_run() (std_thread.h:244)
   ==13669==    by 0x70B5B74: execute_native_thread_routine (thread.cc:104)
   ==13669==    by 0x7288AC2: start_thread (pthread_create.c:442)
   ==13669==    by 0x7319A03: clone (clone.S:100)
   ==13669== 
   {
      <insert_a_suppression_name_here>
      Memcheck:Cond
      
fun:_ZN7parquet21TypedColumnWriterImplINS_12PhysicalTypeILNS_4Type4typeE4EEEE17GetPageStatisticsEv
      
fun:_ZN7parquet16ColumnWriterImpl15BuildDataPageV1ElllRKSt10shared_ptrIN5arrow6BufferEE
      fun:_ZN7parquet16ColumnWriterImpl11AddDataPageEv
      fun:_ZN7parquet16ColumnWriterImpl22FlushBufferedDataPagesEv
      fun:_ZN7parquet16ColumnWriterImpl5CloseEv
      
fun:_ZN7parquet21TypedColumnWriterImplINS_12PhysicalTypeILNS_4Type4typeE4EEEE5CloseEv
      
fun:_ZN7parquet5arrow12_GLOBAL__N_119ArrowColumnWriterV25WriteEPNS_17ArrowWriteContextE
      
fun:_ZN7parquet5arrow14FileWriterImpl16WriteColumnChunkERKSt10shared_ptrIN5arrow12ChunkedArrayEEll
      
fun:_ZZN7parquet5arrow14FileWriterImpl10WriteTableERKN5arrow5TableElENKUlllE_clEll
      fun:_ZN7parquet5arrow14FileWriterImpl10WriteTableERKN5arrow5TableEl
      
fun:_ZN5arrow7dataset17ParquetFileWriter5WriteERKSt10shared_ptrINS_11RecordBatchEE
      
fun:_ZZN5arrow7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEENKUlvE_clEv
      
fun:_ZNK5arrow6detail14ContinueFutureclIRZNS_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEEUlvE_JENS_6StatusENS_6FutureINS_8internal5EmptyEEEEENSt9enable_ifIXaaaantsrSt7is_voidIT1_E5valuentsrNS0_9is_futureISJ_EE5valueoontsrT2_8is_emptysrSt7is_sameISJ_SC_E5valueEvE4typeESN_OT_DpOT0_
      
fun:_ZSt13__invoke_implIvRN5arrow6detail14ContinueFutureEJRNS0_6FutureINS0_8internal5EmptyEEERZNS0_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS0_11RecordBatchEEEUlvE_EET_St14__invoke_otherOT0_DpOT1_
      fun:__invoke<arrow::detail::ContinueFuture&, 
arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous 
namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::<lambda()>&>
      fun:__call<void, 0, 1>
      fun:operator()<>
      
fun:_ZN5arrow8internal6FnOnceIFvvEE6FnImplISt5_BindIFNS_6detail14ContinueFutureENS_6FutureINS0_5EmptyEEEZNS_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEEUlvE_EEE6invokeEv
      fun:_ZNO5arrow8internal6FnOnceIFvvEEclEv
      
fun:_ZN5arrow8internalL10WorkerLoopESt10shared_ptrINS0_10ThreadPool5StateEESt14_List_iteratorISt6threadE
      fun:_ZZN5arrow8internal10ThreadPool21LaunchWorkersUnlockedEiENKUlvE_clEv
      fun:__invoke_impl<void, 
arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> >
      
fun:__invoke<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()>
 >
      fun:_M_invoke<0>
      fun:operator()
      
fun:_ZNSt6thread11_State_implINS_8_InvokerISt5tupleIJZN5arrow8internal10ThreadPool21LaunchWorkersUnlockedEiEUlvE_EEEEE6_M_runEv
      fun:execute_native_thread_routine
      fun:start_thread
      fun:clone
   }
   [       OK ] LargeRowEncryptionTest.ReadEncryptLargeRows (611 ms)
   [----------] 1 test from LargeRowEncryptionTest (611 ms total)
   
   [----------] Global test environment tear-down
   [==========] 3 tests from 2 test suites ran. (9334 ms total)
   [  PASSED  ] 3 tests.
   ==13669== 
   ==13669== HEAP SUMMARY:
   ==13669==     in use at exit: 9,874 bytes in 157 blocks
   ==13669==   total heap usage: 56,117 allocs, 55,960 frees, 16,502,688 bytes 
allocated
   ==13669== 
   ==13669== LEAK SUMMARY:
   ==13669==    definitely lost: 0 bytes in 0 blocks
   ==13669==    indirectly lost: 0 bytes in 0 blocks
   ==13669==      possibly lost: 0 bytes in 0 blocks
   ==13669==    still reachable: 9,874 bytes in 157 blocks
   ==13669==         suppressed: 0 bytes in 0 blocks
   ==13669== Reachable blocks (those to which a pointer was found) are not 
shown.
   ==13669== To see them, rerun with: --leak-check=full --show-leak-kinds=all
   ==13669== 
   ==13669== Use --track-origins=yes to see where uninitialised values come from
   ==13669== For lists of detected and suppressed errors, rerun with: -s
   ==13669== ERROR SUMMARY: 96 errors from 6 contexts (suppressed: 0 from 0)
   ```
   This is happening on the maintenance branch for 19.0.0.
   
   From the crossbow nightly report site it seems it started failing with this 
commits where I can see some potential ones causing the issue:
   
https://github.com/apache/arrow/compare/313d11aa94c2be71142b55e3d8bb166d780c19c7...66be0f8031780b2a23b5d565a29363d47f7f41ff
   
   ### Component(s)
   
   C++, Parquet


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: issues-unsubscr...@arrow.apache.org.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org

Reply via email to