raulcd opened a new issue, #45212: URL: https://github.com/apache/arrow/issues/45212
### Describe the bug, including details regarding any error messages, version, and platform. The [test-conda-cpp-valgrind](https://github.com/ursacomputing/crossbow/actions/runs/12680490061/job/35342372038) has been failing for a while now with some errors. Here is some part of the error log but more context can be found on the failed job: ``` } ==13669== Conditional jump or move depends on uninitialised value(s) ==13669== at 0x4C1629E: parquet::TypedColumnWriterImpl<parquet::PhysicalType<(parquet::Type::type)4> >::GetPageStatistics() (column_writer.cc:1381) ==13669== by 0x4BF3659: parquet::ColumnWriterImpl::BuildDataPageV1(long, long, long, std::shared_ptr<arrow::Buffer> const&) (column_writer.cc:992) ==13669== by 0x4C06447: parquet::ColumnWriterImpl::AddDataPage() (column_writer.cc:968) ==13669== by 0x4C0677B: parquet::ColumnWriterImpl::FlushBufferedDataPages() (column_writer.cc:1118) ==13669== by 0x4C0714D: parquet::ColumnWriterImpl::Close() (column_writer.cc:1094) ==13669== by 0x4C07324: parquet::TypedColumnWriterImpl<parquet::PhysicalType<(parquet::Type::type)4> >::Close() (column_writer.cc:1243) ==13669== by 0x4B8DFCD: parquet::arrow::(anonymous namespace)::ArrowColumnWriterV2::Write(parquet::ArrowWriteContext*) (writer.cc:160) ==13669== by 0x4B92C9C: parquet::arrow::FileWriterImpl::WriteColumnChunk(std::shared_ptr<arrow::ChunkedArray> const&, long, long) (writer.cc:355) ==13669== by 0x4B8D8A1: parquet::arrow::FileWriterImpl::WriteTable(arrow::Table const&, long)::{lambda(long, long)#1}::operator()(long, long) const (writer.cc:384) ==13669== by 0x4B9117C: parquet::arrow::FileWriterImpl::WriteTable(arrow::Table const&, long) (writer.cc:397) ==13669== by 0x49B79C9: arrow::dataset::ParquetFileWriter::Write(std::shared_ptr<arrow::RecordBatch> const&) (file_parquet.cc:765) ==13669== by 0x48FE006: arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}::operator()() const (dataset_writer.cc:236) ==13669== by 0x48FE08A: std::enable_if<((!std::is_void<arrow::Status>::value)&&(!arrow::detail::is_future<arrow::Status>::value))&&((!arrow::Future<arrow::internal::Empty>::is_empty)||std::is_same<arrow::Status, arrow::Status>::value), void>::type arrow::detail::ContinueFuture::operator()<arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&, , arrow::Status, arrow::Future<arrow::internal::Empty> >(arrow::Future<arrow::internal::Empty>, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&) const (future.h:150) ==13669== by 0x48FE128: void std::__invoke_impl<void, arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&>(std::__invoke_other, arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1}&) (invoke.h:61) ==13669== by 0x48FE19A: __invoke<arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::<lambda()>&> (invoke.h:96) ==13669== by 0x48FE19A: __call<void, 0, 1> (functional:506) ==13669== by 0x48FE19A: operator()<> (functional:591) ==13669== by 0x48FE19A: arrow::internal::FnOnce<void ()>::FnImpl<std::_Bind<arrow::detail::ContinueFuture (arrow::Future<arrow::internal::Empty>, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::{lambda()#1})> >::invoke() (functional.h:152) ==13669== by 0x67F6021: arrow::internal::FnOnce<void ()>::operator()() && (functional.h:140) ==13669== by 0x67F8E48: arrow::internal::WorkerLoop(std::shared_ptr<arrow::internal::ThreadPool::State>, std::_List_iterator<std::thread>) (thread_pool.cc:478) ==13669== by 0x67F9179: arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::{lambda()#1}::operator()() const (thread_pool.cc:643) ==13669== by 0x67F91E4: __invoke_impl<void, arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > (invoke.h:61) ==13669== by 0x67F91E4: __invoke<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > (invoke.h:96) ==13669== by 0x67F91E4: _M_invoke<0> (std_thread.h:292) ==13669== by 0x67F91E4: operator() (std_thread.h:299) ==13669== by 0x67F91E4: std::thread::_State_impl<std::thread::_Invoker<std::tuple<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::{lambda()#1}> > >::_M_run() (std_thread.h:244) ==13669== by 0x70B5B74: execute_native_thread_routine (thread.cc:104) ==13669== by 0x7288AC2: start_thread (pthread_create.c:442) ==13669== by 0x7319A03: clone (clone.S:100) ==13669== { <insert_a_suppression_name_here> Memcheck:Cond fun:_ZN7parquet21TypedColumnWriterImplINS_12PhysicalTypeILNS_4Type4typeE4EEEE17GetPageStatisticsEv fun:_ZN7parquet16ColumnWriterImpl15BuildDataPageV1ElllRKSt10shared_ptrIN5arrow6BufferEE fun:_ZN7parquet16ColumnWriterImpl11AddDataPageEv fun:_ZN7parquet16ColumnWriterImpl22FlushBufferedDataPagesEv fun:_ZN7parquet16ColumnWriterImpl5CloseEv fun:_ZN7parquet21TypedColumnWriterImplINS_12PhysicalTypeILNS_4Type4typeE4EEEE5CloseEv fun:_ZN7parquet5arrow12_GLOBAL__N_119ArrowColumnWriterV25WriteEPNS_17ArrowWriteContextE fun:_ZN7parquet5arrow14FileWriterImpl16WriteColumnChunkERKSt10shared_ptrIN5arrow12ChunkedArrayEEll fun:_ZZN7parquet5arrow14FileWriterImpl10WriteTableERKN5arrow5TableElENKUlllE_clEll fun:_ZN7parquet5arrow14FileWriterImpl10WriteTableERKN5arrow5TableEl fun:_ZN5arrow7dataset17ParquetFileWriter5WriteERKSt10shared_ptrINS_11RecordBatchEE fun:_ZZN5arrow7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEENKUlvE_clEv fun:_ZNK5arrow6detail14ContinueFutureclIRZNS_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEEUlvE_JENS_6StatusENS_6FutureINS_8internal5EmptyEEEEENSt9enable_ifIXaaaantsrSt7is_voidIT1_E5valuentsrNS0_9is_futureISJ_EE5valueoontsrT2_8is_emptysrSt7is_sameISJ_SC_E5valueEvE4typeESN_OT_DpOT0_ fun:_ZSt13__invoke_implIvRN5arrow6detail14ContinueFutureEJRNS0_6FutureINS0_8internal5EmptyEEERZNS0_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS0_11RecordBatchEEEUlvE_EET_St14__invoke_otherOT0_DpOT1_ fun:__invoke<arrow::detail::ContinueFuture&, arrow::Future<arrow::internal::Empty>&, arrow::dataset::internal::(anonymous namespace)::DatasetWriterFileQueue::WriteNext(std::shared_ptr<arrow::RecordBatch>)::<lambda()>&> fun:__call<void, 0, 1> fun:operator()<> fun:_ZN5arrow8internal6FnOnceIFvvEE6FnImplISt5_BindIFNS_6detail14ContinueFutureENS_6FutureINS0_5EmptyEEEZNS_7dataset8internal12_GLOBAL__N_122DatasetWriterFileQueue9WriteNextESt10shared_ptrINS_11RecordBatchEEEUlvE_EEE6invokeEv fun:_ZNO5arrow8internal6FnOnceIFvvEEclEv fun:_ZN5arrow8internalL10WorkerLoopESt10shared_ptrINS0_10ThreadPool5StateEESt14_List_iteratorISt6threadE fun:_ZZN5arrow8internal10ThreadPool21LaunchWorkersUnlockedEiENKUlvE_clEv fun:__invoke_impl<void, arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > fun:__invoke<arrow::internal::ThreadPool::LaunchWorkersUnlocked(int)::<lambda()> > fun:_M_invoke<0> fun:operator() fun:_ZNSt6thread11_State_implINS_8_InvokerISt5tupleIJZN5arrow8internal10ThreadPool21LaunchWorkersUnlockedEiEUlvE_EEEEE6_M_runEv fun:execute_native_thread_routine fun:start_thread fun:clone } [ OK ] LargeRowEncryptionTest.ReadEncryptLargeRows (611 ms) [----------] 1 test from LargeRowEncryptionTest (611 ms total) [----------] Global test environment tear-down [==========] 3 tests from 2 test suites ran. (9334 ms total) [ PASSED ] 3 tests. ==13669== ==13669== HEAP SUMMARY: ==13669== in use at exit: 9,874 bytes in 157 blocks ==13669== total heap usage: 56,117 allocs, 55,960 frees, 16,502,688 bytes allocated ==13669== ==13669== LEAK SUMMARY: ==13669== definitely lost: 0 bytes in 0 blocks ==13669== indirectly lost: 0 bytes in 0 blocks ==13669== possibly lost: 0 bytes in 0 blocks ==13669== still reachable: 9,874 bytes in 157 blocks ==13669== suppressed: 0 bytes in 0 blocks ==13669== Reachable blocks (those to which a pointer was found) are not shown. ==13669== To see them, rerun with: --leak-check=full --show-leak-kinds=all ==13669== ==13669== Use --track-origins=yes to see where uninitialised values come from ==13669== For lists of detected and suppressed errors, rerun with: -s ==13669== ERROR SUMMARY: 96 errors from 6 contexts (suppressed: 0 from 0) ``` This is happening on the maintenance branch for 19.0.0. From the crossbow nightly report site it seems it started failing with this commits where I can see some potential ones causing the issue: https://github.com/apache/arrow/compare/313d11aa94c2be71142b55e3d8bb166d780c19c7...66be0f8031780b2a23b5d565a29363d47f7f41ff ### Component(s) C++, Parquet -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: issues-unsubscr...@arrow.apache.org.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org