[
https://issues.apache.org/jira/browse/KUDU-1528?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15423896#comment-15423896
]
Todd Lipcon commented on KUDU-1528:
-----------------------------------
Saw something similar in a real cluster: one thread at:
Thread 127 (Thread 0x7f776c92c700 (LWP 63948)):
#0 0x0000003e8b60b7bb in pthread_cond_timedwait@@GLIBC_2.3.2 () from
/lib64/libpthread.so.0
#1 0x000000000189747d in kudu::ConditionVariable::TimedWait(kudu::MonoDelta
const&) const ()
#2 0x0000000001908c5c in kudu::ThreadJoiner::Join() ()
#3 0x00000000009a74ca in kudu::log::Log::AppendThread::Shutdown() ()
#4 0x00000000009ab996 in kudu::log::Log::Close() ()
#5 0x00000000008cb92a in kudu::tablet::TabletPeer::Shutdown() ()
#6 0x00000000007a07ae in
kudu::tserver::TSTabletManager::DeleteTablet(std::basic_string<char,
std::char_traits<char>, std::allocator<char> > const&,
kudu::tablet::TabletDataState, boost::optional<long> const&,
boost::optional<kudu::tserver::TabletServerErrorPB_Code>*) ()
#7 0x0000000000786c89 in
kudu::tserver::TabletServiceAdminImpl::DeleteTablet(kudu::tserver::DeleteTabletRequestPB
const*, kudu::tserver::DeleteTabletResponsePB*, kudu::rpc::RpcContext*) ()
another thread crashed in:
#6 0x00000000007d80ef in google::LogMessageFatal::~LogMessageFatal() ()
#7 0x000000000099140f in
kudu::consensus::PeerMessageQueue::LocalPeerAppendFinished(kudu::consensus::OpId
const&, kudu::Callback<void ()(kudu::Status const&)> const&, kudu::Status
const&) ()
#8 0x00000000009987b9 in kudu::consensus::LogCache::LogCallback(long, bool,
kudu::Callback<void ()(kudu::Status const&)> const&, kudu::Status const&) ()
#9 0x00000000009b048b in kudu::log::Log::AppendThread::RunThread() ()
with:
F0816 18:23:24.599644 64693 consensus_queue.cc:221] Check failed: _s.ok() Bad
status: Service unavailable: The pool has been shut down.
> heap-use-after-free in Peer::ProcessResponse while deleting a tablet
> ---------------------------------------------------------------------
>
> Key: KUDU-1528
> URL: https://issues.apache.org/jira/browse/KUDU-1528
> Project: Kudu
> Issue Type: Bug
> Components: consensus
> Affects Versions: 0.9.1
> Reporter: Adar Dembo
> Priority: Critical
>
> Observed this in a [master-stress-test
> failure|http://104.196.14.100/job/kudu-gerrit/2314/BUILD_TYPE=ASAN]. It
> appears that we deleted a tablet while we were processing the response to
> ConsensusService::UpdateConsensus().
> {noformat}
> ==721==ERROR: AddressSanitizer: heap-use-after-free on address 0x6140001b8fb0
> at pc 0x7f54968ac684 bp 0x7f5487e485b0 sp 0x7f5487e485a8
> READ of size 8 at 0x6140001b8fb0 thread T6 (rpc reactor-728)
> #0 0x7f54968ac683 in scoped_refptr<kudu::Histogram>::operator
> kudu::Histogram* scoped_refptr<kudu::Histogram>::*() const
> /home/jenkins-slave/workspace/kudu-3/src/kudu/gutil/ref_counted.h:269:38
> #1 0x7f5491297e5b in
> kudu::ThreadPool::Submit(std::shared_ptr<kudu::Runnable> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/threadpool.cc:241:7
> #2 0x7f54912978cd in kudu::ThreadPool::SubmitFunc(boost::function<void
> ()> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/threadpool.cc:182:10
> #3 0x7f54912976ef in kudu::ThreadPool::SubmitClosure(kudu::Callback<void
> ()> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/threadpool.cc:178:10
> #4 0x7f5497f3929c in kudu::consensus::Peer::ProcessResponse()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/consensus/consensus_peers.cc:263:14
> #5 0x7f5497f440ad in boost::_bi::bind_t<void, boost::_mfi::mf0<void,
> kudu::consensus::Peer>,
> boost::_bi::list1<boost::_bi::value<kudu::consensus::Peer*> > >::operator()()
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/bind/bind.hpp:1222:16
> #6 0x7f549688135e in boost::function0<void>::operator()() const
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/function/function_template.hpp:770:14
> #7 0x7f549687ca1e in kudu::rpc::OutboundCall::CallCallback()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/outbound_call.cc:189:5
> #8 0x7f549687ce01 in
> kudu::rpc::OutboundCall::SetResponse(gscoped_ptr<kudu::rpc::CallResponse,
> kudu::DefaultDeleter<kudu::rpc::CallResponse> >)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/outbound_call.cc:221:5
> #9 0x7f549688ea1f in
> kudu::rpc::Connection::HandleCallResponse(gscoped_ptr<kudu::rpc::InboundTransfer,
> kudu::DefaultDeleter<kudu::rpc::InboundTransfer> >)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/connection.cc:534:3
> #10 0x7f549688ded2 in kudu::rpc::Connection::ReadHandler(ev::io&, int)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/connection.cc:470:7
> #11 0x7f5496184605 in ev_invoke_pending
> /home/jenkins-slave/workspace/kudu-2/thirdparty/libev-4.20/ev.c:3155
> #12 0x7f54961854f7 in ev_run
> /home/jenkins-slave/workspace/kudu-2/thirdparty/libev-4.20/ev.c:3555
> #13 0x7f54968c6cca in kudu::rpc::ReactorThread::RunThread()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/reactor.cc:306:3
> #14 0x7f54968d69dd in boost::_bi::bind_t<void, boost::_mfi::mf0<void,
> kudu::rpc::ReactorThread>,
> boost::_bi::list1<boost::_bi::value<kudu::rpc::ReactorThread*> >
> >::operator()()
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/bind/bind.hpp:1222:16
> #15 0x7f549688135e in boost::function0<void>::operator()() const
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/function/function_template.hpp:770:14
> #16 0x7f5491285dd6 in kudu::Thread::SuperviseThread(void*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:586:3
> #17 0x7f5493bcb181 in start_thread
> /build/eglibc-3GlaMS/eglibc-2.19/nptl/pthread_create.c:312
> #18 0x7f548e6fe47c in clone
> /build/eglibc-3GlaMS/eglibc-2.19/misc/../sysdeps/unix/sysv/linux/x86_64/clone.S:111
> 0x6140001b8fb0 is located 368 bytes inside of 416-byte region
> [0x6140001b8e40,0x6140001b8fe0)
> freed by thread T31 (rpc worker-753) here:
> #0 0x4f54d0 in operator delete(void*)
> /home/jenkins-slave/workspace/kudu-3/thirdparty/llvm-3.8.0.src/projects/compiler-rt/lib/asan/asan_new_delete.cc:94
> #1 0x7f5497f9e40d in kudu::consensus::RaftConsensus::~RaftConsensus()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/consensus/raft_consensus.cc:244:1
> #2 0x7f5497f9e551 in kudu::consensus::RaftConsensus::~RaftConsensus()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/consensus/raft_consensus.cc:242:33
> #3 0x7f5498adf6e8 in
> scoped_refptr<kudu::consensus::Consensus>::operator=(kudu::consensus::Consensus*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/gutil/ref_counted.h:284:7
> #4 0x7f5498ad3d41 in kudu::tablet::TabletPeer::Shutdown()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tablet/tablet_peer.cc:255:5
> #5 0x7f549adedd6d in
> kudu::tserver::TSTabletManager::DeleteTablet(std::string const&,
> kudu::tablet::TabletDataState, boost::optional<long> const&,
> boost::optional<kudu::tserver::TabletServerErrorPB_Code>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/ts_tablet_manager.cc:525:3
> #6 0x7f549adacdbd in
> kudu::tserver::TabletServiceAdminImpl::DeleteTablet(kudu::tserver::DeleteTabletRequestPB
> const*, kudu::tserver::DeleteTabletResponsePB*, kudu::rpc::RpcContext*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_service.cc:664:14
> #7 0x7f549707daae in std::_Function_handler<void
> (google::protobuf::Message const*, google::protobuf::Message*,
> kudu::rpc::RpcContext*),
> kudu::tserver::TabletServerAdminServiceIf::TabletServerAdminServiceIf(scoped_refptr<kudu::MetricEntity>
> const&)::$_1>::_M_invoke(std::_Any_data const&, google::protobuf::Message
> const*, google::protobuf::Message*, kudu::rpc::RpcContext*)
> /usr/lib/gcc/x86_64-linux-gnu/4.8/../../../../include/c++/4.8/functional:2071:2
> #8 0x7f549691f220 in std::function<void (google::protobuf::Message
> const*, google::protobuf::Message*,
> kudu::rpc::RpcContext*)>::operator()(google::protobuf::Message const*,
> google::protobuf::Message*, kudu::rpc::RpcContext*) const
> /usr/lib/gcc/x86_64-linux-gnu/4.8/../../../../include/c++/4.8/functional:2471:14
> #9 0x7f549691e913 in
> kudu::rpc::GeneratedServiceIf::Handle(kudu::rpc::InboundCall*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/service_if.cc:94:3
> #10 0x7f5496921599 in kudu::rpc::ServicePool::RunThread()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/service_pool.cc:206:5
> #11 0x7f549692533d in boost::_bi::bind_t<void, boost::_mfi::mf0<void,
> kudu::rpc::ServicePool>,
> boost::_bi::list1<boost::_bi::value<kudu::rpc::ServicePool*> >
> >::operator()()
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/bind/bind.hpp:1222:16
> #12 0x7f549688135e in boost::function0<void>::operator()() const
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/function/function_template.hpp:770:14
> #13 0x7f5491285dd6 in kudu::Thread::SuperviseThread(void*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:586:3
> #14 0x7f5493bcb181 in start_thread
> /build/eglibc-3GlaMS/eglibc-2.19/nptl/pthread_create.c:312
> previously allocated by thread T121 (tablet-bootstra) here:
> #0 0x4f4e90 in operator new(unsigned long)
> /home/jenkins-slave/workspace/kudu-3/thirdparty/llvm-3.8.0.src/projects/compiler-rt/lib/asan/asan_new_delete.cc:62
> #1 0x7f5491295c3e in
> kudu::ThreadPoolBuilder::Build(gscoped_ptr<kudu::ThreadPool,
> kudu::DefaultDeleter<kudu::ThreadPool> >*) const
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/threadpool.cc:96:15
> #2 0x7f5497f9d2f0 in
> kudu::consensus::RaftConsensus::Create(kudu::consensus::ConsensusOptions
> const&, gscoped_ptr<kudu::consensus::ConsensusMetadata,
> kudu::DefaultDeleter<kudu::consensus::ConsensusMetadata> >,
> kudu::consensus::RaftPeerPB const&, scoped_refptr<kudu::MetricEntity> const&,
> scoped_refptr<kudu::server::Clock> const&,
> kudu::consensus::ReplicaTransactionFactory*,
> std::shared_ptr<kudu::rpc::Messenger> const&, scoped_refptr<kudu::log::Log>
> const&, std::shared_ptr<kudu::MemTracker> const&, kudu::Callback<void
> (std::string const&)> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/consensus/raft_consensus.cc:172:3
> #3 0x7f5498ad244d in
> kudu::tablet::TabletPeer::Init(std::shared_ptr<kudu::tablet::Tablet> const&,
> scoped_refptr<kudu::server::Clock> const&,
> std::shared_ptr<kudu::rpc::Messenger> const&, scoped_refptr<kudu::log::Log>
> const&, scoped_refptr<kudu::MetricEntity> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tablet/tablet_peer.cc:156:18
> #4 0x7f549ade847e in
> kudu::tserver::TSTabletManager::OpenTablet(scoped_refptr<kudu::tablet::TabletMetadata>
> const&, scoped_refptr<kudu::tserver::TransitionInProgressDeleter> const&)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/ts_tablet_manager.cc:659:10
> #5 0x7f549adfac7d in boost::_bi::bind_t<void, boost::_mfi::mf2<void,
> kudu::tserver::TSTabletManager, scoped_refptr<kudu::tablet::TabletMetadata>
> const&, scoped_refptr<kudu::tserver::TransitionInProgressDeleter> const&>,
> boost::_bi::list3<boost::_bi::value<kudu::tserver::TSTabletManager*>,
> boost::_bi::value<scoped_refptr<kudu::tablet::TabletMetadata> >,
> boost::_bi::value<scoped_refptr<kudu::tserver::TransitionInProgressDeleter> >
> > >::operator()()
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/bind/bind.hpp:1222:16
> #6 0x7f549688135e in boost::function0<void>::operator()() const
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/function/function_template.hpp:770:14
> #7 0x7f5491298bfb in kudu::ThreadPool::DispatchThread(bool)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/threadpool.cc:343:7
> #8 0x7f54912a00dd in boost::_bi::bind_t<void, boost::_mfi::mf1<void,
> kudu::ThreadPool, bool>,
> boost::_bi::list2<boost::_bi::value<kudu::ThreadPool*>,
> boost::_bi::value<bool> > >::operator()()
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/bind/bind.hpp:1222:16
> #9 0x7f549688135e in boost::function0<void>::operator()() const
> /home/jenkins-slave/workspace/kudu-3/thirdparty/installed/include/boost/function/function_template.hpp:770:14
> #10 0x7f5491285dd6 in kudu::Thread::SuperviseThread(void*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:586:3
> #11 0x7f5493bcb181 in start_thread
> /build/eglibc-3GlaMS/eglibc-2.19/nptl/pthread_create.c:312
> Thread T6 (rpc reactor-728) created by T0 here:
> #0 0x4301cd in __interceptor_pthread_create
> /home/jenkins-slave/workspace/kudu-3/thirdparty/llvm-3.8.0.src/projects/compiler-rt/lib/asan/asan_interceptors.cc:238
> #1 0x7f54912852bb in kudu::Thread::StartThread(std::string const&,
> std::string const&, boost::function<void ()> const&, unsigned long,
> scoped_refptr<kudu::Thread>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:509:15
> #2 0x7f54968ce906 in kudu::Status kudu::Thread::Create<void
> (kudu::rpc::ReactorThread::*)(), kudu::rpc::ReactorThread*>(std::string
> const&, std::string const&, void (kudu::rpc::ReactorThread::* const&)(),
> kudu::rpc::ReactorThread* const&, scoped_refptr<kudu::Thread>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.h:156:12
> #3 0x7f54968c69e6 in kudu::rpc::ReactorThread::Init()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/reactor.cc:108:10
> #4 0x7f54968cca15 in kudu::rpc::Reactor::Init()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/reactor.cc:488:10
> #5 0x7f54968b0691 in kudu::rpc::Messenger::Init()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/messenger.cc:266:5
> #6 0x7f54968b03e9 in
> kudu::rpc::MessengerBuilder::Build(kudu::rpc::Messenger**)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/messenger.cc:106:3
> #7 0x7f54968b083f in
> kudu::rpc::MessengerBuilder::Build(std::shared_ptr<kudu::rpc::Messenger>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/messenger.cc:113:3
> #8 0x7f54998b380d in kudu::server::ServerBase::Init()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/server/server_base.cc:178:3
> #9 0x7f549ada533a in kudu::tserver::TabletServer::Init()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server.cc:90:3
> #10 0x4f80cf in kudu::tserver::TabletServerMain(int, char**)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server_main.cc:55:3
> #11 0x4f7d34 in main
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server_main.cc:72:10
> #12 0x7f548e625ec4 in __libc_start_main
> /build/eglibc-3GlaMS/eglibc-2.19/csu/libc-start.c:287
> Thread T31 (rpc worker-753) created by T0 here:
> #0 0x4301cd in __interceptor_pthread_create
> /home/jenkins-slave/workspace/kudu-3/thirdparty/llvm-3.8.0.src/projects/compiler-rt/lib/asan/asan_interceptors.cc:238
> #1 0x7f54912852bb in kudu::Thread::StartThread(std::string const&,
> std::string const&, boost::function<void ()> const&, unsigned long,
> scoped_refptr<kudu::Thread>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:509:15
> #2 0x7f54969236e6 in kudu::Status kudu::Thread::Create<void
> (kudu::rpc::ServicePool::*)(), kudu::rpc::ServicePool*>(std::string const&,
> std::string const&, void (kudu::rpc::ServicePool::* const&)(),
> kudu::rpc::ServicePool* const&, scoped_refptr<kudu::Thread>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.h:156:12
> #3 0x7f5496920ffc in kudu::rpc::ServicePool::Init(int)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/rpc/service_pool.cc:80:5
> #4 0x7f54998ab7e4 in
> kudu::RpcServer::RegisterService(gscoped_ptr<kudu::rpc::ServiceIf,
> kudu::DefaultDeleter<kudu::rpc::ServiceIf> >)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/server/rpc_server.cc:122:3
> #5 0x7f54998b4bc3 in
> kudu::server::ServerBase::RegisterService(gscoped_ptr<kudu::rpc::ServiceIf,
> kudu::DefaultDeleter<kudu::rpc::ServiceIf> >)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/server/server_base.cc:239:10
> #6 0x7f549ada5984 in kudu::tserver::TabletServer::Start()
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server.cc:120:3
> #7 0x4f8133 in kudu::tserver::TabletServerMain(int, char**)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server_main.cc:58:3
> #8 0x4f7d34 in main
> /home/jenkins-slave/workspace/kudu-3/src/kudu/tserver/tablet_server_main.cc:72:10
> #9 0x7f548e625ec4 in __libc_start_main
> /build/eglibc-3GlaMS/eglibc-2.19/csu/libc-start.c:287
> Thread T121 (tablet-bootstra) created by T46 (rpc worker-768) here:
> #0 0x4301cd in __interceptor_pthread_create
> /home/jenkins-slave/workspace/kudu-3/thirdparty/llvm-3.8.0.src/projects/compiler-rt/lib/asan/asan_interceptors.cc:238
> #1 0x7f54912852bb in kudu::Thread::StartThread(std::string const&,
> std::string const&, boost::function<void ()> const&, unsigned long,
> scoped_refptr<kudu::Thread>*)
> /home/jenkins-slave/workspace/kudu-3/src/kudu/util/thread.cc:509:15
> {noformat}
--
This message was sent by Atlassian JIRA
(v6.3.4#6332)