nebula 版本:2.5.1
部署方式:分布式
硬件信息
SSD 400G
CPU 20核、内存 30g
问题的具体描述
部署了30台机器的集群,使用过程中发现有3台的storaged崩溃,在nebula目录下有core文件,gdb bin/nebula-storaged core.389_executor-pri3-2,然后bt full显示信息如下:
[Thread debugging using libthread_db enabled]
Using host libthread_db library "/lib64/libthread_db.so.1".
Core was generated by `/usr/local/nebula/bin/nebula-storaged --flagfile /usr/local/nebula/etc/nebula-s'.
Program terminated with signal 6, Aborted.
#0 0x00007ff1ffdea1f7 in raise () from /lib64/libc.so.6
Missing separate debuginfos, use: debuginfo-install nebula-graph-2.5.1-1.x86_64
(gdb) bt full
#0 0x00007ff1ffdea1f7 in raise () from /lib64/libc.so.6
No symbol table info available.
#1 0x00007ff1ffdeb8e8 in abort () from /lib64/libc.so.6
No symbol table info available.
#2 0x0000000002081dad in google::LogMessage::Fail() ()
No symbol table info available.
#3 0x0000000002086b8e in google::LogMessage::SendToLog() ()
No symbol table info available.
#4 0x0000000002081a7e in google::LogMessage::Flush() ()
No symbol table info available.
#5 0x00000000020822d9 in google::LogMessageFatal::~LogMessageFatal() ()
No symbol table info available.
#6 0x00000000010d0272 in nebula::RowWriterV2::checkUnsetFields() ()
No symbol table info available.
#7 0x00000000010d082d in nebula::RowWriterV2::finish() ()
No symbol table info available.
#8 0x0000000000ecec42 in nebula::storage::BaseProcessor<nebula::storage::cpp2::ExecResponse>::encodeRowVal(nebula::meta::NebulaSchemaProvider const*, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > const&, std::vector<nebula::Value, std::allocator<nebula::Value> > const&, nebula::WriteResult&) [clone .constprop.0] ()
No symbol table info available.
#9 0x0000000000ecf728 in nebula::storage::AddVerticesProcessor::doProcess(nebula::storage::cpp2::AddVerticesRequest const&) ()
No symbol table info available.
#10 0x0000000000ed4bbb in nebula::storage::AddVerticesProcessor::process(nebula::storage::cpp2::AddVerticesRequest const&) ()
No symbol table info available.
#11 0x0000000000ec0741 in nebula::storage::GraphStorageServiceHandler::future_addVertices(nebula::storage::cpp2::AddVerticesRequest const&) ()
No symbol table info available.
#12 0x00000000013711e3 in nebula::storage::cpp2::GraphStorageServiceSvIf::async_tm_addVertices(std::unique_ptr<apache::thrift::HandlerCallback<nebula::storage::cpp2::ExecResponse>, std::default_delete<apache::thrift::HandlerCallback<nebula::storage::cpp2::ExecResponse> > >, nebula::storage::cpp2::AddVerticesRequest const&) ()
No symbol table info available.
#13 0x0000000001385bfa in void nebula::storage::cpp2::GraphStorageServiceAsyncProcessor::process_addVertices<apache::thrift::CompactProtocolReader, apache::thrift::CompactProtocolWriter>(std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>, apache::thrift::SerializedRequest&&, apache::thrift::Cpp2RequestContext*, folly::EventBase*, apache::thrift::concurrency::ThreadManager*) ()
No symbol table info available.
#14 0x000000000138ba39 in void folly::detail::function::FunctionTraits<void (std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>)>::callBig<std::shared_ptr<apache::thrift::EventTask> apache::thrift::GeneratedAsyncProcessor::makeEventTaskForRequest<nebula::storage::cpp2::GraphStorageServiceAsyncProcessor>(std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>, apache::thrift::SerializedRequest&&, apache::thrift::Cpp2RequestContext*, folly::EventBase*, apache::thrift::concurrency::ThreadManager*, apache::thrift::RpcKind, void (nebula::storage::cpp2::GraphStorageServiceAsyncProcessor::*)(std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>, apache::thrift::SerializedRequest&&, apache::thrift::Cpp2RequestContext*, folly::EventBase*, apache::thrift::concurrency::ThreadManager*), nebula::storage::cpp2::GraphStorageServiceAsyncProcessor*, apache::thrift::Tile*)::{lambda(std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>)#1}>(std::unique_ptr<apache::thrift::ResponseChannelRequest, apache::thrift::RequestsRegistry::Deleter>&&, folly::detail::function::Data&) ()
No symbol table info available.
#15 0x0000000001c330e2 in apache::thrift::EventTask::run() ()
No symbol table info available.
#16 0x0000000001c38627 in virtual thunk to apache::thrift::concurrency::FunctionRunner::run() ()
No symbol table info available.
#17 0x0000000001d6a3f3 in apache::thrift::concurrency::ThreadManager::Impl::Worker::run() ()
No symbol table info available.
#18 0x0000000001d6e04d in apache::thrift::concurrency::PthreadThread::threadMain(void*) ()
No symbol table info available.
#19 0x00007ff200180e25 in start_thread () from /lib64/libpthread.so.0
No symbol table info available.
#20 0x00007ff1ffead35d in clone () from /lib64/libc.so.6
No symbol table info available.