Project

General

Profile

Actions

Bug #56350

open

crash: void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const: assert(num_down_in_osds <= num_in_osds)

Added by Telemetry Bot almost 2 years ago. Updated over 1 year ago.

Status:
New
Priority:
Normal
Assignee:
-
Category:
-
Target version:
-
% Done:

0%

Source:
Telemetry
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
Affected Versions:
ceph-qa-suite:
Component(RADOS):
Pull request ID:
Crash signature (v1):

ebc465267883da2e1b8d48a3c95f936715b299aded56e6a4709eaf33aea43996


Description

http://telemetry.front.sepia.ceph.com:4000/d/jByk5HaMz/crash-spec-x-ray?orgId=1&var-sig_v2=279837e667d5bd5af7117e58d352a99560d2bb4be2cd339361fc05d3ea369d98

Assert condition: num_down_in_osds <= num_in_osds
Assert function: void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const

Sanitized backtrace:

    OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const
    OSDMonitor::encode_pending(std::shared_ptr<MonitorDBStore::Transaction>)
    PaxosService::propose_pending()
    MDSMonitor::prepare_beacon(boost::intrusive_ptr<MonOpRequest>)
    MDSMonitor::prepare_update(boost::intrusive_ptr<MonOpRequest>)
    PaxosService::dispatch(boost::intrusive_ptr<MonOpRequest>)
    PaxosService::C_RetryMessage::_finish(int)
    C_MonOp::finish(int)
    Context::complete(int)
    void finish_contexts<std::list<Context*, std::allocator<Context*> > >(ceph::common::CephContext*, std::list<Context*, std::allocator<Context*> >&, int)
    Paxos::finish_round()
    Paxos::handle_last(boost::intrusive_ptr<MonOpRequest>)
    Paxos::dispatch(boost::intrusive_ptr<MonOpRequest>)
    Monitor::dispatch_op(boost::intrusive_ptr<MonOpRequest>)
    Monitor::_ms_dispatch(Message*)
    Dispatcher::ms_dispatch2(boost::intrusive_ptr<Message> const&)
    DispatchQueue::entry()
    DispatchQueue::DispatchThread::entry()

Crash dump sample:
{
    "archived": "2022-06-05 23:20:30.222550",
    "assert_condition": "num_down_in_osds <= num_in_osds",
    "assert_file": "osd/OSDMap.cc",
    "assert_func": "void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const",
    "assert_line": 5896,
    "assert_msg": "osd/OSDMap.cc: In function 'void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const' thread 7f5455624700 time 2022-06-05T18:57:29.596923+0000\nosd/OSDMap.cc: 5896: FAILED ceph_assert(num_down_in_osds <= num_in_osds)",
    "assert_thread_name": "ms_dispatch",
    "backtrace": [
        "/lib64/libpthread.so.0(+0x12ce0) [0x7f545fa80ce0]",
        "gsignal()",
        "abort()",
        "(ceph::__ceph_assert_fail(char const*, char const*, int, char const*)+0x1b0) [0x7f5461aed082]",
        "/usr/lib64/ceph/libceph-common.so.2(+0x283245) [0x7f5461aed245]",
        "(OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const+0x405d) [0x7f5461fad29d]",
        "(OSDMonitor::encode_pending(std::shared_ptr<MonitorDBStore::Transaction>)+0x3e2b) [0x55827f8de72b]",
        "(PaxosService::propose_pending()+0x21a) [0x55827f857faa]",
        "(MDSMonitor::prepare_beacon(boost::intrusive_ptr<MonOpRequest>)+0xd48) [0x55827f924ec8]",
        "(MDSMonitor::prepare_update(boost::intrusive_ptr<MonOpRequest>)+0x198) [0x55827f92a808]",
        "(PaxosService::dispatch(boost::intrusive_ptr<MonOpRequest>)+0xa7d) [0x55827f858e6d]",
        "(PaxosService::C_RetryMessage::_finish(int)+0x64) [0x55827f7a7ef4]",
        "(C_MonOp::finish(int)+0x49) [0x55827f72a5c9]",
        "(Context::complete(int)+0xd) [0x55827f72721d]",
        "(void finish_contexts<std::__cxx11::list<Context*, std::allocator<Context*> > >(ceph::common::CephContext*, std::__cxx11::list<Context*, std::allocator<Context*> >&, int)+0xa5) [0x55827f754f95]",
        "(Paxos::finish_round()+0x27b) [0x55827f85079b]",
        "(Paxos::handle_last(boost::intrusive_ptr<MonOpRequest>)+0xc6b) [0x55827f85189b]",
        "(Paxos::dispatch(boost::intrusive_ptr<MonOpRequest>)+0x427) [0x55827f852687]",
        "(Monitor::dispatch_op(boost::intrusive_ptr<MonOpRequest>)+0x176d) [0x55827f7250ed]",
        "(Monitor::_ms_dispatch(Message*)+0x457) [0x55827f725737]",
        "(Dispatcher::ms_dispatch2(boost::intrusive_ptr<Message> const&)+0x5c) [0x55827f755c5c]",
        "(DispatchQueue::entry()+0x14fa) [0x7f5461d733aa]",
        "(DispatchQueue::DispatchThread::entry()+0x11) [0x7f5461e29bd1]",
        "/lib64/libpthread.so.0(+0x81cf) [0x7f545fa761cf]",
        "clone()" 
    ],
    "ceph_version": "17.2.0",
    "crash_id": "2022-06-05T18:57:29.604871Z_46521724-b272-4ae1-b74f-37b9b8cdb017",
    "entity_name": "mon.676ff60aa64518d09da9bc045a405d9067b9815e",
    "os_id": "centos",
    "os_name": "CentOS Stream",
    "os_version": "8",
    "os_version_id": "8",
    "process_name": "ceph-mon",
    "stack_sig": "ebc465267883da2e1b8d48a3c95f936715b299aded56e6a4709eaf33aea43996",
    "timestamp": "2022-06-05T18:57:29.604871Z",
    "utsname_machine": "x86_64",
    "utsname_release": "5.16.0-0.bpo.4-amd64",
    "utsname_sysname": "Linux",
    "utsname_version": "#1 SMP PREEMPT Debian 5.16.12-1~bpo11+1 (2022-03-08)" 
}

Actions #1

Updated by Telemetry Bot almost 2 years ago

  • Crash signature (v1) updated (diff)
  • Crash signature (v2) updated (diff)
  • Affected Versions v17.2.0 added
Actions

Also available in: Atom PDF