Project

General

Profile

Actions

Bug #54831

open

crash: void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const: assert(num_down_in_osds <= num_in_osds)

Added by Telemetry Bot about 2 years ago. Updated about 2 years ago.

Status:
New
Priority:
Normal
Assignee:
-
Category:
-
Target version:
-
% Done:

0%

Source:
Telemetry
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
Affected Versions:
ceph-qa-suite:
Component(RADOS):
Pull request ID:
Crash signature (v1):

d0fe3d13c395a64264b349382b992d7c2dd48ba5d6de278fb80e9f65a78cb304


Description

http://telemetry.front.sepia.ceph.com:4000/d/jByk5HaMz/crash-spec-x-ray?orgId=1&var-sig_v2=80078d4d0d62906a1043c2354ca62bc7a627a73edaff3dcad2468220e8fa17bd

Assert condition: num_down_in_osds <= num_in_osds
Assert function: void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const

Sanitized backtrace:

    OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const
    OSDMonitor::encode_pending(std::shared_ptr<MonitorDBStore::Transaction>)
    PaxosService::propose_pending()
    MgrMonitor::drop_active()
    MgrMonitor::prepare_beacon(boost::intrusive_ptr<MonOpRequest>)
    MgrMonitor::prepare_update(boost::intrusive_ptr<MonOpRequest>)
    PaxosService::dispatch(boost::intrusive_ptr<MonOpRequest>)
    PaxosService::C_RetryMessage::_finish(int)
    C_MonOp::finish(int)
    Context::complete(int)
    void finish_contexts<std::list<Context*, std::allocator<Context*> > >(ceph::common::CephContext*, std::list<Context*, std::allocator<Context*> >&, int)
    Paxos::finish_round()
    Paxos::commit_finish()
    C_Committed::finish(int)
    Context::complete(int)
    MonitorDBStore::C_DoTransaction::finish(int)
    Context::complete(int)
    Finisher::finisher_thread_entry()

Crash dump sample:
{
    "assert_condition": "num_down_in_osds <= num_in_osds",
    "assert_file": "osd/OSDMap.cc",
    "assert_func": "void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const",
    "assert_line": 5704,
    "assert_msg": "osd/OSDMap.cc: In function 'void OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const' thread 7f609a67f700 time 2022-02-09T13:15:04.233043+0000\nosd/OSDMap.cc: 5704: FAILED ceph_assert(num_down_in_osds <= num_in_osds)",
    "assert_thread_name": "fn_monstore",
    "backtrace": [
        "/lib64/libpthread.so.0(+0x12c20) [0x7f60a74ffc20]",
        "gsignal()",
        "abort()",
        "(ceph::__ceph_assert_fail(char const*, char const*, int, char const*)+0x1a9) [0x7f60a97c3ba3]",
        "/usr/lib64/ceph/libceph-common.so.2(+0x276d6c) [0x7f60a97c3d6c]",
        "(OSDMap::check_health(ceph::common::CephContext*, health_check_map_t*) const+0x3e5e) [0x7f60a9c0c29e]",
        "(OSDMonitor::encode_pending(std::shared_ptr<MonitorDBStore::Transaction>)+0x3c38) [0x55decd77a218]",
        "(PaxosService::propose_pending()+0x21a) [0x55decd6eb9ea]",
        "(MgrMonitor::drop_active()+0x30c) [0x55decd7e619c]",
        "(MgrMonitor::prepare_beacon(boost::intrusive_ptr<MonOpRequest>)+0x1d4f) [0x55decd7e826f]",
        "(MgrMonitor::prepare_update(boost::intrusive_ptr<MonOpRequest>)+0x5b) [0x55decd7ec79b]",
        "(PaxosService::dispatch(boost::intrusive_ptr<MonOpRequest>)+0xa6d) [0x55decd6ec89d]",
        "(PaxosService::C_RetryMessage::_finish(int)+0x64) [0x55decd63f534]",
        "(C_MonOp::finish(int)+0x49) [0x55decd5dc8b9]",
        "(Context::complete(int)+0xd) [0x55decd5d9dbd]",
        "(void finish_contexts<std::__cxx11::list<Context*, std::allocator<Context*> > >(ceph::common::CephContext*, std::__cxx11::list<Context*, std::allocator<Context*> >&, int)+0xa5) [0x55decd606285]",
        "(Paxos::finish_round()+0x27b) [0x55decd6e41bb]",
        "(Paxos::commit_finish()+0x8c0) [0x55decd6e6bd0]",
        "(C_Committed::finish(int)+0x45) [0x55decd6ea7f5]",
        "(Context::complete(int)+0xd) [0x55decd5d9dbd]",
        "(MonitorDBStore::C_DoTransaction::finish(int)+0x98) [0x55decd6ea518]",
        "(Context::complete(int)+0xd) [0x55decd5d9dbd]",
        "(Finisher::finisher_thread_entry()+0x1a5) [0x7f60a9864155]",
        "/lib64/libpthread.so.0(+0x817f) [0x7f60a74f517f]",
        "clone()" 
    ],
    "ceph_version": "16.2.7",
    "crash_id": "2022-02-09T13:15:04.240309Z_7a9f6c27-2785-4c58-8972-a14eae262b3b",
    "entity_name": "mon.2cc27d319f666a8deac1826e7fa159f65e898539",
    "os_id": "centos",
    "os_name": "CentOS Stream",
    "os_version": "8",
    "os_version_id": "8",
    "process_name": "ceph-mon",
    "stack_sig": "d0fe3d13c395a64264b349382b992d7c2dd48ba5d6de278fb80e9f65a78cb304",
    "timestamp": "2022-02-09T13:15:04.240309Z",
    "utsname_machine": "x86_64",
    "utsname_release": "5.4.0-99-generic",
    "utsname_sysname": "Linux",
    "utsname_version": "#112-Ubuntu SMP Thu Feb 3 13:50:55 UTC 2022" 
}

Actions #1

Updated by Telemetry Bot about 2 years ago

  • Crash signature (v1) updated (diff)
  • Crash signature (v2) updated (diff)
  • Affected Versions v16.2.7 added
Actions

Also available in: Atom PDF