Project

General

Profile

Bug #56289

crash: void PeeringState::check_past_interval_bounds() const: abort

Added by Telemetry Bot 7 months ago. Updated 4 months ago.

Status:
Duplicate
Priority:
Normal
Assignee:
-
Category:
-
Target version:
-
% Done:

0%

Source:
Telemetry
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
Affected Versions:
ceph-qa-suite:
Component(RADOS):
Pull request ID:
Crash signature (v1):

3eef3d242ab35e36048b4e9895b78e792108209c81b1cca1a8e39b3fedce3ed2
945ef76c4a0a5ace0e41631a7ba4d0bc98c5be52bc918587b8030fbef1103533


Description

http://telemetry.front.sepia.ceph.com:4000/d/jByk5HaMz/crash-spec-x-ray?orgId=1&var-sig_v2=657abbfaddca21e4f153180f250c6cfa9ab54d79998695c48528e2ca436305e2

Assert condition: abort
Assert function: void PeeringState::check_past_interval_bounds() const

Sanitized backtrace:

    PeeringState::check_past_interval_bounds() const
    PeeringState::Reset::react(PeeringState::AdvMap const&)
    boost::statechart::simple_state<PeeringState::Reset, PeeringState::PeeringMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)>::react_impl(boost::statechart::event_base const&, void const*)
    boost::statechart::state_machine<PeeringState::PeeringMachine, PeeringState::Initial, std::allocator<boost::statechart::none>, boost::statechart::null_exception_translator>::send_event(boost::statechart::event_base const&)
    PeeringState::advance_map(std::shared_ptr<OSDMap const>, std::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> >&, int, std::vector<int, std::allocator<int> >&, int, PeeringCtx&)
    PG::handle_advance_map(std::shared_ptr<OSDMap const>, std::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> >&, int, std::vector<int, std::allocator<int> >&, int, PeeringCtx&)
    OSD::advance_pg(unsigned int, PG*, ThreadPool::TPHandle&, PeeringCtx&)
    OSD::dequeue_peering_evt(OSDShard*, PG*, std::shared_ptr<PGPeeringEvent>, ThreadPool::TPHandle&)
    ceph::osd::scheduler::PGPeeringItem::run(OSD*, OSDShard*, boost::intrusive_ptr<PG>&, ThreadPool::TPHandle&)
    OSD::ShardedOpWQ::_process(unsigned int, ceph::heartbeat_handle_d*)
    ShardedThreadPool::shardedthreadpool_worker(unsigned int)
    ShardedThreadPool::WorkThreadSharded::entry()

Crash dump sample:
{
    "assert_condition": "abort",
    "assert_file": "osd/PeeringState.cc",
    "assert_func": "void PeeringState::check_past_interval_bounds() const",
    "assert_line": 968,
    "assert_msg": "osd/PeeringState.cc: In function 'void PeeringState::check_past_interval_bounds() const' thread 7f6fe4832700 time 2022-05-06T23:17:17.742464+0000\nosd/PeeringState.cc: 968: ceph_abort_msg(\"past_interval start interval mismatch\")",
    "assert_thread_name": "tp_osd_tp",
    "backtrace": [
        "/lib64/libpthread.so.0(+0x12ce0) [0x7f70078d5ce0]",
        "gsignal()",
        "abort()",
        "(ceph::__ceph_abort(char const*, int, char const*, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&)+0x1b8) [0x55f42e69bc6c]",
        "(PeeringState::check_past_interval_bounds() const+0x6d5) [0x55f42ea917c5]",
        "(PeeringState::Reset::react(PeeringState::AdvMap const&)+0x3ec) [0x55f42eaaacdc]",
        "(boost::statechart::simple_state<PeeringState::Reset, PeeringState::PeeringMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)0>::react_impl(boost::statechart::event_base const&, void const*)+0x1f8) [0x55f42eaecef8]",
        "(boost::statechart::state_machine<PeeringState::PeeringMachine, PeeringState::Initial, std::allocator<boost::statechart::none>, boost::statechart::null_exception_translator>::send_event(boost::statechart::event_base const&)+0x53) [0x55f42e949793]",
        "(PeeringState::advance_map(std::shared_ptr<OSDMap const>, std::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> >&, int, std::vector<int, std::allocator<int> >&, int, PeeringCtx&)+0x1b8) [0x55f42ea8ce68]",
        "(PG::handle_advance_map(std::shared_ptr<OSDMap const>, std::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> >&, int, std::vector<int, std::allocator<int> >&, int, PeeringCtx&)+0x1e6) [0x55f42e85eda6]",
        "(OSD::advance_pg(unsigned int, PG*, ThreadPool::TPHandle&, PeeringCtx&)+0x322) [0x55f42e7d13f2]",
        "(OSD::dequeue_peering_evt(OSDShard*, PG*, std::shared_ptr<PGPeeringEvent>, ThreadPool::TPHandle&)+0xd4) [0x55f42e7d3314]",
        "(ceph::osd::scheduler::PGPeeringItem::run(OSD*, OSDShard*, boost::intrusive_ptr<PG>&, ThreadPool::TPHandle&)+0x56) [0x55f42ea6a526]",
        "(OSD::ShardedOpWQ::_process(unsigned int, ceph::heartbeat_handle_d*)+0xaf8) [0x55f42e7c50d8]",
        "(ShardedThreadPool::shardedthreadpool_worker(unsigned int)+0x5c4) [0x55f42eeca9c4]",
        "(ShardedThreadPool::WorkThreadSharded::entry()+0x14) [0x55f42eecbd64]",
        "/lib64/libpthread.so.0(+0x81cf) [0x7f70078cb1cf]",
        "clone()" 
    ],
    "ceph_version": "17.2.0",
    "crash_id": "2022-05-06T23:17:17.760315Z_57b03271-eca8-4c18-962b-b78b49044812",
    "entity_name": "osd.99e3561dd9289b126efbec392067ffab500dfc47",
    "os_id": "centos",
    "os_name": "CentOS Stream",
    "os_version": "8",
    "os_version_id": "8",
    "process_name": "ceph-osd",
    "stack_sig": "945ef76c4a0a5ace0e41631a7ba4d0bc98c5be52bc918587b8030fbef1103533",
    "timestamp": "2022-05-06T23:17:17.760315Z",
    "utsname_machine": "x86_64",
    "utsname_release": "5.4.0-109-generic",
    "utsname_sysname": "Linux",
    "utsname_version": "#123-Ubuntu SMP Fri Apr 8 09:10:54 UTC 2022" 
}


Related issues

Duplicates RADOS - Bug #49689: osd/PeeringState.cc: ceph_abort_msg("past_interval start interval mismatch") start Fix Under Review

History

#1 Updated by Telemetry Bot 7 months ago

  • Crash signature (v1) updated (diff)
  • Crash signature (v2) updated (diff)
  • Affected Versions v17.1.0, v17.2.0 added

#2 Updated by Matan Breizman 4 months ago

  • Status changed from New to Duplicate
  • Crash signature (v1) updated (diff)

#3 Updated by Matan Breizman 4 months ago

  • Duplicates Bug #49689: osd/PeeringState.cc: ceph_abort_msg("past_interval start interval mismatch") start added

Also available in: Atom PDF