Project

General

Profile

Actions

Bug #56189

open

crash: pthread_cond_wait()

Added by Telemetry Bot almost 2 years ago. Updated 12 months ago.

Status:
New
Priority:
Normal
Assignee:
-
Target version:
-
% Done:

0%

Source:
Telemetry
Tags:
Backport:
Regression:
No
Severity:
3 - minor
Reviewed:
ceph-qa-suite:
Pull request ID:
Crash signature (v1):

555225c50b2dabfb6dfb7c2c8af24a75aec798ade59a1eb9d19d7bb0ed4e4917
b7e0632d25596edc39d27926f525c0f5108938c26b627da2f6673c8094997e09


Description

http://telemetry.front.sepia.ceph.com:4000/d/jByk5HaMz/crash-spec-x-ray?orgId=1&var-sig_v2=a1b56d10ffb10d94d3cc6f59107ebd4be47d2c2a51a228f0ba48b26b60d0e6a5

Sanitized backtrace:

    pthread_cond_wait()
    std::condition_variable::wait(std::unique_lock<std::mutex>&)
    IOContext::aio_wait()
    BlueStore::_do_readv(BlueStore::Collection*, boost::intrusive_ptr<BlueStore::Onode>, interval_set<unsigned long, std::map> const&, ceph::buffer::list&, unsigned int, unsigned long)
    BlueStore::readv(boost::intrusive_ptr<ObjectStore::CollectionImpl>&, ghobject_t const&, interval_set<unsigned long, std::map>&, ceph::buffer::list&, unsigned int)
    ReplicatedBackend::build_push_op(ObjectRecoveryInfo const&, ObjectRecoveryProgress const&, ObjectRecoveryProgress*, PushOp*, object_stat_sum_t*, bool)
    ReplicatedBackend::prep_push(std::shared_ptr<ObjectContext>, hobject_t const&, pg_shard_t, eversion_t, interval_set<unsigned long, std::map>&, std::map<hobject_t, interval_set<unsigned long, std::map>, std::less<hobject_t>, std::allocator<std::pair<hobject_t const, interval_set<unsigned long, std::map> > > >&, PushOp*, bool, ObcLockManager&&)
    ReplicatedBackend::prep_push_to_replica(std::shared_ptr<ObjectContext>, hobject_t const&, pg_shard_t, PushOp*, bool)
    ReplicatedBackend::start_pushes(hobject_t const&, std::shared_ptr<ObjectContext>, ReplicatedBackend::RPGHandle*)
    ReplicatedBackend::recover_object(hobject_t const&, eversion_t, std::shared_ptr<ObjectContext>, std::shared_ptr<ObjectContext>, PGBackend::RecoveryHandle*)
    PrimaryLogPG::prep_backfill_object_push(hobject_t, eversion_t, std::shared_ptr<ObjectContext>, std::vector<pg_shard_t, std::allocator<pg_shard_t> >, PGBackend::RecoveryHandle*)
    PrimaryLogPG::recover_backfill(unsigned long, ThreadPool::TPHandle&, bool*)
    PrimaryLogPG::start_recovery_ops(unsigned long, ThreadPool::TPHandle&, unsigned long*)
    OSD::do_recovery(PG*, unsigned int, unsigned long, ThreadPool::TPHandle&)
    ceph::osd::scheduler::PGRecovery::run(OSD*, OSDShard*, boost::intrusive_ptr<PG>&, ThreadPool::TPHandle&)
    OSD::ShardedOpWQ::_process(unsigned int, ceph::heartbeat_handle_d*)
    ShardedThreadPool::shardedthreadpool_worker(unsigned int)
    ShardedThreadPool::WorkThreadSharded::entry()

Crash dump sample:
{
    "backtrace": [
        "/lib64/libpthread.so.0(+0x12ce0) [0x7f825e5dace0]",
        "pthread_cond_wait()",
        "(std::condition_variable::wait(std::unique_lock<std::mutex>&)+0x10) [0x7f825dc1d8f0]",
        "(IOContext::aio_wait()+0x499) [0x563bf3215f19]",
        "(BlueStore::_do_readv(BlueStore::Collection*, boost::intrusive_ptr<BlueStore::Onode>, interval_set<unsigned long, std::map> const&, ceph::buffer::v15_2_0::list&, unsigned int, unsigned long)+0x8d1) [0x563bf2c65b91]",
        "(BlueStore::readv(boost::intrusive_ptr<ObjectStore::CollectionImpl>&, ghobject_t const&, interval_set<unsigned long, std::map>&, ceph::buffer::v15_2_0::list&, unsigned int)+0x49e) [0x563bf2c66efe]",
        "(ReplicatedBackend::build_push_op(ObjectRecoveryInfo const&, ObjectRecoveryProgress const&, ObjectRecoveryProgress*, PushOp*, object_stat_sum_t*, bool)+0x3c7) [0x563bf2ab0d47]",
        "(ReplicatedBackend::prep_push(std::shared_ptr<ObjectContext>, hobject_t const&, pg_shard_t, eversion_t, interval_set<unsigned long, std::map>&, std::map<hobject_t, interval_set<unsigned long, std::map>, std::less<hobject_t>, std::allocator<std::pair<hobject_t const, interval_set<unsigned long, std::map> > > >&, PushOp*, bool, ObcLockManager&&)+0x582) [0x563bf2ab2e22]",
        "(ReplicatedBackend::prep_push_to_replica(std::shared_ptr<ObjectContext>, hobject_t const&, pg_shard_t, PushOp*, bool)+0x3eb) [0x563bf2ab38bb]",
        "(ReplicatedBackend::start_pushes(hobject_t const&, std::shared_ptr<ObjectContext>, ReplicatedBackend::RPGHandle*)+0x1d7) [0x563bf2ab5037]",
        "(ReplicatedBackend::recover_object(hobject_t const&, eversion_t, std::shared_ptr<ObjectContext>, std::shared_ptr<ObjectContext>, PGBackend::RecoveryHandle*)+0x13e) [0x563bf2ab55be]",
        "(PrimaryLogPG::prep_backfill_object_push(hobject_t, eversion_t, std::shared_ptr<ObjectContext>, std::vector<pg_shard_t, std::allocator<pg_shard_t> >, PGBackend::RecoveryHandle*)+0x30b) [0x563bf281cbbb]",
        "(PrimaryLogPG::recover_backfill(unsigned long, ThreadPool::TPHandle&, bool*)+0x3035) [0x563bf2865c95]",
        "(PrimaryLogPG::start_recovery_ops(unsigned long, ThreadPool::TPHandle&, unsigned long*)+0x10e3) [0x563bf2868e73]",
        "(OSD::do_recovery(PG*, unsigned int, unsigned long, ThreadPool::TPHandle&)+0x2f5) [0x563bf26e2015]",
        "(ceph::osd::scheduler::PGRecovery::run(OSD*, OSDShard*, boost::intrusive_ptr<PG>&, ThreadPool::TPHandle&)+0x1d) [0x563bf29a5e0d]",
        "(OSD::ShardedOpWQ::_process(unsigned int, ceph::heartbeat_handle_d*)+0xaf8) [0x563bf27010d8]",
        "(ShardedThreadPool::shardedthreadpool_worker(unsigned int)+0x5c4) [0x563bf2e069c4]",
        "(ShardedThreadPool::WorkThreadSharded::entry()+0x14) [0x563bf2e07d64]",
        "/lib64/libpthread.so.0(+0x81cf) [0x7f825e5d01cf]",
        "clone()" 
    ],
    "ceph_version": "17.2.0",
    "crash_id": "2022-06-22T13:05:28.665716Z_47c18d2d-bc67-4a4b-8358-8106f6061663",
    "entity_name": "osd.54b8974301b2d12585113c153c571b08c14486b8",
    "os_id": "centos",
    "os_name": "CentOS Stream",
    "os_version": "8",
    "os_version_id": "8",
    "process_name": "ceph-osd",
    "stack_sig": "b7e0632d25596edc39d27926f525c0f5108938c26b627da2f6673c8094997e09",
    "timestamp": "2022-06-22T13:05:28.665716Z",
    "utsname_machine": "x86_64",
    "utsname_release": "5.13.19-6-pve",
    "utsname_sysname": "Linux",
    "utsname_version": "#1 SMP PVE 5.13.19-15 (Tue, 29 Mar 2022 15:59:50 +0200)" 
}

Actions #1

Updated by Telemetry Bot almost 2 years ago

  • Crash signature (v1) updated (diff)
  • Crash signature (v2) updated (diff)
  • Affected Versions v16.2.4, v16.2.5, v16.2.6, v16.2.7, v16.2.9, v17.2.0 added
Actions #2

Updated by Telemetry Bot 12 months ago

  • Affected Versions v16.2.10, v16.2.11, v17.2.3, v17.2.5 added
Actions

Also available in: Atom PDF