Project

General

Profile

Bug #6117

Updated by Loïc Dachary over 10 years ago

"work in progress":https://github.com/dachary/ceph/tree/wip-6117 

 <pre> 
 2013-08-25 12:26:35.911288 7fda96367700 -1 common/Mutex.cc: In function 'void Mutex::Lock(bool)' thread 7fda96367700 time 2013-08-25 12:26:35.905967 
 common/Mutex.cc: 93: FAILED assert(r == 0) 

  ceph version 0.67-352-g8b1b745 (8b1b74598bae0e13691e6244c647fb89cc9e21a7) 
  1: (Mutex::Lock(bool)+0x1c3) [0x8979f3] 
  2: (SharedPtrRegistry<hobject_t, ObjectContext>::OnRemoval::operator()(ObjectContext*)+0x21) [0x770c31] 
  3: (std::tr1::__shared_count<(__gnu_cxx::_Lock_policy)2>::operator=(std::tr1::__shared_count<(__gnu_cxx::_Lock_policy)2> const&)+0x86) [0x633776] 
  4: (ReplicatedPG::context_registry_on_change()+0x23a) [0x70888a] 
  5: (ReplicatedPG::on_change(ObjectStore::Transaction*)+0xec) [0x7236fc] 
  6: (PG::start_peering_interval(std::tr1::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, ObjectStore::Transaction*)+0x5e3) [0x69abb3] 
  7: (PG::RecoveryState::Reset::react(PG::AdvMap const&)+0x313) [0x69fe23] 
  8: (boost::statechart::detail::reaction_result boost::statechart::simple_state<PG::RecoveryState::Reset, PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)0>::local_react_impl_non_empty::local_react_impl<boost::mpl::list5<boost::statechart::custom_reaction<PG::AdvMap>, boost::statechart::custom_reaction<PG::ActMap>, boost::statechart::custom_reaction<PG::NullEvt>, boost::statechart::custom_reaction<PG::FlushedEvt>, boost::statechart::transition<boost::statechart::event_base, PG::RecoveryState::Crashed, boost::statechart::detail::no_context<boost::statechart::event_base>, &(boost::statechart::detail::no_context<boost::statechart::event_base>::no_function(boost::statechart::event_base const&))> >, boost::statechart::simple_state<PG::RecoveryState::Reset, PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)0> >(boost::statechart::simple_state<PG::RecoveryState::Reset, PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)0>&, boost::statechart::event_base const&, void const*)+0x100) [0x6ea220] 
  9: (boost::statechart::simple_state<PG::RecoveryState::Reset, PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>, (boost::statechart::history_mode)0>::react_impl(boost::statechart::event_base const&, void const*)+0x4e) [0x6ea2fe] 
  10: (boost::statechart::state_machine<PG::RecoveryState::RecoveryMachine, PG::RecoveryState::Initial, std::allocator<void>, boost::statechart::null_exception_translator>::process_queued_events()+0xfb) [0x6cd35b] 
  11: (PG::RecoveryState::handle_event(boost::statechart::event_base const&, PG::RecoveryCtx*)+0x57) [0x6cd5d7] 
  12: (PG::handle_advance_map(std::tr1::shared_ptr<OSDMap const>, std::tr1::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, PG::RecoveryCtx*)+0x464) [0x6b9004] 
  13: (OSD::advance_pg(unsigned int, PG*, ThreadPool::TPHandle&, PG::RecoveryCtx*, std::set<boost::intrusive_ptr<PG>, std::less<boost::intrusive_ptr<PG> >, std::allocator<boost::intrusive_ptr<PG> > >*)+0x206) [0x6139a6] 
  14: (OSD::process_peering_events(std::list<PG*, std::allocator<PG*> > const&, ThreadPool::TPHandle&)+0x23a) [0x61400a] 
  15: (OSD::PeeringWQ::_process(std::list<PG*, std::allocator<PG*> > const&, ThreadPool::TPHandle&)+0x12) [0x6592d2] 
  16: (ThreadPool::worker(ThreadPool::WorkThread*)+0x4e6) [0x8c5156] 
  17: (ThreadPool::WorkThread::entry()+0x10) [0x8c6f60] 
  18: (()+0x7e9a) [0x7fdaa9c24e9a] 
  19: (clone()+0x6d) [0x7fdaa7db7ccd] 
  NOTE: a copy of the executable, or `objdump -rdS <executable>` is needed to interpret this. 

 </pre> 

 <pre> 
 ubuntu@teuthology:/a/teuthology-2013-08-25_09:25:20-krbd-master-testing-basic-plana/4964$ cat orig.config.yaml  
 kernel: 
   kdb: true 
   sha1: c2f29906882bd30794da6993e755a0dab2b7a665 
 machine_type: plana 
 nuke-on-error: true 
 os_type: ubuntu 
 overrides: 
   admin_socket: 
     branch: master 
   ceph: 
     conf: 
       mon: 
         debug mon: 20 
         debug ms: 1 
         debug paxos: 20 
       osd: 
         osd op thread timeout: 60 
     fs: btrfs 
     log-whitelist: 
     - slow request 
     sha1: 8b1b74598bae0e13691e6244c647fb89cc9e21a7 
   ceph-deploy: 
     branch: 
       dev: master 
     conf: 
       client: 
         log file: /var/log/ceph/ceph-$name.$pid.log 
       mon: 
         debug mon: 1 
         debug ms: 20 
         debug paxos: 20 
   install: 
     ceph: 
       sha1: 8b1b74598bae0e13691e6244c647fb89cc9e21a7 
   s3tests: 
     branch: master 
   workunit: 
     sha1: 8b1b74598bae0e13691e6244c647fb89cc9e21a7 
 roles: 
 - - mon.a 
   - mon.c 
   - osd.0 
   - osd.1 
   - osd.2 
 - - mon.b 
   - mds.a 
   - osd.3 
   - osd.4 
   - osd.5 
 - - client.0 
 tasks: 
 - chef: null 
 - clock.check: null 
 - install: null 
 - ceph: 
     log-whitelist: 
     - wrongly marked me down 
     - objects unfound and apparently lost 
 - thrashosds: null 
 - rbd: 
     all: 
       image_size: 20480 
 - workunit: 
     clients: 
       all: 
       - suites/ffsb.sh 
 teuthology_branch: master 

 </pre>

Back