Hi Sage,
a I dropped the wip branch. I just repushed the patches (on top of
bobtail) for you.
Thanks for the new build!
I have finished testing it on one osd - sadly the osd crashed again, but
now with a new stack trace.
0> 2013-01-19 18:48:44.636938 7fb5597f2700 -1 ./osd/OSDMap.h: In
function 'const epoch_t& OSDMap::get_up_thru(int) const' thread
7fb5597f2700 time 2013-01-19 18:48:44.499494
./osd/OSDMap.h: 367: FAILED assert(exists(osd))
ceph version 0.56.1-25-g25a6b1b (25a6b1b325db2a2b45963f83623c447ec577c5ef)
1: /usr/bin/ceph-osd() [0x60db42]
2: /usr/bin/ceph-osd() [0x6e3b35]
3: (pg_interval_t::check_new_interval(std::vector<int,
std::allocator<int> > const&, std::vector<int, std::allocator<int> >
const&, std::vector<int, std::allocator<int> > const&, std::vector<int,
std::allocator<int> > const&, unsigned int, unsigned int,
std::tr1::shared_ptr<OSDMap const>, std::tr1::shared_ptr<OSDMap const>,
long, pg_t, std::map<unsigned int, pg_interval_t, std::less<unsigned
int>, std::allocator<std::pair<unsigned int const, pg_interval_t> > >*,
std::ostream*)+0x250) [0x935590]
4: (PG::start_peering_interval(std::tr1::shared_ptr<OSDMap const>,
std::vector<int, std::allocator<int> > const&, std::vector<int,
std::allocator<int> > const&)+0x353) [0x7563c3]
5: (PG::RecoveryState::Reset::react(PG::AdvMap const&)+0x21e) [0x75887e]
6: (boost::statechart::detail::reaction_result
boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>::local_react_impl_non_empty::local_react_impl<boost::mpl::list5<boost::statechart::custom_reaction<PG::AdvMap>,
boost::statechart::custom_reaction<PG::ActMap>,
boost::statechart::custom_reaction<PG::NullEvt>,
boost::statechart::custom_reaction<PG::FlushedEvt>,
boost::statechart::transition<boost::statechart::event_base,
PG::RecoveryState::Crashed,
boost::statechart::detail::no_context<boost::statechart::event_base>,
&boost::statechart::detail::no_context<boost::statechart::event_base>::no_function>
>, boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>
>(boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>&, boost::statechart::event_base
const&, void const*)+0x86) [0x78abb6]
7: (boost::statechart::detail::reaction_result
boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>::local_react_impl_non_empty::local_react_impl<boost::mpl::list<boost::statechart::custom_reaction<PG::QueryState>,
boost::statechart::custom_reaction<PG::AdvMap>,
boost::statechart::custom_reaction<PG::ActMap>,
boost::statechart::custom_reaction<PG::NullEvt>,
boost::statechart::custom_reaction<PG::FlushedEvt>,
boost::statechart::transition<boost::statechart::event_base,
PG::RecoveryState::Crashed,
boost::statechart::detail::no_context<boost::statechart::event_base>,
&boost::statechart::detail::no_context<boost::statechart::event_base>::no_function>,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>
>(boost::statechart::simple_state<PG::RecoveryState::Reset,
PG::RecoveryState::RecoveryMachine, boost::mpl::list<mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na, mpl_::na,
mpl_::na, mpl_::na, mpl_::na, mpl_::na>,
(boost::statechart::history_mode)0>&, boost::statechart::event_base
const&, void const*)+0x53) [0x78ac33]
8:
(boost::statechart::state_machine<PG::RecoveryState::RecoveryMachine,
PG::RecoveryState::Initial, std::allocator<void>,
boost::statechart::null_exception_translator>::send_event(boost::statechart::event_base
const&)+0x5b) [0x76f58b]
9:
(boost::statechart::state_machine<PG::RecoveryState::RecoveryMachine,
PG::RecoveryState::Initial, std::allocator<void>,
boost::statechart::null_exception_translator>::process_event(boost::statechart::event_base
const&)+0x19) [0x76f619]
10: (PG::RecoveryState::handle_event(boost::statechart::event_base
const&, PG::RecoveryCtx*)+0x4d) [0x76f6cd]
11: (PG::handle_advance_map(std::tr1::shared_ptr<OSDMap const>,
std::tr1::shared_ptr<OSDMap const>, std::vector<int, std::allocator<int>
>&, std::vector<int, std::allocator<int> >&, PG::RecoveryCtx*)+0x196)
[0x72bf46]
12: (OSD::advance_pg(unsigned int, PG*, PG::RecoveryCtx*,
std::set<boost::intrusive_ptr<PG>, std::less<boost::intrusive_ptr<PG> >,
std::allocator<boost::intrusive_ptr<PG> > >*)+0x48b) [0x6cf14b]
13: (OSD::process_peering_events(std::list<PG*, std::allocator<PG*> >
const&)+0x2a6) [0x6cf7f6]
14: (OSD::PeeringWQ::_process(std::list<PG*, std::allocator<PG*> >
const&)+0x17) [0x70a3f7]
15: (ThreadPool::worker(ThreadPool::WorkThread*)+0x95c) [0x8ccccc]
16: (ThreadPool::WorkThread::entry()+0x10) [0x8cdc40]
17: /lib64/libpthread.so.0() [0x360de07d14]
18: (clone()+0x6d) [0x360d6f167d]
--
Jens Kristian Søgaard, Mermaid Consulting ApS,
jens@xxxxxxxxxxxxxxxxxxxx,
http://www.mermaidconsulting.com/
--
To unsubscribe from this list: send the line "unsubscribe ceph-devel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html