]>
git.proxmox.com Git - ceph.git/blob - ceph/src/msg/simple/SimpleMessenger.cc
84b6a253ec6e6ee72499e312d4d6737d09841f85
1 // -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
2 // vim: ts=8 sw=2 smarttab
4 * Ceph - scalable distributed file system
6 * Copyright (C) 2004-2006 Sage Weil <sage@newdream.net>
8 * This is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License version 2.1, as published by the Free Software
11 * Foundation. See file COPYING.
20 #include "SimpleMessenger.h"
22 #include "common/config.h"
23 #include "common/Timer.h"
24 #include "common/errno.h"
25 #include "common/valgrind.h"
26 #include "auth/Crypto.h"
27 #include "include/Spinlock.h"
29 #define dout_subsys ceph_subsys_ms
31 #define dout_prefix _prefix(_dout, this)
32 static ostream
& _prefix(std::ostream
*_dout
, SimpleMessenger
*msgr
) {
33 return *_dout
<< "-- " << msgr
->get_myaddr() << " ";
41 SimpleMessenger::SimpleMessenger(CephContext
*cct
, entity_name_t name
,
42 string mname
, uint64_t _nonce
)
43 : SimplePolicyMessenger(cct
, name
,mname
, _nonce
),
44 accepter(this, _nonce
),
45 dispatch_queue(cct
, this, mname
),
48 lock("SimpleMessenger::lock"), need_addr(true), did_bind(false),
51 reaper_started(false), reaper_stop(false),
53 local_connection(new PipeConnection(cct
, this))
55 ANNOTATE_BENIGN_RACE_SIZED(&timeout
, sizeof(timeout
),
56 "SimpleMessenger read timeout");
57 ceph_spin_init(&global_seq_lock
);
58 init_local_connection();
62 * Destroy the SimpleMessenger. Pretty simple since all the work is done
65 SimpleMessenger::~SimpleMessenger()
67 assert(!did_bind
); // either we didn't bind or we shut down the Accepter
68 assert(rank_pipe
.empty()); // we don't have any running Pipes.
69 assert(!reaper_started
); // the reaper thread is stopped
70 ceph_spin_destroy(&global_seq_lock
);
73 void SimpleMessenger::ready()
75 ldout(cct
,10) << "ready " << get_myaddr() << dendl
;
76 dispatch_queue
.start();
85 int SimpleMessenger::shutdown()
87 ldout(cct
,10) << "shutdown " << get_myaddr() << dendl
;
90 // break ref cycles on the loopback connection
91 local_connection
->set_priv(NULL
);
101 int SimpleMessenger::_send_message(Message
*m
, const entity_inst_t
& dest
)
104 m
->get_header().src
= get_myname();
107 if (!m
->get_priority()) m
->set_priority(get_default_send_priority());
109 ldout(cct
,1) <<"--> " << dest
.name
<< " "
110 << dest
.addr
<< " -- " << *m
111 << " -- ?+" << m
->get_data().length()
115 if (dest
.addr
== entity_addr_t()) {
116 ldout(cct
,0) << "send_message message " << *m
117 << " with empty dest " << dest
.addr
<< dendl
;
123 Pipe
*pipe
= _lookup_pipe(dest
.addr
);
124 submit_message(m
, (pipe
? pipe
->connection_state
.get() : NULL
),
125 dest
.addr
, dest
.name
.type(), true);
130 int SimpleMessenger::_send_message(Message
*m
, Connection
*con
)
133 m
->get_header().src
= get_myname();
135 if (!m
->get_priority()) m
->set_priority(get_default_send_priority());
137 ldout(cct
,1) << "--> " << con
->get_peer_addr()
139 << " -- ?+" << m
->get_data().length()
140 << " " << m
<< " con " << con
143 submit_message(m
, static_cast<PipeConnection
*>(con
),
144 con
->get_peer_addr(), con
->get_peer_type(), false);
149 * If my_inst.addr doesn't have an IP set, this function
150 * will fill it in from the passed addr. Otherwise it does nothing and returns.
152 void SimpleMessenger::set_addr_unknowns(const entity_addr_t
&addr
)
154 if (my_inst
.addr
.is_blank_ip()) {
155 int port
= my_inst
.addr
.get_port();
156 my_inst
.addr
.u
= addr
.u
;
157 my_inst
.addr
.set_port(port
);
158 init_local_connection();
162 int SimpleMessenger::get_proto_version(int peer_type
, bool connect
)
164 int my_type
= my_inst
.name
.type();
166 // set reply protocol version
167 if (peer_type
== my_type
) {
169 return cluster_protocol
;
174 case CEPH_ENTITY_TYPE_OSD
: return CEPH_OSDC_PROTOCOL
;
175 case CEPH_ENTITY_TYPE_MDS
: return CEPH_MDSC_PROTOCOL
;
176 case CEPH_ENTITY_TYPE_MON
: return CEPH_MONC_PROTOCOL
;
180 case CEPH_ENTITY_TYPE_OSD
: return CEPH_OSDC_PROTOCOL
;
181 case CEPH_ENTITY_TYPE_MDS
: return CEPH_MDSC_PROTOCOL
;
182 case CEPH_ENTITY_TYPE_MON
: return CEPH_MONC_PROTOCOL
;
195 /********************************************
199 #define dout_prefix _prefix(_dout, this)
201 void SimpleMessenger::reaper_entry()
203 ldout(cct
,10) << "reaper_entry start" << dendl
;
205 while (!reaper_stop
) {
206 reaper(); // may drop and retake the lock
209 reaper_cond
.Wait(lock
);
212 ldout(cct
,10) << "reaper_entry done" << dendl
;
216 * note: assumes lock is held
218 void SimpleMessenger::reaper()
220 ldout(cct
,10) << "reaper" << dendl
;
221 assert(lock
.is_locked());
223 while (!pipe_reap_queue
.empty()) {
224 Pipe
*p
= pipe_reap_queue
.front();
225 pipe_reap_queue
.pop_front();
226 ldout(cct
,10) << "reaper reaping pipe " << p
<< " " <<
227 p
->get_peer_addr() << dendl
;
229 p
->discard_out_queue();
230 if (p
->connection_state
) {
231 // mark_down, mark_down_all, or fault() should have done this,
232 // or accept() may have switch the Connection to a different
233 // Pipe... but make sure!
234 bool cleared
= p
->connection_state
->clear_pipe(p
);
237 p
->pipe_lock
.Unlock();
238 p
->unregister_pipe();
239 assert(pipes
.count(p
));
242 // drop msgr lock while joining thread; the delay through could be
243 // trying to fast dispatch, preventing it from joining without
244 // blocking and deadlocking.
251 ldout(cct
,10) << "reaper reaped pipe " << p
<< " " << p
->get_peer_addr() << dendl
;
253 ldout(cct
,10) << "reaper deleted pipe " << p
<< dendl
;
255 ldout(cct
,10) << "reaper done" << dendl
;
258 void SimpleMessenger::queue_reap(Pipe
*pipe
)
260 ldout(cct
,10) << "queue_reap " << pipe
<< dendl
;
262 pipe_reap_queue
.push_back(pipe
);
263 reaper_cond
.Signal();
267 bool SimpleMessenger::is_connected(Connection
*con
)
271 Pipe
*p
= static_cast<Pipe
*>(static_cast<PipeConnection
*>(con
)->get_pipe());
273 assert(p
->msgr
== this);
274 r
= p
->is_connected();
281 int SimpleMessenger::bind(const entity_addr_t
&bind_addr
)
285 ldout(cct
,10) << "rank.bind already started" << dendl
;
289 ldout(cct
,10) << "rank.bind " << bind_addr
<< dendl
;
293 set
<int> avoid_ports
;
294 int r
= accepter
.bind(bind_addr
, avoid_ports
);
300 int SimpleMessenger::rebind(const set
<int>& avoid_ports
)
302 ldout(cct
,1) << "rebind avoid " << avoid_ports
<< dendl
;
306 return accepter
.rebind(avoid_ports
);
310 int SimpleMessenger::client_bind(const entity_addr_t
&bind_addr
)
312 if (!cct
->_conf
->ms_bind_before_connect
)
314 Mutex::Locker
l(lock
);
316 assert(my_inst
.addr
== bind_addr
);
320 ldout(cct
,10) << "rank.bind already started" << dendl
;
323 ldout(cct
,10) << "rank.bind " << bind_addr
<< dendl
;
325 set_myaddr(bind_addr
);
330 int SimpleMessenger::start()
333 ldout(cct
,1) << "messenger.start" << dendl
;
335 // register at least one entity, first!
336 assert(my_inst
.name
.type() >= 0);
343 my_inst
.addr
.nonce
= nonce
;
344 init_local_connection();
349 reaper_started
= true;
350 reaper_thread
.create("ms_reaper");
354 Pipe
*SimpleMessenger::add_accept_pipe(int sd
)
357 Pipe
*p
= new Pipe(this, Pipe::STATE_ACCEPTING
, NULL
);
361 p
->pipe_lock
.Unlock();
363 accepting_pipes
.insert(p
);
369 * NOTE: assumes messenger.lock held.
371 Pipe
*SimpleMessenger::connect_rank(const entity_addr_t
& addr
,
376 assert(lock
.is_locked());
377 assert(addr
!= my_inst
.addr
);
379 ldout(cct
,10) << "connect_rank to " << addr
<< ", creating pipe and registering" << dendl
;
382 Pipe
*pipe
= new Pipe(this, Pipe::STATE_CONNECTING
,
383 static_cast<PipeConnection
*>(con
));
384 pipe
->pipe_lock
.Lock();
385 pipe
->set_peer_type(type
);
386 pipe
->set_peer_addr(addr
);
387 pipe
->policy
= get_policy(type
);
388 pipe
->start_writer();
391 pipe
->pipe_lock
.Unlock();
392 pipe
->register_pipe();
403 AuthAuthorizer
*SimpleMessenger::get_authorizer(int peer_type
, bool force_new
)
405 return ms_deliver_get_authorizer(peer_type
, force_new
);
408 bool SimpleMessenger::verify_authorizer(Connection
*con
, int peer_type
,
409 int protocol
, bufferlist
& authorizer
, bufferlist
& authorizer_reply
,
410 bool& isvalid
,CryptoKey
& session_key
)
412 return ms_deliver_verify_authorizer(con
, peer_type
, protocol
, authorizer
, authorizer_reply
, isvalid
,session_key
);
415 ConnectionRef
SimpleMessenger::get_connection(const entity_inst_t
& dest
)
417 Mutex::Locker
l(lock
);
418 if (my_inst
.addr
== dest
.addr
) {
420 return local_connection
;
425 Pipe
*pipe
= _lookup_pipe(dest
.addr
);
427 ldout(cct
, 10) << "get_connection " << dest
<< " existing " << pipe
<< dendl
;
429 pipe
= connect_rank(dest
.addr
, dest
.name
.type(), NULL
, NULL
);
430 ldout(cct
, 10) << "get_connection " << dest
<< " new " << pipe
<< dendl
;
432 Mutex::Locker
l(pipe
->pipe_lock
);
433 if (pipe
->connection_state
)
434 return pipe
->connection_state
;
435 // we failed too quickly! retry. FIXME.
439 ConnectionRef
SimpleMessenger::get_loopback_connection()
441 return local_connection
;
444 void SimpleMessenger::submit_message(Message
*m
, PipeConnection
*con
,
445 const entity_addr_t
& dest_addr
, int dest_type
,
448 m
->trace
.event("simple submitting message");
449 if (cct
->_conf
->ms_dump_on_send
) {
451 ldout(cct
, 0) << "submit_message " << *m
<< "\n";
452 m
->get_payload().hexdump(*_dout
);
453 if (m
->get_data().length() > 0) {
454 *_dout
<< " data:\n";
455 m
->get_data().hexdump(*_dout
);
461 // existing connection?
464 bool ok
= static_cast<PipeConnection
*>(con
)->try_get_pipe(&pipe
);
466 ldout(cct
,0) << "submit_message " << *m
<< " remote, " << dest_addr
467 << ", failed lossy con, dropping message " << m
<< dendl
;
472 // we loop in case of a racing reconnect, either from us or them
473 pipe
->pipe_lock
.Lock(); // can't use a Locker because of the Pipe ref
474 if (pipe
->state
!= Pipe::STATE_CLOSED
) {
475 ldout(cct
,20) << "submit_message " << *m
<< " remote, " << dest_addr
<< ", have pipe." << dendl
;
477 pipe
->pipe_lock
.Unlock();
482 ok
= con
->try_get_pipe(¤t_pipe
);
483 pipe
->pipe_lock
.Unlock();
484 if (current_pipe
== pipe
) {
485 ldout(cct
,20) << "submit_message " << *m
<< " remote, " << dest_addr
486 << ", had pipe " << pipe
<< ", but it closed." << dendl
;
499 if (my_inst
.addr
== dest_addr
) {
501 ldout(cct
,20) << "submit_message " << *m
<< " local" << dendl
;
502 m
->set_connection(local_connection
.get());
503 dispatch_queue
.local_delivery(m
, m
->get_priority());
507 // remote, no existing pipe.
508 const Policy
& policy
= get_policy(dest_type
);
510 ldout(cct
,20) << "submit_message " << *m
<< " remote, " << dest_addr
<< ", lossy server for target type "
511 << ceph_entity_type_name(dest_type
) << ", no session, dropping." << dendl
;
514 ldout(cct
,20) << "submit_message " << *m
<< " remote, " << dest_addr
<< ", new pipe." << dendl
;
515 if (!already_locked
) {
516 /** We couldn't handle the Message without reference to global data, so
517 * grab the lock and do it again. If we got here, we know it's a non-lossy
518 * Connection, so we can use our existing pointer without doing another lookup. */
519 Mutex::Locker
l(lock
);
520 submit_message(m
, con
, dest_addr
, dest_type
, true);
522 connect_rank(dest_addr
, dest_type
, static_cast<PipeConnection
*>(con
), m
);
527 int SimpleMessenger::send_keepalive(Connection
*con
)
530 Pipe
*pipe
= static_cast<Pipe
*>(
531 static_cast<PipeConnection
*>(con
)->get_pipe());
533 ldout(cct
,20) << "send_keepalive con " << con
<< ", have pipe." << dendl
;
534 assert(pipe
->msgr
== this);
535 pipe
->pipe_lock
.Lock();
536 pipe
->_send_keepalive();
537 pipe
->pipe_lock
.Unlock();
540 ldout(cct
,0) << "send_keepalive con " << con
<< ", no pipe." << dendl
;
548 void SimpleMessenger::wait()
556 stop_cond
.Wait(lock
);
562 ldout(cct
,20) << "wait: stopping accepter thread" << dendl
;
565 ldout(cct
,20) << "wait: stopped accepter thread" << dendl
;
568 dispatch_queue
.shutdown();
569 if (dispatch_queue
.is_started()) {
570 ldout(cct
,10) << "wait: waiting for dispatch queue" << dendl
;
571 dispatch_queue
.wait();
572 dispatch_queue
.discard_local();
573 ldout(cct
,10) << "wait: dispatch queue is stopped" << dendl
;
576 if (reaper_started
) {
577 ldout(cct
,20) << "wait: stopping reaper thread" << dendl
;
579 reaper_cond
.Signal();
582 reaper_thread
.join();
583 reaper_started
= false;
584 ldout(cct
,20) << "wait: stopped reaper thread" << dendl
;
587 // close+reap all pipes
590 ldout(cct
,10) << "wait: closing pipes" << dendl
;
592 while (!rank_pipe
.empty()) {
593 Pipe
*p
= rank_pipe
.begin()->second
;
594 p
->unregister_pipe();
597 // don't generate an event here; we're shutting down anyway.
598 PipeConnectionRef con
= p
->connection_state
;
601 p
->pipe_lock
.Unlock();
605 ldout(cct
,10) << "wait: waiting for pipes " << pipes
<< " to close" << dendl
;
606 while (!pipes
.empty()) {
607 reaper_cond
.Wait(lock
);
613 ldout(cct
,10) << "wait: done." << dendl
;
614 ldout(cct
,1) << "shutdown complete." << dendl
;
619 void SimpleMessenger::mark_down_all()
621 ldout(cct
,1) << "mark_down_all" << dendl
;
623 for (set
<Pipe
*>::iterator q
= accepting_pipes
.begin(); q
!= accepting_pipes
.end(); ++q
) {
625 ldout(cct
,5) << "mark_down_all accepting_pipe " << p
<< dendl
;
628 PipeConnectionRef con
= p
->connection_state
;
629 if (con
&& con
->clear_pipe(p
))
630 dispatch_queue
.queue_reset(con
.get());
631 p
->pipe_lock
.Unlock();
633 accepting_pipes
.clear();
635 while (!rank_pipe
.empty()) {
636 ceph::unordered_map
<entity_addr_t
,Pipe
*>::iterator it
= rank_pipe
.begin();
637 Pipe
*p
= it
->second
;
638 ldout(cct
,5) << "mark_down_all " << it
->first
<< " " << p
<< dendl
;
640 p
->unregister_pipe();
643 PipeConnectionRef con
= p
->connection_state
;
644 if (con
&& con
->clear_pipe(p
))
645 dispatch_queue
.queue_reset(con
.get());
646 p
->pipe_lock
.Unlock();
651 void SimpleMessenger::mark_down(const entity_addr_t
& addr
)
654 Pipe
*p
= _lookup_pipe(addr
);
656 ldout(cct
,1) << "mark_down " << addr
<< " -- " << p
<< dendl
;
657 p
->unregister_pipe();
660 if (p
->connection_state
) {
661 // generate a reset event for the caller in this case, even
662 // though they asked for it, since this is the addr-based (and
663 // not Connection* based) interface
664 PipeConnectionRef con
= p
->connection_state
;
665 if (con
&& con
->clear_pipe(p
))
666 dispatch_queue
.queue_reset(con
.get());
668 p
->pipe_lock
.Unlock();
670 ldout(cct
,1) << "mark_down " << addr
<< " -- pipe dne" << dendl
;
675 void SimpleMessenger::mark_down(Connection
*con
)
680 Pipe
*p
= static_cast<Pipe
*>(static_cast<PipeConnection
*>(con
)->get_pipe());
682 ldout(cct
,1) << "mark_down " << con
<< " -- " << p
<< dendl
;
683 assert(p
->msgr
== this);
684 p
->unregister_pipe();
687 if (p
->connection_state
) {
688 // do not generate a reset event for the caller in this case,
689 // since they asked for it.
690 p
->connection_state
->clear_pipe(p
);
692 p
->pipe_lock
.Unlock();
695 ldout(cct
,1) << "mark_down " << con
<< " -- pipe dne" << dendl
;
700 void SimpleMessenger::mark_disposable(Connection
*con
)
703 Pipe
*p
= static_cast<Pipe
*>(static_cast<PipeConnection
*>(con
)->get_pipe());
705 ldout(cct
,1) << "mark_disposable " << con
<< " -- " << p
<< dendl
;
706 assert(p
->msgr
== this);
708 p
->policy
.lossy
= true;
709 p
->pipe_lock
.Unlock();
712 ldout(cct
,1) << "mark_disposable " << con
<< " -- pipe dne" << dendl
;
717 void SimpleMessenger::learned_addr(const entity_addr_t
&peer_addr_for_me
)
719 // be careful here: multiple threads may block here, and readers of
720 // my_inst.addr do NOT hold any lock.
722 // this always goes from true -> false under the protection of the
723 // mutex. if it is already false, we need not retake the mutex at
730 entity_addr_t t
= peer_addr_for_me
;
731 t
.set_port(my_inst
.addr
.get_port());
732 t
.set_nonce(my_inst
.addr
.get_nonce());
733 ANNOTATE_BENIGN_RACE_SIZED(&my_inst
.addr
, sizeof(my_inst
.addr
),
734 "SimpleMessenger learned addr");
736 ldout(cct
,1) << "learned my addr " << my_inst
.addr
<< dendl
;
738 init_local_connection();
743 void SimpleMessenger::init_local_connection()
745 local_connection
->peer_addr
= my_inst
.addr
;
746 local_connection
->peer_type
= my_inst
.name
.type();
747 local_connection
->set_features(CEPH_FEATURES_ALL
);
748 ms_deliver_handle_fast_connect(local_connection
.get());