1 // -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
2 // vim: ts=8 sw=2 smarttab
12 #include "include/types.h"
14 #include "global/global_context.h"
18 #include "messages/MPGStats.h"
20 #include "messages/MGenericMessage.h"
22 #include "messages/MPGStatsAck.h"
24 #include "messages/MStatfs.h"
25 #include "messages/MStatfsReply.h"
27 #include "messages/MGetPoolStats.h"
28 #include "messages/MGetPoolStatsReply.h"
31 #include "messages/MPoolOp.h"
32 #include "messages/MPoolOpReply.h"
34 #include "messages/PaxosServiceMessage.h"
35 #include "messages/MMonCommand.h"
36 #include "messages/MMonCommandAck.h"
37 #include "messages/MMonPaxos.h"
39 #include "messages/MMonProbe.h"
40 #include "messages/MMonJoin.h"
41 #include "messages/MMonElection.h"
42 #include "messages/MMonSync.h"
43 #include "messages/MMonScrub.h"
45 #include "messages/MLog.h"
46 #include "messages/MLogAck.h"
48 #include "messages/MPing.h"
50 #include "messages/MCommand.h"
51 #include "messages/MCommandReply.h"
52 #include "messages/MBackfillReserve.h"
53 #include "messages/MRecoveryReserve.h"
55 #include "messages/MRoute.h"
56 #include "messages/MForward.h"
58 #include "messages/MOSDBoot.h"
59 #include "messages/MOSDAlive.h"
60 #include "messages/MOSDBeacon.h"
61 #include "messages/MOSDPGTemp.h"
62 #include "messages/MOSDFailure.h"
63 #include "messages/MOSDMarkMeDown.h"
64 #include "messages/MOSDFull.h"
65 #include "messages/MOSDPing.h"
66 #include "messages/MOSDOp.h"
67 #include "messages/MOSDOpReply.h"
68 #include "messages/MOSDSubOp.h"
69 #include "messages/MOSDSubOpReply.h"
70 #include "messages/MOSDRepOp.h"
71 #include "messages/MOSDRepOpReply.h"
72 #include "messages/MOSDMap.h"
73 #include "messages/MMonGetOSDMap.h"
75 #include "messages/MOSDPGCreated.h"
76 #include "messages/MOSDPGNotify.h"
77 #include "messages/MOSDPGQuery.h"
78 #include "messages/MOSDPGLog.h"
79 #include "messages/MOSDPGRemove.h"
80 #include "messages/MOSDPGInfo.h"
81 #include "messages/MOSDPGCreate.h"
82 #include "messages/MOSDPGTrim.h"
83 #include "messages/MOSDScrub.h"
84 #include "messages/MOSDScrubReserve.h"
85 #include "messages/MOSDRepScrub.h"
86 #include "messages/MOSDRepScrubMap.h"
87 #include "messages/MOSDPGScan.h"
88 #include "messages/MOSDPGBackfill.h"
89 #include "messages/MOSDBackoff.h"
90 #include "messages/MOSDPGBackfillRemove.h"
92 #include "messages/MRemoveSnaps.h"
94 #include "messages/MMonMap.h"
95 #include "messages/MMonGetMap.h"
96 #include "messages/MMonGetVersion.h"
97 #include "messages/MMonGetVersionReply.h"
98 #include "messages/MMonHealth.h"
99 #include "messages/MMonHealthChecks.h"
100 #include "messages/MMonMetadata.h"
101 #include "messages/MDataPing.h"
102 #include "messages/MAuth.h"
103 #include "messages/MAuthReply.h"
104 #include "messages/MMonSubscribe.h"
105 #include "messages/MMonSubscribeAck.h"
106 #include "messages/MMonGlobalID.h"
107 #include "messages/MClientSession.h"
108 #include "messages/MClientReconnect.h"
109 #include "messages/MClientRequest.h"
110 #include "messages/MClientRequestForward.h"
111 #include "messages/MClientReply.h"
112 #include "messages/MClientCaps.h"
113 #include "messages/MClientCapRelease.h"
114 #include "messages/MClientLease.h"
115 #include "messages/MClientSnap.h"
116 #include "messages/MClientQuota.h"
118 #include "messages/MMDSSlaveRequest.h"
120 #include "messages/MMDSMap.h"
121 #include "messages/MFSMap.h"
122 #include "messages/MFSMapUser.h"
123 #include "messages/MMDSBeacon.h"
124 #include "messages/MMDSLoadTargets.h"
125 #include "messages/MMDSResolve.h"
126 #include "messages/MMDSResolveAck.h"
127 #include "messages/MMDSCacheRejoin.h"
128 #include "messages/MMDSFindIno.h"
129 #include "messages/MMDSFindInoReply.h"
130 #include "messages/MMDSOpenIno.h"
131 #include "messages/MMDSOpenInoReply.h"
133 #include "messages/MDirUpdate.h"
134 #include "messages/MDiscover.h"
135 #include "messages/MDiscoverReply.h"
137 #include "messages/MMDSFragmentNotify.h"
139 #include "messages/MExportDirDiscover.h"
140 #include "messages/MExportDirDiscoverAck.h"
141 #include "messages/MExportDirCancel.h"
142 #include "messages/MExportDirPrep.h"
143 #include "messages/MExportDirPrepAck.h"
144 #include "messages/MExportDir.h"
145 #include "messages/MExportDirAck.h"
146 #include "messages/MExportDirNotify.h"
147 #include "messages/MExportDirNotifyAck.h"
148 #include "messages/MExportDirFinish.h"
150 #include "messages/MExportCaps.h"
151 #include "messages/MExportCapsAck.h"
152 #include "messages/MGatherCaps.h"
155 #include "messages/MDentryUnlink.h"
156 #include "messages/MDentryLink.h"
158 #include "messages/MHeartbeat.h"
160 #include "messages/MMDSTableRequest.h"
162 //#include "messages/MInodeUpdate.h"
163 #include "messages/MCacheExpire.h"
164 #include "messages/MInodeFileCaps.h"
166 #include "messages/MMgrBeacon.h"
167 #include "messages/MMgrMap.h"
168 #include "messages/MMgrDigest.h"
169 #include "messages/MMgrReport.h"
170 #include "messages/MMgrOpen.h"
171 #include "messages/MMgrConfigure.h"
172 #include "messages/MMonMgrReport.h"
173 #include "messages/MServiceMap.h"
175 #include "messages/MLock.h"
177 #include "messages/MWatchNotify.h"
178 #include "messages/MTimeCheck.h"
180 #include "common/config.h"
182 #include "messages/MOSDPGPush.h"
183 #include "messages/MOSDPGPushReply.h"
184 #include "messages/MOSDPGPull.h"
186 #include "messages/MOSDECSubOpWrite.h"
187 #include "messages/MOSDECSubOpWriteReply.h"
188 #include "messages/MOSDECSubOpRead.h"
189 #include "messages/MOSDECSubOpReadReply.h"
191 #include "messages/MOSDPGUpdateLogMissing.h"
192 #include "messages/MOSDPGUpdateLogMissingReply.h"
194 #define DEBUGLVL 10 // debug level of output
196 #define dout_subsys ceph_subsys_ms
198 void Message::encode(uint64_t features
, int crcflags
)
200 // encode and copy out of *m
201 if (empty_payload()) {
202 assert(middle
.length() == 0);
203 encode_payload(features
);
205 if (byte_throttler
) {
206 byte_throttler
->take(payload
.length() + middle
.length());
209 // if the encoder didn't specify past compatibility, we assume it
211 if (header
.compat_version
== 0)
212 header
.compat_version
= header
.version
;
214 if (crcflags
& MSG_CRC_HEADER
)
218 header
.front_len
= get_payload().length();
219 header
.middle_len
= get_middle().length();
220 header
.data_len
= get_data().length();
221 if (crcflags
& MSG_CRC_HEADER
)
224 footer
.flags
= CEPH_MSG_FOOTER_COMPLETE
;
226 if (crcflags
& MSG_CRC_DATA
) {
231 ::encode(get_header(), bl
);
233 // dump the old footer format
234 ceph_msg_footer_old old_footer
;
235 old_footer
.front_crc
= footer
.front_crc
;
236 old_footer
.middle_crc
= footer
.middle_crc
;
237 old_footer
.data_crc
= footer
.data_crc
;
238 old_footer
.flags
= footer
.flags
;
239 ::encode(old_footer
, bl
);
241 ::encode(get_payload(), bl
);
242 ::encode(get_middle(), bl
);
243 ::encode(get_data(), bl
);
245 // this is almost an exponential backoff, except because we count
246 // bits we tend to sample things we encode later, which should be
247 // more representative.
251 for (unsigned t
= i
; t
; bits
++)
256 snprintf(fn
, sizeof(fn
), ENCODE_STRINGIFY(ENCODE_DUMP
) "/%s__%d.%x",
257 abi::__cxa_demangle(typeid(*this).name(), 0, 0, &status
),
259 int fd
= ::open(fn
, O_WRONLY
|O_TRUNC
|O_CREAT
, 0644);
267 footer
.flags
= (unsigned)footer
.flags
| CEPH_MSG_FOOTER_NOCRC
;
271 void Message::dump(Formatter
*f
) const
275 f
->dump_string("summary", ss
.str());
278 Message
*decode_message(CephContext
*cct
, int crcflags
,
279 ceph_msg_header
& header
,
280 ceph_msg_footer
& footer
,
281 bufferlist
& front
, bufferlist
& middle
,
282 bufferlist
& data
, Connection
* conn
)
285 if (crcflags
& MSG_CRC_HEADER
) {
286 __u32 front_crc
= front
.crc32c(0);
287 __u32 middle_crc
= middle
.crc32c(0);
289 if (front_crc
!= footer
.front_crc
) {
291 ldout(cct
, 0) << "bad crc in front " << front_crc
<< " != exp " << footer
.front_crc
<< dendl
;
292 ldout(cct
, 20) << " ";
293 front
.hexdump(*_dout
);
298 if (middle_crc
!= footer
.middle_crc
) {
300 ldout(cct
, 0) << "bad crc in middle " << middle_crc
<< " != exp " << footer
.middle_crc
<< dendl
;
301 ldout(cct
, 20) << " ";
302 middle
.hexdump(*_dout
);
308 if (crcflags
& MSG_CRC_DATA
) {
309 if ((footer
.flags
& CEPH_MSG_FOOTER_NOCRC
) == 0) {
310 __u32 data_crc
= data
.crc32c(0);
311 if (data_crc
!= footer
.data_crc
) {
313 ldout(cct
, 0) << "bad crc in data " << data_crc
<< " != exp " << footer
.data_crc
<< dendl
;
314 ldout(cct
, 20) << " ";
315 data
.hexdump(*_dout
);
325 int type
= header
.type
;
328 // -- with payload --
337 case CEPH_MSG_STATFS
:
340 case CEPH_MSG_STATFS_REPLY
:
341 m
= new MStatfsReply
;
343 case MSG_GETPOOLSTATS
:
344 m
= new MGetPoolStats
;
346 case MSG_GETPOOLSTATSREPLY
:
347 m
= new MGetPoolStatsReply
;
349 case CEPH_MSG_POOLOP
:
352 case CEPH_MSG_POOLOP_REPLY
:
353 m
= new MPoolOpReply
;
355 case MSG_MON_COMMAND
:
358 case MSG_MON_COMMAND_ACK
:
359 m
= new MMonCommandAck
;
371 case MSG_MON_ELECTION
:
372 m
= new MMonElection
;
394 case MSG_COMMAND_REPLY
:
395 m
= new MCommandReply
;
397 case MSG_OSD_BACKFILL_RESERVE
:
398 m
= new MBackfillReserve
;
400 case MSG_OSD_RECOVERY_RESERVE
:
401 m
= new MRecoveryReserve
;
411 case CEPH_MSG_MON_MAP
:
414 case CEPH_MSG_MON_GET_MAP
:
417 case CEPH_MSG_MON_GET_OSDMAP
:
418 m
= new MMonGetOSDMap
;
420 case CEPH_MSG_MON_GET_VERSION
:
421 m
= new MMonGetVersion();
423 case CEPH_MSG_MON_GET_VERSION_REPLY
:
424 m
= new MMonGetVersionReply();
426 case CEPH_MSG_MON_METADATA
:
427 m
= new MMonMetadata();
437 m
= new MOSDBeacon();
442 case MSG_OSD_FAILURE
:
443 m
= new MOSDFailure();
445 case MSG_OSD_MARK_ME_DOWN
:
446 m
= new MOSDMarkMeDown();
454 case CEPH_MSG_OSD_OP
:
457 case CEPH_MSG_OSD_OPREPLY
:
458 m
= new MOSDOpReply();
463 case MSG_OSD_SUBOPREPLY
:
464 m
= new MOSDSubOpReply();
469 case MSG_OSD_REPOPREPLY
:
470 m
= new MOSDRepOpReply();
472 case MSG_OSD_PG_CREATED
:
473 m
= new MOSDPGCreated();
475 case MSG_OSD_PG_UPDATE_LOG_MISSING
:
476 m
= new MOSDPGUpdateLogMissing();
478 case MSG_OSD_PG_UPDATE_LOG_MISSING_REPLY
:
479 m
= new MOSDPGUpdateLogMissingReply();
481 case CEPH_MSG_OSD_BACKOFF
:
485 case CEPH_MSG_OSD_MAP
:
489 case CEPH_MSG_WATCH_NOTIFY
:
490 m
= new MWatchNotify
;
493 case MSG_OSD_PG_NOTIFY
:
494 m
= new MOSDPGNotify
;
496 case MSG_OSD_PG_QUERY
:
502 case MSG_OSD_PG_REMOVE
:
503 m
= new MOSDPGRemove
;
505 case MSG_OSD_PG_INFO
:
508 case MSG_OSD_PG_CREATE
:
509 m
= new MOSDPGCreate
;
511 case MSG_OSD_PG_TRIM
:
518 case MSG_OSD_SCRUB_RESERVE
:
519 m
= new MOSDScrubReserve
;
521 case MSG_REMOVE_SNAPS
:
522 m
= new MRemoveSnaps
;
524 case MSG_OSD_REP_SCRUB
:
525 m
= new MOSDRepScrub
;
527 case MSG_OSD_REP_SCRUBMAP
:
528 m
= new MOSDRepScrubMap
;
530 case MSG_OSD_PG_SCAN
:
533 case MSG_OSD_PG_BACKFILL
:
534 m
= new MOSDPGBackfill
;
536 case MSG_OSD_PG_BACKFILL_REMOVE
:
537 m
= new MOSDPGBackfillRemove
;
539 case MSG_OSD_PG_PUSH
:
542 case MSG_OSD_PG_PULL
:
545 case MSG_OSD_PG_PUSH_REPLY
:
546 m
= new MOSDPGPushReply
;
548 case MSG_OSD_EC_WRITE
:
549 m
= new MOSDECSubOpWrite
;
551 case MSG_OSD_EC_WRITE_REPLY
:
552 m
= new MOSDECSubOpWriteReply
;
554 case MSG_OSD_EC_READ
:
555 m
= new MOSDECSubOpRead
;
557 case MSG_OSD_EC_READ_REPLY
:
558 m
= new MOSDECSubOpReadReply
;
564 case CEPH_MSG_AUTH_REPLY
:
568 case MSG_MON_GLOBAL_ID
:
569 m
= new MMonGlobalID
;
573 case CEPH_MSG_MON_SUBSCRIBE
:
574 m
= new MMonSubscribe
;
576 case CEPH_MSG_MON_SUBSCRIBE_ACK
:
577 m
= new MMonSubscribeAck
;
579 case CEPH_MSG_CLIENT_SESSION
:
580 m
= new MClientSession
;
582 case CEPH_MSG_CLIENT_RECONNECT
:
583 m
= new MClientReconnect
;
585 case CEPH_MSG_CLIENT_REQUEST
:
586 m
= new MClientRequest
;
588 case CEPH_MSG_CLIENT_REQUEST_FORWARD
:
589 m
= new MClientRequestForward
;
591 case CEPH_MSG_CLIENT_REPLY
:
592 m
= new MClientReply
;
594 case CEPH_MSG_CLIENT_CAPS
:
597 case CEPH_MSG_CLIENT_CAPRELEASE
:
598 m
= new MClientCapRelease
;
600 case CEPH_MSG_CLIENT_LEASE
:
601 m
= new MClientLease
;
603 case CEPH_MSG_CLIENT_SNAP
:
606 case CEPH_MSG_CLIENT_QUOTA
:
607 m
= new MClientQuota
;
611 case MSG_MDS_SLAVE_REQUEST
:
612 m
= new MMDSSlaveRequest
;
615 case CEPH_MSG_MDS_MAP
:
618 case CEPH_MSG_FS_MAP
:
621 case CEPH_MSG_FS_MAP_USER
:
627 case MSG_MDS_OFFLOAD_TARGETS
:
628 m
= new MMDSLoadTargets
;
630 case MSG_MDS_RESOLVE
:
633 case MSG_MDS_RESOLVEACK
:
634 m
= new MMDSResolveAck
;
636 case MSG_MDS_CACHEREJOIN
:
637 m
= new MMDSCacheRejoin
;
640 case MSG_MDS_DIRUPDATE
:
641 m
= new MDirUpdate();
644 case MSG_MDS_DISCOVER
:
647 case MSG_MDS_DISCOVERREPLY
:
648 m
= new MDiscoverReply();
651 case MSG_MDS_FINDINO
:
654 case MSG_MDS_FINDINOREPLY
:
655 m
= new MMDSFindInoReply
;
658 case MSG_MDS_OPENINO
:
661 case MSG_MDS_OPENINOREPLY
:
662 m
= new MMDSOpenInoReply
;
665 case MSG_MDS_FRAGMENTNOTIFY
:
666 m
= new MMDSFragmentNotify
;
669 case MSG_MDS_EXPORTDIRDISCOVER
:
670 m
= new MExportDirDiscover();
672 case MSG_MDS_EXPORTDIRDISCOVERACK
:
673 m
= new MExportDirDiscoverAck();
675 case MSG_MDS_EXPORTDIRCANCEL
:
676 m
= new MExportDirCancel();
679 case MSG_MDS_EXPORTDIR
:
682 case MSG_MDS_EXPORTDIRACK
:
683 m
= new MExportDirAck
;
685 case MSG_MDS_EXPORTDIRFINISH
:
686 m
= new MExportDirFinish
;
689 case MSG_MDS_EXPORTDIRNOTIFY
:
690 m
= new MExportDirNotify();
693 case MSG_MDS_EXPORTDIRNOTIFYACK
:
694 m
= new MExportDirNotifyAck();
697 case MSG_MDS_EXPORTDIRPREP
:
698 m
= new MExportDirPrep();
701 case MSG_MDS_EXPORTDIRPREPACK
:
702 m
= new MExportDirPrepAck();
705 case MSG_MDS_EXPORTCAPS
:
708 case MSG_MDS_EXPORTCAPSACK
:
709 m
= new MExportCapsAck
;
711 case MSG_MDS_GATHERCAPS
:
716 case MSG_MDS_DENTRYUNLINK
:
717 m
= new MDentryUnlink
;
719 case MSG_MDS_DENTRYLINK
:
723 case MSG_MDS_HEARTBEAT
:
724 m
= new MHeartbeat();
727 case MSG_MDS_CACHEEXPIRE
:
728 m
= new MCacheExpire();
731 case MSG_MDS_TABLE_REQUEST
:
732 m
= new MMDSTableRequest
;
735 /* case MSG_MDS_INODEUPDATE:
736 m = new MInodeUpdate();
740 case MSG_MDS_INODEFILECAPS
:
741 m
= new MInodeFileCaps();
749 m
= new MMgrBeacon();
752 case MSG_MON_MGR_REPORT
:
753 m
= new MMonMgrReport();
756 case MSG_SERVICE_MAP
:
757 m
= new MServiceMap();
765 m
= new MMgrDigest();
773 m
= new MMgrReport();
776 case MSG_MGR_CONFIGURE
:
777 m
= new MMgrConfigure();
781 m
= new MTimeCheck();
785 m
= new MMonHealth();
788 case MSG_MON_HEALTH_CHECKS
:
789 m
= new MMonHealthChecks();
792 #if defined(HAVE_XIO)
797 // -- simple messages without payload --
799 case CEPH_MSG_SHUTDOWN
:
800 m
= new MGenericMessage(type
);
805 ldout(cct
, 0) << "can't decode unknown message type " << type
<< " MSG_AUTH=" << CEPH_MSG_AUTH
<< dendl
;
806 if (cct
->_conf
->ms_die_on_bad_msg
)
814 // m->header.version, if non-zero, should be populated with the
815 // newest version of the encoding the code supports. If set, check
816 // it against compat_version.
817 if (m
->get_header().version
&&
818 m
->get_header().version
< header
.compat_version
) {
820 ldout(cct
, 0) << "will not decode message of type " << type
821 << " version " << header
.version
822 << " because compat_version " << header
.compat_version
823 << " > supported version " << m
->get_header().version
<< dendl
;
824 if (cct
->_conf
->ms_die_on_bad_msg
)
831 m
->set_connection(conn
);
832 m
->set_header(header
);
833 m
->set_footer(footer
);
834 m
->set_payload(front
);
835 m
->set_middle(middle
);
841 catch (const buffer::error
&e
) {
843 lderr(cct
) << "failed to decode message of type " << type
844 << " v" << header
.version
845 << ": " << e
.what() << dendl
;
846 ldout(cct
, cct
->_conf
->ms_dump_corrupt_message_level
) << "dump: \n";
847 m
->get_payload().hexdump(*_dout
);
849 if (cct
->_conf
->ms_die_on_bad_msg
)
860 void Message::encode_trace(bufferlist
&bl
, uint64_t features
) const
862 auto p
= trace
.get_info();
863 static const blkin_trace_info empty
= { 0, 0, 0 };
870 void Message::decode_trace(bufferlist::iterator
&p
, bool create
)
872 blkin_trace_info info
= {};
879 const auto msgr
= connection
->get_messenger();
880 const auto endpoint
= msgr
->get_trace_endpoint();
882 trace
.init(get_type_name(), endpoint
, &info
, true);
883 trace
.event("decoded trace");
884 } else if (create
|| (msgr
->get_myname().is_osd() &&
885 msgr
->cct
->_conf
->osd_blkin_trace_all
)) {
886 // create a trace even if we didn't get one on the wire
887 trace
.init(get_type_name(), endpoint
);
888 trace
.event("created trace");
890 trace
.keyval("tid", get_tid());
891 trace
.keyval("entity type", get_source().type_str());
892 trace
.keyval("entity num", get_source().num());
897 // This routine is not used for ordinary messages, but only when encapsulating a message
898 // for forwarding and routing. It's also used in a backward compatibility test, which only
899 // effectively tests backward compability for those functions. To avoid backward compatibility
900 // problems, we currently always encode and decode using the old footer format that doesn't
901 // allow for message authentication. Eventually we should fix that. PLR
903 void encode_message(Message
*msg
, uint64_t features
, bufferlist
& payload
)
905 bufferlist front
, middle
, data
;
906 ceph_msg_footer_old old_footer
;
907 ceph_msg_footer footer
;
908 msg
->encode(features
, MSG_CRC_ALL
);
909 ::encode(msg
->get_header(), payload
);
911 // Here's where we switch to the old footer format. PLR
913 footer
= msg
->get_footer();
914 old_footer
.front_crc
= footer
.front_crc
;
915 old_footer
.middle_crc
= footer
.middle_crc
;
916 old_footer
.data_crc
= footer
.data_crc
;
917 old_footer
.flags
= footer
.flags
;
918 ::encode(old_footer
, payload
);
920 ::encode(msg
->get_payload(), payload
);
921 ::encode(msg
->get_middle(), payload
);
922 ::encode(msg
->get_data(), payload
);
925 // See above for somewhat bogus use of the old message footer. We switch to the current footer
926 // after decoding the old one so the other form of decode_message() doesn't have to change.
927 // We've slipped in a 0 signature at this point, so any signature checking after this will
930 Message
*decode_message(CephContext
*cct
, int crcflags
, bufferlist::iterator
& p
)
933 ceph_msg_footer_old fo
;
935 bufferlist fr
, mi
, da
;
938 f
.front_crc
= fo
.front_crc
;
939 f
.middle_crc
= fo
.middle_crc
;
940 f
.data_crc
= fo
.data_crc
;
946 return decode_message(cct
, crcflags
, h
, f
, fr
, mi
, da
, nullptr);