1 // -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
2 // vim: ts=8 sw=2 smarttab
4 * Ceph - scalable distributed file system
6 * Copyright (C) 2013 Inktank
8 * This is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License version 2.1, as published by the Free Software
11 * Foundation. See file COPYING.
15 #include <boost/program_options/variables_map.hpp>
16 #include <boost/program_options/parsers.hpp>
17 #include <boost/scoped_ptr.hpp>
18 #include <boost/optional.hpp>
22 #include "common/Formatter.h"
23 #include "common/errno.h"
24 #include "common/ceph_argparse.h"
26 #include "global/global_init.h"
28 #include "os/ObjectStore.h"
29 #include "os/filestore/FileJournal.h"
30 #include "os/filestore/FileStore.h"
32 #include "os/FuseStore.h"
35 #include "osd/PGLog.h"
39 #include "json_spirit/json_spirit_value.h"
40 #include "json_spirit/json_spirit_reader.h"
42 #include "rebuild_mondb.h"
43 #include "ceph_objectstore_tool.h"
44 #include "include/compat.h"
45 #include "include/util.h"
47 namespace po
= boost::program_options
;
51 CompatSet
get_test_compat_set() {
52 CompatSet::FeatureSet ceph_osd_feature_compat
;
53 CompatSet::FeatureSet ceph_osd_feature_ro_compat
;
54 CompatSet::FeatureSet ceph_osd_feature_incompat
;
55 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_BASE
);
56 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_PGINFO
);
57 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_OLOC
);
58 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_LEC
);
59 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_CATEGORIES
);
60 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_HOBJECTPOOL
);
61 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_BIGINFO
);
62 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_LEVELDBINFO
);
63 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_LEVELDBLOG
);
65 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_SNAPMAPPER
);
66 ceph_osd_feature_incompat
.insert(CEPH_OSD_FEATURE_INCOMPAT_SHARDS
);
68 return CompatSet(ceph_osd_feature_compat
, ceph_osd_feature_ro_compat
,
69 ceph_osd_feature_incompat
);
73 const ssize_t max_read
= 1024 * 1024;
74 const int fd_none
= INT_MIN
;
78 struct action_on_object_t
{
79 virtual ~action_on_object_t() {}
80 virtual int call(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, object_info_t
&oi
) = 0;
83 int _action_on_all_objects_in_pg(ObjectStore
*store
, coll_t coll
, action_on_object_t
&action
, bool debug
)
85 unsigned LIST_AT_A_TIME
= 100;
87 while (!next
.is_max()) {
88 vector
<ghobject_t
> list
;
89 int r
= store
->collection_list(
92 ghobject_t::get_max(),
97 cerr
<< "Error listing collection: " << coll
<< ", "
98 << cpp_strerror(r
) << std::endl
;
101 for (vector
<ghobject_t
>::iterator obj
= list
.begin();
104 if (obj
->is_pgmeta())
107 if (coll
!= coll_t::meta()) {
109 r
= store
->getattr(coll
, *obj
, OI_ATTR
, attr
);
111 cerr
<< "Error getting attr on : " << make_pair(coll
, *obj
) << ", "
112 << cpp_strerror(r
) << std::endl
;
115 bufferlist::iterator bp
= attr
.begin();
120 cerr
<< "Error getting attr on : " << make_pair(coll
, *obj
) << ", "
121 << cpp_strerror(r
) << std::endl
;
125 r
= action
.call(store
, coll
, *obj
, oi
);
133 int action_on_all_objects_in_pg(ObjectStore
*store
, string pgidstr
, action_on_object_t
&action
, bool debug
)
136 // Scan collections in case this is an ec pool but no shard specified
137 unsigned scanned
= 0;
139 vector
<coll_t
> colls_to_check
;
140 vector
<coll_t
> candidates
;
141 r
= store
->list_collections(candidates
);
143 cerr
<< "Error listing collections: " << cpp_strerror(r
) << std::endl
;
146 pgid
.parse(pgidstr
.c_str());
147 for (vector
<coll_t
>::iterator i
= candidates
.begin();
148 i
!= candidates
.end();
151 if (!i
->is_pg(&cand_pgid
))
154 // If an exact match or treat no shard as any shard
155 if (cand_pgid
== pgid
||
156 (pgid
.is_no_shard() && pgid
.pgid
== cand_pgid
.pgid
)) {
157 colls_to_check
.push_back(*i
);
162 cerr
<< colls_to_check
.size() << " pgs to scan" << std::endl
;
163 for (vector
<coll_t
>::iterator i
= colls_to_check
.begin();
164 i
!= colls_to_check
.end();
167 cerr
<< "Scanning " << *i
<< ", " << scanned
<< "/"
168 << colls_to_check
.size() << " completed" << std::endl
;
169 r
= _action_on_all_objects_in_pg(store
, *i
, action
, debug
);
176 int action_on_all_objects_in_exact_pg(ObjectStore
*store
, coll_t coll
, action_on_object_t
&action
, bool debug
)
178 int r
= _action_on_all_objects_in_pg(store
, coll
, action
, debug
);
182 int _action_on_all_objects(ObjectStore
*store
, action_on_object_t
&action
, bool debug
)
184 unsigned scanned
= 0;
186 vector
<coll_t
> colls_to_check
;
187 vector
<coll_t
> candidates
;
188 r
= store
->list_collections(candidates
);
190 cerr
<< "Error listing collections: " << cpp_strerror(r
) << std::endl
;
193 for (vector
<coll_t
>::iterator i
= candidates
.begin();
194 i
!= candidates
.end();
197 colls_to_check
.push_back(*i
);
202 cerr
<< colls_to_check
.size() << " pgs to scan" << std::endl
;
203 for (vector
<coll_t
>::iterator i
= colls_to_check
.begin();
204 i
!= colls_to_check
.end();
207 cerr
<< "Scanning " << *i
<< ", " << scanned
<< "/"
208 << colls_to_check
.size() << " completed" << std::endl
;
209 r
= _action_on_all_objects_in_pg(store
, *i
, action
, debug
);
216 int action_on_all_objects(ObjectStore
*store
, action_on_object_t
&action
, bool debug
)
218 int r
= _action_on_all_objects(store
, action
, debug
);
222 struct pgid_object_list
{
223 list
<pair
<coll_t
, ghobject_t
> > _objects
;
225 void insert(coll_t coll
, ghobject_t
&ghobj
) {
226 _objects
.push_back(make_pair(coll
, ghobj
));
229 void dump(Formatter
*f
, bool human_readable
) const {
231 f
->open_array_section("pgid_objects");
232 for (list
<pair
<coll_t
, ghobject_t
> >::const_iterator i
= _objects
.begin();
235 f
->open_array_section("pgid_object");
237 bool is_pg
= i
->first
.is_pg(&pgid
);
239 f
->dump_string("pgid", stringify(pgid
));
240 if (!is_pg
|| !human_readable
)
241 f
->dump_string("coll", i
->first
.to_str());
242 f
->open_object_section("ghobject");
246 if (human_readable
) {
251 if (!human_readable
) {
259 struct lookup_ghobject
: public action_on_object_t
{
260 pgid_object_list _objects
;
262 const boost::optional
<std::string
> _namespace
;
265 lookup_ghobject(const string
& name
, const boost::optional
<std::string
>& nspace
, bool need_snapset
= false) : _name(name
),
266 _namespace(nspace
), _need_snapset(need_snapset
) { }
268 int call(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, object_info_t
&oi
) override
{
269 if (_need_snapset
&& !ghobj
.hobj
.has_snapset())
271 if ((_name
.length() == 0 || ghobj
.hobj
.oid
.name
== _name
) &&
272 (!_namespace
|| ghobj
.hobj
.nspace
== _namespace
))
273 _objects
.insert(coll
, ghobj
);
278 return _objects
._objects
.size();
281 pair
<coll_t
, ghobject_t
> pop() {
282 pair
<coll_t
, ghobject_t
> front
= _objects
._objects
.front();
283 _objects
._objects
.pop_front();
287 void dump(Formatter
*f
, bool human_readable
) const {
288 _objects
.dump(f
, human_readable
);
292 ghobject_t infos_oid
= OSD::make_infos_oid();
294 ghobject_t biginfo_oid
;
296 int file_fd
= fd_none
;
300 static int get_fd_data(int fd
, bufferlist
&bl
)
304 ssize_t bytes
= bl
.read_fd(fd
, max_read
);
306 cerr
<< "read_fd error " << cpp_strerror(bytes
) << std::endl
;
316 assert(bl
.length() == total
);
320 int get_log(ObjectStore
*fs
, __u8 struct_ver
,
321 coll_t coll
, spg_t pgid
, const pg_info_t
&info
,
322 PGLog::IndexedLog
&log
, pg_missing_t
&missing
)
326 assert(struct_ver
> 0);
327 PGLog::read_log_and_missing(fs
, coll
,
328 struct_ver
>= 8 ? coll
: coll_t::meta(),
329 struct_ver
>= 8 ? pgid
.make_pgmeta_oid() : log_oid
,
333 g_ceph_context
->_conf
->osd_ignore_stale_divergent_priors
);
334 if (debug
&& oss
.str().size())
335 cerr
<< oss
.str() << std::endl
;
337 catch (const buffer::error
&e
) {
338 cerr
<< "read_log_and_missing threw exception error " << e
.what() << std::endl
;
344 void dump_log(Formatter
*formatter
, ostream
&out
, pg_log_t
&log
,
345 pg_missing_t
&missing
)
347 formatter
->open_object_section("op_log");
348 formatter
->open_object_section("pg_log_t");
350 formatter
->close_section();
351 formatter
->flush(out
);
352 formatter
->open_object_section("pg_missing_t");
353 missing
.dump(formatter
);
354 formatter
->close_section();
355 formatter
->close_section();
356 formatter
->flush(out
);
359 //Based on part of OSD::load_pgs()
360 int finish_remove_pgs(ObjectStore
*store
)
363 int r
= store
->list_collections(ls
);
365 cerr
<< "finish_remove_pgs: failed to list pgs: " << cpp_strerror(r
)
370 for (vector
<coll_t
>::iterator it
= ls
.begin();
375 if (it
->is_temp(&pgid
) ||
376 (it
->is_pg(&pgid
) && PG::_has_removal_flag(store
, pgid
))) {
377 cout
<< "finish_remove_pgs " << *it
<< " removing " << pgid
<< std::endl
;
378 OSD::recursive_remove_collection(g_ceph_context
, store
, pgid
, *it
);
382 //cout << "finish_remove_pgs ignoring unrecognized " << *it << std::endl;
387 #pragma GCC diagnostic ignored "-Wpragmas"
388 #pragma GCC diagnostic push
389 #pragma GCC diagnostic ignored "-Wdeprecated-declarations"
391 int mark_pg_for_removal(ObjectStore
*fs
, spg_t pgid
, ObjectStore::Transaction
*t
)
393 pg_info_t
info(pgid
);
395 ghobject_t
pgmeta_oid(info
.pgid
.make_pgmeta_oid());
398 epoch_t map_epoch
= 0;
399 int r
= PG::peek_map_epoch(fs
, pgid
, &map_epoch
, &bl
);
401 cerr
<< __func__
<< " warning: peek_map_epoch reported error" << std::endl
;
402 PastIntervals past_intervals
;
404 r
= PG::read_info(fs
, pgid
, coll
, bl
, info
, past_intervals
, struct_v
);
406 cerr
<< __func__
<< " error on read_info " << cpp_strerror(r
) << std::endl
;
409 assert(struct_v
>= 8);
411 cout
<< "setting '_remove' omap key" << std::endl
;
412 map
<string
,bufferlist
> values
;
413 ::encode((char)1, values
["_remove"]);
414 t
->omap_setkeys(coll
, pgmeta_oid
, values
);
418 #pragma GCC diagnostic pop
419 #pragma GCC diagnostic warning "-Wpragmas"
421 int initiate_new_remove_pg(ObjectStore
*store
, spg_t r_pgid
,
422 ObjectStore::Sequencer
&osr
)
425 finish_remove_pgs(store
);
426 if (!store
->collection_exists(coll_t(r_pgid
)))
429 cout
<< " marking collection for removal" << std::endl
;
432 ObjectStore::Transaction rmt
;
433 int r
= mark_pg_for_removal(store
, r_pgid
, &rmt
);
437 store
->apply_transaction(&osr
, std::move(rmt
));
438 finish_remove_pgs(store
);
442 int write_info(ObjectStore::Transaction
&t
, epoch_t epoch
, pg_info_t
&info
,
443 PastIntervals
&past_intervals
)
446 coll_t
coll(info
.pgid
);
447 ghobject_t
pgmeta_oid(info
.pgid
.make_pgmeta_oid());
448 map
<string
,bufferlist
> km
;
449 pg_info_t last_written_info
;
450 int ret
= PG::_prepare_write_info(
457 if (ret
) cerr
<< "Failed to write info" << std::endl
;
458 t
.omap_setkeys(coll
, pgmeta_oid
, km
);
462 typedef map
<eversion_t
, hobject_t
> divergent_priors_t
;
464 int write_pg(ObjectStore::Transaction
&t
, epoch_t epoch
, pg_info_t
&info
,
465 pg_log_t
&log
, PastIntervals
&past_intervals
,
466 divergent_priors_t
&divergent
,
467 pg_missing_t
&missing
)
469 int ret
= write_info(t
, epoch
, info
, past_intervals
);
472 coll_t
coll(info
.pgid
);
473 map
<string
,bufferlist
> km
;
475 if (!divergent
.empty()) {
476 assert(missing
.get_items().empty());
477 PGLog::write_log_and_missing_wo_missing(
478 t
, &km
, log
, coll
, info
.pgid
.make_pgmeta_oid(), divergent
, true);
480 pg_missing_tracker_t
tmissing(missing
);
481 bool rebuilt_missing_set_with_deletes
= missing
.may_include_deletes
;
482 PGLog::write_log_and_missing(
483 t
, &km
, log
, coll
, info
.pgid
.make_pgmeta_oid(), tmissing
, true,
484 &rebuilt_missing_set_with_deletes
);
486 t
.omap_setkeys(coll
, info
.pgid
.make_pgmeta_oid(), km
);
490 const int OMAP_BATCH_SIZE
= 25;
491 void get_omap_batch(ObjectMap::ObjectMapIterator
&iter
, map
<string
, bufferlist
> &oset
)
494 for (int count
= OMAP_BATCH_SIZE
; count
&& iter
->valid(); --count
, iter
->next()) {
495 oset
.insert(pair
<string
, bufferlist
>(iter
->key(), iter
->value()));
499 int ObjectStoreTool::export_file(ObjectStore
*store
, coll_t cid
, ghobject_t
&obj
)
505 int ret
= store
->stat(cid
, obj
, &st
);
509 cerr
<< "Read " << obj
<< std::endl
;
513 cerr
<< "size=" << total
<< std::endl
;
515 object_begin
objb(obj
);
520 ret
= store
->getattr(cid
, obj
, OI_ATTR
, bp
);
522 cerr
<< "getattr failure object_info " << ret
<< std::endl
;
528 cerr
<< "object_info: " << objb
.oi
<< std::endl
;
531 // NOTE: we include whiteouts, lost, etc.
533 ret
= write_section(TYPE_OBJECT_BEGIN
, objb
, file_fd
);
538 bufferlist rawdatabl
;
541 mysize_t len
= max_read
;
545 ret
= store
->read(cid
, obj
, offset
, len
, rawdatabl
);
551 data_section
dblock(offset
, len
, rawdatabl
);
553 cerr
<< "data section offset=" << offset
<< " len=" << len
<< std::endl
;
558 ret
= write_section(TYPE_DATA
, dblock
, file_fd
);
562 //Handle attrs for this object
563 map
<string
,bufferptr
> aset
;
564 ret
= store
->getattrs(cid
, obj
, aset
);
566 attr_section
as(aset
);
567 ret
= write_section(TYPE_ATTRS
, as
, file_fd
);
572 cerr
<< "attrs size " << aset
.size() << std::endl
;
575 //Handle omap information
577 ret
= store
->omap_get_header(cid
, obj
, &hdrbuf
, true);
579 cerr
<< "omap_get_header: " << cpp_strerror(ret
) << std::endl
;
583 omap_hdr_section
ohs(hdrbuf
);
584 ret
= write_section(TYPE_OMAP_HDR
, ohs
, file_fd
);
588 ObjectMap::ObjectMapIterator iter
= store
->get_omap_iterator(cid
, obj
);
591 cerr
<< "omap_get_iterator: " << cpp_strerror(ret
) << std::endl
;
594 iter
->seek_to_first();
596 map
<string
, bufferlist
> out
;
597 while(iter
->valid()) {
598 get_omap_batch(iter
, out
);
600 if (out
.empty()) break;
602 mapcount
+= out
.size();
603 omap_section
oms(out
);
604 ret
= write_section(TYPE_OMAP
, oms
, file_fd
);
609 cerr
<< "omap map size " << mapcount
<< std::endl
;
611 ret
= write_simple(TYPE_OBJECT_END
, file_fd
);
618 int ObjectStoreTool::export_files(ObjectStore
*store
, coll_t coll
)
622 while (!next
.is_max()) {
623 vector
<ghobject_t
> objects
;
624 int r
= store
->collection_list(coll
, next
, ghobject_t::get_max(), 300,
628 for (vector
<ghobject_t
>::iterator i
= objects
.begin();
631 assert(!i
->hobj
.is_meta());
632 if (i
->is_pgmeta() || i
->hobj
.is_temp()) {
635 r
= export_file(store
, coll
, *i
);
643 int set_inc_osdmap(ObjectStore
*store
, epoch_t e
, bufferlist
& bl
, bool force
,
644 ObjectStore::Sequencer
&osr
) {
645 OSDMap::Incremental inc
;
646 bufferlist::iterator it
= bl
.begin();
650 } else if (e
!= inc
.epoch
) {
651 cerr
<< "incremental.epoch mismatch: "
652 << inc
.epoch
<< " != " << e
<< std::endl
;
654 cerr
<< "But will continue anyway." << std::endl
;
659 const ghobject_t inc_oid
= OSD::get_inc_osdmap_pobject_name(e
);
660 if (!store
->exists(coll_t::meta(), inc_oid
)) {
661 cerr
<< "inc-osdmap (" << inc_oid
<< ") does not exist." << std::endl
;
665 cout
<< "Creating a new epoch." << std::endl
;
669 ObjectStore::Transaction t
;
670 t
.write(coll_t::meta(), inc_oid
, 0, bl
.length(), bl
);
671 t
.truncate(coll_t::meta(), inc_oid
, bl
.length());
672 int ret
= store
->apply_transaction(&osr
, std::move(t
));
674 cerr
<< "Failed to set inc-osdmap (" << inc_oid
<< "): " << ret
<< std::endl
;
676 cout
<< "Wrote inc-osdmap." << inc
.epoch
<< std::endl
;
681 int get_inc_osdmap(ObjectStore
*store
, epoch_t e
, bufferlist
& bl
)
683 if (store
->read(coll_t::meta(),
684 OSD::get_inc_osdmap_pobject_name(e
),
691 int set_osdmap(ObjectStore
*store
, epoch_t e
, bufferlist
& bl
, bool force
,
692 ObjectStore::Sequencer
&osr
) {
696 e
= osdmap
.get_epoch();
697 } else if (e
!= osdmap
.get_epoch()) {
698 cerr
<< "osdmap.epoch mismatch: "
699 << e
<< " != " << osdmap
.get_epoch() << std::endl
;
701 cerr
<< "But will continue anyway." << std::endl
;
706 const ghobject_t full_oid
= OSD::get_osdmap_pobject_name(e
);
707 if (!store
->exists(coll_t::meta(), full_oid
)) {
708 cerr
<< "osdmap (" << full_oid
<< ") does not exist." << std::endl
;
712 cout
<< "Creating a new epoch." << std::endl
;
716 ObjectStore::Transaction t
;
717 t
.write(coll_t::meta(), full_oid
, 0, bl
.length(), bl
);
718 t
.truncate(coll_t::meta(), full_oid
, bl
.length());
719 int ret
= store
->apply_transaction(&osr
, std::move(t
));
721 cerr
<< "Failed to set osdmap (" << full_oid
<< "): " << ret
<< std::endl
;
723 cout
<< "Wrote osdmap." << osdmap
.get_epoch() << std::endl
;
728 int get_osdmap(ObjectStore
*store
, epoch_t e
, OSDMap
&osdmap
, bufferlist
& bl
)
730 bool found
= store
->read(
731 coll_t::meta(), OSD::get_osdmap_pobject_name(e
), 0, 0, bl
) >= 0;
733 cerr
<< "Can't find OSDMap for pg epoch " << e
<< std::endl
;
738 cerr
<< osdmap
<< std::endl
;
742 int add_osdmap(ObjectStore
*store
, metadata_section
&ms
)
744 return get_osdmap(store
, ms
.map_epoch
, ms
.osdmap
, ms
.osdmap_bl
);
747 int ObjectStoreTool::do_export(ObjectStore
*fs
, coll_t coll
, spg_t pgid
,
748 pg_info_t
&info
, epoch_t map_epoch
, __u8 struct_ver
,
749 const OSDSuperblock
& superblock
,
750 PastIntervals
&past_intervals
)
752 PGLog::IndexedLog log
;
753 pg_missing_t missing
;
755 cerr
<< "Exporting " << pgid
<< std::endl
;
757 int ret
= get_log(fs
, struct_ver
, coll
, pgid
, info
, log
, missing
);
762 Formatter
*formatter
= Formatter::create("json-pretty");
764 dump_log(formatter
, cerr
, log
, missing
);
769 pg_begin
pgb(pgid
, superblock
);
770 // Special case: If replicated pg don't require the importing OSD to have shard feature
771 if (pgid
.is_no_shard()) {
772 pgb
.superblock
.compat_features
.incompat
.remove(CEPH_OSD_FEATURE_INCOMPAT_SHARDS
);
774 ret
= write_section(TYPE_PG_BEGIN
, pgb
, file_fd
);
778 // The metadata_section is now before files, so import can detect
779 // errors and abort without wasting time.
787 ret
= add_osdmap(fs
, ms
);
790 ret
= write_section(TYPE_PG_METADATA
, ms
, file_fd
);
794 ret
= export_files(fs
, coll
);
796 cerr
<< "export_files error " << ret
<< std::endl
;
800 ret
= write_simple(TYPE_PG_END
, file_fd
);
807 int dump_data(Formatter
*formatter
, bufferlist
&bl
)
809 bufferlist::iterator ebliter
= bl
.begin();
813 formatter
->open_object_section("data_block");
814 formatter
->dump_unsigned("offset", ds
.offset
);
815 formatter
->dump_unsigned("len", ds
.len
);
816 // XXX: Add option to dump data like od -cx ?
817 formatter
->close_section();
818 formatter
->flush(cout
);
822 int get_data(ObjectStore
*store
, coll_t coll
, ghobject_t hoid
,
823 ObjectStore::Transaction
*t
, bufferlist
&bl
)
825 bufferlist::iterator ebliter
= bl
.begin();
830 cerr
<< "\tdata: offset " << ds
.offset
<< " len " << ds
.len
<< std::endl
;
831 t
->write(coll
, hoid
, ds
.offset
, ds
.len
, ds
.databl
);
836 Formatter
*formatter
, ghobject_t hoid
,
839 bufferlist::iterator ebliter
= bl
.begin();
843 // This could have been handled in the caller if we didn't need to
844 // support exports that didn't include object_info_t in object_begin.
845 if (hoid
.generation
== ghobject_t::NO_GEN
&&
846 hoid
.hobj
.is_head()) {
847 map
<string
,bufferlist
>::iterator mi
= as
.data
.find(SS_ATTR
);
848 if (mi
!= as
.data
.end()) {
850 auto p
= mi
->second
.begin();
852 formatter
->open_object_section("snapset");
853 snapset
.dump(formatter
);
854 formatter
->close_section();
856 formatter
->open_object_section("snapset");
857 formatter
->dump_string("error", "missing SS_ATTR");
858 formatter
->close_section();
862 formatter
->open_object_section("attrs");
863 formatter
->open_array_section("user");
864 for (auto kv
: as
.data
) {
865 // Skip system attributes
866 if (('_' != kv
.first
.at(0)) || kv
.first
.size() == 1)
868 formatter
->open_object_section("user_attr");
869 formatter
->dump_string("name", kv
.first
.substr(1));
871 formatter
->dump_string("value", cleanbin(kv
.second
, b64
));
872 formatter
->dump_bool("Base64", b64
);
873 formatter
->close_section();
875 formatter
->close_section();
876 formatter
->open_array_section("system");
877 for (auto kv
: as
.data
) {
878 // Skip user attributes
879 if (('_' == kv
.first
.at(0)) && kv
.first
.size() != 1)
881 formatter
->open_object_section("sys_attr");
882 formatter
->dump_string("name", kv
.first
);
883 formatter
->close_section();
885 formatter
->close_section();
886 formatter
->close_section();
887 formatter
->flush(cout
);
893 ObjectStore
*store
, coll_t coll
, ghobject_t hoid
,
894 ObjectStore::Transaction
*t
, bufferlist
&bl
,
895 OSDriver
&driver
, SnapMapper
&snap_mapper
)
897 bufferlist::iterator ebliter
= bl
.begin();
902 cerr
<< "\tattrs: len " << as
.data
.size() << std::endl
;
903 t
->setattrs(coll
, hoid
, as
.data
);
905 // This could have been handled in the caller if we didn't need to
906 // support exports that didn't include object_info_t in object_begin.
907 if (hoid
.generation
== ghobject_t::NO_GEN
) {
908 if (hoid
.hobj
.snap
< CEPH_MAXSNAP
) {
909 map
<string
,bufferlist
>::iterator mi
= as
.data
.find(OI_ATTR
);
910 if (mi
!= as
.data
.end()) {
911 object_info_t
oi(mi
->second
);
914 cerr
<< "object_info " << oi
<< std::endl
;
916 OSDriver::OSTransaction
_t(driver
.get_transaction(t
));
917 set
<snapid_t
> oi_snaps(oi
.legacy_snaps
.begin(), oi
.legacy_snaps
.end());
918 if (!oi_snaps
.empty()) {
920 cerr
<< "\tsetting legacy snaps " << oi_snaps
<< std::endl
;
921 snap_mapper
.add_oid(hoid
.hobj
, oi_snaps
, &_t
);
925 if (hoid
.hobj
.is_head()) {
926 map
<string
,bufferlist
>::iterator mi
= as
.data
.find(SS_ATTR
);
927 if (mi
!= as
.data
.end()) {
929 auto p
= mi
->second
.begin();
931 cout
<< "snapset " << snapset
<< std::endl
;
932 if (!snapset
.is_legacy()) {
933 for (auto& p
: snapset
.clone_snaps
) {
934 ghobject_t clone
= hoid
;
935 clone
.hobj
.snap
= p
.first
;
936 set
<snapid_t
> snaps(p
.second
.begin(), p
.second
.end());
937 if (!store
->exists(coll
, clone
)) {
938 // no clone, skip. this is probably a cache pool. this works
939 // because we use a separate transaction per object and clones
940 // come before head in the archive.
942 cerr
<< "\tskipping missing " << clone
<< " (snaps "
943 << snaps
<< ")" << std::endl
;
947 cerr
<< "\tsetting " << clone
.hobj
<< " snaps " << snaps
949 OSDriver::OSTransaction
_t(driver
.get_transaction(t
));
950 assert(!snaps
.empty());
951 snap_mapper
.add_oid(clone
.hobj
, snaps
, &_t
);
955 cerr
<< "missing SS_ATTR on " << hoid
<< std::endl
;
964 int dump_omap_hdr(Formatter
*formatter
, bufferlist
&bl
)
966 bufferlist::iterator ebliter
= bl
.begin();
970 formatter
->open_object_section("omap_header");
971 formatter
->dump_string("value", string(oh
.hdr
.c_str(), oh
.hdr
.length()));
972 formatter
->close_section();
973 formatter
->flush(cout
);
977 int get_omap_hdr(ObjectStore
*store
, coll_t coll
, ghobject_t hoid
,
978 ObjectStore::Transaction
*t
, bufferlist
&bl
)
980 bufferlist::iterator ebliter
= bl
.begin();
985 cerr
<< "\tomap header: " << string(oh
.hdr
.c_str(), oh
.hdr
.length())
987 t
->omap_setheader(coll
, hoid
, oh
.hdr
);
991 int dump_omap(Formatter
*formatter
, bufferlist
&bl
)
993 bufferlist::iterator ebliter
= bl
.begin();
997 formatter
->open_object_section("omaps");
998 formatter
->dump_unsigned("count", os
.omap
.size());
999 formatter
->open_array_section("data");
1000 for (auto o
: os
.omap
) {
1001 formatter
->open_object_section("omap");
1002 formatter
->dump_string("name", o
.first
);
1004 formatter
->dump_string("value", cleanbin(o
.second
, b64
));
1005 formatter
->dump_bool("Base64", b64
);
1006 formatter
->close_section();
1008 formatter
->close_section();
1009 formatter
->close_section();
1010 formatter
->flush(cout
);
1014 int get_omap(ObjectStore
*store
, coll_t coll
, ghobject_t hoid
,
1015 ObjectStore::Transaction
*t
, bufferlist
&bl
)
1017 bufferlist::iterator ebliter
= bl
.begin();
1022 cerr
<< "\tomap: size " << os
.omap
.size() << std::endl
;
1023 t
->omap_setkeys(coll
, hoid
, os
.omap
);
1027 int ObjectStoreTool::dump_object(Formatter
*formatter
,
1030 bufferlist::iterator ebliter
= bl
.begin();
1034 if (ob
.hoid
.hobj
.is_temp()) {
1035 cerr
<< "ERROR: Export contains temporary object '" << ob
.hoid
<< "'" << std::endl
;
1039 formatter
->open_object_section("object");
1040 formatter
->open_object_section("oid");
1041 ob
.hoid
.dump(formatter
);
1042 formatter
->close_section();
1043 formatter
->open_object_section("object_info");
1044 ob
.oi
.dump(formatter
);
1045 formatter
->close_section();
1051 int ret
= read_section(&type
, &ebl
);
1055 //cout << "\tdo_object: Section type " << hex << type << dec << std::endl;
1056 //cout << "\t\tsection size " << ebl.length() << std::endl;
1057 if (type
>= END_OF_TYPES
) {
1058 cout
<< "Skipping unknown object section type" << std::endl
;
1064 ret
= dump_data(formatter
, ebl
);
1065 if (ret
) return ret
;
1069 ret
= dump_attrs(formatter
, ob
.hoid
, ebl
);
1070 if (ret
) return ret
;
1074 ret
= dump_omap_hdr(formatter
, ebl
);
1075 if (ret
) return ret
;
1079 ret
= dump_omap(formatter
, ebl
);
1080 if (ret
) return ret
;
1082 case TYPE_OBJECT_END
:
1086 cerr
<< "Unknown section type " << type
<< std::endl
;
1090 formatter
->close_section();
1094 int ObjectStoreTool::get_object(ObjectStore
*store
, coll_t coll
,
1095 bufferlist
&bl
, OSDMap
&curmap
,
1096 bool *skipped_objects
,
1097 ObjectStore::Sequencer
&osr
)
1099 ObjectStore::Transaction tran
;
1100 ObjectStore::Transaction
*t
= &tran
;
1101 bufferlist::iterator ebliter
= bl
.begin();
1107 OSD::make_snapmapper_oid());
1109 coll
.is_pg_prefix(&pg
);
1110 SnapMapper
mapper(g_ceph_context
, &driver
, 0, 0, 0, pg
.shard
);
1112 if (ob
.hoid
.hobj
.is_temp()) {
1113 cerr
<< "ERROR: Export contains temporary object '" << ob
.hoid
<< "'" << std::endl
;
1116 assert(g_ceph_context
);
1117 if (ob
.hoid
.hobj
.nspace
!= g_ceph_context
->_conf
->osd_hit_set_namespace
) {
1118 object_t oid
= ob
.hoid
.hobj
.oid
;
1119 object_locator_t
loc(ob
.hoid
.hobj
);
1120 pg_t raw_pgid
= curmap
.object_locator_to_pg(oid
, loc
);
1121 pg_t pgid
= curmap
.raw_pg_to_pg(raw_pgid
);
1124 if (coll
.is_pg(&coll_pgid
) == false) {
1125 cerr
<< "INTERNAL ERROR: Bad collection during import" << std::endl
;
1128 if (coll_pgid
.shard
!= ob
.hoid
.shard_id
) {
1129 cerr
<< "INTERNAL ERROR: Importing shard " << coll_pgid
.shard
1130 << " but object shard is " << ob
.hoid
.shard_id
<< std::endl
;
1134 if (coll_pgid
.pgid
!= pgid
) {
1135 cerr
<< "Skipping object '" << ob
.hoid
<< "' which belongs in pg " << pgid
<< std::endl
;
1136 *skipped_objects
= true;
1143 t
->touch(coll
, ob
.hoid
);
1145 cout
<< "Write " << ob
.hoid
<< std::endl
;
1151 int ret
= read_section(&type
, &ebl
);
1155 //cout << "\tdo_object: Section type " << hex << type << dec << std::endl;
1156 //cout << "\t\tsection size " << ebl.length() << std::endl;
1157 if (type
>= END_OF_TYPES
) {
1158 cout
<< "Skipping unknown object section type" << std::endl
;
1164 ret
= get_data(store
, coll
, ob
.hoid
, t
, ebl
);
1165 if (ret
) return ret
;
1169 ret
= get_attrs(store
, coll
, ob
.hoid
, t
, ebl
, driver
, mapper
);
1170 if (ret
) return ret
;
1174 ret
= get_omap_hdr(store
, coll
, ob
.hoid
, t
, ebl
);
1175 if (ret
) return ret
;
1179 ret
= get_omap(store
, coll
, ob
.hoid
, t
, ebl
);
1180 if (ret
) return ret
;
1182 case TYPE_OBJECT_END
:
1186 cerr
<< "Unknown section type " << type
<< std::endl
;
1191 store
->apply_transaction(&osr
, std::move(*t
));
1195 int dump_pg_metadata(Formatter
*formatter
, bufferlist
&bl
, metadata_section
&ms
)
1197 bufferlist::iterator ebliter
= bl
.begin();
1200 formatter
->open_object_section("metadata_section");
1202 formatter
->dump_unsigned("pg_disk_version", (int)ms
.struct_ver
);
1203 formatter
->dump_unsigned("map_epoch", ms
.map_epoch
);
1205 formatter
->open_object_section("OSDMap");
1206 ms
.osdmap
.dump(formatter
);
1207 formatter
->close_section();
1208 formatter
->flush(cout
);
1211 formatter
->open_object_section("info");
1212 ms
.info
.dump(formatter
);
1213 formatter
->close_section();
1214 formatter
->flush(cout
);
1216 formatter
->open_object_section("log");
1217 ms
.log
.dump(formatter
);
1218 formatter
->close_section();
1219 formatter
->flush(cout
);
1221 formatter
->open_object_section("pg_missing_t");
1222 ms
.missing
.dump(formatter
);
1223 formatter
->close_section();
1225 // XXX: ms.past_intervals?
1227 formatter
->close_section();
1228 formatter
->flush(cout
);
1230 if (ms
.osdmap
.get_epoch() != 0 && ms
.map_epoch
!= ms
.osdmap
.get_epoch()) {
1231 cerr
<< "FATAL: Invalid OSDMap epoch in export data" << std::endl
;
1238 int get_pg_metadata(ObjectStore
*store
, bufferlist
&bl
, metadata_section
&ms
,
1239 const OSDSuperblock
& sb
, OSDMap
& curmap
, spg_t pgid
)
1241 bufferlist::iterator ebliter
= bl
.begin();
1243 spg_t old_pgid
= ms
.info
.pgid
;
1244 ms
.info
.pgid
= pgid
;
1247 Formatter
*formatter
= new JSONFormatter(true);
1248 cout
<< "export pgid " << old_pgid
<< std::endl
;
1249 cout
<< "struct_v " << (int)ms
.struct_ver
<< std::endl
;
1250 cout
<< "map epoch " << ms
.map_epoch
<< std::endl
;
1252 formatter
->open_object_section("importing OSDMap");
1253 ms
.osdmap
.dump(formatter
);
1254 formatter
->close_section();
1255 formatter
->flush(cout
);
1258 cout
<< "osd current epoch " << sb
.current_epoch
<< std::endl
;
1259 formatter
->open_object_section("current OSDMap");
1260 curmap
.dump(formatter
);
1261 formatter
->close_section();
1262 formatter
->flush(cout
);
1265 formatter
->open_object_section("info");
1266 ms
.info
.dump(formatter
);
1267 formatter
->close_section();
1268 formatter
->flush(cout
);
1271 formatter
->open_object_section("log");
1272 ms
.log
.dump(formatter
);
1273 formatter
->close_section();
1274 formatter
->flush(cout
);
1277 formatter
->flush(cout
);
1281 if (ms
.osdmap
.get_epoch() != 0 && ms
.map_epoch
!= ms
.osdmap
.get_epoch()) {
1282 cerr
<< "FATAL: Invalid OSDMap epoch in export data" << std::endl
;
1286 if (ms
.map_epoch
> sb
.current_epoch
) {
1287 cerr
<< "ERROR: Export PG's map_epoch " << ms
.map_epoch
<< " > OSD's epoch " << sb
.current_epoch
<< std::endl
;
1288 cerr
<< "The OSD you are using is older than the exported PG" << std::endl
;
1289 cerr
<< "Either use another OSD or join selected OSD to cluster to update it first" << std::endl
;
1293 // Pool verified to exist for call to get_pg_num().
1294 unsigned new_pg_num
= curmap
.get_pg_num(pgid
.pgid
.pool());
1296 if (pgid
.pgid
.ps() >= new_pg_num
) {
1297 cerr
<< "Illegal pgid, the seed is larger than current pg_num" << std::endl
;
1301 // Old exports didn't include OSDMap, see if we have a copy locally
1302 if (ms
.osdmap
.get_epoch() == 0) {
1304 bufferlist findmap_bl
;
1305 int ret
= get_osdmap(store
, ms
.map_epoch
, findmap
, findmap_bl
);
1307 ms
.osdmap
.deepish_copy_from(findmap
);
1309 cerr
<< "WARNING: No OSDMap in old export,"
1310 " some objects may be ignored due to a split" << std::endl
;
1314 // Make sure old_pg_num is 0 in the unusual case that OSDMap not in export
1315 // nor can we find a local copy.
1316 unsigned old_pg_num
= 0;
1317 if (ms
.osdmap
.get_epoch() != 0)
1318 old_pg_num
= ms
.osdmap
.get_pg_num(pgid
.pgid
.pool());
1321 cerr
<< "old_pg_num " << old_pg_num
<< std::endl
;
1322 cerr
<< "new_pg_num " << new_pg_num
<< std::endl
;
1323 cerr
<< ms
.osdmap
<< std::endl
;
1324 cerr
<< curmap
<< std::endl
;
1327 // If we have managed to have a good OSDMap we can do these checks
1329 if (old_pgid
.pgid
.ps() >= old_pg_num
) {
1330 cerr
<< "FATAL: pgid invalid for original map epoch" << std::endl
;
1333 if (pgid
.pgid
.ps() >= old_pg_num
) {
1334 cout
<< "NOTICE: Post split pgid specified" << std::endl
;
1337 if (parent
.is_split(old_pg_num
, new_pg_num
, NULL
)) {
1338 cerr
<< "WARNING: Split occurred, some objects may be ignored" << std::endl
;
1344 cerr
<< "Import pgid " << ms
.info
.pgid
<< std::endl
;
1345 cerr
<< "Previous past_intervals " << ms
.past_intervals
<< std::endl
;
1346 cerr
<< "history.same_interval_since " << ms
.info
.history
.same_interval_since
<< std::endl
;
1349 // Let osd recompute past_intervals and same_interval_since
1350 ms
.past_intervals
.clear();
1351 ms
.info
.history
.same_interval_since
= 0;
1354 cerr
<< "Changing pg epoch " << ms
.map_epoch
<< " to " << sb
.current_epoch
<< std::endl
;
1356 ms
.map_epoch
= sb
.current_epoch
;
1361 // out: pg_log_t that only has entries that apply to import_pgid using curmap
1362 // reject: Entries rejected from "in" are in the reject.log. Other fields not set.
1363 void filter_divergent_priors(spg_t import_pgid
, const OSDMap
&curmap
,
1364 const string
&hit_set_namespace
, const divergent_priors_t
&in
,
1365 divergent_priors_t
&out
, divergent_priors_t
&reject
)
1370 for (divergent_priors_t::const_iterator i
= in
.begin();
1371 i
!= in
.end(); ++i
) {
1373 // Reject divergent priors for temporary objects
1374 if (i
->second
.is_temp()) {
1379 if (i
->second
.nspace
!= hit_set_namespace
) {
1380 object_t oid
= i
->second
.oid
;
1381 object_locator_t
loc(i
->second
);
1382 pg_t raw_pgid
= curmap
.object_locator_to_pg(oid
, loc
);
1383 pg_t pgid
= curmap
.raw_pg_to_pg(raw_pgid
);
1385 if (import_pgid
.pgid
== pgid
) {
1396 int ObjectStoreTool::dump_import(Formatter
*formatter
)
1400 PGLog::IndexedLog log
;
1401 //bool skipped_objects = false;
1403 int ret
= read_super();
1407 if (sh
.magic
!= super_header::super_magic
) {
1408 cerr
<< "Invalid magic number" << std::endl
;
1412 if (sh
.version
> super_header::super_ver
) {
1413 cerr
<< "Can't handle export format version=" << sh
.version
<< std::endl
;
1417 formatter
->open_object_section("Export");
1419 //First section must be TYPE_PG_BEGIN
1421 ret
= read_section(&type
, &ebl
);
1424 if (type
== TYPE_POOL_BEGIN
) {
1425 cerr
<< "Dump of pool exports not supported" << std::endl
;
1427 } else if (type
!= TYPE_PG_BEGIN
) {
1428 cerr
<< "Invalid first section type " << std::to_string(type
) << std::endl
;
1432 bufferlist::iterator ebliter
= ebl
.begin();
1434 pgb
.decode(ebliter
);
1435 spg_t pgid
= pgb
.pgid
;
1437 formatter
->dump_string("pgid", stringify(pgid
));
1438 formatter
->dump_string("cluster_fsid", stringify(pgb
.superblock
.cluster_fsid
));
1439 formatter
->dump_string("features", stringify(pgb
.superblock
.compat_features
));
1442 bool found_metadata
= false;
1443 metadata_section ms
;
1444 bool objects_started
= false;
1446 ret
= read_section(&type
, &ebl
);
1451 cerr
<< "dump_import: Section type " << std::to_string(type
) << std::endl
;
1453 if (type
>= END_OF_TYPES
) {
1454 cerr
<< "Skipping unknown section type" << std::endl
;
1458 case TYPE_OBJECT_BEGIN
:
1459 if (!objects_started
) {
1460 formatter
->open_array_section("objects");
1461 objects_started
= true;
1463 ret
= dump_object(formatter
, ebl
);
1464 if (ret
) return ret
;
1466 case TYPE_PG_METADATA
:
1467 if (objects_started
)
1468 cerr
<< "WARNING: metadata_section out of order" << std::endl
;
1469 ret
= dump_pg_metadata(formatter
, ebl
, ms
);
1470 if (ret
) return ret
;
1471 found_metadata
= true;
1474 if (objects_started
) {
1475 formatter
->close_section();
1480 cerr
<< "Unknown section type " << std::to_string(type
) << std::endl
;
1485 if (!found_metadata
) {
1486 cerr
<< "Missing metadata section" << std::endl
;
1490 formatter
->close_section();
1491 formatter
->flush(cout
);
1496 int ObjectStoreTool::do_import(ObjectStore
*store
, OSDSuperblock
& sb
,
1497 bool force
, std::string pgidstr
,
1498 ObjectStore::Sequencer
&osr
)
1502 PGLog::IndexedLog log
;
1503 bool skipped_objects
= false;
1506 finish_remove_pgs(store
);
1508 int ret
= read_super();
1512 if (sh
.magic
!= super_header::super_magic
) {
1513 cerr
<< "Invalid magic number" << std::endl
;
1517 if (sh
.version
> super_header::super_ver
) {
1518 cerr
<< "Can't handle export format version=" << sh
.version
<< std::endl
;
1522 //First section must be TYPE_PG_BEGIN
1524 ret
= read_section(&type
, &ebl
);
1527 if (type
== TYPE_POOL_BEGIN
) {
1528 cerr
<< "Pool exports cannot be imported into a PG" << std::endl
;
1530 } else if (type
!= TYPE_PG_BEGIN
) {
1531 cerr
<< "Invalid first section type " << std::to_string(type
) << std::endl
;
1535 bufferlist::iterator ebliter
= ebl
.begin();
1537 pgb
.decode(ebliter
);
1538 spg_t pgid
= pgb
.pgid
;
1539 spg_t orig_pgid
= pgid
;
1541 if (pgidstr
.length()) {
1544 bool ok
= user_pgid
.parse(pgidstr
.c_str());
1545 // This succeeded in main() already
1547 if (pgid
!= user_pgid
) {
1548 if (pgid
.pool() != user_pgid
.pool()) {
1549 cerr
<< "Can't specify a different pgid pool, must be " << pgid
.pool() << std::endl
;
1552 if (pgid
.is_no_shard() && !user_pgid
.is_no_shard()) {
1553 cerr
<< "Can't specify a sharded pgid with a non-sharded export" << std::endl
;
1556 // Get shard from export information if not specified
1557 if (!pgid
.is_no_shard() && user_pgid
.is_no_shard()) {
1558 user_pgid
.shard
= pgid
.shard
;
1560 if (pgid
.shard
!= user_pgid
.shard
) {
1561 cerr
<< "Can't specify a different shard, must be " << pgid
.shard
<< std::endl
;
1568 if (!pgb
.superblock
.cluster_fsid
.is_zero()
1569 && pgb
.superblock
.cluster_fsid
!= sb
.cluster_fsid
) {
1570 cerr
<< "Export came from different cluster with fsid "
1571 << pgb
.superblock
.cluster_fsid
<< std::endl
;
1576 cerr
<< "Exported features: " << pgb
.superblock
.compat_features
<< std::endl
;
1579 // Special case: Old export has SHARDS incompat feature on replicated pg, remove it
1580 if (pgid
.is_no_shard())
1581 pgb
.superblock
.compat_features
.incompat
.remove(CEPH_OSD_FEATURE_INCOMPAT_SHARDS
);
1583 if (sb
.compat_features
.compare(pgb
.superblock
.compat_features
) == -1) {
1584 CompatSet unsupported
= sb
.compat_features
.unsupported(pgb
.superblock
.compat_features
);
1586 cerr
<< "Export has incompatible features set " << unsupported
<< std::endl
;
1588 // Let them import if they specify the --force option
1590 return 11; // Positive return means exit status
1593 // Don't import if pool no longer exists
1596 ret
= get_osdmap(store
, sb
.current_epoch
, curmap
, bl
);
1598 cerr
<< "Can't find local OSDMap" << std::endl
;
1601 if (!curmap
.have_pg_pool(pgid
.pgid
.m_pool
)) {
1602 cerr
<< "Pool " << pgid
.pgid
.m_pool
<< " no longer exists" << std::endl
;
1603 // Special exit code for this error, used by test code
1604 return 10; // Positive return means exit status
1607 ghobject_t pgmeta_oid
= pgid
.make_pgmeta_oid();
1608 log_oid
= OSD::make_pg_log_oid(pgid
);
1609 biginfo_oid
= OSD::make_pg_biginfo_oid(pgid
);
1611 //Check for PG already present.
1613 if (store
->collection_exists(coll
)) {
1614 cerr
<< "pgid " << pgid
<< " already exists" << std::endl
;
1619 ObjectStore::Transaction t
;
1620 PG::_create(t
, pgid
,
1621 pgid
.get_split_bits(curmap
.get_pg_pool(pgid
.pool())->get_pg_num()));
1622 PG::_init(t
, pgid
, NULL
);
1624 // mark this coll for removal until we're done
1625 map
<string
,bufferlist
> values
;
1626 ::encode((char)1, values
["_remove"]);
1627 t
.omap_setkeys(coll
, pgid
.make_pgmeta_oid(), values
);
1629 store
->apply_transaction(&osr
, std::move(t
));
1632 cout
<< "Importing pgid " << pgid
;
1633 if (orig_pgid
!= pgid
) {
1634 cout
<< " exported as " << orig_pgid
;
1639 bool found_metadata
= false;
1640 metadata_section ms
;
1642 ret
= read_section(&type
, &ebl
);
1647 cout
<< __func__
<< ": Section type " << std::to_string(type
) << std::endl
;
1649 if (type
>= END_OF_TYPES
) {
1650 cout
<< "Skipping unknown section type" << std::endl
;
1654 case TYPE_OBJECT_BEGIN
:
1655 ret
= get_object(store
, coll
, ebl
, curmap
, &skipped_objects
, osr
);
1656 if (ret
) return ret
;
1658 case TYPE_PG_METADATA
:
1659 ret
= get_pg_metadata(store
, ebl
, ms
, sb
, curmap
, pgid
);
1660 if (ret
) return ret
;
1661 found_metadata
= true;
1667 cerr
<< "Unknown section type " << std::to_string(type
) << std::endl
;
1672 if (!found_metadata
) {
1673 cerr
<< "Missing metadata section" << std::endl
;
1677 ObjectStore::Transaction t
;
1679 pg_log_t newlog
, reject
;
1680 pg_log_t::filter_log(pgid
, curmap
, g_ceph_context
->_conf
->osd_hit_set_namespace
,
1681 ms
.log
, newlog
, reject
);
1683 for (list
<pg_log_entry_t
>::iterator i
= newlog
.log
.begin();
1684 i
!= newlog
.log
.end(); ++i
)
1685 cerr
<< "Keeping log entry " << *i
<< std::endl
;
1686 for (list
<pg_log_entry_t
>::iterator i
= reject
.log
.begin();
1687 i
!= reject
.log
.end(); ++i
)
1688 cerr
<< "Skipping log entry " << *i
<< std::endl
;
1691 divergent_priors_t newdp
, rejectdp
;
1692 filter_divergent_priors(pgid
, curmap
, g_ceph_context
->_conf
->osd_hit_set_namespace
,
1693 ms
.divergent_priors
, newdp
, rejectdp
);
1694 ms
.divergent_priors
= newdp
;
1696 for (divergent_priors_t::iterator i
= newdp
.begin();
1697 i
!= newdp
.end(); ++i
)
1698 cerr
<< "Keeping divergent_prior " << *i
<< std::endl
;
1699 for (divergent_priors_t::iterator i
= rejectdp
.begin();
1700 i
!= rejectdp
.end(); ++i
)
1701 cerr
<< "Skipping divergent_prior " << *i
<< std::endl
;
1704 ms
.missing
.filter_objects([&](const hobject_t
&obj
) {
1705 if (obj
.nspace
== g_ceph_context
->_conf
->osd_hit_set_namespace
)
1707 assert(!obj
.is_temp());
1708 object_t oid
= obj
.oid
;
1709 object_locator_t
loc(obj
);
1710 pg_t raw_pgid
= curmap
.object_locator_to_pg(oid
, loc
);
1711 pg_t _pgid
= curmap
.raw_pg_to_pg(raw_pgid
);
1713 return pgid
.pgid
!= _pgid
;
1718 pg_missing_t missing
;
1719 Formatter
*formatter
= Formatter::create("json-pretty");
1720 dump_log(formatter
, cerr
, newlog
, ms
.missing
);
1724 // Just like a split invalidate stats since the object count is changed
1725 if (skipped_objects
)
1726 ms
.info
.stats
.stats_invalid
= true;
1734 ms
.divergent_priors
,
1736 if (ret
) return ret
;
1739 // done, clear removal flag
1741 cerr
<< "done, clearing removal flag" << std::endl
;
1745 remove
.insert("_remove");
1746 t
.omap_rmkeys(coll
, pgid
.make_pgmeta_oid(), remove
);
1747 store
->apply_transaction(&osr
, std::move(t
));
1753 int do_list(ObjectStore
*store
, string pgidstr
, string object
, boost::optional
<std::string
> nspace
,
1754 Formatter
*formatter
, bool debug
, bool human_readable
, bool head
)
1757 lookup_ghobject
lookup(object
, nspace
, head
);
1758 if (pgidstr
.length() > 0) {
1759 r
= action_on_all_objects_in_pg(store
, pgidstr
, lookup
, debug
);
1761 r
= action_on_all_objects(store
, lookup
, debug
);
1765 lookup
.dump(formatter
, human_readable
);
1766 formatter
->flush(cout
);
1770 int do_meta(ObjectStore
*store
, string object
, Formatter
*formatter
, bool debug
, bool human_readable
)
1773 boost::optional
<std::string
> nspace
; // Not specified
1774 lookup_ghobject
lookup(object
, nspace
);
1775 r
= action_on_all_objects_in_exact_pg(store
, coll_t::meta(), lookup
, debug
);
1778 lookup
.dump(formatter
, human_readable
);
1779 formatter
->flush(cout
);
1783 int remove_object(coll_t coll
, ghobject_t
&ghobj
,
1785 MapCacher::Transaction
<std::string
, bufferlist
> *_t
,
1786 ObjectStore::Transaction
*t
)
1788 int r
= mapper
.remove_oid(ghobj
.hobj
, _t
);
1789 if (r
< 0 && r
!= -ENOENT
) {
1790 cerr
<< "remove_oid returned " << cpp_strerror(r
) << std::endl
;
1794 t
->remove(coll
, ghobj
);
1798 int get_snapset(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, SnapSet
&ss
, bool silent
);
1800 int do_remove_object(ObjectStore
*store
, coll_t coll
,
1801 ghobject_t
&ghobj
, bool all
, bool force
,
1802 ObjectStore::Sequencer
&osr
)
1805 coll
.is_pg_prefix(&pg
);
1809 OSD::make_snapmapper_oid());
1810 SnapMapper
mapper(g_ceph_context
, &driver
, 0, 0, 0, pg
.shard
);
1813 int r
= store
->stat(coll
, ghobj
, &st
);
1815 cerr
<< "remove: " << cpp_strerror(r
) << std::endl
;
1820 if (ghobj
.hobj
.has_snapset()) {
1821 r
= get_snapset(store
, coll
, ghobj
, ss
, false);
1823 cerr
<< "Can't get snapset error " << cpp_strerror(r
) << std::endl
;
1826 if (!ss
.snaps
.empty() && !all
) {
1828 cout
<< "WARNING: only removing "
1829 << (ghobj
.hobj
.is_head() ? "head" : "snapdir")
1830 << " with snapshots present" << std::endl
;
1833 cerr
<< "Snapshots are present, use removeall to delete everything" << std::endl
;
1839 ObjectStore::Transaction t
;
1840 OSDriver::OSTransaction
_t(driver
.get_transaction(&t
));
1842 cout
<< "remove " << ghobj
<< std::endl
;
1845 r
= remove_object(coll
, ghobj
, mapper
, &_t
, &t
);
1850 ghobject_t snapobj
= ghobj
;
1851 for (vector
<snapid_t
>::iterator i
= ss
.snaps
.begin() ;
1852 i
!= ss
.snaps
.end() ; ++i
) {
1853 snapobj
.hobj
.snap
= *i
;
1854 cout
<< "remove " << snapobj
<< std::endl
;
1856 r
= remove_object(coll
, snapobj
, mapper
, &_t
, &t
);
1863 store
->apply_transaction(&osr
, std::move(t
));
1868 int do_list_attrs(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
)
1870 map
<string
,bufferptr
> aset
;
1871 int r
= store
->getattrs(coll
, ghobj
, aset
);
1873 cerr
<< "getattrs: " << cpp_strerror(r
) << std::endl
;
1877 for (map
<string
,bufferptr
>::iterator i
= aset
.begin();i
!= aset
.end(); ++i
) {
1878 string
key(i
->first
);
1880 key
= cleanbin(key
);
1881 cout
<< key
<< std::endl
;
1886 int do_list_omap(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
)
1888 ObjectMap::ObjectMapIterator iter
= store
->get_omap_iterator(coll
, ghobj
);
1890 cerr
<< "omap_get_iterator: " << cpp_strerror(ENOENT
) << std::endl
;
1893 iter
->seek_to_first();
1894 map
<string
, bufferlist
> oset
;
1895 while(iter
->valid()) {
1896 get_omap_batch(iter
, oset
);
1898 for (map
<string
,bufferlist
>::iterator i
= oset
.begin();i
!= oset
.end(); ++i
) {
1899 string
key(i
->first
);
1901 key
= cleanbin(key
);
1902 cout
<< key
<< std::endl
;
1908 int do_get_bytes(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, int fd
)
1913 int ret
= store
->stat(coll
, ghobj
, &st
);
1915 cerr
<< "get-bytes: " << cpp_strerror(ret
) << std::endl
;
1921 cerr
<< "size=" << total
<< std::endl
;
1923 uint64_t offset
= 0;
1924 bufferlist rawdatabl
;
1927 mysize_t len
= max_read
;
1931 ret
= store
->read(coll
, ghobj
, offset
, len
, rawdatabl
);
1938 cerr
<< "data section offset=" << offset
<< " len=" << len
<< std::endl
;
1943 ret
= write(fd
, rawdatabl
.c_str(), ret
);
1953 int do_set_bytes(ObjectStore
*store
, coll_t coll
,
1954 ghobject_t
&ghobj
, int fd
,
1955 ObjectStore::Sequencer
&osr
)
1957 ObjectStore::Transaction tran
;
1958 ObjectStore::Transaction
*t
= &tran
;
1961 cerr
<< "Write " << ghobj
<< std::endl
;
1964 t
->touch(coll
, ghobj
);
1965 t
->truncate(coll
, ghobj
, 0);
1968 uint64_t offset
= 0;
1969 bufferlist rawdatabl
;
1972 ssize_t bytes
= rawdatabl
.read_fd(fd
, max_read
);
1974 cerr
<< "read_fd error " << cpp_strerror(bytes
) << std::endl
;
1982 cerr
<< "\tdata: offset " << offset
<< " bytes " << bytes
<< std::endl
;
1984 t
->write(coll
, ghobj
, offset
, bytes
, rawdatabl
);
1987 // XXX: Should we apply_transaction() every once in a while for very large files
1991 store
->apply_transaction(&osr
, std::move(*t
));
1995 int do_get_attr(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, string key
)
1999 int r
= store
->getattr(coll
, ghobj
, key
.c_str(), bp
);
2001 cerr
<< "getattr: " << cpp_strerror(r
) << std::endl
;
2005 string
value(bp
.c_str(), bp
.length());
2007 value
= cleanbin(value
);
2008 value
.push_back('\n');
2015 int do_set_attr(ObjectStore
*store
, coll_t coll
,
2016 ghobject_t
&ghobj
, string key
, int fd
,
2017 ObjectStore::Sequencer
&osr
)
2019 ObjectStore::Transaction tran
;
2020 ObjectStore::Transaction
*t
= &tran
;
2024 cerr
<< "Setattr " << ghobj
<< std::endl
;
2026 int ret
= get_fd_data(fd
, bl
);
2033 t
->touch(coll
, ghobj
);
2035 t
->setattr(coll
, ghobj
, key
, bl
);
2037 store
->apply_transaction(&osr
, std::move(*t
));
2041 int do_rm_attr(ObjectStore
*store
, coll_t coll
,
2042 ghobject_t
&ghobj
, string key
,
2043 ObjectStore::Sequencer
&osr
)
2045 ObjectStore::Transaction tran
;
2046 ObjectStore::Transaction
*t
= &tran
;
2049 cerr
<< "Rmattr " << ghobj
<< std::endl
;
2054 t
->rmattr(coll
, ghobj
, key
);
2056 store
->apply_transaction(&osr
, std::move(*t
));
2060 int do_get_omap(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, string key
)
2063 map
<string
, bufferlist
> out
;
2067 int r
= store
->omap_get_values(coll
, ghobj
, keys
, &out
);
2069 cerr
<< "omap_get_values: " << cpp_strerror(r
) << std::endl
;
2074 cerr
<< "Key not found" << std::endl
;
2078 assert(out
.size() == 1);
2080 bufferlist bl
= out
.begin()->second
;
2081 string
value(bl
.c_str(), bl
.length());
2083 value
= cleanbin(value
);
2084 value
.push_back('\n');
2091 int do_set_omap(ObjectStore
*store
, coll_t coll
,
2092 ghobject_t
&ghobj
, string key
, int fd
,
2093 ObjectStore::Sequencer
&osr
)
2095 ObjectStore::Transaction tran
;
2096 ObjectStore::Transaction
*t
= &tran
;
2097 map
<string
, bufferlist
> attrset
;
2101 cerr
<< "Set_omap " << ghobj
<< std::endl
;
2103 int ret
= get_fd_data(fd
, valbl
);
2107 attrset
.insert(pair
<string
, bufferlist
>(key
, valbl
));
2112 t
->touch(coll
, ghobj
);
2114 t
->omap_setkeys(coll
, ghobj
, attrset
);
2116 store
->apply_transaction(&osr
, std::move(*t
));
2120 int do_rm_omap(ObjectStore
*store
, coll_t coll
,
2121 ghobject_t
&ghobj
, string key
,
2122 ObjectStore::Sequencer
&osr
)
2124 ObjectStore::Transaction tran
;
2125 ObjectStore::Transaction
*t
= &tran
;
2131 cerr
<< "Rm_omap " << ghobj
<< std::endl
;
2136 t
->omap_rmkeys(coll
, ghobj
, keys
);
2138 store
->apply_transaction(&osr
, std::move(*t
));
2142 int do_get_omaphdr(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
)
2146 int r
= store
->omap_get_header(coll
, ghobj
, &hdrbl
, true);
2148 cerr
<< "omap_get_header: " << cpp_strerror(r
) << std::endl
;
2152 string
header(hdrbl
.c_str(), hdrbl
.length());
2154 header
= cleanbin(header
);
2155 header
.push_back('\n');
2162 int do_set_omaphdr(ObjectStore
*store
, coll_t coll
,
2163 ghobject_t
&ghobj
, int fd
,
2164 ObjectStore::Sequencer
&osr
)
2166 ObjectStore::Transaction tran
;
2167 ObjectStore::Transaction
*t
= &tran
;
2171 cerr
<< "Omap_setheader " << ghobj
<< std::endl
;
2173 int ret
= get_fd_data(fd
, hdrbl
);
2180 t
->touch(coll
, ghobj
);
2182 t
->omap_setheader(coll
, ghobj
, hdrbl
);
2184 store
->apply_transaction(&osr
, std::move(*t
));
2188 struct do_fix_lost
: public action_on_object_t
{
2189 ObjectStore::Sequencer
*osr
;
2191 explicit do_fix_lost(ObjectStore::Sequencer
*_osr
) : osr(_osr
) {}
2193 int call(ObjectStore
*store
, coll_t coll
,
2194 ghobject_t
&ghobj
, object_info_t
&oi
) override
{
2196 cout
<< coll
<< "/" << ghobj
<< " is lost";
2202 oi
.clear_flag(object_info_t::FLAG_LOST
);
2204 ::encode(oi
, bl
, -1); /* fixme: using full features */
2205 ObjectStore::Transaction t
;
2206 t
.setattr(coll
, ghobj
, OI_ATTR
, bl
);
2207 int r
= store
->apply_transaction(osr
, std::move(t
));
2209 cerr
<< "Error getting fixing attr on : " << make_pair(coll
, ghobj
)
2211 << cpp_strerror(r
) << std::endl
;
2219 int get_snapset(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, SnapSet
&ss
, bool silent
= false)
2222 int r
= store
->getattr(coll
, ghobj
, SS_ATTR
, attr
);
2225 cerr
<< "Error getting snapset on : " << make_pair(coll
, ghobj
) << ", "
2226 << cpp_strerror(r
) << std::endl
;
2229 bufferlist::iterator bp
= attr
.begin();
2234 cerr
<< "Error decoding snapset on : " << make_pair(coll
, ghobj
) << ", "
2235 << cpp_strerror(r
) << std::endl
;
2241 int print_obj_info(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, Formatter
* formatter
)
2244 formatter
->open_object_section("obj");
2245 formatter
->open_object_section("id");
2246 ghobj
.dump(formatter
);
2247 formatter
->close_section();
2250 int gr
= store
->getattr(coll
, ghobj
, OI_ATTR
, attr
);
2253 cerr
<< "Error getting attr on : " << make_pair(coll
, ghobj
) << ", "
2254 << cpp_strerror(r
) << std::endl
;
2257 bufferlist::iterator bp
= attr
.begin();
2260 formatter
->open_object_section("info");
2262 formatter
->close_section();
2265 cerr
<< "Error decoding attr on : " << make_pair(coll
, ghobj
) << ", "
2266 << cpp_strerror(r
) << std::endl
;
2270 int sr
= store
->stat(coll
, ghobj
, &st
, true);
2273 cerr
<< "Error stat on : " << make_pair(coll
, ghobj
) << ", "
2274 << cpp_strerror(r
) << std::endl
;
2276 formatter
->open_object_section("stat");
2277 formatter
->dump_int("size", st
.st_size
);
2278 formatter
->dump_int("blksize", st
.st_blksize
);
2279 formatter
->dump_int("blocks", st
.st_blocks
);
2280 formatter
->dump_int("nlink", st
.st_nlink
);
2281 formatter
->close_section();
2284 if (ghobj
.hobj
.has_snapset()) {
2286 int snr
= get_snapset(store
, coll
, ghobj
, ss
);
2290 formatter
->open_object_section("SnapSet");
2292 formatter
->close_section();
2295 formatter
->close_section();
2296 formatter
->flush(cout
);
2301 int set_size(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, uint64_t setsize
, Formatter
* formatter
,
2302 ObjectStore::Sequencer
&osr
, bool corrupt
)
2304 if (ghobj
.hobj
.is_snapdir()) {
2305 cerr
<< "Can't set the size of a snapdir" << std::endl
;
2309 int r
= store
->getattr(coll
, ghobj
, OI_ATTR
, attr
);
2311 cerr
<< "Error getting attr on : " << make_pair(coll
, ghobj
) << ", "
2312 << cpp_strerror(r
) << std::endl
;
2316 bufferlist::iterator bp
= attr
.begin();
2321 cerr
<< "Error getting attr on : " << make_pair(coll
, ghobj
) << ", "
2322 << cpp_strerror(r
) << std::endl
;
2326 r
= store
->stat(coll
, ghobj
, &st
, true);
2328 cerr
<< "Error stat on : " << make_pair(coll
, ghobj
) << ", "
2329 << cpp_strerror(r
) << std::endl
;
2331 ghobject_t
head(ghobj
);
2333 bool found_head
= true;
2334 map
<snapid_t
, uint64_t>::iterator csi
;
2335 bool is_snap
= ghobj
.hobj
.is_snap();
2337 head
.hobj
= head
.hobj
.get_head();
2338 r
= get_snapset(store
, coll
, head
, ss
, true);
2339 if (r
< 0 && r
!= -ENOENT
) {
2340 // Requested get_snapset() silent, so if not -ENOENT show error
2341 cerr
<< "Error getting snapset on : " << make_pair(coll
, head
) << ", "
2342 << cpp_strerror(r
) << std::endl
;
2346 head
.hobj
= head
.hobj
.get_snapdir();
2347 r
= get_snapset(store
, coll
, head
, ss
);
2354 csi
= ss
.clone_size
.find(ghobj
.hobj
.snap
);
2355 if (csi
== ss
.clone_size
.end()) {
2356 cerr
<< "SnapSet is missing clone_size for snap " << ghobj
.hobj
.snap
<< std::endl
;
2360 if ((uint64_t)st
.st_size
== setsize
&& oi
.size
== setsize
2361 && (!is_snap
|| csi
->second
== setsize
)) {
2362 cout
<< "Size of object is already " << setsize
<< std::endl
;
2365 cout
<< "Setting size to " << setsize
<< ", stat size " << st
.st_size
2366 << ", obj info size " << oi
.size
;
2368 cout
<< ", " << (found_head
? "head" : "snapdir")
2369 << " clone_size " << csi
->second
;
2370 csi
->second
= setsize
;
2376 ObjectStore::Transaction t
;
2377 // Only modify object info if we want to corrupt it
2378 if (!corrupt
&& (uint64_t)st
.st_size
!= setsize
) {
2379 t
.truncate(coll
, ghobj
, setsize
);
2380 // Changing objectstore size will invalidate data_digest, so clear it.
2381 oi
.clear_data_digest();
2383 ::encode(oi
, attr
, -1); /* fixme: using full features */
2384 t
.setattr(coll
, ghobj
, OI_ATTR
, attr
);
2386 bufferlist snapattr
;
2388 ::encode(ss
, snapattr
);
2389 t
.setattr(coll
, head
, SS_ATTR
, snapattr
);
2391 r
= store
->apply_transaction(&osr
, std::move(t
));
2393 cerr
<< "Error writing object info: " << make_pair(coll
, ghobj
) << ", "
2394 << cpp_strerror(r
) << std::endl
;
2401 int clear_snapset(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
,
2402 string arg
, ObjectStore::Sequencer
&osr
)
2405 int ret
= get_snapset(store
, coll
, ghobj
, ss
);
2409 // Use "head" to set head_exists incorrectly
2410 if (arg
== "corrupt" || arg
== "head")
2411 ss
.head_exists
= !ghobj
.hobj
.is_head();
2412 else if (ss
.head_exists
!= ghobj
.hobj
.is_head()) {
2413 cerr
<< "Correcting head_exists, set to "
2414 << (ghobj
.hobj
.is_head() ? "true" : "false") << std::endl
;
2415 ss
.head_exists
= ghobj
.hobj
.is_head();
2417 // Use "corrupt" to clear entire SnapSet
2418 // Use "seq" to just corrupt SnapSet.seq
2419 if (arg
== "corrupt" || arg
== "seq")
2421 // Use "snaps" to just clear SnapSet.snaps
2422 if (arg
== "corrupt" || arg
== "snaps")
2424 // By default just clear clone, clone_overlap and clone_size
2425 if (arg
== "corrupt")
2427 if (arg
== "" || arg
== "clones")
2429 if (arg
== "" || arg
== "clone_overlap")
2430 ss
.clone_overlap
.clear();
2431 if (arg
== "" || arg
== "clone_size")
2432 ss
.clone_size
.clear();
2433 // Break all clone sizes by adding 1
2434 if (arg
== "size") {
2435 for (map
<snapid_t
, uint64_t>::iterator i
= ss
.clone_size
.begin();
2436 i
!= ss
.clone_size
.end(); ++i
)
2443 ObjectStore::Transaction t
;
2444 t
.setattr(coll
, ghobj
, SS_ATTR
, bl
);
2445 int r
= store
->apply_transaction(&osr
, std::move(t
));
2447 cerr
<< "Error setting snapset on : " << make_pair(coll
, ghobj
) << ", "
2448 << cpp_strerror(r
) << std::endl
;
2455 vector
<snapid_t
>::iterator
find(vector
<snapid_t
> &v
, snapid_t clid
)
2457 return std::find(v
.begin(), v
.end(), clid
);
2460 map
<snapid_t
, interval_set
<uint64_t> >::iterator
2461 find(map
<snapid_t
, interval_set
<uint64_t> > &m
, snapid_t clid
)
2463 return m
.find(clid
);
2466 map
<snapid_t
, uint64_t>::iterator
find(map
<snapid_t
, uint64_t> &m
,
2469 return m
.find(clid
);
2473 int remove_from(T
&mv
, string name
, snapid_t cloneid
, bool force
)
2475 typename
T::iterator i
= find(mv
, cloneid
);
2476 if (i
!= mv
.end()) {
2479 cerr
<< "Clone " << cloneid
<< " doesn't exist in " << name
;
2481 cerr
<< " (ignored)" << std::endl
;
2490 int remove_clone(ObjectStore
*store
, coll_t coll
, ghobject_t
&ghobj
, snapid_t cloneid
, bool force
,
2491 ObjectStore::Sequencer
&osr
)
2493 // XXX: Don't allow this if in a cache tier or former cache tier
2494 // bool allow_incomplete_clones() const {
2495 // return cache_mode != CACHEMODE_NONE || has_flag(FLAG_INCOMPLETE_CLONES);
2498 int ret
= get_snapset(store
, coll
, ghobj
, snapset
);
2502 // Derived from trim_object()
2504 vector
<snapid_t
>::iterator p
;
2505 for (p
= snapset
.clones
.begin(); p
!= snapset
.clones
.end(); ++p
)
2508 if (p
== snapset
.clones
.end()) {
2509 cerr
<< "Clone " << cloneid
<< " not present";
2512 if (p
!= snapset
.clones
.begin()) {
2513 // not the oldest... merge overlap into next older clone
2514 vector
<snapid_t
>::iterator n
= p
- 1;
2515 hobject_t prev_coid
= ghobj
.hobj
;
2516 prev_coid
.snap
= *n
;
2517 //bool adjust_prev_bytes = is_present_clone(prev_coid);
2519 //if (adjust_prev_bytes)
2520 // ctx->delta_stats.num_bytes -= snapset.get_clone_bytes(*n);
2522 snapset
.clone_overlap
[*n
].intersection_of(
2523 snapset
.clone_overlap
[*p
]);
2525 //if (adjust_prev_bytes)
2526 // ctx->delta_stats.num_bytes += snapset.get_clone_bytes(*n);
2529 ret
= remove_from(snapset
.clones
, "clones", cloneid
, force
);
2530 if (ret
) return ret
;
2531 ret
= remove_from(snapset
.clone_overlap
, "clone_overlap", cloneid
, force
);
2532 if (ret
) return ret
;
2533 ret
= remove_from(snapset
.clone_size
, "clone_size", cloneid
, force
);
2534 if (ret
) return ret
;
2540 ::encode(snapset
, bl
);
2541 ObjectStore::Transaction t
;
2542 t
.setattr(coll
, ghobj
, SS_ATTR
, bl
);
2543 int r
= store
->apply_transaction(&osr
, std::move(t
));
2545 cerr
<< "Error setting snapset on : " << make_pair(coll
, ghobj
) << ", "
2546 << cpp_strerror(r
) << std::endl
;
2549 cout
<< "Removal of clone " << cloneid
<< " complete" << std::endl
;
2550 cout
<< "Use pg repair after OSD restarted to correct stat information" << std::endl
;
2554 int dup(string srcpath
, ObjectStore
*src
, string dstpath
, ObjectStore
*dst
)
2556 cout
<< "dup from " << src
->get_type() << ": " << srcpath
<< "\n"
2557 << " to " << dst
->get_type() << ": " << dstpath
2559 ObjectStore::Sequencer
osr("dup");
2561 vector
<coll_t
> collections
;
2566 cerr
<< "failed to mount src: " << cpp_strerror(r
) << std::endl
;
2571 cerr
<< "failed to mount dst: " << cpp_strerror(r
) << std::endl
;
2575 if (src
->get_fsid() != dst
->get_fsid()) {
2576 cerr
<< "src fsid " << src
->get_fsid() << " != dest " << dst
->get_fsid()
2580 cout
<< "fsid " << src
->get_fsid() << std::endl
;
2582 // make sure dst is empty
2583 r
= dst
->list_collections(collections
);
2585 cerr
<< "error listing collections on dst: " << cpp_strerror(r
) << std::endl
;
2588 if (!collections
.empty()) {
2589 cerr
<< "destination store is not empty" << std::endl
;
2593 r
= src
->list_collections(collections
);
2595 cerr
<< "error listing collections on src: " << cpp_strerror(r
) << std::endl
;
2599 num
= collections
.size();
2600 cout
<< num
<< " collections" << std::endl
;
2602 for (auto cid
: collections
) {
2603 cout
<< i
++ << "/" << num
<< " " << cid
<< std::endl
;
2605 ObjectStore::Transaction t
;
2606 int bits
= src
->collection_bits(cid
);
2608 if (src
->get_type() == "filestore" && cid
.is_meta()) {
2611 cerr
<< "cannot get bit count for collection " << cid
<< ": "
2612 << cpp_strerror(bits
) << std::endl
;
2616 t
.create_collection(cid
, bits
);
2617 dst
->apply_transaction(&osr
, std::move(t
));
2622 uint64_t bytes
= 0, keys
= 0;
2624 vector
<ghobject_t
> ls
;
2625 r
= src
->collection_list(cid
, pos
, ghobject_t::get_max(), 1000, &ls
, &pos
);
2627 cerr
<< "collection_list on " << cid
<< " from " << pos
<< " got: "
2628 << cpp_strerror(r
) << std::endl
;
2635 for (auto& oid
: ls
) {
2636 //cout << " " << cid << " " << oid << std::endl;
2638 cout
<< " " << std::setw(16) << n
<< " objects, "
2639 << std::setw(16) << bytes
<< " bytes, "
2640 << std::setw(16) << keys
<< " keys"
2641 << std::setw(1) << "\r" << std::flush
;
2645 ObjectStore::Transaction t
;
2648 map
<string
,bufferptr
> attrs
;
2649 src
->getattrs(cid
, oid
, attrs
);
2650 if (!attrs
.empty()) {
2651 t
.setattrs(cid
, oid
, attrs
);
2655 src
->read(cid
, oid
, 0, 0, bl
);
2657 t
.write(cid
, oid
, 0, bl
.length(), bl
);
2658 bytes
+= bl
.length();
2662 map
<string
,bufferlist
> omap
;
2663 src
->omap_get(cid
, oid
, &header
, &omap
);
2664 if (header
.length()) {
2665 t
.omap_setheader(cid
, oid
, header
);
2668 if (!omap
.empty()) {
2669 keys
+= omap
.size();
2670 t
.omap_setkeys(cid
, oid
, omap
);
2673 dst
->apply_transaction(&osr
, std::move(t
));
2676 cout
<< " " << std::setw(16) << n
<< " objects, "
2677 << std::setw(16) << bytes
<< " bytes, "
2678 << std::setw(16) << keys
<< " keys"
2679 << std::setw(1) << std::endl
;
2683 cout
<< "keyring" << std::endl
;
2686 string s
= srcpath
+ "/keyring";
2688 r
= bl
.read_file(s
.c_str(), &err
);
2690 cerr
<< "failed to copy " << s
<< ": " << err
<< std::endl
;
2692 string d
= dstpath
+ "/keyring";
2693 bl
.write_file(d
.c_str(), 0600);
2698 cout
<< "duping osd metadata" << std::endl
;
2700 for (auto k
: {"magic", "whoami", "ceph_fsid", "fsid"}) {
2702 src
->read_meta(k
, &val
);
2703 dst
->write_meta(k
, val
);
2707 dst
->write_meta("ready", "ready");
2709 cout
<< "done." << std::endl
;
2718 void usage(po::options_description
&desc
)
2721 cerr
<< desc
<< std::endl
;
2723 cerr
<< "Positional syntax:" << std::endl
;
2725 cerr
<< "ceph-objectstore-tool ... <object> (get|set)-bytes [file]" << std::endl
;
2726 cerr
<< "ceph-objectstore-tool ... <object> set-(attr|omap) <key> [file]" << std::endl
;
2727 cerr
<< "ceph-objectstore-tool ... <object> (get|rm)-(attr|omap) <key>" << std::endl
;
2728 cerr
<< "ceph-objectstore-tool ... <object> get-omaphdr" << std::endl
;
2729 cerr
<< "ceph-objectstore-tool ... <object> set-omaphdr [file]" << std::endl
;
2730 cerr
<< "ceph-objectstore-tool ... <object> list-attrs" << std::endl
;
2731 cerr
<< "ceph-objectstore-tool ... <object> list-omap" << std::endl
;
2732 cerr
<< "ceph-objectstore-tool ... <object> remove|removeall" << std::endl
;
2733 cerr
<< "ceph-objectstore-tool ... <object> dump" << std::endl
;
2734 cerr
<< "ceph-objectstore-tool ... <object> set-size" << std::endl
;
2735 cerr
<< "ceph-objectstore-tool ... <object> remove-clone-metadata <cloneid>" << std::endl
;
2737 cerr
<< "<object> can be a JSON object description as displayed" << std::endl
;
2738 cerr
<< "by --op list." << std::endl
;
2739 cerr
<< "<object> can be an object name which will be looked up in all" << std::endl
;
2740 cerr
<< "the OSD's PGs." << std::endl
;
2741 cerr
<< "<object> can be the empty string ('') which with a provided pgid " << std::endl
;
2742 cerr
<< "specifies the pgmeta object" << std::endl
;
2744 cerr
<< "The optional [file] argument will read stdin or write stdout" << std::endl
;
2745 cerr
<< "if not specified or if '-' specified." << std::endl
;
2748 bool ends_with(const string
& check
, const string
& ending
)
2750 return check
.size() >= ending
.size() && check
.rfind(ending
) == (check
.size() - ending
.size());
2753 // Based on FileStore::dump_journal(), set-up enough to only dump
2754 int mydump_journal(Formatter
*f
, string journalpath
, bool m_journal_dio
)
2758 if (!journalpath
.length())
2761 FileJournal
*journal
= new FileJournal(g_ceph_context
, uuid_d(), NULL
, NULL
,
2762 journalpath
.c_str(), m_journal_dio
);
2763 r
= journal
->_fdump(*f
, false);
2768 int apply_layout_settings(ObjectStore
*os
, const OSDSuperblock
&superblock
,
2769 const string
&pool_name
, const spg_t
&pgid
, bool dry_run
)
2773 FileStore
*fs
= dynamic_cast<FileStore
*>(os
);
2775 cerr
<< "Nothing to do for non-filestore backend" << std::endl
;
2776 return 0; // making this return success makes testing easier
2781 r
= get_osdmap(os
, superblock
.current_epoch
, curmap
, bl
);
2783 cerr
<< "Can't find local OSDMap: " << cpp_strerror(r
) << std::endl
;
2787 int64_t poolid
= -1;
2788 if (pool_name
.length()) {
2789 poolid
= curmap
.lookup_pg_pool_name(pool_name
);
2791 cerr
<< "Couldn't find pool " << pool_name
<< ": " << cpp_strerror(poolid
)
2797 vector
<coll_t
> collections
, filtered_colls
;
2798 r
= os
->list_collections(collections
);
2800 cerr
<< "Error listing collections: " << cpp_strerror(r
) << std::endl
;
2804 for (auto const &coll
: collections
) {
2806 if (coll
.is_pg(&coll_pgid
) &&
2807 ((poolid
>= 0 && coll_pgid
.pool() == (uint64_t)poolid
) ||
2808 coll_pgid
== pgid
)) {
2809 filtered_colls
.push_back(coll
);
2813 size_t done
= 0, total
= filtered_colls
.size();
2814 for (auto const &coll
: filtered_colls
) {
2816 cerr
<< "Would apply layout settings to " << coll
<< std::endl
;
2818 cerr
<< "Finished " << done
<< "/" << total
<< " collections" << "\r";
2819 r
= fs
->apply_layout_settings(coll
);
2821 cerr
<< "Error applying layout settings to " << coll
<< std::endl
;
2828 cerr
<< "Finished " << total
<< "/" << total
<< " collections" << "\r" << std::endl
;
2832 int main(int argc
, char **argv
)
2834 string dpath
, jpath
, pgidstr
, op
, file
, mountpoint
, mon_store_path
, object
;
2835 string target_data_path
, fsid
;
2836 string objcmd
, arg1
, arg2
, type
, format
, argnspace
, pool
;
2837 boost::optional
<std::string
> nspace
;
2841 bool human_readable
;
2843 Formatter
*formatter
;
2846 po::options_description
desc("Allowed options");
2848 ("help", "produce help message")
2849 ("type", po::value
<string
>(&type
),
2850 "Arg is one of [bluestore, filestore (default), memstore]")
2851 ("data-path", po::value
<string
>(&dpath
),
2852 "path to object store, mandatory")
2853 ("journal-path", po::value
<string
>(&jpath
),
2854 "path to journal, use if tool can't find it")
2855 ("pgid", po::value
<string
>(&pgidstr
),
2856 "PG id, mandatory for info, log, remove, export, export-remove, rm-past-intervals, mark-complete, and mandatory for apply-layout-settings if --pool is not specified")
2857 ("pool", po::value
<string
>(&pool
),
2858 "Pool name, mandatory for apply-layout-settings if --pgid is not specified")
2859 ("op", po::value
<string
>(&op
),
2860 "Arg is one of [info, log, remove, mkfs, fsck, repair, fuse, dup, export, export-remove, import, list, fix-lost, list-pgs, rm-past-intervals, dump-journal, dump-super, meta-list, "
2861 "get-osdmap, set-osdmap, get-inc-osdmap, set-inc-osdmap, mark-complete, apply-layout-settings, update-mon-db, dump-import]")
2862 ("epoch", po::value
<unsigned>(&epoch
),
2863 "epoch# for get-osdmap and get-inc-osdmap, the current epoch in use if not specified")
2864 ("file", po::value
<string
>(&file
),
2865 "path of file to export, export-remove, import, get-osdmap, set-osdmap, get-inc-osdmap or set-inc-osdmap")
2866 ("mon-store-path", po::value
<string
>(&mon_store_path
),
2867 "path of monstore to update-mon-db")
2868 ("fsid", po::value
<string
>(&fsid
),
2869 "fsid for new store created by mkfs")
2870 ("target-data-path", po::value
<string
>(&target_data_path
),
2871 "path of target object store (for --op dup)")
2872 ("mountpoint", po::value
<string
>(&mountpoint
),
2874 ("format", po::value
<string
>(&format
)->default_value("json-pretty"),
2875 "Output format which may be json, json-pretty, xml, xml-pretty")
2876 ("debug", "Enable diagnostic output to stderr")
2877 ("force", "Ignore some types of errors and proceed with operation - USE WITH CAUTION: CORRUPTION POSSIBLE NOW OR IN THE FUTURE")
2878 ("skip-journal-replay", "Disable journal replay")
2879 ("skip-mount-omap", "Disable mounting of omap")
2880 ("head", "Find head/snapdir when searching for objects by name")
2881 ("dry-run", "Don't modify the objectstore")
2882 ("namespace", po::value
<string
>(&argnspace
), "Specify namespace when searching for objects")
2885 po::options_description
positional("Positional options");
2886 positional
.add_options()
2887 ("object", po::value
<string
>(&object
), "'' for pgmeta_oid, object name or ghobject in json")
2888 ("objcmd", po::value
<string
>(&objcmd
), "command [(get|set)-bytes, (get|set|rm)-(attr|omap), (get|set)-omaphdr, list-attrs, list-omap, remove]")
2889 ("arg1", po::value
<string
>(&arg1
), "arg1 based on cmd")
2890 ("arg2", po::value
<string
>(&arg2
), "arg2 based on cmd")
2893 po::options_description all
;
2894 all
.add(desc
).add(positional
);
2896 po::positional_options_description pd
;
2897 pd
.add("object", 1).add("objcmd", 1).add("arg1", 1).add("arg2", 1);
2899 vector
<string
> ceph_option_strings
;
2900 po::variables_map vm
;
2902 po::parsed_options parsed
=
2903 po::command_line_parser(argc
, argv
).options(all
).allow_unregistered().positional(pd
).run();
2904 po::store( parsed
, vm
);
2906 ceph_option_strings
= po::collect_unrecognized(parsed
.options
,
2907 po::include_positional
);
2908 } catch(po::error
&e
) {
2909 std::cerr
<< e
.what() << std::endl
;
2913 if (vm
.count("help")) {
2918 debug
= (vm
.count("debug") > 0);
2920 force
= (vm
.count("force") > 0);
2922 if (vm
.count("namespace"))
2925 dry_run
= (vm
.count("dry-run") > 0);
2927 osflagbits_t flags
= 0;
2928 if (dry_run
|| vm
.count("skip-journal-replay"))
2929 flags
|= SKIP_JOURNAL_REPLAY
;
2930 if (vm
.count("skip-mount-omap"))
2931 flags
|= SKIP_MOUNT_OMAP
;
2932 if (op
== "update-mon-db")
2933 flags
|= SKIP_JOURNAL_REPLAY
;
2935 head
= (vm
.count("head") > 0);
2937 vector
<const char *> ceph_options
;
2938 env_to_vec(ceph_options
);
2939 ceph_options
.reserve(ceph_options
.size() + ceph_option_strings
.size());
2940 for (vector
<string
>::iterator i
= ceph_option_strings
.begin();
2941 i
!= ceph_option_strings
.end();
2943 ceph_options
.push_back(i
->c_str());
2947 snprintf(fn
, sizeof(fn
), "%s/type", dpath
.c_str());
2948 int fd
= ::open(fn
, O_RDONLY
);
2953 string dp_type
= string(bl
.c_str(), bl
.length() - 1); // drop \n
2954 if (vm
.count("type") && dp_type
!= "" && type
!= dp_type
)
2955 cerr
<< "WARNING: Ignoring type \"" << type
<< "\" - found data-path type \""
2956 << dp_type
<< "\"" << std::endl
;
2958 //cout << "object store type is " << type << std::endl;
2962 if (!vm
.count("type") && type
== "") {
2965 if (!vm
.count("data-path") &&
2966 op
!= "dump-import" &&
2967 !(op
== "dump-journal" && type
== "filestore")) {
2968 cerr
<< "Must provide --data-path" << std::endl
;
2972 if (type
== "filestore" && !vm
.count("journal-path")) {
2973 jpath
= dpath
+ "/journal";
2975 if (!vm
.count("op") && !vm
.count("object")) {
2976 cerr
<< "Must provide --op or object command..." << std::endl
;
2981 vm
.count("op") && vm
.count("object")) {
2982 cerr
<< "Can't specify both --op and object command syntax" << std::endl
;
2986 if (op
== "apply-layout-settings" && !(vm
.count("pool") ^ vm
.count("pgid"))) {
2987 cerr
<< "apply-layout-settings requires either --pool or --pgid"
2992 if (op
!= "list" && vm
.count("object") && !vm
.count("objcmd")) {
2993 cerr
<< "Invalid syntax, missing command" << std::endl
;
2997 if (op
== "fuse" && mountpoint
.length() == 0) {
2998 cerr
<< "Missing fuse mountpoint" << std::endl
;
3002 outistty
= isatty(STDOUT_FILENO
);
3005 if ((op
== "export" || op
== "export-remove" || op
== "get-osdmap" || op
== "get-inc-osdmap") && !dry_run
) {
3006 if (!vm
.count("file") || file
== "-") {
3008 cerr
<< "stdout is a tty and no --file filename specified" << std::endl
;
3011 file_fd
= STDOUT_FILENO
;
3013 file_fd
= open(file
.c_str(), O_WRONLY
|O_CREAT
|O_TRUNC
, 0666);
3015 } else if (op
== "import" || op
== "dump-import" || op
== "set-osdmap" || op
== "set-inc-osdmap") {
3016 if (!vm
.count("file") || file
== "-") {
3017 if (isatty(STDIN_FILENO
)) {
3018 cerr
<< "stdin is a tty and no --file filename specified" << std::endl
;
3021 file_fd
= STDIN_FILENO
;
3023 file_fd
= open(file
.c_str(), O_RDONLY
);
3027 ObjectStoreTool tool
= ObjectStoreTool(file_fd
, dry_run
);
3029 if (vm
.count("file") && file_fd
== fd_none
&& !dry_run
) {
3030 cerr
<< "--file option only applies to import, dump-import, export, export-remove, "
3031 << "get-osdmap, set-osdmap, get-inc-osdmap or set-inc-osdmap" << std::endl
;
3035 if (file_fd
!= fd_none
&& file_fd
< 0) {
3036 string err
= string("file: ") + file
;
3037 perror(err
.c_str());
3041 auto cct
= global_init(
3042 NULL
, ceph_options
, CEPH_ENTITY_TYPE_OSD
,
3043 CODE_ENVIRONMENT_UTILITY_NODOUT
, 0);
3044 //CINIT_FLAG_NO_DEFAULT_CONFIG_FILE);
3045 common_init_finish(g_ceph_context
);
3046 g_conf
= g_ceph_context
->_conf
;
3048 g_conf
->set_val_or_die("log_to_stderr", "true");
3049 g_conf
->set_val_or_die("err_to_stderr", "true");
3051 g_conf
->apply_changes(NULL
);
3053 // Special list handling. Treating pretty_format as human readable,
3054 // with one object per line and not an enclosing array.
3055 human_readable
= ends_with(format
, "-pretty");
3056 if ((op
== "list" || op
== "meta-list") && human_readable
) {
3057 // Remove -pretty from end of format which we know is there
3058 format
= format
.substr(0, format
.size() - strlen("-pretty"));
3061 formatter
= Formatter::create(format
);
3062 if (formatter
== NULL
) {
3063 cerr
<< "unrecognized format: " << format
<< std::endl
;
3067 // Special handling for filestore journal, so we can dump it without mounting
3068 if (op
== "dump-journal" && type
== "filestore") {
3069 int ret
= mydump_journal(formatter
, jpath
, g_conf
->journal_dio
);
3071 cerr
<< "journal-path: " << jpath
<< ": "
3072 << cpp_strerror(ret
) << std::endl
;
3075 formatter
->flush(cout
);
3079 if (op
== "dump-import") {
3080 int ret
= tool
.dump_import(formatter
);
3082 cerr
<< "dump-import: "
3083 << cpp_strerror(ret
) << std::endl
;
3089 //Verify that data-path really exists
3091 if (::stat(dpath
.c_str(), &st
) == -1) {
3092 string err
= string("data-path: ") + dpath
;
3093 perror(err
.c_str());
3097 if (pgidstr
.length() && !pgid
.parse(pgidstr
.c_str())) {
3098 cerr
<< "Invalid pgid '" << pgidstr
<< "' specified" << std::endl
;
3102 //Verify that the journal-path really exists
3103 if (type
== "filestore") {
3104 if (::stat(jpath
.c_str(), &st
) == -1) {
3105 string err
= string("journal-path: ") + jpath
;
3106 perror(err
.c_str());
3109 if (S_ISDIR(st
.st_mode
)) {
3110 cerr
<< "journal-path: " << jpath
<< ": "
3111 << cpp_strerror(EISDIR
) << std::endl
;
3116 ObjectStore
*fs
= ObjectStore::create(g_ceph_context
, type
, dpath
, jpath
, flags
);
3118 cerr
<< "Unable to create store of type " << type
<< std::endl
;
3122 if (op
== "fsck" || op
== "fsck-deep") {
3123 int r
= fs
->fsck(op
== "fsck-deep");
3125 cerr
<< "fsck failed: " << cpp_strerror(r
) << std::endl
;
3129 cerr
<< "fsck found " << r
<< " errors" << std::endl
;
3132 cout
<< "fsck found no errors" << std::endl
;
3135 if (op
== "repair" || op
== "repair-deep") {
3136 int r
= fs
->repair(op
== "repair-deep");
3138 cerr
<< "repair failed: " << cpp_strerror(r
) << std::endl
;
3142 cerr
<< "repair found " << r
<< " errors" << std::endl
;
3145 cout
<< "repair found no errors" << std::endl
;
3149 if (fsid
.length()) {
3151 bool r
= f
.parse(fsid
.c_str());
3153 cerr
<< "failed to parse uuid '" << fsid
<< "'" << std::endl
;
3160 cerr
<< "mkfs failed: " << cpp_strerror(r
) << std::endl
;
3168 snprintf(fn
, sizeof(fn
), "%s/type", target_data_path
.c_str());
3169 int fd
= ::open(fn
, O_RDONLY
);
3171 cerr
<< "Unable to open " << target_data_path
<< "/type" << std::endl
;
3177 target_type
= string(bl
.c_str(), bl
.length() - 1); // drop \n
3180 ObjectStore
*targetfs
= ObjectStore::create(
3181 g_ceph_context
, target_type
,
3182 target_data_path
, "", 0);
3183 if (targetfs
== NULL
) {
3184 cerr
<< "Unable to open store of type " << target_type
<< std::endl
;
3187 int r
= dup(dpath
, fs
, target_data_path
, targetfs
);
3189 cerr
<< "dup failed: " << cpp_strerror(r
) << std::endl
;
3195 ObjectStore::Sequencer
*osr
= new ObjectStore::Sequencer(__func__
);
3196 int ret
= fs
->mount();
3198 if (ret
== -EBUSY
) {
3199 cerr
<< "OSD has the store locked" << std::endl
;
3201 cerr
<< "Mount failed with '" << cpp_strerror(ret
) << "'" << std::endl
;
3208 FuseStore
fuse(fs
, mountpoint
);
3209 cout
<< "mounting fuse at " << mountpoint
<< " ..." << std::endl
;
3210 int r
= fuse
.main();
3212 cerr
<< "failed to mount fuse: " << cpp_strerror(r
) << std::endl
;
3216 cerr
<< "fuse support not enabled" << std::endl
;
3222 vector
<coll_t
>::iterator it
;
3223 CompatSet supported
;
3225 #ifdef INTERNAL_TEST
3226 supported
= get_test_compat_set();
3228 supported
= OSD::get_osd_compat_set();
3232 OSDSuperblock superblock
;
3233 bufferlist::iterator p
;
3234 ret
= fs
->read(coll_t::meta(), OSD_SUPERBLOCK_GOBJECT
, 0, 0, bl
);
3236 cerr
<< "Failure to read OSD superblock: " << cpp_strerror(ret
) << std::endl
;
3241 ::decode(superblock
, p
);
3244 cerr
<< "Cluster fsid=" << superblock
.cluster_fsid
<< std::endl
;
3248 cerr
<< "Supported features: " << supported
<< std::endl
;
3249 cerr
<< "On-disk features: " << superblock
.compat_features
<< std::endl
;
3251 if (supported
.compare(superblock
.compat_features
) == -1) {
3252 CompatSet unsupported
= supported
.unsupported(superblock
.compat_features
);
3253 cerr
<< "On-disk OSD incompatible features set "
3254 << unsupported
<< std::endl
;
3259 if (op
== "apply-layout-settings") {
3260 ret
= apply_layout_settings(fs
, superblock
, pool
, pgid
, dry_run
);
3264 if (op
!= "list" && vm
.count("object")) {
3265 // Special case: Create pgmeta_oid if empty string specified
3266 // This can't conflict with any actual object names.
3268 ghobj
= pgid
.make_pgmeta_oid();
3270 json_spirit::Value v
;
3272 if (!json_spirit::read(object
, v
) ||
3273 (v
.type() != json_spirit::array_type
&& v
.type() != json_spirit::obj_type
)) {
3274 // Special: Need head/snapdir so set even if user didn't specify
3275 if (vm
.count("objcmd") && (objcmd
== "remove-clone-metadata"))
3277 lookup_ghobject
lookup(object
, nspace
, head
);
3278 if (action_on_all_objects(fs
, lookup
, debug
)) {
3279 throw std::runtime_error("Internal error");
3281 if (lookup
.size() != 1) {
3283 if (lookup
.size() == 0)
3284 ss
<< "No object id '" << object
<< "' found or invalid JSON specified";
3286 ss
<< "Found " << lookup
.size() << " objects with id '" << object
3287 << "', please use a JSON spec from --op list instead";
3288 throw std::runtime_error(ss
.str());
3290 pair
<coll_t
, ghobject_t
> found
= lookup
.pop();
3291 pgidstr
= found
.first
.to_str();
3292 pgid
.parse(pgidstr
.c_str());
3293 ghobj
= found
.second
;
3297 if (pgidstr
.length() == 0 && v
.type() != json_spirit::array_type
) {
3298 ss
<< "Without --pgid the object '" << object
3299 << "' must be a JSON array";
3300 throw std::runtime_error(ss
.str());
3302 if (v
.type() == json_spirit::array_type
) {
3303 json_spirit::Array array
= v
.get_array();
3304 if (array
.size() != 2) {
3305 ss
<< "Object '" << object
3306 << "' must be a JSON array with 2 elements";
3307 throw std::runtime_error(ss
.str());
3309 vector
<json_spirit::Value
>::iterator i
= array
.begin();
3310 assert(i
!= array
.end());
3311 if (i
->type() != json_spirit::str_type
) {
3312 ss
<< "Object '" << object
3313 << "' must be a JSON array with the first element a string";
3314 throw std::runtime_error(ss
.str());
3316 string object_pgidstr
= i
->get_str();
3317 if (object_pgidstr
!= "meta") {
3319 object_pgid
.parse(object_pgidstr
.c_str());
3320 if (pgidstr
.length() > 0) {
3321 if (object_pgid
!= pgid
) {
3322 ss
<< "object '" << object
3323 << "' has a pgid different from the --pgid="
3324 << pgidstr
<< " option";
3325 throw std::runtime_error(ss
.str());
3328 pgidstr
= object_pgidstr
;
3332 pgidstr
= object_pgidstr
;
3339 } catch (std::runtime_error
& e
) {
3340 ss
<< "Decode object JSON error: " << e
.what();
3341 throw std::runtime_error(ss
.str());
3343 if (pgidstr
!= "meta" && (uint64_t)pgid
.pgid
.m_pool
!= (uint64_t)ghobj
.hobj
.pool
) {
3344 cerr
<< "Object pool and pgid pool don't match" << std::endl
;
3349 } catch (std::runtime_error
& e
) {
3350 cerr
<< e
.what() << std::endl
;
3357 // The ops which require --pgid option are checked here and
3358 // mentioned in the usage for --pgid.
3359 if ((op
== "info" || op
== "log" || op
== "remove" || op
== "export"
3360 || op
== "export-remove" || op
== "rm-past-intervals" || op
== "mark-complete") &&
3361 pgidstr
.length() == 0) {
3362 cerr
<< "Must provide pgid" << std::endl
;
3368 if (op
== "import") {
3371 ret
= tool
.do_import(fs
, superblock
, force
, pgidstr
, *osr
);
3373 catch (const buffer::error
&e
) {
3374 cerr
<< "do_import threw exception error " << e
.what() << std::endl
;
3377 if (ret
== -EFAULT
) {
3378 cerr
<< "Corrupt input for import" << std::endl
;
3381 cout
<< "Import successful" << std::endl
;
3383 } else if (op
== "dump-journal-mount") {
3384 // Undocumented feature to dump journal with mounted fs
3385 // This doesn't support the format option, but it uses the
3386 // ObjectStore::dump_journal() and mounts to get replay to run.
3387 ret
= fs
->dump_journal(cout
);
3389 if (ret
== -EOPNOTSUPP
) {
3390 cerr
<< "Object store type \"" << type
<< "\" doesn't support journal dump" << std::endl
;
3392 cerr
<< "Journal dump failed with error " << cpp_strerror(ret
) << std::endl
;
3396 } else if (op
== "get-osdmap") {
3400 epoch
= superblock
.current_epoch
;
3402 ret
= get_osdmap(fs
, epoch
, osdmap
, bl
);
3404 cerr
<< "Failed to get osdmap#" << epoch
<< ": "
3405 << cpp_strerror(ret
) << std::endl
;
3408 ret
= bl
.write_fd(file_fd
);
3410 cerr
<< "Failed to write to " << file
<< ": " << cpp_strerror(ret
) << std::endl
;
3412 cout
<< "osdmap#" << epoch
<< " exported." << std::endl
;
3415 } else if (op
== "set-osdmap") {
3417 ret
= get_fd_data(file_fd
, bl
);
3419 cerr
<< "Failed to read osdmap " << cpp_strerror(ret
) << std::endl
;
3421 ret
= set_osdmap(fs
, epoch
, bl
, force
, *osr
);
3424 } else if (op
== "get-inc-osdmap") {
3427 epoch
= superblock
.current_epoch
;
3429 ret
= get_inc_osdmap(fs
, epoch
, bl
);
3431 cerr
<< "Failed to get incremental osdmap# " << epoch
<< ": "
3432 << cpp_strerror(ret
) << std::endl
;
3435 ret
= bl
.write_fd(file_fd
);
3437 cerr
<< "Failed to write to " << file
<< ": " << cpp_strerror(ret
) << std::endl
;
3439 cout
<< "inc-osdmap#" << epoch
<< " exported." << std::endl
;
3442 } else if (op
== "set-inc-osdmap") {
3444 ret
= get_fd_data(file_fd
, bl
);
3446 cerr
<< "Failed to read incremental osdmap " << cpp_strerror(ret
) << std::endl
;
3449 ret
= set_inc_osdmap(fs
, epoch
, bl
, force
, *osr
);
3452 } else if (op
== "update-mon-db") {
3453 if (!vm
.count("mon-store-path")) {
3454 cerr
<< "Please specify the path to monitor db to update" << std::endl
;
3457 ret
= update_mon_db(*fs
, superblock
, dpath
+ "/keyring", mon_store_path
);
3462 log_oid
= OSD::make_pg_log_oid(pgid
);
3463 biginfo_oid
= OSD::make_pg_biginfo_oid(pgid
);
3465 if (op
== "remove") {
3466 if (!force
&& !dry_run
) {
3467 cerr
<< "Please use export-remove or you must use --force option" << std::endl
;
3471 ret
= initiate_new_remove_pg(fs
, pgid
, *osr
);
3473 cerr
<< "PG '" << pgid
<< "' not found" << std::endl
;
3476 cout
<< "Remove successful" << std::endl
;
3480 if (op
== "fix-lost") {
3481 boost::scoped_ptr
<action_on_object_t
> action
;
3482 action
.reset(new do_fix_lost(osr
));
3483 if (pgidstr
.length())
3484 ret
= action_on_all_objects_in_exact_pg(fs
, coll_t(pgid
), *action
, debug
);
3486 ret
= action_on_all_objects(fs
, *action
, debug
);
3491 ret
= do_list(fs
, pgidstr
, object
, nspace
, formatter
, debug
,
3492 human_readable
, head
);
3494 cerr
<< "do_list failed: " << cpp_strerror(ret
) << std::endl
;
3499 if (op
== "dump-super") {
3500 formatter
->open_object_section("superblock");
3501 superblock
.dump(formatter
);
3502 formatter
->close_section();
3503 formatter
->flush(cout
);
3508 if (op
== "meta-list") {
3509 ret
= do_meta(fs
, object
, formatter
, debug
, human_readable
);
3511 cerr
<< "do_meta failed: " << cpp_strerror(ret
) << std::endl
;
3516 ret
= fs
->list_collections(ls
);
3518 cerr
<< "failed to list pgs: " << cpp_strerror(ret
) << std::endl
;
3522 if (debug
&& op
== "list-pgs")
3523 cout
<< "Performing list-pgs operation" << std::endl
;
3526 for (it
= ls
.begin(); it
!= ls
.end(); ++it
) {
3529 if (pgidstr
== "meta") {
3530 if (it
->to_str() == "meta")
3536 if (!it
->is_pg(&tmppgid
)) {
3540 if (it
->is_temp(&tmppgid
)) {
3544 if (op
!= "list-pgs" && tmppgid
!= pgid
) {
3548 if (op
!= "list-pgs") {
3553 cout
<< tmppgid
<< std::endl
;
3556 if (op
== "list-pgs") {
3561 // If not an object command nor any of the ops handled below, then output this usage
3562 // before complaining about a bad pgid
3563 if (!vm
.count("objcmd") && op
!= "export" && op
!= "export-remove" && op
!= "info" && op
!= "log" && op
!= "rm-past-intervals" && op
!= "mark-complete") {
3564 cerr
<< "Must provide --op (info, log, remove, mkfs, fsck, repair, export, export-remove, import, list, fix-lost, list-pgs, rm-past-intervals, dump-journal, dump-super, meta-list, "
3565 "get-osdmap, set-osdmap, get-inc-osdmap, set-inc-osdmap, mark-complete, dump-import)"
3572 // The following code for export, info, log require omap or !skip-mount-omap
3573 if (it
!= ls
.end()) {
3577 if (vm
.count("objcmd")) {
3579 if (objcmd
== "remove" || objcmd
== "removeall") {
3580 bool all
= (objcmd
== "removeall");
3581 ret
= do_remove_object(fs
, coll
, ghobj
, all
, force
, *osr
);
3583 } else if (objcmd
== "list-attrs") {
3584 ret
= do_list_attrs(fs
, coll
, ghobj
);
3586 } else if (objcmd
== "list-omap") {
3587 ret
= do_list_omap(fs
, coll
, ghobj
);
3589 } else if (objcmd
== "get-bytes" || objcmd
== "set-bytes") {
3590 if (objcmd
== "get-bytes") {
3592 if (vm
.count("arg1") == 0 || arg1
== "-") {
3595 fd
= open(arg1
.c_str(), O_WRONLY
|O_TRUNC
|O_CREAT
|O_EXCL
|O_LARGEFILE
, 0666);
3597 cerr
<< "open " << arg1
<< " " << cpp_strerror(errno
) << std::endl
;
3602 ret
= do_get_bytes(fs
, coll
, ghobj
, fd
);
3603 if (fd
!= STDOUT_FILENO
)
3607 if (vm
.count("arg1") == 0 || arg1
== "-") {
3608 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3609 if (isatty(STDIN_FILENO
)) {
3610 cerr
<< "stdin is a tty and no file specified" << std::endl
;
3616 fd
= open(arg1
.c_str(), O_RDONLY
|O_LARGEFILE
, 0666);
3618 cerr
<< "open " << arg1
<< " " << cpp_strerror(errno
) << std::endl
;
3623 ret
= do_set_bytes(fs
, coll
, ghobj
, fd
, *osr
);
3624 if (fd
!= STDIN_FILENO
)
3628 } else if (objcmd
== "get-attr") {
3629 if (vm
.count("arg1") == 0) {
3634 ret
= do_get_attr(fs
, coll
, ghobj
, arg1
);
3636 } else if (objcmd
== "set-attr") {
3637 if (vm
.count("arg1") == 0) {
3643 if (vm
.count("arg2") == 0 || arg2
== "-") {
3644 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3645 if (isatty(STDIN_FILENO
)) {
3646 cerr
<< "stdin is a tty and no file specified" << std::endl
;
3652 fd
= open(arg2
.c_str(), O_RDONLY
|O_LARGEFILE
, 0666);
3654 cerr
<< "open " << arg2
<< " " << cpp_strerror(errno
) << std::endl
;
3659 ret
= do_set_attr(fs
, coll
, ghobj
, arg1
, fd
, *osr
);
3660 if (fd
!= STDIN_FILENO
)
3663 } else if (objcmd
== "rm-attr") {
3664 if (vm
.count("arg1") == 0) {
3669 ret
= do_rm_attr(fs
, coll
, ghobj
, arg1
, *osr
);
3671 } else if (objcmd
== "get-omap") {
3672 if (vm
.count("arg1") == 0) {
3677 ret
= do_get_omap(fs
, coll
, ghobj
, arg1
);
3679 } else if (objcmd
== "set-omap") {
3680 if (vm
.count("arg1") == 0) {
3686 if (vm
.count("arg2") == 0 || arg2
== "-") {
3687 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3688 if (isatty(STDIN_FILENO
)) {
3689 cerr
<< "stdin is a tty and no file specified" << std::endl
;
3695 fd
= open(arg2
.c_str(), O_RDONLY
|O_LARGEFILE
, 0666);
3697 cerr
<< "open " << arg2
<< " " << cpp_strerror(errno
) << std::endl
;
3702 ret
= do_set_omap(fs
, coll
, ghobj
, arg1
, fd
, *osr
);
3703 if (fd
!= STDIN_FILENO
)
3706 } else if (objcmd
== "rm-omap") {
3707 if (vm
.count("arg1") == 0) {
3712 ret
= do_rm_omap(fs
, coll
, ghobj
, arg1
, *osr
);
3714 } else if (objcmd
== "get-omaphdr") {
3715 if (vm
.count("arg1")) {
3720 ret
= do_get_omaphdr(fs
, coll
, ghobj
);
3722 } else if (objcmd
== "set-omaphdr") {
3724 if (vm
.count("arg2")) {
3730 if (vm
.count("arg1") == 0 || arg1
== "-") {
3731 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3732 if (isatty(STDIN_FILENO
)) {
3733 cerr
<< "stdin is a tty and no file specified" << std::endl
;
3739 fd
= open(arg1
.c_str(), O_RDONLY
|O_LARGEFILE
, 0666);
3741 cerr
<< "open " << arg1
<< " " << cpp_strerror(errno
) << std::endl
;
3746 ret
= do_set_omaphdr(fs
, coll
, ghobj
, fd
, *osr
);
3747 if (fd
!= STDIN_FILENO
)
3750 } else if (objcmd
== "dump") {
3751 // There should not be any other arguments
3752 if (vm
.count("arg1") || vm
.count("arg2")) {
3757 ret
= print_obj_info(fs
, coll
, ghobj
, formatter
);
3759 } else if (objcmd
== "set-size" || objcmd
== "corrupt-size") {
3760 // Undocumented testing feature
3761 bool corrupt
= (objcmd
== "corrupt-size");
3763 if (vm
.count("arg1") == 0 || vm
.count("arg2")) {
3768 if (arg1
.length() == 0 || !isdigit(arg1
.c_str()[0])) {
3769 cerr
<< "Invalid size '" << arg1
<< "' specified" << std::endl
;
3773 uint64_t size
= atoll(arg1
.c_str());
3774 ret
= set_size(fs
, coll
, ghobj
, size
, formatter
, *osr
, corrupt
);
3776 } else if (objcmd
== "clear-snapset") {
3777 // UNDOCUMENTED: For testing zap SnapSet
3778 // IGNORE extra args since not in usage anyway
3779 if (!ghobj
.hobj
.has_snapset()) {
3780 cerr
<< "'" << objcmd
<< "' requires a head or snapdir object" << std::endl
;
3784 ret
= clear_snapset(fs
, coll
, ghobj
, arg1
, *osr
);
3786 } else if (objcmd
== "remove-clone-metadata") {
3788 if (vm
.count("arg1") == 0 || vm
.count("arg2")) {
3793 if (!ghobj
.hobj
.has_snapset()) {
3794 cerr
<< "'" << objcmd
<< "' requires a head or snapdir object" << std::endl
;
3798 if (arg1
.length() == 0 || !isdigit(arg1
.c_str()[0])) {
3799 cerr
<< "Invalid cloneid '" << arg1
<< "' specified" << std::endl
;
3803 snapid_t cloneid
= atoi(arg1
.c_str());
3804 ret
= remove_clone(fs
, coll
, ghobj
, cloneid
, force
, *osr
);
3807 cerr
<< "Unknown object command '" << objcmd
<< "'" << std::endl
;
3815 ret
= PG::peek_map_epoch(fs
, pgid
, &map_epoch
, &bl
);
3817 cerr
<< "peek_map_epoch reports error" << std::endl
;
3819 cerr
<< "map_epoch " << map_epoch
<< std::endl
;
3821 pg_info_t
info(pgid
);
3822 PastIntervals past_intervals
;
3824 ret
= PG::read_info(fs
, pgid
, coll
, bl
, info
, past_intervals
,
3827 cerr
<< "read_info error " << cpp_strerror(ret
) << std::endl
;
3830 if (struct_ver
< PG::compat_struct_v
) {
3831 cerr
<< "PG is too old to upgrade, use older Ceph version" << std::endl
;
3836 cerr
<< "struct_v " << (int)struct_ver
<< std::endl
;
3838 if (op
== "export" || op
== "export-remove") {
3839 ret
= tool
.do_export(fs
, coll
, pgid
, info
, map_epoch
, struct_ver
, superblock
, past_intervals
);
3841 cerr
<< "Export successful" << std::endl
;
3842 if (op
== "export-remove") {
3843 ret
= initiate_new_remove_pg(fs
, pgid
, *osr
);
3844 // Export succeeded, so pgid is there
3846 cerr
<< "Remove successful" << std::endl
;
3849 } else if (op
== "info") {
3850 formatter
->open_object_section("info");
3851 info
.dump(formatter
);
3852 formatter
->close_section();
3853 formatter
->flush(cout
);
3855 } else if (op
== "log") {
3856 PGLog::IndexedLog log
;
3857 pg_missing_t missing
;
3858 ret
= get_log(fs
, struct_ver
, coll
, pgid
, info
, log
, missing
);
3862 dump_log(formatter
, cout
, log
, missing
);
3863 } else if (op
== "rm-past-intervals") {
3864 ObjectStore::Transaction tran
;
3865 ObjectStore::Transaction
*t
= &tran
;
3867 if (struct_ver
< PG::compat_struct_v
) {
3868 cerr
<< "Can't remove past-intervals, version mismatch " << (int)struct_ver
3869 << " (pg) < compat " << (int)PG::compat_struct_v
<< " (tool)"
3875 cout
<< "Remove past-intervals " << past_intervals
<< std::endl
;
3877 past_intervals
.clear();
3882 ret
= write_info(*t
, map_epoch
, info
, past_intervals
);
3885 fs
->apply_transaction(osr
, std::move(*t
));
3886 cout
<< "Removal succeeded" << std::endl
;
3888 } else if (op
== "mark-complete") {
3889 ObjectStore::Transaction tran
;
3890 ObjectStore::Transaction
*t
= &tran
;
3892 if (struct_ver
< PG::compat_struct_v
) {
3893 cerr
<< "Can't mark-complete, version mismatch " << (int)struct_ver
3894 << " (pg) < compat " << (int)PG::compat_struct_v
<< " (tool)"
3900 cout
<< "Marking complete " << std::endl
;
3902 info
.last_update
= eversion_t(superblock
.current_epoch
, info
.last_update
.version
+ 1);
3903 info
.last_backfill
= hobject_t::get_max();
3904 info
.last_epoch_started
= superblock
.current_epoch
;
3905 info
.history
.last_epoch_started
= superblock
.current_epoch
;
3906 info
.history
.last_epoch_clean
= superblock
.current_epoch
;
3907 past_intervals
.clear();
3910 ret
= write_info(*t
, map_epoch
, info
, past_intervals
);
3913 fs
->apply_transaction(osr
, std::move(*t
));
3915 cout
<< "Marking complete succeeded" << std::endl
;
3917 assert(!"Should have already checked for valid --op");
3920 cerr
<< "PG '" << pgid
<< "' not found" << std::endl
;
3925 int r
= fs
->umount();
3928 cerr
<< "umount failed: " << cpp_strerror(r
) << std::endl
;
3929 // If no previous error, then use umount() error
3935 // Export output can go to stdout, so put this message on stderr
3937 cerr
<< "dry-run: Nothing changed" << std::endl
;
3939 cout
<< "dry-run: Nothing changed" << std::endl
;