]> git.proxmox.com Git - ceph.git/blob - ceph/src/tools/ceph_objectstore_tool.cc
9fcbbdf3e145c0c92ff44525fe4e83f1f166bbfe
[ceph.git] / ceph / src / tools / ceph_objectstore_tool.cc
1 // -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
2 // vim: ts=8 sw=2 smarttab
3 /*
4 * Ceph - scalable distributed file system
5 *
6 * Copyright (C) 2013 Inktank
7 *
8 * This is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License version 2.1, as published by the Free Software
11 * Foundation. See file COPYING.
12 *
13 */
14
15 #include <boost/program_options/variables_map.hpp>
16 #include <boost/program_options/parsers.hpp>
17 #include <boost/scoped_ptr.hpp>
18 #include <boost/optional.hpp>
19
20 #include <stdlib.h>
21
22 #include "common/Formatter.h"
23 #include "common/errno.h"
24 #include "common/ceph_argparse.h"
25
26 #include "global/global_init.h"
27
28 #include "os/ObjectStore.h"
29 #include "os/filestore/FileJournal.h"
30 #include "os/filestore/FileStore.h"
31 #ifdef HAVE_LIBFUSE
32 #include "os/FuseStore.h"
33 #endif
34
35 #include "osd/PGLog.h"
36 #include "osd/OSD.h"
37 #include "osd/PG.h"
38
39 #include "json_spirit/json_spirit_value.h"
40 #include "json_spirit/json_spirit_reader.h"
41
42 #include "rebuild_mondb.h"
43 #include "ceph_objectstore_tool.h"
44 #include "include/compat.h"
45 #include "include/util.h"
46
47 namespace po = boost::program_options;
48 using namespace std;
49
50 #ifdef INTERNAL_TEST
51 CompatSet get_test_compat_set() {
52 CompatSet::FeatureSet ceph_osd_feature_compat;
53 CompatSet::FeatureSet ceph_osd_feature_ro_compat;
54 CompatSet::FeatureSet ceph_osd_feature_incompat;
55 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_BASE);
56 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_PGINFO);
57 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_OLOC);
58 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_LEC);
59 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_CATEGORIES);
60 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_HOBJECTPOOL);
61 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_BIGINFO);
62 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_LEVELDBINFO);
63 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_LEVELDBLOG);
64 #ifdef INTERNAL_TEST2
65 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_SNAPMAPPER);
66 ceph_osd_feature_incompat.insert(CEPH_OSD_FEATURE_INCOMPAT_SHARDS);
67 #endif
68 return CompatSet(ceph_osd_feature_compat, ceph_osd_feature_ro_compat,
69 ceph_osd_feature_incompat);
70 }
71 #endif
72
73 const ssize_t max_read = 1024 * 1024;
74 const int fd_none = INT_MIN;
75 bool outistty;
76 bool dry_run = false;
77
78 struct action_on_object_t {
79 virtual ~action_on_object_t() {}
80 virtual int call(ObjectStore *store, coll_t coll, ghobject_t &ghobj, object_info_t &oi) = 0;
81 };
82
83 int _action_on_all_objects_in_pg(ObjectStore *store, coll_t coll, action_on_object_t &action, bool debug)
84 {
85 unsigned LIST_AT_A_TIME = 100;
86 ghobject_t next;
87 while (!next.is_max()) {
88 vector<ghobject_t> list;
89 int r = store->collection_list(
90 coll,
91 next,
92 ghobject_t::get_max(),
93 LIST_AT_A_TIME,
94 &list,
95 &next);
96 if (r < 0) {
97 cerr << "Error listing collection: " << coll << ", "
98 << cpp_strerror(r) << std::endl;
99 return r;
100 }
101 for (vector<ghobject_t>::iterator obj = list.begin();
102 obj != list.end();
103 ++obj) {
104 if (obj->is_pgmeta())
105 continue;
106 object_info_t oi;
107 if (coll != coll_t::meta()) {
108 bufferlist attr;
109 r = store->getattr(coll, *obj, OI_ATTR, attr);
110 if (r < 0) {
111 cerr << "Error getting attr on : " << make_pair(coll, *obj) << ", "
112 << cpp_strerror(r) << std::endl;
113 continue;
114 }
115 bufferlist::iterator bp = attr.begin();
116 try {
117 ::decode(oi, bp);
118 } catch (...) {
119 r = -EINVAL;
120 cerr << "Error getting attr on : " << make_pair(coll, *obj) << ", "
121 << cpp_strerror(r) << std::endl;
122 continue;
123 }
124 }
125 r = action.call(store, coll, *obj, oi);
126 if (r < 0)
127 return r;
128 }
129 }
130 return 0;
131 }
132
133 int action_on_all_objects_in_pg(ObjectStore *store, string pgidstr, action_on_object_t &action, bool debug)
134 {
135 spg_t pgid;
136 // Scan collections in case this is an ec pool but no shard specified
137 unsigned scanned = 0;
138 int r = 0;
139 vector<coll_t> colls_to_check;
140 vector<coll_t> candidates;
141 r = store->list_collections(candidates);
142 if (r < 0) {
143 cerr << "Error listing collections: " << cpp_strerror(r) << std::endl;
144 return r;
145 }
146 pgid.parse(pgidstr.c_str());
147 for (vector<coll_t>::iterator i = candidates.begin();
148 i != candidates.end();
149 ++i) {
150 spg_t cand_pgid;
151 if (!i->is_pg(&cand_pgid))
152 continue;
153
154 // If an exact match or treat no shard as any shard
155 if (cand_pgid == pgid ||
156 (pgid.is_no_shard() && pgid.pgid == cand_pgid.pgid)) {
157 colls_to_check.push_back(*i);
158 }
159 }
160
161 if (debug)
162 cerr << colls_to_check.size() << " pgs to scan" << std::endl;
163 for (vector<coll_t>::iterator i = colls_to_check.begin();
164 i != colls_to_check.end();
165 ++i, ++scanned) {
166 if (debug)
167 cerr << "Scanning " << *i << ", " << scanned << "/"
168 << colls_to_check.size() << " completed" << std::endl;
169 r = _action_on_all_objects_in_pg(store, *i, action, debug);
170 if (r < 0)
171 break;
172 }
173 return r;
174 }
175
176 int action_on_all_objects_in_exact_pg(ObjectStore *store, coll_t coll, action_on_object_t &action, bool debug)
177 {
178 int r = _action_on_all_objects_in_pg(store, coll, action, debug);
179 return r;
180 }
181
182 int _action_on_all_objects(ObjectStore *store, action_on_object_t &action, bool debug)
183 {
184 unsigned scanned = 0;
185 int r = 0;
186 vector<coll_t> colls_to_check;
187 vector<coll_t> candidates;
188 r = store->list_collections(candidates);
189 if (r < 0) {
190 cerr << "Error listing collections: " << cpp_strerror(r) << std::endl;
191 return r;
192 }
193 for (vector<coll_t>::iterator i = candidates.begin();
194 i != candidates.end();
195 ++i) {
196 if (i->is_pg()) {
197 colls_to_check.push_back(*i);
198 }
199 }
200
201 if (debug)
202 cerr << colls_to_check.size() << " pgs to scan" << std::endl;
203 for (vector<coll_t>::iterator i = colls_to_check.begin();
204 i != colls_to_check.end();
205 ++i, ++scanned) {
206 if (debug)
207 cerr << "Scanning " << *i << ", " << scanned << "/"
208 << colls_to_check.size() << " completed" << std::endl;
209 r = _action_on_all_objects_in_pg(store, *i, action, debug);
210 if (r < 0)
211 return r;
212 }
213 return 0;
214 }
215
216 int action_on_all_objects(ObjectStore *store, action_on_object_t &action, bool debug)
217 {
218 int r = _action_on_all_objects(store, action, debug);
219 return r;
220 }
221
222 struct pgid_object_list {
223 list<pair<coll_t, ghobject_t> > _objects;
224
225 void insert(coll_t coll, ghobject_t &ghobj) {
226 _objects.push_back(make_pair(coll, ghobj));
227 }
228
229 void dump(Formatter *f, bool human_readable) const {
230 if (!human_readable)
231 f->open_array_section("pgid_objects");
232 for (list<pair<coll_t, ghobject_t> >::const_iterator i = _objects.begin();
233 i != _objects.end();
234 ++i) {
235 f->open_array_section("pgid_object");
236 spg_t pgid;
237 bool is_pg = i->first.is_pg(&pgid);
238 if (is_pg)
239 f->dump_string("pgid", stringify(pgid));
240 if (!is_pg || !human_readable)
241 f->dump_string("coll", i->first.to_str());
242 f->open_object_section("ghobject");
243 i->second.dump(f);
244 f->close_section();
245 f->close_section();
246 if (human_readable) {
247 f->flush(cout);
248 cout << std::endl;
249 }
250 }
251 if (!human_readable) {
252 f->close_section();
253 f->flush(cout);
254 cout << std::endl;
255 }
256 }
257 };
258
259 struct lookup_ghobject : public action_on_object_t {
260 pgid_object_list _objects;
261 const string _name;
262 const boost::optional<std::string> _namespace;
263 bool _need_snapset;
264
265 lookup_ghobject(const string& name, const boost::optional<std::string>& nspace, bool need_snapset = false) : _name(name),
266 _namespace(nspace), _need_snapset(need_snapset) { }
267
268 int call(ObjectStore *store, coll_t coll, ghobject_t &ghobj, object_info_t &oi) override {
269 if (_need_snapset && !ghobj.hobj.has_snapset())
270 return 0;
271 if ((_name.length() == 0 || ghobj.hobj.oid.name == _name) &&
272 (!_namespace || ghobj.hobj.nspace == _namespace))
273 _objects.insert(coll, ghobj);
274 return 0;
275 }
276
277 int size() const {
278 return _objects._objects.size();
279 }
280
281 pair<coll_t, ghobject_t> pop() {
282 pair<coll_t, ghobject_t> front = _objects._objects.front();
283 _objects._objects.pop_front();
284 return front;
285 }
286
287 void dump(Formatter *f, bool human_readable) const {
288 _objects.dump(f, human_readable);
289 }
290 };
291
292 ghobject_t infos_oid = OSD::make_infos_oid();
293 ghobject_t log_oid;
294 ghobject_t biginfo_oid;
295
296 int file_fd = fd_none;
297 bool debug = false;
298 super_header sh;
299 uint64_t testalign;
300
301 static int get_fd_data(int fd, bufferlist &bl)
302 {
303 uint64_t total = 0;
304 do {
305 ssize_t bytes = bl.read_fd(fd, max_read);
306 if (bytes < 0) {
307 cerr << "read_fd error " << cpp_strerror(bytes) << std::endl;
308 return bytes;
309 }
310
311 if (bytes == 0)
312 break;
313
314 total += bytes;
315 } while(true);
316
317 assert(bl.length() == total);
318 return 0;
319 }
320
321 int get_log(ObjectStore *fs, __u8 struct_ver,
322 coll_t coll, spg_t pgid, const pg_info_t &info,
323 PGLog::IndexedLog &log, pg_missing_t &missing)
324 {
325 try {
326 ostringstream oss;
327 assert(struct_ver > 0);
328 PGLog::read_log_and_missing(fs, coll,
329 struct_ver >= 8 ? coll : coll_t::meta(),
330 struct_ver >= 8 ? pgid.make_pgmeta_oid() : log_oid,
331 info, log, missing, oss,
332 g_ceph_context->_conf->osd_ignore_stale_divergent_priors);
333 if (debug && oss.str().size())
334 cerr << oss.str() << std::endl;
335 }
336 catch (const buffer::error &e) {
337 cerr << "read_log_and_missing threw exception error " << e.what() << std::endl;
338 return -EFAULT;
339 }
340 return 0;
341 }
342
343 void dump_log(Formatter *formatter, ostream &out, pg_log_t &log,
344 pg_missing_t &missing)
345 {
346 formatter->open_object_section("op_log");
347 formatter->open_object_section("pg_log_t");
348 log.dump(formatter);
349 formatter->close_section();
350 formatter->flush(out);
351 formatter->open_object_section("pg_missing_t");
352 missing.dump(formatter);
353 formatter->close_section();
354 formatter->flush(out);
355 formatter->open_object_section("map");
356 formatter->close_section();
357 formatter->close_section();
358 formatter->flush(out);
359 }
360
361 //Based on part of OSD::load_pgs()
362 int finish_remove_pgs(ObjectStore *store)
363 {
364 vector<coll_t> ls;
365 int r = store->list_collections(ls);
366 if (r < 0) {
367 cerr << "finish_remove_pgs: failed to list pgs: " << cpp_strerror(r)
368 << std::endl;
369 return r;
370 }
371
372 for (vector<coll_t>::iterator it = ls.begin();
373 it != ls.end();
374 ++it) {
375 spg_t pgid;
376
377 if (it->is_temp(&pgid) ||
378 (it->is_pg(&pgid) && PG::_has_removal_flag(store, pgid))) {
379 cout << "finish_remove_pgs " << *it << " removing " << pgid << std::endl;
380 OSD::recursive_remove_collection(g_ceph_context, store, pgid, *it);
381 continue;
382 }
383
384 //cout << "finish_remove_pgs ignoring unrecognized " << *it << std::endl;
385 }
386 return 0;
387 }
388
389 #pragma GCC diagnostic ignored "-Wpragmas"
390 #pragma GCC diagnostic push
391 #pragma GCC diagnostic ignored "-Wdeprecated-declarations"
392
393 int mark_pg_for_removal(ObjectStore *fs, spg_t pgid, ObjectStore::Transaction *t)
394 {
395 pg_info_t info(pgid);
396 coll_t coll(pgid);
397 ghobject_t pgmeta_oid(info.pgid.make_pgmeta_oid());
398
399 bufferlist bl;
400 epoch_t map_epoch = 0;
401 int r = PG::peek_map_epoch(fs, pgid, &map_epoch, &bl);
402 if (r < 0)
403 cerr << __func__ << " warning: peek_map_epoch reported error" << std::endl;
404 PastIntervals past_intervals;
405 __u8 struct_v;
406 r = PG::read_info(fs, pgid, coll, bl, info, past_intervals, struct_v);
407 if (r < 0) {
408 cerr << __func__ << " error on read_info " << cpp_strerror(r) << std::endl;
409 return r;
410 }
411 assert(struct_v >= 8);
412 // new omap key
413 cout << "setting '_remove' omap key" << std::endl;
414 map<string,bufferlist> values;
415 ::encode((char)1, values["_remove"]);
416 t->omap_setkeys(coll, pgmeta_oid, values);
417 return 0;
418 }
419
420 #pragma GCC diagnostic pop
421 #pragma GCC diagnostic warning "-Wpragmas"
422
423 int initiate_new_remove_pg(ObjectStore *store, spg_t r_pgid,
424 ObjectStore::Sequencer &osr)
425 {
426 if (!dry_run)
427 finish_remove_pgs(store);
428 if (!store->collection_exists(coll_t(r_pgid)))
429 return -ENOENT;
430
431 cout << " marking collection for removal" << std::endl;
432 if (dry_run)
433 return 0;
434 ObjectStore::Transaction rmt;
435 int r = mark_pg_for_removal(store, r_pgid, &rmt);
436 if (r < 0) {
437 return r;
438 }
439 store->apply_transaction(&osr, std::move(rmt));
440 finish_remove_pgs(store);
441 return r;
442 }
443
444 int write_info(ObjectStore::Transaction &t, epoch_t epoch, pg_info_t &info,
445 PastIntervals &past_intervals)
446 {
447 //Empty for this
448 coll_t coll(info.pgid);
449 ghobject_t pgmeta_oid(info.pgid.make_pgmeta_oid());
450 map<string,bufferlist> km;
451 pg_info_t last_written_info;
452 int ret = PG::_prepare_write_info(
453 g_ceph_context,
454 &km, epoch,
455 info,
456 last_written_info,
457 past_intervals,
458 true, true, false);
459 if (ret) cerr << "Failed to write info" << std::endl;
460 t.omap_setkeys(coll, pgmeta_oid, km);
461 return ret;
462 }
463
464 typedef map<eversion_t, hobject_t> divergent_priors_t;
465
466 int write_pg(ObjectStore::Transaction &t, epoch_t epoch, pg_info_t &info,
467 pg_log_t &log, PastIntervals &past_intervals,
468 divergent_priors_t &divergent,
469 pg_missing_t &missing)
470 {
471 int ret = write_info(t, epoch, info, past_intervals);
472 if (ret)
473 return ret;
474 coll_t coll(info.pgid);
475 map<string,bufferlist> km;
476
477 if (!divergent.empty()) {
478 assert(missing.get_items().empty());
479 PGLog::write_log_and_missing_wo_missing(
480 t, &km, log, coll, info.pgid.make_pgmeta_oid(), divergent, true);
481 } else {
482 pg_missing_tracker_t tmissing(missing);
483 PGLog::write_log_and_missing(
484 t, &km, log, coll, info.pgid.make_pgmeta_oid(), tmissing, true);
485 }
486 t.omap_setkeys(coll, info.pgid.make_pgmeta_oid(), km);
487 return 0;
488 }
489
490 const int OMAP_BATCH_SIZE = 25;
491 void get_omap_batch(ObjectMap::ObjectMapIterator &iter, map<string, bufferlist> &oset)
492 {
493 oset.clear();
494 for (int count = OMAP_BATCH_SIZE; count && iter->valid(); --count, iter->next()) {
495 oset.insert(pair<string, bufferlist>(iter->key(), iter->value()));
496 }
497 }
498
499 int ObjectStoreTool::export_file(ObjectStore *store, coll_t cid, ghobject_t &obj)
500 {
501 struct stat st;
502 mysize_t total;
503 footer ft;
504
505 int ret = store->stat(cid, obj, &st);
506 if (ret < 0)
507 return ret;
508
509 cerr << "Read " << obj << std::endl;
510
511 total = st.st_size;
512 if (debug)
513 cerr << "size=" << total << std::endl;
514
515 object_begin objb(obj);
516
517 {
518 bufferptr bp;
519 bufferlist bl;
520 ret = store->getattr(cid, obj, OI_ATTR, bp);
521 if (ret < 0) {
522 cerr << "getattr failure object_info " << ret << std::endl;
523 return ret;
524 }
525 bl.push_back(bp);
526 decode(objb.oi, bl);
527 if (debug)
528 cerr << "object_info: " << objb.oi << std::endl;
529 }
530
531 // NOTE: we include whiteouts, lost, etc.
532
533 ret = write_section(TYPE_OBJECT_BEGIN, objb, file_fd);
534 if (ret < 0)
535 return ret;
536
537 uint64_t offset = 0;
538 bufferlist rawdatabl;
539 while(total > 0) {
540 rawdatabl.clear();
541 mysize_t len = max_read;
542 if (len > total)
543 len = total;
544
545 ret = store->read(cid, obj, offset, len, rawdatabl);
546 if (ret < 0)
547 return ret;
548 if (ret == 0)
549 return -EINVAL;
550
551 data_section dblock(offset, len, rawdatabl);
552 if (debug)
553 cerr << "data section offset=" << offset << " len=" << len << std::endl;
554
555 total -= ret;
556 offset += ret;
557
558 ret = write_section(TYPE_DATA, dblock, file_fd);
559 if (ret) return ret;
560 }
561
562 //Handle attrs for this object
563 map<string,bufferptr> aset;
564 ret = store->getattrs(cid, obj, aset);
565 if (ret) return ret;
566 attr_section as(aset);
567 ret = write_section(TYPE_ATTRS, as, file_fd);
568 if (ret)
569 return ret;
570
571 if (debug) {
572 cerr << "attrs size " << aset.size() << std::endl;
573 }
574
575 //Handle omap information
576 bufferlist hdrbuf;
577 ret = store->omap_get_header(cid, obj, &hdrbuf, true);
578 if (ret < 0) {
579 cerr << "omap_get_header: " << cpp_strerror(ret) << std::endl;
580 return ret;
581 }
582
583 omap_hdr_section ohs(hdrbuf);
584 ret = write_section(TYPE_OMAP_HDR, ohs, file_fd);
585 if (ret)
586 return ret;
587
588 ObjectMap::ObjectMapIterator iter = store->get_omap_iterator(cid, obj);
589 if (!iter) {
590 ret = -ENOENT;
591 cerr << "omap_get_iterator: " << cpp_strerror(ret) << std::endl;
592 return ret;
593 }
594 iter->seek_to_first();
595 int mapcount = 0;
596 map<string, bufferlist> out;
597 while(iter->valid()) {
598 get_omap_batch(iter, out);
599
600 if (out.empty()) break;
601
602 mapcount += out.size();
603 omap_section oms(out);
604 ret = write_section(TYPE_OMAP, oms, file_fd);
605 if (ret)
606 return ret;
607 }
608 if (debug)
609 cerr << "omap map size " << mapcount << std::endl;
610
611 ret = write_simple(TYPE_OBJECT_END, file_fd);
612 if (ret)
613 return ret;
614
615 return 0;
616 }
617
618 int ObjectStoreTool::export_files(ObjectStore *store, coll_t coll)
619 {
620 ghobject_t next;
621
622 while (!next.is_max()) {
623 vector<ghobject_t> objects;
624 int r = store->collection_list(coll, next, ghobject_t::get_max(), 300,
625 &objects, &next);
626 if (r < 0)
627 return r;
628 for (vector<ghobject_t>::iterator i = objects.begin();
629 i != objects.end();
630 ++i) {
631 assert(!i->hobj.is_meta());
632 if (i->is_pgmeta() || i->hobj.is_temp()) {
633 continue;
634 }
635 r = export_file(store, coll, *i);
636 if (r < 0)
637 return r;
638 }
639 }
640 return 0;
641 }
642
643 int set_inc_osdmap(ObjectStore *store, epoch_t e, bufferlist& bl, bool force,
644 ObjectStore::Sequencer &osr) {
645 OSDMap::Incremental inc;
646 bufferlist::iterator it = bl.begin();
647 inc.decode(it);
648 if (e == 0) {
649 e = inc.epoch;
650 } else if (e != inc.epoch) {
651 cerr << "incremental.epoch mismatch: "
652 << inc.epoch << " != " << e << std::endl;
653 if (force) {
654 cerr << "But will continue anyway." << std::endl;
655 } else {
656 return -EINVAL;
657 }
658 }
659 const ghobject_t inc_oid = OSD::get_inc_osdmap_pobject_name(e);
660 if (!store->exists(coll_t::meta(), inc_oid)) {
661 cerr << "inc-osdmap (" << inc_oid << ") does not exist." << std::endl;
662 if (!force) {
663 return -ENOENT;
664 }
665 cout << "Creating a new epoch." << std::endl;
666 }
667 if (dry_run)
668 return 0;
669 ObjectStore::Transaction t;
670 t.write(coll_t::meta(), inc_oid, 0, bl.length(), bl);
671 t.truncate(coll_t::meta(), inc_oid, bl.length());
672 int ret = store->apply_transaction(&osr, std::move(t));
673 if (ret) {
674 cerr << "Failed to set inc-osdmap (" << inc_oid << "): " << ret << std::endl;
675 } else {
676 cout << "Wrote inc-osdmap." << inc.epoch << std::endl;
677 }
678 return ret;
679 }
680
681 int get_inc_osdmap(ObjectStore *store, epoch_t e, bufferlist& bl)
682 {
683 if (store->read(coll_t::meta(),
684 OSD::get_inc_osdmap_pobject_name(e),
685 0, 0, bl) < 0) {
686 return -ENOENT;
687 }
688 return 0;
689 }
690
691 int set_osdmap(ObjectStore *store, epoch_t e, bufferlist& bl, bool force,
692 ObjectStore::Sequencer &osr) {
693 OSDMap osdmap;
694 osdmap.decode(bl);
695 if (e == 0) {
696 e = osdmap.get_epoch();
697 } else if (e != osdmap.get_epoch()) {
698 cerr << "osdmap.epoch mismatch: "
699 << e << " != " << osdmap.get_epoch() << std::endl;
700 if (force) {
701 cerr << "But will continue anyway." << std::endl;
702 } else {
703 return -EINVAL;
704 }
705 }
706 const ghobject_t full_oid = OSD::get_osdmap_pobject_name(e);
707 if (!store->exists(coll_t::meta(), full_oid)) {
708 cerr << "osdmap (" << full_oid << ") does not exist." << std::endl;
709 if (!force) {
710 return -ENOENT;
711 }
712 cout << "Creating a new epoch." << std::endl;
713 }
714 if (dry_run)
715 return 0;
716 ObjectStore::Transaction t;
717 t.write(coll_t::meta(), full_oid, 0, bl.length(), bl);
718 t.truncate(coll_t::meta(), full_oid, bl.length());
719 int ret = store->apply_transaction(&osr, std::move(t));
720 if (ret) {
721 cerr << "Failed to set osdmap (" << full_oid << "): " << ret << std::endl;
722 } else {
723 cout << "Wrote osdmap." << osdmap.get_epoch() << std::endl;
724 }
725 return ret;
726 }
727
728 int get_osdmap(ObjectStore *store, epoch_t e, OSDMap &osdmap, bufferlist& bl)
729 {
730 bool found = store->read(
731 coll_t::meta(), OSD::get_osdmap_pobject_name(e), 0, 0, bl) >= 0;
732 if (!found) {
733 cerr << "Can't find OSDMap for pg epoch " << e << std::endl;
734 return -ENOENT;
735 }
736 osdmap.decode(bl);
737 if (debug)
738 cerr << osdmap << std::endl;
739 return 0;
740 }
741
742 int add_osdmap(ObjectStore *store, metadata_section &ms)
743 {
744 return get_osdmap(store, ms.map_epoch, ms.osdmap, ms.osdmap_bl);
745 }
746
747 int ObjectStoreTool::do_export(ObjectStore *fs, coll_t coll, spg_t pgid,
748 pg_info_t &info, epoch_t map_epoch, __u8 struct_ver,
749 const OSDSuperblock& superblock,
750 PastIntervals &past_intervals)
751 {
752 PGLog::IndexedLog log;
753 pg_missing_t missing;
754
755 cerr << "Exporting " << pgid << std::endl;
756
757 int ret = get_log(fs, struct_ver, coll, pgid, info, log, missing);
758 if (ret > 0)
759 return ret;
760
761 if (debug) {
762 Formatter *formatter = Formatter::create("json-pretty");
763 assert(formatter);
764 dump_log(formatter, cerr, log, missing);
765 delete formatter;
766 }
767 write_super();
768
769 pg_begin pgb(pgid, superblock);
770 // Special case: If replicated pg don't require the importing OSD to have shard feature
771 if (pgid.is_no_shard()) {
772 pgb.superblock.compat_features.incompat.remove(CEPH_OSD_FEATURE_INCOMPAT_SHARDS);
773 }
774 ret = write_section(TYPE_PG_BEGIN, pgb, file_fd);
775 if (ret)
776 return ret;
777
778 // The metadata_section is now before files, so import can detect
779 // errors and abort without wasting time.
780 metadata_section ms(
781 struct_ver,
782 map_epoch,
783 info,
784 log,
785 past_intervals,
786 missing);
787 ret = add_osdmap(fs, ms);
788 if (ret)
789 return ret;
790 ret = write_section(TYPE_PG_METADATA, ms, file_fd);
791 if (ret)
792 return ret;
793
794 ret = export_files(fs, coll);
795 if (ret) {
796 cerr << "export_files error " << ret << std::endl;
797 return ret;
798 }
799
800 ret = write_simple(TYPE_PG_END, file_fd);
801 if (ret)
802 return ret;
803
804 return 0;
805 }
806
807 int get_data(ObjectStore *store, coll_t coll, ghobject_t hoid,
808 ObjectStore::Transaction *t, bufferlist &bl)
809 {
810 bufferlist::iterator ebliter = bl.begin();
811 data_section ds;
812 ds.decode(ebliter);
813
814 if (debug)
815 cerr << "\tdata: offset " << ds.offset << " len " << ds.len << std::endl;
816 t->write(coll, hoid, ds.offset, ds.len, ds.databl);
817 return 0;
818 }
819
820 int get_attrs(
821 ObjectStore *store, coll_t coll, ghobject_t hoid,
822 ObjectStore::Transaction *t, bufferlist &bl,
823 OSDriver &driver, SnapMapper &snap_mapper,
824 const ghobject_t& last_head,
825 const set<ghobject_t>& last_clones)
826 {
827 bufferlist::iterator ebliter = bl.begin();
828 attr_section as;
829 as.decode(ebliter);
830
831 if (debug)
832 cerr << "\tattrs: len " << as.data.size() << std::endl;
833 t->setattrs(coll, hoid, as.data);
834
835 // This could have been handled in the caller if we didn't need to
836 // support exports that didn't include object_info_t in object_begin.
837 if (hoid.generation == ghobject_t::NO_GEN) {
838 if (hoid.hobj.snap < CEPH_MAXSNAP) {
839 map<string,bufferlist>::iterator mi = as.data.find(OI_ATTR);
840 if (mi != as.data.end()) {
841 object_info_t oi(mi->second);
842
843 if (debug)
844 cerr << "object_info " << oi << std::endl;
845
846 OSDriver::OSTransaction _t(driver.get_transaction(t));
847 set<snapid_t> oi_snaps(oi.legacy_snaps.begin(), oi.legacy_snaps.end());
848 if (!oi_snaps.empty()) {
849 if (debug)
850 cerr << "\tsetting legacy snaps " << oi_snaps << std::endl;
851 snap_mapper.add_oid(hoid.hobj, oi_snaps, &_t);
852 }
853 }
854 } else {
855 if (hoid == last_head) {
856 map<string,bufferlist>::iterator mi = as.data.find(SS_ATTR);
857 if (mi != as.data.end()) {
858 SnapSet snapset;
859 auto p = mi->second.begin();
860 snapset.decode(p);
861 cout << "snapset " << snapset << std::endl;
862 if (!snapset.is_legacy()) {
863 for (auto& p : snapset.clone_snaps) {
864 ghobject_t clone = hoid;
865 clone.hobj.snap = p.first;
866 set<snapid_t> snaps(p.second.begin(), p.second.end());
867 if (!store->exists(coll, clone)) {
868 // no clone, skip. this is probably a cache pool. this works
869 // because we use a separate transaction per object and clones
870 // come before head in the archive.
871 if (debug)
872 cerr << "\tskipping missing " << clone << " (snaps "
873 << snaps << ")" << std::endl;
874 continue;
875 }
876 if (debug)
877 cerr << "\tsetting " << clone.hobj << " snaps " << snaps
878 << std::endl;
879 OSDriver::OSTransaction _t(driver.get_transaction(t));
880 assert(!snaps.empty());
881 snap_mapper.add_oid(clone.hobj, snaps, &_t);
882 }
883 }
884 } else {
885 cerr << "missing SS_ATTR on " << hoid << std::endl;
886 }
887 }
888 }
889 }
890
891 return 0;
892 }
893
894 int get_omap_hdr(ObjectStore *store, coll_t coll, ghobject_t hoid,
895 ObjectStore::Transaction *t, bufferlist &bl)
896 {
897 bufferlist::iterator ebliter = bl.begin();
898 omap_hdr_section oh;
899 oh.decode(ebliter);
900
901 if (debug)
902 cerr << "\tomap header: " << string(oh.hdr.c_str(), oh.hdr.length())
903 << std::endl;
904 t->omap_setheader(coll, hoid, oh.hdr);
905 return 0;
906 }
907
908 int get_omap(ObjectStore *store, coll_t coll, ghobject_t hoid,
909 ObjectStore::Transaction *t, bufferlist &bl)
910 {
911 bufferlist::iterator ebliter = bl.begin();
912 omap_section os;
913 os.decode(ebliter);
914
915 if (debug)
916 cerr << "\tomap: size " << os.omap.size() << std::endl;
917 t->omap_setkeys(coll, hoid, os.omap);
918 return 0;
919 }
920
921 int ObjectStoreTool::get_object(ObjectStore *store, coll_t coll,
922 bufferlist &bl, OSDMap &curmap,
923 bool *skipped_objects,
924 ObjectStore::Sequencer &osr,
925 ghobject_t *last_head,
926 set<ghobject_t> *last_clones)
927 {
928 ObjectStore::Transaction tran;
929 ObjectStore::Transaction *t = &tran;
930 bufferlist::iterator ebliter = bl.begin();
931 object_begin ob;
932 ob.decode(ebliter);
933 OSDriver driver(
934 store,
935 coll_t(),
936 OSD::make_snapmapper_oid());
937 spg_t pg;
938 coll.is_pg_prefix(&pg);
939 SnapMapper mapper(g_ceph_context, &driver, 0, 0, 0, pg.shard);
940
941 if (ob.hoid.hobj.is_temp()) {
942 cerr << "ERROR: Export contains temporary object '" << ob.hoid << "'" << std::endl;
943 return -EFAULT;
944 }
945 assert(g_ceph_context);
946 if (ob.hoid.hobj.nspace != g_ceph_context->_conf->osd_hit_set_namespace) {
947 object_t oid = ob.hoid.hobj.oid;
948 object_locator_t loc(ob.hoid.hobj);
949 pg_t raw_pgid = curmap.object_locator_to_pg(oid, loc);
950 pg_t pgid = curmap.raw_pg_to_pg(raw_pgid);
951
952 spg_t coll_pgid;
953 if (coll.is_pg(&coll_pgid) == false) {
954 cerr << "INTERNAL ERROR: Bad collection during import" << std::endl;
955 return -EFAULT;
956 }
957 if (coll_pgid.shard != ob.hoid.shard_id) {
958 cerr << "INTERNAL ERROR: Importing shard " << coll_pgid.shard
959 << " but object shard is " << ob.hoid.shard_id << std::endl;
960 return -EFAULT;
961 }
962
963 if (coll_pgid.pgid != pgid) {
964 cerr << "Skipping object '" << ob.hoid << "' which belongs in pg " << pgid << std::endl;
965 *skipped_objects = true;
966 skip_object(bl);
967 return 0;
968 }
969 }
970
971 if (!dry_run)
972 t->touch(coll, ob.hoid);
973
974 cout << "Write " << ob.hoid << std::endl;
975
976 // manage snap collection
977 if (ob.hoid.hobj.is_snap()) {
978 ghobject_t head = ob.hoid;
979 head.hobj = head.hobj.get_head();
980 if (head == *last_head) {
981 last_clones->insert(ob.hoid);
982 } else {
983 *last_head = head;
984 last_clones->clear();
985 }
986 last_clones->insert(ob.hoid);
987 }
988
989 bufferlist ebl;
990 bool done = false;
991 while(!done) {
992 sectiontype_t type;
993 int ret = read_section(&type, &ebl);
994 if (ret)
995 return ret;
996
997 //cout << "\tdo_object: Section type " << hex << type << dec << std::endl;
998 //cout << "\t\tsection size " << ebl.length() << std::endl;
999 if (type >= END_OF_TYPES) {
1000 cout << "Skipping unknown object section type" << std::endl;
1001 continue;
1002 }
1003 switch(type) {
1004 case TYPE_DATA:
1005 if (dry_run) break;
1006 ret = get_data(store, coll, ob.hoid, t, ebl);
1007 if (ret) return ret;
1008 break;
1009 case TYPE_ATTRS:
1010 if (dry_run) break;
1011 ret = get_attrs(store, coll, ob.hoid, t, ebl, driver, mapper,
1012 *last_head, *last_clones);
1013 if (ret) return ret;
1014 break;
1015 case TYPE_OMAP_HDR:
1016 if (dry_run) break;
1017 ret = get_omap_hdr(store, coll, ob.hoid, t, ebl);
1018 if (ret) return ret;
1019 break;
1020 case TYPE_OMAP:
1021 if (dry_run) break;
1022 ret = get_omap(store, coll, ob.hoid, t, ebl);
1023 if (ret) return ret;
1024 break;
1025 case TYPE_OBJECT_END:
1026 done = true;
1027 break;
1028 default:
1029 cerr << "Unknown section type " << type << std::endl;
1030 return -EFAULT;
1031 }
1032 }
1033 if (!dry_run)
1034 store->apply_transaction(&osr, std::move(*t));
1035 return 0;
1036 }
1037
1038 int get_pg_metadata(ObjectStore *store, bufferlist &bl, metadata_section &ms,
1039 const OSDSuperblock& sb, OSDMap& curmap, spg_t pgid)
1040 {
1041 bufferlist::iterator ebliter = bl.begin();
1042 ms.decode(ebliter);
1043 spg_t old_pgid = ms.info.pgid;
1044 ms.info.pgid = pgid;
1045
1046 #if DIAGNOSTIC
1047 Formatter *formatter = new JSONFormatter(true);
1048 cout << "export pgid " << old_pgid << std::endl;
1049 cout << "struct_v " << (int)ms.struct_ver << std::endl;
1050 cout << "map epoch " << ms.map_epoch << std::endl;
1051
1052 formatter->open_object_section("importing OSDMap");
1053 ms.osdmap.dump(formatter);
1054 formatter->close_section();
1055 formatter->flush(cout);
1056 cout << std::endl;
1057
1058 cout << "osd current epoch " << sb.current_epoch << std::endl;
1059 formatter->open_object_section("current OSDMap");
1060 curmap.dump(formatter);
1061 formatter->close_section();
1062 formatter->flush(cout);
1063 cout << std::endl;
1064
1065 formatter->open_object_section("info");
1066 ms.info.dump(formatter);
1067 formatter->close_section();
1068 formatter->flush(cout);
1069 cout << std::endl;
1070
1071 formatter->open_object_section("log");
1072 ms.log.dump(formatter);
1073 formatter->close_section();
1074 formatter->flush(cout);
1075 cout << std::endl;
1076
1077 formatter->flush(cout);
1078 cout << std::endl;
1079 #endif
1080
1081 if (ms.osdmap.get_epoch() != 0 && ms.map_epoch != ms.osdmap.get_epoch()) {
1082 cerr << "FATAL: Invalid OSDMap epoch in export data" << std::endl;
1083 return -EFAULT;
1084 }
1085
1086 if (ms.map_epoch > sb.current_epoch) {
1087 cerr << "ERROR: Export PG's map_epoch " << ms.map_epoch << " > OSD's epoch " << sb.current_epoch << std::endl;
1088 cerr << "The OSD you are using is older than the exported PG" << std::endl;
1089 cerr << "Either use another OSD or join selected OSD to cluster to update it first" << std::endl;
1090 return -EINVAL;
1091 }
1092
1093 // Pool verified to exist for call to get_pg_num().
1094 unsigned new_pg_num = curmap.get_pg_num(pgid.pgid.pool());
1095
1096 if (pgid.pgid.ps() >= new_pg_num) {
1097 cerr << "Illegal pgid, the seed is larger than current pg_num" << std::endl;
1098 return -EINVAL;
1099 }
1100
1101 // Old exports didn't include OSDMap, see if we have a copy locally
1102 if (ms.osdmap.get_epoch() == 0) {
1103 OSDMap findmap;
1104 bufferlist findmap_bl;
1105 int ret = get_osdmap(store, ms.map_epoch, findmap, findmap_bl);
1106 if (ret == 0) {
1107 ms.osdmap.deepish_copy_from(findmap);
1108 } else {
1109 cerr << "WARNING: No OSDMap in old export,"
1110 " some objects may be ignored due to a split" << std::endl;
1111 }
1112 }
1113
1114 // Make sure old_pg_num is 0 in the unusual case that OSDMap not in export
1115 // nor can we find a local copy.
1116 unsigned old_pg_num = 0;
1117 if (ms.osdmap.get_epoch() != 0)
1118 old_pg_num = ms.osdmap.get_pg_num(pgid.pgid.pool());
1119
1120 if (debug) {
1121 cerr << "old_pg_num " << old_pg_num << std::endl;
1122 cerr << "new_pg_num " << new_pg_num << std::endl;
1123 cerr << ms.osdmap << std::endl;
1124 cerr << curmap << std::endl;
1125 }
1126
1127 // If we have managed to have a good OSDMap we can do these checks
1128 if (old_pg_num) {
1129 if (old_pgid.pgid.ps() >= old_pg_num) {
1130 cerr << "FATAL: pgid invalid for original map epoch" << std::endl;
1131 return -EFAULT;
1132 }
1133 if (pgid.pgid.ps() >= old_pg_num) {
1134 cout << "NOTICE: Post split pgid specified" << std::endl;
1135 } else {
1136 spg_t parent(pgid);
1137 if (parent.is_split(old_pg_num, new_pg_num, NULL)) {
1138 cerr << "WARNING: Split occurred, some objects may be ignored" << std::endl;
1139 }
1140 }
1141 }
1142
1143 if (debug) {
1144 cerr << "Import pgid " << ms.info.pgid << std::endl;
1145 cerr << "Clearing past_intervals " << ms.past_intervals << std::endl;
1146 cerr << "Zero same_interval_since " << ms.info.history.same_interval_since << std::endl;
1147 }
1148
1149 // Let osd recompute past_intervals and same_interval_since
1150 ms.past_intervals.clear();
1151 ms.info.history.same_interval_since = 0;
1152
1153 if (debug)
1154 cerr << "Changing pg epoch " << ms.map_epoch << " to " << sb.current_epoch << std::endl;
1155
1156 ms.map_epoch = sb.current_epoch;
1157
1158 return 0;
1159 }
1160
1161 // out: pg_log_t that only has entries that apply to import_pgid using curmap
1162 // reject: Entries rejected from "in" are in the reject.log. Other fields not set.
1163 void filter_divergent_priors(spg_t import_pgid, const OSDMap &curmap,
1164 const string &hit_set_namespace, const divergent_priors_t &in,
1165 divergent_priors_t &out, divergent_priors_t &reject)
1166 {
1167 out.clear();
1168 reject.clear();
1169
1170 for (divergent_priors_t::const_iterator i = in.begin();
1171 i != in.end(); ++i) {
1172
1173 // Reject divergent priors for temporary objects
1174 if (i->second.is_temp()) {
1175 reject.insert(*i);
1176 continue;
1177 }
1178
1179 if (i->second.nspace != hit_set_namespace) {
1180 object_t oid = i->second.oid;
1181 object_locator_t loc(i->second);
1182 pg_t raw_pgid = curmap.object_locator_to_pg(oid, loc);
1183 pg_t pgid = curmap.raw_pg_to_pg(raw_pgid);
1184
1185 if (import_pgid.pgid == pgid) {
1186 out.insert(*i);
1187 } else {
1188 reject.insert(*i);
1189 }
1190 } else {
1191 out.insert(*i);
1192 }
1193 }
1194 }
1195
1196 int ObjectStoreTool::do_import(ObjectStore *store, OSDSuperblock& sb,
1197 bool force, std::string pgidstr,
1198 ObjectStore::Sequencer &osr)
1199 {
1200 bufferlist ebl;
1201 pg_info_t info;
1202 PGLog::IndexedLog log;
1203 bool skipped_objects = false;
1204
1205 if (!dry_run)
1206 finish_remove_pgs(store);
1207
1208 int ret = read_super();
1209 if (ret)
1210 return ret;
1211
1212 if (sh.magic != super_header::super_magic) {
1213 cerr << "Invalid magic number" << std::endl;
1214 return -EFAULT;
1215 }
1216
1217 if (sh.version > super_header::super_ver) {
1218 cerr << "Can't handle export format version=" << sh.version << std::endl;
1219 return -EINVAL;
1220 }
1221
1222 //First section must be TYPE_PG_BEGIN
1223 sectiontype_t type;
1224 ret = read_section(&type, &ebl);
1225 if (ret)
1226 return ret;
1227 if (type == TYPE_POOL_BEGIN) {
1228 cerr << "Pool exports cannot be imported into a PG" << std::endl;
1229 return -EINVAL;
1230 } else if (type != TYPE_PG_BEGIN) {
1231 cerr << "Invalid first section type " << type << std::endl;
1232 return -EFAULT;
1233 }
1234
1235 bufferlist::iterator ebliter = ebl.begin();
1236 pg_begin pgb;
1237 pgb.decode(ebliter);
1238 spg_t pgid = pgb.pgid;
1239 spg_t orig_pgid = pgid;
1240
1241 if (pgidstr.length()) {
1242 spg_t user_pgid;
1243
1244 bool ok = user_pgid.parse(pgidstr.c_str());
1245 // This succeeded in main() already
1246 assert(ok);
1247 if (pgid != user_pgid) {
1248 if (pgid.pool() != user_pgid.pool()) {
1249 cerr << "Can't specify a different pgid pool, must be " << pgid.pool() << std::endl;
1250 return -EINVAL;
1251 }
1252 if (pgid.is_no_shard() && !user_pgid.is_no_shard()) {
1253 cerr << "Can't specify a sharded pgid with a non-sharded export" << std::endl;
1254 return -EINVAL;
1255 }
1256 // Get shard from export information if not specified
1257 if (!pgid.is_no_shard() && user_pgid.is_no_shard()) {
1258 user_pgid.shard = pgid.shard;
1259 }
1260 if (pgid.shard != user_pgid.shard) {
1261 cerr << "Can't specify a different shard, must be " << pgid.shard << std::endl;
1262 return -EINVAL;
1263 }
1264 pgid = user_pgid;
1265 }
1266 }
1267
1268 if (!pgb.superblock.cluster_fsid.is_zero()
1269 && pgb.superblock.cluster_fsid != sb.cluster_fsid) {
1270 cerr << "Export came from different cluster with fsid "
1271 << pgb.superblock.cluster_fsid << std::endl;
1272 return -EINVAL;
1273 }
1274
1275 if (debug) {
1276 cerr << "Exported features: " << pgb.superblock.compat_features << std::endl;
1277 }
1278
1279 // Special case: Old export has SHARDS incompat feature on replicated pg, remove it
1280 if (pgid.is_no_shard())
1281 pgb.superblock.compat_features.incompat.remove(CEPH_OSD_FEATURE_INCOMPAT_SHARDS);
1282
1283 if (sb.compat_features.compare(pgb.superblock.compat_features) == -1) {
1284 CompatSet unsupported = sb.compat_features.unsupported(pgb.superblock.compat_features);
1285
1286 cerr << "Export has incompatible features set " << unsupported << std::endl;
1287
1288 // Let them import if they specify the --force option
1289 if (!force)
1290 return 11; // Positive return means exit status
1291 }
1292
1293 // Don't import if pool no longer exists
1294 OSDMap curmap;
1295 bufferlist bl;
1296 ret = get_osdmap(store, sb.current_epoch, curmap, bl);
1297 if (ret) {
1298 cerr << "Can't find local OSDMap" << std::endl;
1299 return ret;
1300 }
1301 if (!curmap.have_pg_pool(pgid.pgid.m_pool)) {
1302 cerr << "Pool " << pgid.pgid.m_pool << " no longer exists" << std::endl;
1303 // Special exit code for this error, used by test code
1304 return 10; // Positive return means exit status
1305 }
1306
1307 ghobject_t pgmeta_oid = pgid.make_pgmeta_oid();
1308 log_oid = OSD::make_pg_log_oid(pgid);
1309 biginfo_oid = OSD::make_pg_biginfo_oid(pgid);
1310
1311 //Check for PG already present.
1312 coll_t coll(pgid);
1313 if (store->collection_exists(coll)) {
1314 cerr << "pgid " << pgid << " already exists" << std::endl;
1315 return -EEXIST;
1316 }
1317
1318 if (!dry_run) {
1319 ObjectStore::Transaction t;
1320 PG::_create(t, pgid,
1321 pgid.get_split_bits(curmap.get_pg_pool(pgid.pool())->get_pg_num()));
1322 PG::_init(t, pgid, NULL);
1323
1324 // mark this coll for removal until we're done
1325 map<string,bufferlist> values;
1326 ::encode((char)1, values["_remove"]);
1327 t.omap_setkeys(coll, pgid.make_pgmeta_oid(), values);
1328
1329 store->apply_transaction(&osr, std::move(t));
1330 }
1331
1332 cout << "Importing pgid " << pgid;
1333 if (orig_pgid != pgid) {
1334 cout << " exported as " << orig_pgid;
1335 }
1336 cout << std::endl;
1337
1338 bool done = false;
1339 bool found_metadata = false;
1340 metadata_section ms;
1341 ghobject_t last_head;
1342 set<ghobject_t> last_clones;
1343 while(!done) {
1344 ret = read_section(&type, &ebl);
1345 if (ret)
1346 return ret;
1347
1348 //cout << "do_import: Section type " << hex << type << dec << std::endl;
1349 if (type >= END_OF_TYPES) {
1350 cout << "Skipping unknown section type" << std::endl;
1351 continue;
1352 }
1353 switch(type) {
1354 case TYPE_OBJECT_BEGIN:
1355 ret = get_object(store, coll, ebl, curmap, &skipped_objects, osr,
1356 &last_head, &last_clones);
1357 if (ret) return ret;
1358 break;
1359 case TYPE_PG_METADATA:
1360 ret = get_pg_metadata(store, ebl, ms, sb, curmap, pgid);
1361 if (ret) return ret;
1362 found_metadata = true;
1363 break;
1364 case TYPE_PG_END:
1365 done = true;
1366 break;
1367 default:
1368 cerr << "Unknown section type " << type << std::endl;
1369 return -EFAULT;
1370 }
1371 }
1372
1373 if (!found_metadata) {
1374 cerr << "Missing metadata section" << std::endl;
1375 return -EFAULT;
1376 }
1377
1378 ObjectStore::Transaction t;
1379 if (!dry_run) {
1380 pg_log_t newlog, reject;
1381 pg_log_t::filter_log(pgid, curmap, g_ceph_context->_conf->osd_hit_set_namespace,
1382 ms.log, newlog, reject);
1383 if (debug) {
1384 for (list<pg_log_entry_t>::iterator i = newlog.log.begin();
1385 i != newlog.log.end(); ++i)
1386 cerr << "Keeping log entry " << *i << std::endl;
1387 for (list<pg_log_entry_t>::iterator i = reject.log.begin();
1388 i != reject.log.end(); ++i)
1389 cerr << "Skipping log entry " << *i << std::endl;
1390 }
1391
1392 divergent_priors_t newdp, rejectdp;
1393 filter_divergent_priors(pgid, curmap, g_ceph_context->_conf->osd_hit_set_namespace,
1394 ms.divergent_priors, newdp, rejectdp);
1395 ms.divergent_priors = newdp;
1396 if (debug) {
1397 for (divergent_priors_t::iterator i = newdp.begin();
1398 i != newdp.end(); ++i)
1399 cerr << "Keeping divergent_prior " << *i << std::endl;
1400 for (divergent_priors_t::iterator i = rejectdp.begin();
1401 i != rejectdp.end(); ++i)
1402 cerr << "Skipping divergent_prior " << *i << std::endl;
1403 }
1404
1405 ms.missing.filter_objects([&](const hobject_t &obj) {
1406 if (obj.nspace == g_ceph_context->_conf->osd_hit_set_namespace)
1407 return false;
1408 assert(!obj.is_temp());
1409 object_t oid = obj.oid;
1410 object_locator_t loc(obj);
1411 pg_t raw_pgid = curmap.object_locator_to_pg(oid, loc);
1412 pg_t _pgid = curmap.raw_pg_to_pg(raw_pgid);
1413
1414 return pgid.pgid != _pgid;
1415 });
1416
1417
1418 if (debug) {
1419 pg_missing_t missing;
1420 Formatter *formatter = Formatter::create("json-pretty");
1421 dump_log(formatter, cerr, newlog, ms.missing);
1422 delete formatter;
1423 }
1424
1425 // Just like a split invalidate stats since the object count is changed
1426 if (skipped_objects)
1427 ms.info.stats.stats_invalid = true;
1428
1429 ret = write_pg(
1430 t,
1431 ms.map_epoch,
1432 ms.info,
1433 newlog,
1434 ms.past_intervals,
1435 ms.divergent_priors,
1436 ms.missing);
1437 if (ret) return ret;
1438 }
1439
1440 // done, clear removal flag
1441 if (debug)
1442 cerr << "done, clearing removal flag" << std::endl;
1443
1444 if (!dry_run) {
1445 set<string> remove;
1446 remove.insert("_remove");
1447 t.omap_rmkeys(coll, pgid.make_pgmeta_oid(), remove);
1448 store->apply_transaction(&osr, std::move(t));
1449 }
1450
1451 return 0;
1452 }
1453
1454 int do_list(ObjectStore *store, string pgidstr, string object, boost::optional<std::string> nspace,
1455 Formatter *formatter, bool debug, bool human_readable, bool head)
1456 {
1457 int r;
1458 lookup_ghobject lookup(object, nspace, head);
1459 if (pgidstr.length() > 0) {
1460 r = action_on_all_objects_in_pg(store, pgidstr, lookup, debug);
1461 } else {
1462 r = action_on_all_objects(store, lookup, debug);
1463 }
1464 if (r)
1465 return r;
1466 lookup.dump(formatter, human_readable);
1467 formatter->flush(cout);
1468 return 0;
1469 }
1470
1471 int do_meta(ObjectStore *store, string object, Formatter *formatter, bool debug, bool human_readable)
1472 {
1473 int r;
1474 boost::optional<std::string> nspace; // Not specified
1475 lookup_ghobject lookup(object, nspace);
1476 r = action_on_all_objects_in_exact_pg(store, coll_t::meta(), lookup, debug);
1477 if (r)
1478 return r;
1479 lookup.dump(formatter, human_readable);
1480 formatter->flush(cout);
1481 return 0;
1482 }
1483
1484 int remove_object(coll_t coll, ghobject_t &ghobj,
1485 SnapMapper &mapper,
1486 MapCacher::Transaction<std::string, bufferlist> *_t,
1487 ObjectStore::Transaction *t)
1488 {
1489 int r = mapper.remove_oid(ghobj.hobj, _t);
1490 if (r < 0 && r != -ENOENT) {
1491 cerr << "remove_oid returned " << cpp_strerror(r) << std::endl;
1492 return r;
1493 }
1494
1495 t->remove(coll, ghobj);
1496 return 0;
1497 }
1498
1499 int get_snapset(ObjectStore *store, coll_t coll, ghobject_t &ghobj, SnapSet &ss, bool silent);
1500
1501 int do_remove_object(ObjectStore *store, coll_t coll,
1502 ghobject_t &ghobj, bool all, bool force,
1503 ObjectStore::Sequencer &osr)
1504 {
1505 spg_t pg;
1506 coll.is_pg_prefix(&pg);
1507 OSDriver driver(
1508 store,
1509 coll_t(),
1510 OSD::make_snapmapper_oid());
1511 SnapMapper mapper(g_ceph_context, &driver, 0, 0, 0, pg.shard);
1512 struct stat st;
1513
1514 int r = store->stat(coll, ghobj, &st);
1515 if (r < 0) {
1516 cerr << "remove: " << cpp_strerror(r) << std::endl;
1517 return r;
1518 }
1519
1520 SnapSet ss;
1521 if (ghobj.hobj.has_snapset()) {
1522 r = get_snapset(store, coll, ghobj, ss, false);
1523 if (r < 0) {
1524 cerr << "Can't get snapset error " << cpp_strerror(r) << std::endl;
1525 return r;
1526 }
1527 if (!ss.snaps.empty() && !all) {
1528 if (force) {
1529 cout << "WARNING: only removing "
1530 << (ghobj.hobj.is_head() ? "head" : "snapdir")
1531 << " with snapshots present" << std::endl;
1532 ss.snaps.clear();
1533 } else {
1534 cerr << "Snapshots are present, use removeall to delete everything" << std::endl;
1535 return -EINVAL;
1536 }
1537 }
1538 }
1539
1540 ObjectStore::Transaction t;
1541 OSDriver::OSTransaction _t(driver.get_transaction(&t));
1542
1543 cout << "remove " << ghobj << std::endl;
1544
1545 if (!dry_run) {
1546 r = remove_object(coll, ghobj, mapper, &_t, &t);
1547 if (r < 0)
1548 return r;
1549 }
1550
1551 ghobject_t snapobj = ghobj;
1552 for (vector<snapid_t>::iterator i = ss.snaps.begin() ;
1553 i != ss.snaps.end() ; ++i) {
1554 snapobj.hobj.snap = *i;
1555 cout << "remove " << snapobj << std::endl;
1556 if (!dry_run) {
1557 r = remove_object(coll, snapobj, mapper, &_t, &t);
1558 if (r < 0)
1559 return r;
1560 }
1561 }
1562
1563 if (!dry_run)
1564 store->apply_transaction(&osr, std::move(t));
1565
1566 return 0;
1567 }
1568
1569 int do_list_attrs(ObjectStore *store, coll_t coll, ghobject_t &ghobj)
1570 {
1571 map<string,bufferptr> aset;
1572 int r = store->getattrs(coll, ghobj, aset);
1573 if (r < 0) {
1574 cerr << "getattrs: " << cpp_strerror(r) << std::endl;
1575 return r;
1576 }
1577
1578 for (map<string,bufferptr>::iterator i = aset.begin();i != aset.end(); ++i) {
1579 string key(i->first);
1580 if (outistty)
1581 key = cleanbin(key);
1582 cout << key << std::endl;
1583 }
1584 return 0;
1585 }
1586
1587 int do_list_omap(ObjectStore *store, coll_t coll, ghobject_t &ghobj)
1588 {
1589 ObjectMap::ObjectMapIterator iter = store->get_omap_iterator(coll, ghobj);
1590 if (!iter) {
1591 cerr << "omap_get_iterator: " << cpp_strerror(ENOENT) << std::endl;
1592 return -ENOENT;
1593 }
1594 iter->seek_to_first();
1595 map<string, bufferlist> oset;
1596 while(iter->valid()) {
1597 get_omap_batch(iter, oset);
1598
1599 for (map<string,bufferlist>::iterator i = oset.begin();i != oset.end(); ++i) {
1600 string key(i->first);
1601 if (outistty)
1602 key = cleanbin(key);
1603 cout << key << std::endl;
1604 }
1605 }
1606 return 0;
1607 }
1608
1609 int do_get_bytes(ObjectStore *store, coll_t coll, ghobject_t &ghobj, int fd)
1610 {
1611 struct stat st;
1612 mysize_t total;
1613
1614 int ret = store->stat(coll, ghobj, &st);
1615 if (ret < 0) {
1616 cerr << "get-bytes: " << cpp_strerror(ret) << std::endl;
1617 return ret;
1618 }
1619
1620 total = st.st_size;
1621 if (debug)
1622 cerr << "size=" << total << std::endl;
1623
1624 uint64_t offset = 0;
1625 bufferlist rawdatabl;
1626 while(total > 0) {
1627 rawdatabl.clear();
1628 mysize_t len = max_read;
1629 if (len > total)
1630 len = total;
1631
1632 ret = store->read(coll, ghobj, offset, len, rawdatabl);
1633 if (ret < 0)
1634 return ret;
1635 if (ret == 0)
1636 return -EINVAL;
1637
1638 if (debug)
1639 cerr << "data section offset=" << offset << " len=" << len << std::endl;
1640
1641 total -= ret;
1642 offset += ret;
1643
1644 ret = write(fd, rawdatabl.c_str(), ret);
1645 if (ret == -1) {
1646 perror("write");
1647 return -errno;
1648 }
1649 }
1650
1651 return 0;
1652 }
1653
1654 int do_set_bytes(ObjectStore *store, coll_t coll,
1655 ghobject_t &ghobj, int fd,
1656 ObjectStore::Sequencer &osr)
1657 {
1658 ObjectStore::Transaction tran;
1659 ObjectStore::Transaction *t = &tran;
1660
1661 if (debug)
1662 cerr << "Write " << ghobj << std::endl;
1663
1664 if (!dry_run) {
1665 t->touch(coll, ghobj);
1666 t->truncate(coll, ghobj, 0);
1667 }
1668
1669 uint64_t offset = 0;
1670 bufferlist rawdatabl;
1671 do {
1672 rawdatabl.clear();
1673 ssize_t bytes = rawdatabl.read_fd(fd, max_read);
1674 if (bytes < 0) {
1675 cerr << "read_fd error " << cpp_strerror(bytes) << std::endl;
1676 return bytes;
1677 }
1678
1679 if (bytes == 0)
1680 break;
1681
1682 if (debug)
1683 cerr << "\tdata: offset " << offset << " bytes " << bytes << std::endl;
1684 if (!dry_run)
1685 t->write(coll, ghobj, offset, bytes, rawdatabl);
1686
1687 offset += bytes;
1688 // XXX: Should we apply_transaction() every once in a while for very large files
1689 } while(true);
1690
1691 if (!dry_run)
1692 store->apply_transaction(&osr, std::move(*t));
1693 return 0;
1694 }
1695
1696 int do_get_attr(ObjectStore *store, coll_t coll, ghobject_t &ghobj, string key)
1697 {
1698 bufferptr bp;
1699
1700 int r = store->getattr(coll, ghobj, key.c_str(), bp);
1701 if (r < 0) {
1702 cerr << "getattr: " << cpp_strerror(r) << std::endl;
1703 return r;
1704 }
1705
1706 string value(bp.c_str(), bp.length());
1707 if (outistty) {
1708 value = cleanbin(value);
1709 value.push_back('\n');
1710 }
1711 cout << value;
1712
1713 return 0;
1714 }
1715
1716 int do_set_attr(ObjectStore *store, coll_t coll,
1717 ghobject_t &ghobj, string key, int fd,
1718 ObjectStore::Sequencer &osr)
1719 {
1720 ObjectStore::Transaction tran;
1721 ObjectStore::Transaction *t = &tran;
1722 bufferlist bl;
1723
1724 if (debug)
1725 cerr << "Setattr " << ghobj << std::endl;
1726
1727 int ret = get_fd_data(fd, bl);
1728 if (ret < 0)
1729 return ret;
1730
1731 if (dry_run)
1732 return 0;
1733
1734 t->touch(coll, ghobj);
1735
1736 t->setattr(coll, ghobj, key, bl);
1737
1738 store->apply_transaction(&osr, std::move(*t));
1739 return 0;
1740 }
1741
1742 int do_rm_attr(ObjectStore *store, coll_t coll,
1743 ghobject_t &ghobj, string key,
1744 ObjectStore::Sequencer &osr)
1745 {
1746 ObjectStore::Transaction tran;
1747 ObjectStore::Transaction *t = &tran;
1748
1749 if (debug)
1750 cerr << "Rmattr " << ghobj << std::endl;
1751
1752 if (dry_run)
1753 return 0;
1754
1755 t->rmattr(coll, ghobj, key);
1756
1757 store->apply_transaction(&osr, std::move(*t));
1758 return 0;
1759 }
1760
1761 int do_get_omap(ObjectStore *store, coll_t coll, ghobject_t &ghobj, string key)
1762 {
1763 set<string> keys;
1764 map<string, bufferlist> out;
1765
1766 keys.insert(key);
1767
1768 int r = store->omap_get_values(coll, ghobj, keys, &out);
1769 if (r < 0) {
1770 cerr << "omap_get_values: " << cpp_strerror(r) << std::endl;
1771 return r;
1772 }
1773
1774 if (out.empty()) {
1775 cerr << "Key not found" << std::endl;
1776 return -ENOENT;
1777 }
1778
1779 assert(out.size() == 1);
1780
1781 bufferlist bl = out.begin()->second;
1782 string value(bl.c_str(), bl.length());
1783 if (outistty) {
1784 value = cleanbin(value);
1785 value.push_back('\n');
1786 }
1787 cout << value;
1788
1789 return 0;
1790 }
1791
1792 int do_set_omap(ObjectStore *store, coll_t coll,
1793 ghobject_t &ghobj, string key, int fd,
1794 ObjectStore::Sequencer &osr)
1795 {
1796 ObjectStore::Transaction tran;
1797 ObjectStore::Transaction *t = &tran;
1798 map<string, bufferlist> attrset;
1799 bufferlist valbl;
1800
1801 if (debug)
1802 cerr << "Set_omap " << ghobj << std::endl;
1803
1804 int ret = get_fd_data(fd, valbl);
1805 if (ret < 0)
1806 return ret;
1807
1808 attrset.insert(pair<string, bufferlist>(key, valbl));
1809
1810 if (dry_run)
1811 return 0;
1812
1813 t->touch(coll, ghobj);
1814
1815 t->omap_setkeys(coll, ghobj, attrset);
1816
1817 store->apply_transaction(&osr, std::move(*t));
1818 return 0;
1819 }
1820
1821 int do_rm_omap(ObjectStore *store, coll_t coll,
1822 ghobject_t &ghobj, string key,
1823 ObjectStore::Sequencer &osr)
1824 {
1825 ObjectStore::Transaction tran;
1826 ObjectStore::Transaction *t = &tran;
1827 set<string> keys;
1828
1829 keys.insert(key);
1830
1831 if (debug)
1832 cerr << "Rm_omap " << ghobj << std::endl;
1833
1834 if (dry_run)
1835 return 0;
1836
1837 t->omap_rmkeys(coll, ghobj, keys);
1838
1839 store->apply_transaction(&osr, std::move(*t));
1840 return 0;
1841 }
1842
1843 int do_get_omaphdr(ObjectStore *store, coll_t coll, ghobject_t &ghobj)
1844 {
1845 bufferlist hdrbl;
1846
1847 int r = store->omap_get_header(coll, ghobj, &hdrbl, true);
1848 if (r < 0) {
1849 cerr << "omap_get_header: " << cpp_strerror(r) << std::endl;
1850 return r;
1851 }
1852
1853 string header(hdrbl.c_str(), hdrbl.length());
1854 if (outistty) {
1855 header = cleanbin(header);
1856 header.push_back('\n');
1857 }
1858 cout << header;
1859
1860 return 0;
1861 }
1862
1863 int do_set_omaphdr(ObjectStore *store, coll_t coll,
1864 ghobject_t &ghobj, int fd,
1865 ObjectStore::Sequencer &osr)
1866 {
1867 ObjectStore::Transaction tran;
1868 ObjectStore::Transaction *t = &tran;
1869 bufferlist hdrbl;
1870
1871 if (debug)
1872 cerr << "Omap_setheader " << ghobj << std::endl;
1873
1874 int ret = get_fd_data(fd, hdrbl);
1875 if (ret)
1876 return ret;
1877
1878 if (dry_run)
1879 return 0;
1880
1881 t->touch(coll, ghobj);
1882
1883 t->omap_setheader(coll, ghobj, hdrbl);
1884
1885 store->apply_transaction(&osr, std::move(*t));
1886 return 0;
1887 }
1888
1889 struct do_fix_lost : public action_on_object_t {
1890 ObjectStore::Sequencer *osr;
1891
1892 explicit do_fix_lost(ObjectStore::Sequencer *_osr) : osr(_osr) {}
1893
1894 int call(ObjectStore *store, coll_t coll,
1895 ghobject_t &ghobj, object_info_t &oi) override {
1896 if (oi.is_lost()) {
1897 cout << coll << "/" << ghobj << " is lost";
1898 if (!dry_run)
1899 cout << ", fixing";
1900 cout << std::endl;
1901 if (dry_run)
1902 return 0;
1903 oi.clear_flag(object_info_t::FLAG_LOST);
1904 bufferlist bl;
1905 ::encode(oi, bl, -1); /* fixme: using full features */
1906 ObjectStore::Transaction t;
1907 t.setattr(coll, ghobj, OI_ATTR, bl);
1908 int r = store->apply_transaction(osr, std::move(t));
1909 if (r < 0) {
1910 cerr << "Error getting fixing attr on : " << make_pair(coll, ghobj)
1911 << ", "
1912 << cpp_strerror(r) << std::endl;
1913 return r;
1914 }
1915 }
1916 return 0;
1917 }
1918 };
1919
1920 int get_snapset(ObjectStore *store, coll_t coll, ghobject_t &ghobj, SnapSet &ss, bool silent = false)
1921 {
1922 bufferlist attr;
1923 int r = store->getattr(coll, ghobj, SS_ATTR, attr);
1924 if (r < 0) {
1925 if (!silent)
1926 cerr << "Error getting snapset on : " << make_pair(coll, ghobj) << ", "
1927 << cpp_strerror(r) << std::endl;
1928 return r;
1929 }
1930 bufferlist::iterator bp = attr.begin();
1931 try {
1932 ::decode(ss, bp);
1933 } catch (...) {
1934 r = -EINVAL;
1935 cerr << "Error decoding snapset on : " << make_pair(coll, ghobj) << ", "
1936 << cpp_strerror(r) << std::endl;
1937 return r;
1938 }
1939 return 0;
1940 }
1941
1942 int print_obj_info(ObjectStore *store, coll_t coll, ghobject_t &ghobj, Formatter* formatter)
1943 {
1944 int r = 0;
1945 formatter->open_object_section("obj");
1946 formatter->open_object_section("id");
1947 ghobj.dump(formatter);
1948 formatter->close_section();
1949
1950 bufferlist attr;
1951 int gr = store->getattr(coll, ghobj, OI_ATTR, attr);
1952 if (gr < 0) {
1953 r = gr;
1954 cerr << "Error getting attr on : " << make_pair(coll, ghobj) << ", "
1955 << cpp_strerror(r) << std::endl;
1956 } else {
1957 object_info_t oi;
1958 bufferlist::iterator bp = attr.begin();
1959 try {
1960 ::decode(oi, bp);
1961 formatter->open_object_section("info");
1962 oi.dump(formatter);
1963 formatter->close_section();
1964 } catch (...) {
1965 r = -EINVAL;
1966 cerr << "Error decoding attr on : " << make_pair(coll, ghobj) << ", "
1967 << cpp_strerror(r) << std::endl;
1968 }
1969 }
1970 struct stat st;
1971 int sr = store->stat(coll, ghobj, &st, true);
1972 if (sr < 0) {
1973 r = sr;
1974 cerr << "Error stat on : " << make_pair(coll, ghobj) << ", "
1975 << cpp_strerror(r) << std::endl;
1976 } else {
1977 formatter->open_object_section("stat");
1978 formatter->dump_int("size", st.st_size);
1979 formatter->dump_int("blksize", st.st_blksize);
1980 formatter->dump_int("blocks", st.st_blocks);
1981 formatter->dump_int("nlink", st.st_nlink);
1982 formatter->close_section();
1983 }
1984
1985 if (ghobj.hobj.has_snapset()) {
1986 SnapSet ss;
1987 int snr = get_snapset(store, coll, ghobj, ss);
1988 if (snr < 0) {
1989 r = snr;
1990 } else {
1991 formatter->open_object_section("SnapSet");
1992 ss.dump(formatter);
1993 formatter->close_section();
1994 }
1995 }
1996 formatter->close_section();
1997 formatter->flush(cout);
1998 cout << std::endl;
1999 return r;
2000 }
2001
2002 int set_size(ObjectStore *store, coll_t coll, ghobject_t &ghobj, uint64_t setsize, Formatter* formatter,
2003 ObjectStore::Sequencer &osr)
2004 {
2005 if (ghobj.hobj.is_snapdir()) {
2006 cerr << "Can't set the size of a snapdir" << std::endl;
2007 return -EINVAL;
2008 }
2009 bufferlist attr;
2010 int r = store->getattr(coll, ghobj, OI_ATTR, attr);
2011 if (r < 0) {
2012 cerr << "Error getting attr on : " << make_pair(coll, ghobj) << ", "
2013 << cpp_strerror(r) << std::endl;
2014 return r;
2015 }
2016 object_info_t oi;
2017 bufferlist::iterator bp = attr.begin();
2018 try {
2019 ::decode(oi, bp);
2020 } catch (...) {
2021 r = -EINVAL;
2022 cerr << "Error getting attr on : " << make_pair(coll, ghobj) << ", "
2023 << cpp_strerror(r) << std::endl;
2024 return r;
2025 }
2026 struct stat st;
2027 r = store->stat(coll, ghobj, &st, true);
2028 if (r < 0) {
2029 cerr << "Error stat on : " << make_pair(coll, ghobj) << ", "
2030 << cpp_strerror(r) << std::endl;
2031 }
2032 ghobject_t head(ghobj);
2033 SnapSet ss;
2034 bool found_head = true;
2035 map<snapid_t, uint64_t>::iterator csi;
2036 bool is_snap = ghobj.hobj.is_snap();
2037 if (is_snap) {
2038 head.hobj = head.hobj.get_head();
2039 r = get_snapset(store, coll, head, ss, true);
2040 if (r < 0 && r != -ENOENT) {
2041 // Requested get_snapset() silent, so if not -ENOENT show error
2042 cerr << "Error getting snapset on : " << make_pair(coll, head) << ", "
2043 << cpp_strerror(r) << std::endl;
2044 return r;
2045 }
2046 if (r == -ENOENT) {
2047 head.hobj = head.hobj.get_snapdir();
2048 r = get_snapset(store, coll, head, ss);
2049 if (r < 0)
2050 return r;
2051 found_head = false;
2052 } else {
2053 found_head = true;
2054 }
2055 csi = ss.clone_size.find(ghobj.hobj.snap);
2056 if (csi == ss.clone_size.end()) {
2057 cerr << "SnapSet is missing clone_size for snap " << ghobj.hobj.snap << std::endl;
2058 return -EINVAL;
2059 }
2060 }
2061 if ((uint64_t)st.st_size == setsize && oi.size == setsize
2062 && (!is_snap || csi->second == setsize)) {
2063 cout << "Size of object is already " << setsize << std::endl;
2064 return 0;
2065 }
2066 cout << "Setting size to " << setsize << ", stat size " << st.st_size
2067 << ", obj info size " << oi.size;
2068 if (is_snap) {
2069 cout << ", " << (found_head ? "head" : "snapdir")
2070 << " clone_size " << csi->second;
2071 csi->second = setsize;
2072 }
2073 cout << std::endl;
2074 if (!dry_run) {
2075 attr.clear();
2076 oi.size = setsize;
2077 ::encode(oi, attr, -1); /* fixme: using full features */
2078 ObjectStore::Transaction t;
2079 t.setattr(coll, ghobj, OI_ATTR, attr);
2080 t.truncate(coll, ghobj, setsize);
2081 if (is_snap) {
2082 bufferlist snapattr;
2083 snapattr.clear();
2084 ::encode(ss, snapattr);
2085 t.setattr(coll, head, SS_ATTR, snapattr);
2086 }
2087 r = store->apply_transaction(&osr, std::move(t));
2088 if (r < 0) {
2089 cerr << "Error writing object info: " << make_pair(coll, ghobj) << ", "
2090 << cpp_strerror(r) << std::endl;
2091 return r;
2092 }
2093 }
2094 return 0;
2095 }
2096
2097 int clear_snapset(ObjectStore *store, coll_t coll, ghobject_t &ghobj,
2098 string arg, ObjectStore::Sequencer &osr)
2099 {
2100 SnapSet ss;
2101 int ret = get_snapset(store, coll, ghobj, ss);
2102 if (ret < 0)
2103 return ret;
2104
2105 // Use "head" to set head_exists incorrectly
2106 if (arg == "corrupt" || arg == "head")
2107 ss.head_exists = !ghobj.hobj.is_head();
2108 else if (ss.head_exists != ghobj.hobj.is_head()) {
2109 cerr << "Correcting head_exists, set to "
2110 << (ghobj.hobj.is_head() ? "true" : "false") << std::endl;
2111 ss.head_exists = ghobj.hobj.is_head();
2112 }
2113 // Use "corrupt" to clear entire SnapSet
2114 // Use "seq" to just corrupt SnapSet.seq
2115 if (arg == "corrupt" || arg == "seq")
2116 ss.seq = 0;
2117 // Use "snaps" to just clear SnapSet.snaps
2118 if (arg == "corrupt" || arg == "snaps")
2119 ss.snaps.clear();
2120 // By default just clear clone, clone_overlap and clone_size
2121 if (arg == "corrupt")
2122 arg = "";
2123 if (arg == "" || arg == "clones")
2124 ss.clones.clear();
2125 if (arg == "" || arg == "clone_overlap")
2126 ss.clone_overlap.clear();
2127 if (arg == "" || arg == "clone_size")
2128 ss.clone_size.clear();
2129 // Break all clone sizes by adding 1
2130 if (arg == "size") {
2131 for (map<snapid_t, uint64_t>::iterator i = ss.clone_size.begin();
2132 i != ss.clone_size.end(); ++i)
2133 ++(i->second);
2134 }
2135
2136 if (!dry_run) {
2137 bufferlist bl;
2138 ::encode(ss, bl);
2139 ObjectStore::Transaction t;
2140 t.setattr(coll, ghobj, SS_ATTR, bl);
2141 int r = store->apply_transaction(&osr, std::move(t));
2142 if (r < 0) {
2143 cerr << "Error setting snapset on : " << make_pair(coll, ghobj) << ", "
2144 << cpp_strerror(r) << std::endl;
2145 return r;
2146 }
2147 }
2148 return 0;
2149 }
2150
2151 vector<snapid_t>::iterator find(vector<snapid_t> &v, snapid_t clid)
2152 {
2153 return std::find(v.begin(), v.end(), clid);
2154 }
2155
2156 map<snapid_t, interval_set<uint64_t> >::iterator
2157 find(map<snapid_t, interval_set<uint64_t> > &m, snapid_t clid)
2158 {
2159 return m.find(clid);
2160 }
2161
2162 map<snapid_t, uint64_t>::iterator find(map<snapid_t, uint64_t> &m,
2163 snapid_t clid)
2164 {
2165 return m.find(clid);
2166 }
2167
2168 template<class T>
2169 int remove_from(T &mv, string name, snapid_t cloneid, bool force)
2170 {
2171 typename T::iterator i = find(mv, cloneid);
2172 if (i != mv.end()) {
2173 mv.erase(i);
2174 } else {
2175 cerr << "Clone " << cloneid << " doesn't exist in " << name;
2176 if (force) {
2177 cerr << " (ignored)" << std::endl;
2178 return 0;
2179 }
2180 cerr << std::endl;
2181 return -EINVAL;
2182 }
2183 return 0;
2184 }
2185
2186 int remove_clone(ObjectStore *store, coll_t coll, ghobject_t &ghobj, snapid_t cloneid, bool force,
2187 ObjectStore::Sequencer &osr)
2188 {
2189 // XXX: Don't allow this if in a cache tier or former cache tier
2190 // bool allow_incomplete_clones() const {
2191 // return cache_mode != CACHEMODE_NONE || has_flag(FLAG_INCOMPLETE_CLONES);
2192
2193 SnapSet snapset;
2194 int ret = get_snapset(store, coll, ghobj, snapset);
2195 if (ret < 0)
2196 return ret;
2197
2198 // Derived from trim_object()
2199 // ...from snapset
2200 vector<snapid_t>::iterator p;
2201 for (p = snapset.clones.begin(); p != snapset.clones.end(); ++p)
2202 if (*p == cloneid)
2203 break;
2204 if (p == snapset.clones.end()) {
2205 cerr << "Clone " << cloneid << " not present";
2206 return -ENOENT;
2207 }
2208 if (p != snapset.clones.begin()) {
2209 // not the oldest... merge overlap into next older clone
2210 vector<snapid_t>::iterator n = p - 1;
2211 hobject_t prev_coid = ghobj.hobj;
2212 prev_coid.snap = *n;
2213 //bool adjust_prev_bytes = is_present_clone(prev_coid);
2214
2215 //if (adjust_prev_bytes)
2216 // ctx->delta_stats.num_bytes -= snapset.get_clone_bytes(*n);
2217
2218 snapset.clone_overlap[*n].intersection_of(
2219 snapset.clone_overlap[*p]);
2220
2221 //if (adjust_prev_bytes)
2222 // ctx->delta_stats.num_bytes += snapset.get_clone_bytes(*n);
2223 }
2224
2225 ret = remove_from(snapset.clones, "clones", cloneid, force);
2226 if (ret) return ret;
2227 ret = remove_from(snapset.clone_overlap, "clone_overlap", cloneid, force);
2228 if (ret) return ret;
2229 ret = remove_from(snapset.clone_size, "clone_size", cloneid, force);
2230 if (ret) return ret;
2231
2232 if (dry_run)
2233 return 0;
2234
2235 bufferlist bl;
2236 ::encode(snapset, bl);
2237 ObjectStore::Transaction t;
2238 t.setattr(coll, ghobj, SS_ATTR, bl);
2239 int r = store->apply_transaction(&osr, std::move(t));
2240 if (r < 0) {
2241 cerr << "Error setting snapset on : " << make_pair(coll, ghobj) << ", "
2242 << cpp_strerror(r) << std::endl;
2243 return r;
2244 }
2245 cout << "Removal of clone " << cloneid << " complete" << std::endl;
2246 cout << "Use pg repair after OSD restarted to correct stat information" << std::endl;
2247 return 0;
2248 }
2249
2250 int dup(string srcpath, ObjectStore *src, string dstpath, ObjectStore *dst)
2251 {
2252 cout << "dup from " << src->get_type() << ": " << srcpath << "\n"
2253 << " to " << dst->get_type() << ": " << dstpath
2254 << std::endl;
2255 ObjectStore::Sequencer osr("dup");
2256 int num, i;
2257 vector<coll_t> collections;
2258 int r;
2259
2260 r = src->mount();
2261 if (r < 0) {
2262 cerr << "failed to mount src: " << cpp_strerror(r) << std::endl;
2263 return r;
2264 }
2265 r = dst->mount();
2266 if (r < 0) {
2267 cerr << "failed to mount dst: " << cpp_strerror(r) << std::endl;
2268 goto out_src;
2269 }
2270
2271 if (src->get_fsid() != dst->get_fsid()) {
2272 cerr << "src fsid " << src->get_fsid() << " != dest " << dst->get_fsid()
2273 << std::endl;
2274 goto out;
2275 }
2276 cout << "fsid " << src->get_fsid() << std::endl;
2277
2278 // make sure dst is empty
2279 r = dst->list_collections(collections);
2280 if (r < 0) {
2281 cerr << "error listing collections on dst: " << cpp_strerror(r) << std::endl;
2282 goto out;
2283 }
2284 if (!collections.empty()) {
2285 cerr << "destination store is not empty" << std::endl;
2286 goto out;
2287 }
2288
2289 r = src->list_collections(collections);
2290 if (r < 0) {
2291 cerr << "error listing collections on src: " << cpp_strerror(r) << std::endl;
2292 goto out;
2293 }
2294
2295 num = collections.size();
2296 cout << num << " collections" << std::endl;
2297 i = 1;
2298 for (auto cid : collections) {
2299 cout << i++ << "/" << num << " " << cid << std::endl;
2300 {
2301 ObjectStore::Transaction t;
2302 int bits = src->collection_bits(cid);
2303 if (bits < 0) {
2304 cerr << "cannot get bit count for collection " << cid << ": "
2305 << cpp_strerror(bits) << std::endl;
2306 goto out;
2307 }
2308 t.create_collection(cid, bits);
2309 dst->apply_transaction(&osr, std::move(t));
2310 }
2311
2312 ghobject_t pos;
2313 uint64_t n = 0;
2314 uint64_t bytes = 0, keys = 0;
2315 while (true) {
2316 vector<ghobject_t> ls;
2317 r = src->collection_list(cid, pos, ghobject_t::get_max(), 1000, &ls, &pos);
2318 if (r < 0) {
2319 cerr << "collection_list on " << cid << " from " << pos << " got: "
2320 << cpp_strerror(r) << std::endl;
2321 goto out;
2322 }
2323 if (ls.empty()) {
2324 break;
2325 }
2326
2327 for (auto& oid : ls) {
2328 //cout << " " << cid << " " << oid << std::endl;
2329 if (n % 100 == 0) {
2330 cout << " " << std::setw(16) << n << " objects, "
2331 << std::setw(16) << bytes << " bytes, "
2332 << std::setw(16) << keys << " keys"
2333 << std::setw(1) << "\r" << std::flush;
2334 }
2335 n++;
2336
2337 ObjectStore::Transaction t;
2338 t.touch(cid, oid);
2339
2340 map<string,bufferptr> attrs;
2341 src->getattrs(cid, oid, attrs);
2342 if (!attrs.empty()) {
2343 t.setattrs(cid, oid, attrs);
2344 }
2345
2346 bufferlist bl;
2347 src->read(cid, oid, 0, 0, bl);
2348 if (bl.length()) {
2349 t.write(cid, oid, 0, bl.length(), bl);
2350 bytes += bl.length();
2351 }
2352
2353 bufferlist header;
2354 map<string,bufferlist> omap;
2355 src->omap_get(cid, oid, &header, &omap);
2356 if (header.length()) {
2357 t.omap_setheader(cid, oid, header);
2358 ++keys;
2359 }
2360 if (!omap.empty()) {
2361 keys += omap.size();
2362 t.omap_setkeys(cid, oid, omap);
2363 }
2364
2365 dst->apply_transaction(&osr, std::move(t));
2366 }
2367 }
2368 cout << " " << std::setw(16) << n << " objects, "
2369 << std::setw(16) << bytes << " bytes, "
2370 << std::setw(16) << keys << " keys"
2371 << std::setw(1) << std::endl;
2372 }
2373
2374 // keyring
2375 cout << "keyring" << std::endl;
2376 {
2377 bufferlist bl;
2378 string s = srcpath + "/keyring";
2379 string err;
2380 r = bl.read_file(s.c_str(), &err);
2381 if (r < 0) {
2382 cerr << "failed to copy " << s << ": " << err << std::endl;
2383 } else {
2384 string d = dstpath + "/keyring";
2385 bl.write_file(d.c_str(), 0600);
2386 }
2387 }
2388
2389 // osd metadata
2390 cout << "duping osd metadata" << std::endl;
2391 {
2392 for (auto k : {"magic", "whoami", "ceph_fsid", "fsid"}) {
2393 string val;
2394 src->read_meta(k, &val);
2395 dst->write_meta(k, val);
2396 }
2397 }
2398
2399 dst->write_meta("ready", "ready");
2400
2401 cout << "done." << std::endl;
2402 r = 0;
2403 out:
2404 dst->umount();
2405 out_src:
2406 src->umount();
2407 return r;
2408 }
2409
2410 void usage(po::options_description &desc)
2411 {
2412 cerr << std::endl;
2413 cerr << desc << std::endl;
2414 cerr << std::endl;
2415 cerr << "Positional syntax:" << std::endl;
2416 cerr << std::endl;
2417 cerr << "ceph-objectstore-tool ... <object> (get|set)-bytes [file]" << std::endl;
2418 cerr << "ceph-objectstore-tool ... <object> set-(attr|omap) <key> [file]" << std::endl;
2419 cerr << "ceph-objectstore-tool ... <object> (get|rm)-(attr|omap) <key>" << std::endl;
2420 cerr << "ceph-objectstore-tool ... <object> get-omaphdr" << std::endl;
2421 cerr << "ceph-objectstore-tool ... <object> set-omaphdr [file]" << std::endl;
2422 cerr << "ceph-objectstore-tool ... <object> list-attrs" << std::endl;
2423 cerr << "ceph-objectstore-tool ... <object> list-omap" << std::endl;
2424 cerr << "ceph-objectstore-tool ... <object> remove|removeall" << std::endl;
2425 cerr << "ceph-objectstore-tool ... <object> dump" << std::endl;
2426 cerr << "ceph-objectstore-tool ... <object> set-size" << std::endl;
2427 cerr << "ceph-objectstore-tool ... <object> remove-clone-metadata <cloneid>" << std::endl;
2428 cerr << std::endl;
2429 cerr << "<object> can be a JSON object description as displayed" << std::endl;
2430 cerr << "by --op list." << std::endl;
2431 cerr << "<object> can be an object name which will be looked up in all" << std::endl;
2432 cerr << "the OSD's PGs." << std::endl;
2433 cerr << "<object> can be the empty string ('') which with a provided pgid " << std::endl;
2434 cerr << "specifies the pgmeta object" << std::endl;
2435 cerr << std::endl;
2436 cerr << "The optional [file] argument will read stdin or write stdout" << std::endl;
2437 cerr << "if not specified or if '-' specified." << std::endl;
2438 }
2439
2440 bool ends_with(const string& check, const string& ending)
2441 {
2442 return check.size() >= ending.size() && check.rfind(ending) == (check.size() - ending.size());
2443 }
2444
2445 // Based on FileStore::dump_journal(), set-up enough to only dump
2446 int mydump_journal(Formatter *f, string journalpath, bool m_journal_dio)
2447 {
2448 int r;
2449
2450 if (!journalpath.length())
2451 return -EINVAL;
2452
2453 FileJournal *journal = new FileJournal(g_ceph_context, uuid_d(), NULL, NULL,
2454 journalpath.c_str(), m_journal_dio);
2455 r = journal->_fdump(*f, false);
2456 delete journal;
2457 return r;
2458 }
2459
2460 int apply_layout_settings(ObjectStore *os, const OSDSuperblock &superblock,
2461 const string &pool_name, const spg_t &pgid, bool dry_run)
2462 {
2463 int r = 0;
2464
2465 FileStore *fs = dynamic_cast<FileStore*>(os);
2466 if (!fs) {
2467 cerr << "Nothing to do for non-filestore backend" << std::endl;
2468 return 0; // making this return success makes testing easier
2469 }
2470
2471 OSDMap curmap;
2472 bufferlist bl;
2473 r = get_osdmap(os, superblock.current_epoch, curmap, bl);
2474 if (r) {
2475 cerr << "Can't find local OSDMap: " << cpp_strerror(r) << std::endl;
2476 return r;
2477 }
2478
2479 int64_t poolid = -1;
2480 if (pool_name.length()) {
2481 poolid = curmap.lookup_pg_pool_name(pool_name);
2482 if (poolid < 0) {
2483 cerr << "Couldn't find pool " << pool_name << ": " << cpp_strerror(poolid)
2484 << std::endl;
2485 return poolid;
2486 }
2487 }
2488
2489 vector<coll_t> collections, filtered_colls;
2490 r = os->list_collections(collections);
2491 if (r < 0) {
2492 cerr << "Error listing collections: " << cpp_strerror(r) << std::endl;
2493 return r;
2494 }
2495
2496 for (auto const &coll : collections) {
2497 spg_t coll_pgid;
2498 if (coll.is_pg(&coll_pgid) &&
2499 ((poolid >= 0 && coll_pgid.pool() == (uint64_t)poolid) ||
2500 coll_pgid == pgid)) {
2501 filtered_colls.push_back(coll);
2502 }
2503 }
2504
2505 size_t done = 0, total = filtered_colls.size();
2506 for (auto const &coll : filtered_colls) {
2507 if (dry_run) {
2508 cerr << "Would apply layout settings to " << coll << std::endl;
2509 } else {
2510 cerr << "Finished " << done << "/" << total << " collections" << "\r";
2511 r = fs->apply_layout_settings(coll);
2512 if (r < 0) {
2513 cerr << "Error applying layout settings to " << coll << std::endl;
2514 return r;
2515 }
2516 }
2517 ++done;
2518 }
2519
2520 cerr << "Finished " << total << "/" << total << " collections" << "\r" << std::endl;
2521 return r;
2522 }
2523
2524 int main(int argc, char **argv)
2525 {
2526 string dpath, jpath, pgidstr, op, file, mountpoint, mon_store_path, object;
2527 string target_data_path, fsid;
2528 string objcmd, arg1, arg2, type, format, argnspace, pool;
2529 boost::optional<std::string> nspace;
2530 spg_t pgid;
2531 unsigned epoch = 0;
2532 ghobject_t ghobj;
2533 bool human_readable;
2534 bool force;
2535 Formatter *formatter;
2536 bool head;
2537
2538 po::options_description desc("Allowed options");
2539 desc.add_options()
2540 ("help", "produce help message")
2541 ("type", po::value<string>(&type),
2542 "Arg is one of [bluestore, filestore (default), memstore]")
2543 ("data-path", po::value<string>(&dpath),
2544 "path to object store, mandatory")
2545 ("journal-path", po::value<string>(&jpath),
2546 "path to journal, use if tool can't find it")
2547 ("pgid", po::value<string>(&pgidstr),
2548 "PG id, mandatory for info, log, remove, export, rm-past-intervals, mark-complete, and mandatory for apply-layout-settings if --pool is not specified")
2549 ("pool", po::value<string>(&pool),
2550 "Pool name, mandatory for apply-layout-settings if --pgid is not specified")
2551 ("op", po::value<string>(&op),
2552 "Arg is one of [info, log, remove, mkfs, fsck, fuse, dup, export, import, list, fix-lost, list-pgs, rm-past-intervals, dump-journal, dump-super, meta-list, "
2553 "get-osdmap, set-osdmap, get-inc-osdmap, set-inc-osdmap, mark-complete, apply-layout-settings, update-mon-db]")
2554 ("epoch", po::value<unsigned>(&epoch),
2555 "epoch# for get-osdmap and get-inc-osdmap, the current epoch in use if not specified")
2556 ("file", po::value<string>(&file),
2557 "path of file to export, import, get-osdmap, set-osdmap, get-inc-osdmap or set-inc-osdmap")
2558 ("mon-store-path", po::value<string>(&mon_store_path),
2559 "path of monstore to update-mon-db")
2560 ("fsid", po::value<string>(&fsid),
2561 "fsid for new store created by mkfs")
2562 ("target-data-path", po::value<string>(&target_data_path),
2563 "path of target object store (for --op dup)")
2564 ("mountpoint", po::value<string>(&mountpoint),
2565 "fuse mountpoint")
2566 ("format", po::value<string>(&format)->default_value("json-pretty"),
2567 "Output format which may be json, json-pretty, xml, xml-pretty")
2568 ("debug", "Enable diagnostic output to stderr")
2569 ("force", "Ignore some types of errors and proceed with operation - USE WITH CAUTION: CORRUPTION POSSIBLE NOW OR IN THE FUTURE")
2570 ("skip-journal-replay", "Disable journal replay")
2571 ("skip-mount-omap", "Disable mounting of omap")
2572 ("head", "Find head/snapdir when searching for objects by name")
2573 ("dry-run", "Don't modify the objectstore")
2574 ("namespace", po::value<string>(&argnspace), "Specify namespace when searching for objects")
2575 ;
2576
2577 po::options_description positional("Positional options");
2578 positional.add_options()
2579 ("object", po::value<string>(&object), "'' for pgmeta_oid, object name or ghobject in json")
2580 ("objcmd", po::value<string>(&objcmd), "command [(get|set)-bytes, (get|set|rm)-(attr|omap), (get|set)-omaphdr, list-attrs, list-omap, remove]")
2581 ("arg1", po::value<string>(&arg1), "arg1 based on cmd")
2582 ("arg2", po::value<string>(&arg2), "arg2 based on cmd")
2583 ("test-align", po::value<uint64_t>(&testalign)->default_value(0), "hidden align option for testing")
2584 ;
2585
2586 po::options_description all("All options");
2587 all.add(desc).add(positional);
2588
2589 po::positional_options_description pd;
2590 pd.add("object", 1).add("objcmd", 1).add("arg1", 1).add("arg2", 1);
2591
2592 vector<string> ceph_option_strings;
2593 po::variables_map vm;
2594 try {
2595 po::parsed_options parsed =
2596 po::command_line_parser(argc, argv).options(all).allow_unregistered().positional(pd).run();
2597 po::store( parsed, vm);
2598 po::notify(vm);
2599 ceph_option_strings = po::collect_unrecognized(parsed.options,
2600 po::include_positional);
2601 } catch(po::error &e) {
2602 std::cerr << e.what() << std::endl;
2603 return 1;
2604 }
2605
2606 if (vm.count("help")) {
2607 usage(all);
2608 return 1;
2609 }
2610
2611 if (!vm.count("debug")) {
2612 debug = false;
2613 } else {
2614 debug = true;
2615 }
2616
2617 if (!vm.count("force")) {
2618 force = false;
2619 } else {
2620 force = true;
2621 }
2622
2623 if (vm.count("namespace"))
2624 nspace = argnspace;
2625
2626 if (vm.count("dry-run"))
2627 dry_run = true;
2628 osflagbits_t flags = 0;
2629 if (dry_run || vm.count("skip-journal-replay"))
2630 flags |= SKIP_JOURNAL_REPLAY;
2631 if (vm.count("skip-mount-omap"))
2632 flags |= SKIP_MOUNT_OMAP;
2633 if (op == "update-mon-db")
2634 flags |= SKIP_JOURNAL_REPLAY;
2635 head = (vm.count("head") > 0);
2636
2637 vector<const char *> ceph_options;
2638 env_to_vec(ceph_options);
2639 ceph_options.reserve(ceph_options.size() + ceph_option_strings.size());
2640 for (vector<string>::iterator i = ceph_option_strings.begin();
2641 i != ceph_option_strings.end();
2642 ++i) {
2643 ceph_options.push_back(i->c_str());
2644 }
2645
2646 char fn[PATH_MAX];
2647 snprintf(fn, sizeof(fn), "%s/type", dpath.c_str());
2648 int fd = ::open(fn, O_RDONLY);
2649 if (fd >= 0) {
2650 bufferlist bl;
2651 bl.read_fd(fd, 64);
2652 if (bl.length()) {
2653 string dp_type = string(bl.c_str(), bl.length() - 1); // drop \n
2654 if (vm.count("type") && dp_type != "" && type != dp_type)
2655 cerr << "WARNING: Ignoring type \"" << type << "\" - found data-path type \""
2656 << dp_type << "\"" << std::endl;
2657 type = dp_type;
2658 //cout << "object store type is " << type << std::endl;
2659 }
2660 ::close(fd);
2661 }
2662 if (!vm.count("type") && type == "") {
2663 type = "filestore";
2664 }
2665 if (!vm.count("data-path") &&
2666 !(op == "dump-journal" && type == "filestore")) {
2667 cerr << "Must provide --data-path" << std::endl;
2668 usage(desc);
2669 return 1;
2670 }
2671 if (type == "filestore" && !vm.count("journal-path")) {
2672 jpath = dpath + "/journal";
2673 }
2674 if (!vm.count("op") && !vm.count("object")) {
2675 cerr << "Must provide --op or object command..." << std::endl;
2676 usage(desc);
2677 return 1;
2678 }
2679 if (op != "list" &&
2680 vm.count("op") && vm.count("object")) {
2681 cerr << "Can't specify both --op and object command syntax" << std::endl;
2682 usage(desc);
2683 return 1;
2684 }
2685 if (op == "apply-layout-settings" && !(vm.count("pool") ^ vm.count("pgid"))) {
2686 cerr << "apply-layout-settings requires either --pool or --pgid"
2687 << std::endl;
2688 usage(desc);
2689 return 1;
2690 }
2691 if (op != "list" && vm.count("object") && !vm.count("objcmd")) {
2692 cerr << "Invalid syntax, missing command" << std::endl;
2693 usage(desc);
2694 return 1;
2695 }
2696 if (op == "fuse" && mountpoint.length() == 0) {
2697 cerr << "Missing fuse mountpoint" << std::endl;
2698 usage(desc);
2699 return 1;
2700 }
2701 outistty = isatty(STDOUT_FILENO);
2702
2703 file_fd = fd_none;
2704 if ((op == "export" || op == "get-osdmap" || op == "get-inc-osdmap") && !dry_run) {
2705 if (!vm.count("file") || file == "-") {
2706 if (outistty) {
2707 cerr << "stdout is a tty and no --file filename specified" << std::endl;
2708 return 1;
2709 }
2710 file_fd = STDOUT_FILENO;
2711 } else {
2712 file_fd = open(file.c_str(), O_WRONLY|O_CREAT|O_TRUNC, 0666);
2713 }
2714 } else if (op == "import" || op == "set-osdmap" || op == "set-inc-osdmap") {
2715 if (!vm.count("file") || file == "-") {
2716 if (isatty(STDIN_FILENO)) {
2717 cerr << "stdin is a tty and no --file filename specified" << std::endl;
2718 return 1;
2719 }
2720 file_fd = STDIN_FILENO;
2721 } else {
2722 file_fd = open(file.c_str(), O_RDONLY);
2723 }
2724 }
2725
2726 ObjectStoreTool tool = ObjectStoreTool(file_fd, dry_run);
2727
2728 if (vm.count("file") && file_fd == fd_none && !dry_run) {
2729 cerr << "--file option only applies to import, export, "
2730 << "get-osdmap, set-osdmap, get-inc-osdmap or set-inc-osdmap" << std::endl;
2731 return 1;
2732 }
2733
2734 if (file_fd != fd_none && file_fd < 0) {
2735 string err = string("file: ") + file;
2736 perror(err.c_str());
2737 return 1;
2738 }
2739
2740 auto cct = global_init(
2741 NULL, ceph_options, CEPH_ENTITY_TYPE_OSD,
2742 CODE_ENVIRONMENT_UTILITY_NODOUT, 0);
2743 //CINIT_FLAG_NO_DEFAULT_CONFIG_FILE);
2744 common_init_finish(g_ceph_context);
2745 g_conf = g_ceph_context->_conf;
2746 if (debug) {
2747 g_conf->set_val_or_die("log_to_stderr", "true");
2748 g_conf->set_val_or_die("err_to_stderr", "true");
2749 }
2750 g_conf->apply_changes(NULL);
2751
2752 // Special list handling. Treating pretty_format as human readable,
2753 // with one object per line and not an enclosing array.
2754 human_readable = ends_with(format, "-pretty");
2755 if ((op == "list" || op == "meta-list") && human_readable) {
2756 // Remove -pretty from end of format which we know is there
2757 format = format.substr(0, format.size() - strlen("-pretty"));
2758 }
2759
2760 formatter = Formatter::create(format);
2761 if (formatter == NULL) {
2762 cerr << "unrecognized format: " << format << std::endl;
2763 return 1;
2764 }
2765
2766 // Special handling for filestore journal, so we can dump it without mounting
2767 if (op == "dump-journal" && type == "filestore") {
2768 int ret = mydump_journal(formatter, jpath, g_conf->journal_dio);
2769 if (ret < 0) {
2770 cerr << "journal-path: " << jpath << ": "
2771 << cpp_strerror(ret) << std::endl;
2772 return 1;
2773 }
2774 formatter->flush(cout);
2775 return 0;
2776 }
2777
2778 //Verify that data-path really exists
2779 struct stat st;
2780 if (::stat(dpath.c_str(), &st) == -1) {
2781 string err = string("data-path: ") + dpath;
2782 perror(err.c_str());
2783 return 1;
2784 }
2785
2786 if (pgidstr.length() && !pgid.parse(pgidstr.c_str())) {
2787 cerr << "Invalid pgid '" << pgidstr << "' specified" << std::endl;
2788 return 1;
2789 }
2790
2791 ObjectStore *fs = ObjectStore::create(g_ceph_context, type, dpath, jpath, flags);
2792 if (fs == NULL) {
2793 cerr << "Unable to create store of type " << type << std::endl;
2794 return 1;
2795 }
2796
2797 if (op == "fsck" || op == "fsck-deep") {
2798 int r = fs->fsck(op == "fsck-deep");
2799 if (r < 0) {
2800 cerr << "fsck failed: " << cpp_strerror(r) << std::endl;
2801 return 1;
2802 }
2803 if (r > 0) {
2804 cerr << "fsck found " << r << " errors" << std::endl;
2805 return 1;
2806 }
2807 cout << "fsck found no errors" << std::endl;
2808 return 0;
2809 }
2810 if (op == "mkfs") {
2811 if (fsid.length()) {
2812 uuid_d f;
2813 bool r = f.parse(fsid.c_str());
2814 if (!r) {
2815 cerr << "failed to parse uuid '" << fsid << "'" << std::endl;
2816 return 1;
2817 }
2818 fs->set_fsid(f);
2819 }
2820 int r = fs->mkfs();
2821 if (r < 0) {
2822 cerr << "fsck failed: " << cpp_strerror(r) << std::endl;
2823 return 1;
2824 }
2825 return 0;
2826 }
2827 if (op == "dup") {
2828 string target_type;
2829 char fn[PATH_MAX];
2830 snprintf(fn, sizeof(fn), "%s/type", target_data_path.c_str());
2831 int fd = ::open(fn, O_RDONLY);
2832 if (fd < 0) {
2833 cerr << "Unable to open " << target_data_path << "/type" << std::endl;
2834 exit(1);
2835 }
2836 bufferlist bl;
2837 bl.read_fd(fd, 64);
2838 if (bl.length()) {
2839 target_type = string(bl.c_str(), bl.length() - 1); // drop \n
2840 }
2841 ::close(fd);
2842 ObjectStore *targetfs = ObjectStore::create(
2843 g_ceph_context, target_type,
2844 target_data_path, "", 0);
2845 if (targetfs == NULL) {
2846 cerr << "Unable to open store of type " << target_type << std::endl;
2847 return 1;
2848 }
2849 int r = dup(dpath, fs, target_data_path, targetfs);
2850 if (r < 0) {
2851 cerr << "dup failed: " << cpp_strerror(r) << std::endl;
2852 return 1;
2853 }
2854 return 0;
2855 }
2856
2857 ObjectStore::Sequencer *osr = new ObjectStore::Sequencer(__func__);
2858 int ret = fs->mount();
2859 if (ret < 0) {
2860 if (ret == -EBUSY) {
2861 cerr << "OSD has the store locked" << std::endl;
2862 } else {
2863 cerr << "Mount failed with '" << cpp_strerror(ret) << "'" << std::endl;
2864 }
2865 return 1;
2866 }
2867
2868 if (op == "fuse") {
2869 #ifdef HAVE_LIBFUSE
2870 FuseStore fuse(fs, mountpoint);
2871 cout << "mounting fuse at " << mountpoint << " ..." << std::endl;
2872 int r = fuse.main();
2873 if (r < 0) {
2874 cerr << "failed to mount fuse: " << cpp_strerror(r) << std::endl;
2875 return 1;
2876 }
2877 #else
2878 cerr << "fuse support not enabled" << std::endl;
2879 #endif
2880 return 0;
2881 }
2882
2883 vector<coll_t> ls;
2884 vector<coll_t>::iterator it;
2885 CompatSet supported;
2886
2887 #ifdef INTERNAL_TEST
2888 supported = get_test_compat_set();
2889 #else
2890 supported = OSD::get_osd_compat_set();
2891 #endif
2892
2893 bufferlist bl;
2894 OSDSuperblock superblock;
2895 bufferlist::iterator p;
2896 ret = fs->read(coll_t::meta(), OSD_SUPERBLOCK_GOBJECT, 0, 0, bl);
2897 if (ret < 0) {
2898 cerr << "Failure to read OSD superblock: " << cpp_strerror(ret) << std::endl;
2899 goto out;
2900 }
2901
2902 p = bl.begin();
2903 ::decode(superblock, p);
2904
2905 if (debug) {
2906 cerr << "Cluster fsid=" << superblock.cluster_fsid << std::endl;
2907 }
2908
2909 if (debug) {
2910 cerr << "Supported features: " << supported << std::endl;
2911 cerr << "On-disk features: " << superblock.compat_features << std::endl;
2912 }
2913 if (supported.compare(superblock.compat_features) == -1) {
2914 CompatSet unsupported = supported.unsupported(superblock.compat_features);
2915 cerr << "On-disk OSD incompatible features set "
2916 << unsupported << std::endl;
2917 ret = -EINVAL;
2918 goto out;
2919 }
2920
2921 if (op == "apply-layout-settings") {
2922 ret = apply_layout_settings(fs, superblock, pool, pgid, dry_run);
2923 goto out;
2924 }
2925
2926 if (op != "list" && vm.count("object")) {
2927 // Special case: Create pgmeta_oid if empty string specified
2928 // This can't conflict with any actual object names.
2929 if (object == "") {
2930 ghobj = pgid.make_pgmeta_oid();
2931 } else {
2932 json_spirit::Value v;
2933 try {
2934 if (!json_spirit::read(object, v) ||
2935 (v.type() != json_spirit::array_type && v.type() != json_spirit::obj_type)) {
2936 // Special: Need head/snapdir so set even if user didn't specify
2937 if (vm.count("objcmd") && (objcmd == "remove-clone-metadata"))
2938 head = true;
2939 lookup_ghobject lookup(object, nspace, head);
2940 if (action_on_all_objects(fs, lookup, debug)) {
2941 throw std::runtime_error("Internal error");
2942 } else {
2943 if (lookup.size() != 1) {
2944 stringstream ss;
2945 if (lookup.size() == 0)
2946 ss << "No object id '" << object << "' found or invalid JSON specified";
2947 else
2948 ss << "Found " << lookup.size() << " objects with id '" << object
2949 << "', please use a JSON spec from --op list instead";
2950 throw std::runtime_error(ss.str());
2951 }
2952 pair<coll_t, ghobject_t> found = lookup.pop();
2953 pgidstr = found.first.to_str();
2954 pgid.parse(pgidstr.c_str());
2955 ghobj = found.second;
2956 }
2957 } else {
2958 stringstream ss;
2959 if (pgidstr.length() == 0 && v.type() != json_spirit::array_type) {
2960 ss << "Without --pgid the object '" << object
2961 << "' must be a JSON array";
2962 throw std::runtime_error(ss.str());
2963 }
2964 if (v.type() == json_spirit::array_type) {
2965 json_spirit::Array array = v.get_array();
2966 if (array.size() != 2) {
2967 ss << "Object '" << object
2968 << "' must be a JSON array with 2 elements";
2969 throw std::runtime_error(ss.str());
2970 }
2971 vector<json_spirit::Value>::iterator i = array.begin();
2972 assert(i != array.end());
2973 if (i->type() != json_spirit::str_type) {
2974 ss << "Object '" << object
2975 << "' must be a JSON array with the first element a string";
2976 throw std::runtime_error(ss.str());
2977 }
2978 string object_pgidstr = i->get_str();
2979 if (object_pgidstr != "meta") {
2980 spg_t object_pgid;
2981 object_pgid.parse(object_pgidstr.c_str());
2982 if (pgidstr.length() > 0) {
2983 if (object_pgid != pgid) {
2984 ss << "object '" << object
2985 << "' has a pgid different from the --pgid="
2986 << pgidstr << " option";
2987 throw std::runtime_error(ss.str());
2988 }
2989 } else {
2990 pgidstr = object_pgidstr;
2991 pgid = object_pgid;
2992 }
2993 } else {
2994 pgidstr = object_pgidstr;
2995 }
2996 ++i;
2997 v = *i;
2998 }
2999 try {
3000 ghobj.decode(v);
3001 } catch (std::runtime_error& e) {
3002 ss << "Decode object JSON error: " << e.what();
3003 throw std::runtime_error(ss.str());
3004 }
3005 if (pgidstr != "meta" && (uint64_t)pgid.pgid.m_pool != (uint64_t)ghobj.hobj.pool) {
3006 cerr << "Object pool and pgid pool don't match" << std::endl;
3007 ret = 1;
3008 goto out;
3009 }
3010 }
3011 } catch (std::runtime_error& e) {
3012 cerr << e.what() << std::endl;
3013 ret = 1;
3014 goto out;
3015 }
3016 }
3017 }
3018
3019 // The ops which require --pgid option are checked here and
3020 // mentioned in the usage for --pgid.
3021 if ((op == "info" || op == "log" || op == "remove" || op == "export"
3022 || op == "rm-past-intervals" || op == "mark-complete") &&
3023 pgidstr.length() == 0) {
3024 cerr << "Must provide pgid" << std::endl;
3025 usage(desc);
3026 ret = 1;
3027 goto out;
3028 }
3029
3030 if (op == "import") {
3031
3032 try {
3033 ret = tool.do_import(fs, superblock, force, pgidstr, *osr);
3034 }
3035 catch (const buffer::error &e) {
3036 cerr << "do_import threw exception error " << e.what() << std::endl;
3037 ret = -EFAULT;
3038 }
3039 if (ret == -EFAULT) {
3040 cerr << "Corrupt input for import" << std::endl;
3041 }
3042 if (ret == 0)
3043 cout << "Import successful" << std::endl;
3044 goto out;
3045 } else if (op == "dump-journal-mount") {
3046 // Undocumented feature to dump journal with mounted fs
3047 // This doesn't support the format option, but it uses the
3048 // ObjectStore::dump_journal() and mounts to get replay to run.
3049 ret = fs->dump_journal(cout);
3050 if (ret) {
3051 if (ret == -EOPNOTSUPP) {
3052 cerr << "Object store type \"" << type << "\" doesn't support journal dump" << std::endl;
3053 } else {
3054 cerr << "Journal dump failed with error " << cpp_strerror(ret) << std::endl;
3055 }
3056 }
3057 goto out;
3058 } else if (op == "get-osdmap") {
3059 bufferlist bl;
3060 OSDMap osdmap;
3061 if (epoch == 0) {
3062 epoch = superblock.current_epoch;
3063 }
3064 ret = get_osdmap(fs, epoch, osdmap, bl);
3065 if (ret) {
3066 cerr << "Failed to get osdmap#" << epoch << ": "
3067 << cpp_strerror(ret) << std::endl;
3068 goto out;
3069 }
3070 ret = bl.write_fd(file_fd);
3071 if (ret) {
3072 cerr << "Failed to write to " << file << ": " << cpp_strerror(ret) << std::endl;
3073 } else {
3074 cout << "osdmap#" << epoch << " exported." << std::endl;
3075 }
3076 goto out;
3077 } else if (op == "set-osdmap") {
3078 bufferlist bl;
3079 ret = get_fd_data(file_fd, bl);
3080 if (ret < 0) {
3081 cerr << "Failed to read osdmap " << cpp_strerror(ret) << std::endl;
3082 } else {
3083 ret = set_osdmap(fs, epoch, bl, force, *osr);
3084 }
3085 goto out;
3086 } else if (op == "get-inc-osdmap") {
3087 bufferlist bl;
3088 if (epoch == 0) {
3089 epoch = superblock.current_epoch;
3090 }
3091 ret = get_inc_osdmap(fs, epoch, bl);
3092 if (ret < 0) {
3093 cerr << "Failed to get incremental osdmap# " << epoch << ": "
3094 << cpp_strerror(ret) << std::endl;
3095 goto out;
3096 }
3097 ret = bl.write_fd(file_fd);
3098 if (ret) {
3099 cerr << "Failed to write to " << file << ": " << cpp_strerror(ret) << std::endl;
3100 } else {
3101 cout << "inc-osdmap#" << epoch << " exported." << std::endl;
3102 }
3103 goto out;
3104 } else if (op == "set-inc-osdmap") {
3105 bufferlist bl;
3106 ret = get_fd_data(file_fd, bl);
3107 if (ret < 0) {
3108 cerr << "Failed to read incremental osdmap " << cpp_strerror(ret) << std::endl;
3109 goto out;
3110 } else {
3111 ret = set_inc_osdmap(fs, epoch, bl, force, *osr);
3112 }
3113 goto out;
3114 } else if (op == "update-mon-db") {
3115 if (!vm.count("mon-store-path")) {
3116 cerr << "Please specify the path to monitor db to update" << std::endl;
3117 ret = -EINVAL;
3118 } else {
3119 ret = update_mon_db(*fs, superblock, dpath + "/keyring", mon_store_path);
3120 }
3121 goto out;
3122 }
3123
3124 log_oid = OSD::make_pg_log_oid(pgid);
3125 biginfo_oid = OSD::make_pg_biginfo_oid(pgid);
3126
3127 if (op == "remove") {
3128 ret = initiate_new_remove_pg(fs, pgid, *osr);
3129 if (ret < 0) {
3130 cerr << "PG '" << pgid << "' not found" << std::endl;
3131 goto out;
3132 }
3133 cout << "Remove successful" << std::endl;
3134 goto out;
3135 }
3136
3137 if (op == "fix-lost") {
3138 boost::scoped_ptr<action_on_object_t> action;
3139 action.reset(new do_fix_lost(osr));
3140 if (pgidstr.length())
3141 ret = action_on_all_objects_in_exact_pg(fs, coll_t(pgid), *action, debug);
3142 else
3143 ret = action_on_all_objects(fs, *action, debug);
3144 goto out;
3145 }
3146
3147 if (op == "list") {
3148 ret = do_list(fs, pgidstr, object, nspace, formatter, debug,
3149 human_readable, head);
3150 if (ret < 0) {
3151 cerr << "do_list failed: " << cpp_strerror(ret) << std::endl;
3152 }
3153 goto out;
3154 }
3155
3156 if (op == "dump-super") {
3157 formatter->open_object_section("superblock");
3158 superblock.dump(formatter);
3159 formatter->close_section();
3160 formatter->flush(cout);
3161 cout << std::endl;
3162 goto out;
3163 }
3164
3165 if (op == "meta-list") {
3166 ret = do_meta(fs, object, formatter, debug, human_readable);
3167 if (ret < 0) {
3168 cerr << "do_meta failed: " << cpp_strerror(ret) << std::endl;
3169 }
3170 goto out;
3171 }
3172
3173 ret = fs->list_collections(ls);
3174 if (ret < 0) {
3175 cerr << "failed to list pgs: " << cpp_strerror(ret) << std::endl;
3176 goto out;
3177 }
3178
3179 if (debug && op == "list-pgs")
3180 cout << "Performing list-pgs operation" << std::endl;
3181
3182 // Find pg
3183 for (it = ls.begin(); it != ls.end(); ++it) {
3184 spg_t tmppgid;
3185
3186 if (pgidstr == "meta") {
3187 if (it->to_str() == "meta")
3188 break;
3189 else
3190 continue;
3191 }
3192
3193 if (!it->is_pg(&tmppgid)) {
3194 continue;
3195 }
3196
3197 if (it->is_temp(&tmppgid)) {
3198 continue;
3199 }
3200
3201 if (op != "list-pgs" && tmppgid != pgid) {
3202 continue;
3203 }
3204
3205 if (op != "list-pgs") {
3206 //Found!
3207 break;
3208 }
3209
3210 cout << tmppgid << std::endl;
3211 }
3212
3213 if (op == "list-pgs") {
3214 ret = 0;
3215 goto out;
3216 }
3217
3218 // If not an object command nor any of the ops handled below, then output this usage
3219 // before complaining about a bad pgid
3220 if (!vm.count("objcmd") && op != "export" && op != "info" && op != "log" && op != "rm-past-intervals" && op != "mark-complete") {
3221 cerr << "Must provide --op (info, log, remove, mkfs, fsck, export, import, list, fix-lost, list-pgs, rm-past-intervals, dump-journal, dump-super, meta-list, "
3222 "get-osdmap, set-osdmap, get-inc-osdmap, set-inc-osdmap, mark-complete)"
3223 << std::endl;
3224 usage(desc);
3225 ret = 1;
3226 goto out;
3227 }
3228 epoch_t map_epoch;
3229 // The following code for export, info, log require omap or !skip-mount-omap
3230 if (it != ls.end()) {
3231
3232 coll_t coll = *it;
3233
3234 if (vm.count("objcmd")) {
3235 ret = 0;
3236 if (objcmd == "remove" || objcmd == "removeall") {
3237 bool all = (objcmd == "removeall");
3238 ret = do_remove_object(fs, coll, ghobj, all, force, *osr);
3239 goto out;
3240 } else if (objcmd == "list-attrs") {
3241 ret = do_list_attrs(fs, coll, ghobj);
3242 goto out;
3243 } else if (objcmd == "list-omap") {
3244 ret = do_list_omap(fs, coll, ghobj);
3245 goto out;
3246 } else if (objcmd == "get-bytes" || objcmd == "set-bytes") {
3247 if (objcmd == "get-bytes") {
3248 int fd;
3249 if (vm.count("arg1") == 0 || arg1 == "-") {
3250 fd = STDOUT_FILENO;
3251 } else {
3252 fd = open(arg1.c_str(), O_WRONLY|O_TRUNC|O_CREAT|O_EXCL|O_LARGEFILE, 0666);
3253 if (fd == -1) {
3254 cerr << "open " << arg1 << " " << cpp_strerror(errno) << std::endl;
3255 ret = 1;
3256 goto out;
3257 }
3258 }
3259 ret = do_get_bytes(fs, coll, ghobj, fd);
3260 if (fd != STDOUT_FILENO)
3261 close(fd);
3262 } else {
3263 int fd;
3264 if (vm.count("arg1") == 0 || arg1 == "-") {
3265 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3266 if (isatty(STDIN_FILENO)) {
3267 cerr << "stdin is a tty and no file specified" << std::endl;
3268 ret = 1;
3269 goto out;
3270 }
3271 fd = STDIN_FILENO;
3272 } else {
3273 fd = open(arg1.c_str(), O_RDONLY|O_LARGEFILE, 0666);
3274 if (fd == -1) {
3275 cerr << "open " << arg1 << " " << cpp_strerror(errno) << std::endl;
3276 ret = 1;
3277 goto out;
3278 }
3279 }
3280 ret = do_set_bytes(fs, coll, ghobj, fd, *osr);
3281 if (fd != STDIN_FILENO)
3282 close(fd);
3283 }
3284 goto out;
3285 } else if (objcmd == "get-attr") {
3286 if (vm.count("arg1") == 0) {
3287 usage(desc);
3288 ret = 1;
3289 goto out;
3290 }
3291 ret = do_get_attr(fs, coll, ghobj, arg1);
3292 goto out;
3293 } else if (objcmd == "set-attr") {
3294 if (vm.count("arg1") == 0) {
3295 usage(desc);
3296 ret = 1;
3297 }
3298
3299 int fd;
3300 if (vm.count("arg2") == 0 || arg2 == "-") {
3301 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3302 if (isatty(STDIN_FILENO)) {
3303 cerr << "stdin is a tty and no file specified" << std::endl;
3304 ret = 1;
3305 goto out;
3306 }
3307 fd = STDIN_FILENO;
3308 } else {
3309 fd = open(arg2.c_str(), O_RDONLY|O_LARGEFILE, 0666);
3310 if (fd == -1) {
3311 cerr << "open " << arg2 << " " << cpp_strerror(errno) << std::endl;
3312 ret = 1;
3313 goto out;
3314 }
3315 }
3316 ret = do_set_attr(fs, coll, ghobj, arg1, fd, *osr);
3317 if (fd != STDIN_FILENO)
3318 close(fd);
3319 goto out;
3320 } else if (objcmd == "rm-attr") {
3321 if (vm.count("arg1") == 0) {
3322 usage(desc);
3323 ret = 1;
3324 goto out;
3325 }
3326 ret = do_rm_attr(fs, coll, ghobj, arg1, *osr);
3327 goto out;
3328 } else if (objcmd == "get-omap") {
3329 if (vm.count("arg1") == 0) {
3330 usage(desc);
3331 ret = 1;
3332 goto out;
3333 }
3334 ret = do_get_omap(fs, coll, ghobj, arg1);
3335 goto out;
3336 } else if (objcmd == "set-omap") {
3337 if (vm.count("arg1") == 0) {
3338 usage(desc);
3339 ret = 1;
3340 goto out;
3341 }
3342 int fd;
3343 if (vm.count("arg2") == 0 || arg2 == "-") {
3344 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3345 if (isatty(STDIN_FILENO)) {
3346 cerr << "stdin is a tty and no file specified" << std::endl;
3347 ret = 1;
3348 goto out;
3349 }
3350 fd = STDIN_FILENO;
3351 } else {
3352 fd = open(arg2.c_str(), O_RDONLY|O_LARGEFILE, 0666);
3353 if (fd == -1) {
3354 cerr << "open " << arg2 << " " << cpp_strerror(errno) << std::endl;
3355 ret = 1;
3356 goto out;
3357 }
3358 }
3359 ret = do_set_omap(fs, coll, ghobj, arg1, fd, *osr);
3360 if (fd != STDIN_FILENO)
3361 close(fd);
3362 goto out;
3363 } else if (objcmd == "rm-omap") {
3364 if (vm.count("arg1") == 0) {
3365 usage(desc);
3366 ret = 1;
3367 goto out;
3368 }
3369 ret = do_rm_omap(fs, coll, ghobj, arg1, *osr);
3370 goto out;
3371 } else if (objcmd == "get-omaphdr") {
3372 if (vm.count("arg1")) {
3373 usage(desc);
3374 ret = 1;
3375 goto out;
3376 }
3377 ret = do_get_omaphdr(fs, coll, ghobj);
3378 goto out;
3379 } else if (objcmd == "set-omaphdr") {
3380 // Extra arg
3381 if (vm.count("arg2")) {
3382 usage(desc);
3383 ret = 1;
3384 goto out;
3385 }
3386 int fd;
3387 if (vm.count("arg1") == 0 || arg1 == "-") {
3388 // Since read_fd() doesn't handle ^D from a tty stdin, don't allow it.
3389 if (isatty(STDIN_FILENO)) {
3390 cerr << "stdin is a tty and no file specified" << std::endl;
3391 ret = 1;
3392 goto out;
3393 }
3394 fd = STDIN_FILENO;
3395 } else {
3396 fd = open(arg1.c_str(), O_RDONLY|O_LARGEFILE, 0666);
3397 if (fd == -1) {
3398 cerr << "open " << arg1 << " " << cpp_strerror(errno) << std::endl;
3399 ret = 1;
3400 goto out;
3401 }
3402 }
3403 ret = do_set_omaphdr(fs, coll, ghobj, fd, *osr);
3404 if (fd != STDIN_FILENO)
3405 close(fd);
3406 goto out;
3407 } else if (objcmd == "dump") {
3408 // There should not be any other arguments
3409 if (vm.count("arg1") || vm.count("arg2")) {
3410 usage(desc);
3411 ret = 1;
3412 goto out;
3413 }
3414 ret = print_obj_info(fs, coll, ghobj, formatter);
3415 goto out;
3416 } else if (objcmd == "set-size") {
3417 // Extra arg
3418 if (vm.count("arg1") == 0 || vm.count("arg2")) {
3419 usage(desc);
3420 ret = 1;
3421 goto out;
3422 }
3423 if (arg1.length() == 0 || !isdigit(arg1.c_str()[0])) {
3424 cerr << "Invalid size '" << arg1 << "' specified" << std::endl;
3425 ret = 1;
3426 goto out;
3427 }
3428 uint64_t size = atoll(arg1.c_str());
3429 ret = set_size(fs, coll, ghobj, size, formatter, *osr);
3430 goto out;
3431 } else if (objcmd == "clear-snapset") {
3432 // UNDOCUMENTED: For testing zap SnapSet
3433 // IGNORE extra args since not in usage anyway
3434 if (!ghobj.hobj.has_snapset()) {
3435 cerr << "'" << objcmd << "' requires a head or snapdir object" << std::endl;
3436 ret = 1;
3437 goto out;
3438 }
3439 ret = clear_snapset(fs, coll, ghobj, arg1, *osr);
3440 goto out;
3441 } else if (objcmd == "remove-clone-metadata") {
3442 // Extra arg
3443 if (vm.count("arg1") == 0 || vm.count("arg2")) {
3444 usage(desc);
3445 ret = 1;
3446 goto out;
3447 }
3448 if (!ghobj.hobj.has_snapset()) {
3449 cerr << "'" << objcmd << "' requires a head or snapdir object" << std::endl;
3450 ret = 1;
3451 goto out;
3452 }
3453 if (arg1.length() == 0 || !isdigit(arg1.c_str()[0])) {
3454 cerr << "Invalid cloneid '" << arg1 << "' specified" << std::endl;
3455 ret = 1;
3456 goto out;
3457 }
3458 snapid_t cloneid = atoi(arg1.c_str());
3459 ret = remove_clone(fs, coll, ghobj, cloneid, force, *osr);
3460 goto out;
3461 }
3462 cerr << "Unknown object command '" << objcmd << "'" << std::endl;
3463 usage(desc);
3464 ret = 1;
3465 goto out;
3466 }
3467
3468 bufferlist bl;
3469 map_epoch = 0;
3470 ret = PG::peek_map_epoch(fs, pgid, &map_epoch, &bl);
3471 if (ret < 0)
3472 cerr << "peek_map_epoch reports error" << std::endl;
3473 if (debug)
3474 cerr << "map_epoch " << map_epoch << std::endl;
3475
3476 pg_info_t info(pgid);
3477 PastIntervals past_intervals;
3478 __u8 struct_ver;
3479 ret = PG::read_info(fs, pgid, coll, bl, info, past_intervals,
3480 struct_ver);
3481 if (ret < 0) {
3482 cerr << "read_info error " << cpp_strerror(ret) << std::endl;
3483 goto out;
3484 }
3485 if (struct_ver < PG::compat_struct_v) {
3486 cerr << "PG is too old to upgrade, use older Ceph version" << std::endl;
3487 ret = -EFAULT;
3488 goto out;
3489 }
3490 if (debug)
3491 cerr << "struct_v " << (int)struct_ver << std::endl;
3492
3493 if (op == "export") {
3494 ret = tool.do_export(fs, coll, pgid, info, map_epoch, struct_ver, superblock, past_intervals);
3495 if (ret == 0)
3496 cerr << "Export successful" << std::endl;
3497 } else if (op == "info") {
3498 formatter->open_object_section("info");
3499 info.dump(formatter);
3500 formatter->close_section();
3501 formatter->flush(cout);
3502 cout << std::endl;
3503 } else if (op == "log") {
3504 PGLog::IndexedLog log;
3505 pg_missing_t missing;
3506 ret = get_log(fs, struct_ver, coll, pgid, info, log, missing);
3507 if (ret < 0)
3508 goto out;
3509
3510 dump_log(formatter, cout, log, missing);
3511 } else if (op == "rm-past-intervals") {
3512 ObjectStore::Transaction tran;
3513 ObjectStore::Transaction *t = &tran;
3514
3515 if (struct_ver < PG::compat_struct_v) {
3516 cerr << "Can't remove past-intervals, version mismatch " << (int)struct_ver
3517 << " (pg) < compat " << (int)PG::compat_struct_v << " (tool)"
3518 << std::endl;
3519 ret = -EFAULT;
3520 goto out;
3521 }
3522
3523 cout << "Remove past-intervals " << past_intervals << std::endl;
3524
3525 past_intervals.clear();
3526 if (dry_run) {
3527 ret = 0;
3528 goto out;
3529 }
3530 ret = write_info(*t, map_epoch, info, past_intervals);
3531
3532 if (ret == 0) {
3533 fs->apply_transaction(osr, std::move(*t));
3534 cout << "Removal succeeded" << std::endl;
3535 }
3536 } else if (op == "mark-complete") {
3537 ObjectStore::Transaction tran;
3538 ObjectStore::Transaction *t = &tran;
3539
3540 if (struct_ver < PG::compat_struct_v) {
3541 cerr << "Can't mark-complete, version mismatch " << (int)struct_ver
3542 << " (pg) < compat " << (int)PG::compat_struct_v << " (tool)"
3543 << std::endl;
3544 ret = 1;
3545 goto out;
3546 }
3547
3548 cout << "Marking complete " << std::endl;
3549
3550 info.last_update = eversion_t(superblock.current_epoch, info.last_update.version + 1);
3551 info.last_backfill = hobject_t::get_max();
3552 info.last_epoch_started = superblock.current_epoch;
3553 info.history.last_epoch_started = superblock.current_epoch;
3554 info.history.last_epoch_clean = superblock.current_epoch;
3555 past_intervals.clear();
3556
3557 if (!dry_run) {
3558 ret = write_info(*t, map_epoch, info, past_intervals);
3559 if (ret != 0)
3560 goto out;
3561 fs->apply_transaction(osr, std::move(*t));
3562 }
3563 cout << "Marking complete succeeded" << std::endl;
3564 } else {
3565 assert(!"Should have already checked for valid --op");
3566 }
3567 } else {
3568 cerr << "PG '" << pgid << "' not found" << std::endl;
3569 ret = -ENOENT;
3570 }
3571
3572 out:
3573 int r = fs->umount();
3574 delete osr;
3575 if (r < 0) {
3576 cerr << "umount failed: " << cpp_strerror(r) << std::endl;
3577 // If no previous error, then use umount() error
3578 if (ret == 0)
3579 ret = r;
3580 }
3581
3582 if (dry_run) {
3583 // Export output can go to stdout, so put this message on stderr
3584 if (op == "export")
3585 cerr << "dry-run: Nothing changed" << std::endl;
3586 else
3587 cout << "dry-run: Nothing changed" << std::endl;
3588 }
3589
3590 if (ret < 0)
3591 ret = 1;
3592 return ret;
3593 }