#include "SnapMapper.h"
+#include <fmt/printf.h>
+#include <fmt/ranges.h>
+
+#include "global/global_context.h"
+#include "osd/osd_types_fmt.h"
+#include "SnapMapReaderI.h"
+
#define dout_context cct
#define dout_subsys ceph_subsys_osd
#undef dout_prefix
using std::string;
using std::vector;
-using ceph::bufferlist;
using ceph::decode;
using ceph::encode;
using ceph::timespan_str;
+using result_t = Scrub::SnapMapReaderI::result_t;
+using code_t = Scrub::SnapMapReaderI::result_t::code_t;
+
const string SnapMapper::LEGACY_MAPPING_PREFIX = "MAP_";
const string SnapMapper::MAPPING_PREFIX = "SNA_";
*/
+#ifdef WITH_SEASTAR
+#include "crimson/common/log.h"
+#include "crimson/osd/pg_interval_interrupt_condition.h"
+ template <typename ValuesT = void>
+ using interruptible_future =
+ ::crimson::interruptible::interruptible_future<
+ ::crimson::osd::IOInterruptCondition, ValuesT>;
+ using interruptor =
+ ::crimson::interruptible::interruptor<
+ ::crimson::osd::IOInterruptCondition>;
+
+#define CRIMSON_DEBUG(FMT_MSG, ...) crimson::get_logger(ceph_subsys_).debug(FMT_MSG, ##__VA_ARGS__)
int OSDriver::get_keys(
const std::set<std::string> &keys,
- std::map<std::string, bufferlist> *out)
+ std::map<std::string, ceph::buffer::list> *out)
+{
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+ using crimson::os::FuturizedStore;
+ return interruptor::green_get(os->omap_get_values(
+ ch, hoid, keys
+ ).safe_then([out] (FuturizedStore::Shard::omap_values_t&& vals) {
+ // just the difference in comparator (`std::less<>` in omap_values_t`)
+ reinterpret_cast<FuturizedStore::Shard::omap_values_t&>(*out) = std::move(vals);
+ return 0;
+ }, FuturizedStore::Shard::read_errorator::all_same_way([] (auto& e) {
+ assert(e.value() > 0);
+ return -e.value();
+ }))); // this requires seastar::thread
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+}
+
+int OSDriver::get_next(
+ const std::string &key,
+ std::pair<std::string, ceph::buffer::list> *next)
+{
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+ using crimson::os::FuturizedStore;
+ return interruptor::green_get(os->omap_get_values(
+ ch, hoid, key
+ ).safe_then_unpack([&key, next] (bool, FuturizedStore::Shard::omap_values_t&& vals) {
+ CRIMSON_DEBUG("OSDriver::{}:{}", "get_next", __LINE__);
+ if (auto nit = std::begin(vals); nit == std::end(vals)) {
+ CRIMSON_DEBUG("OSDriver::{}:{}", "get_next", __LINE__);
+ return -ENOENT;
+ } else {
+ CRIMSON_DEBUG("OSDriver::{}:{}", "get_next", __LINE__);
+ assert(nit->first > key);
+ *next = *nit;
+ return 0;
+ }
+ }, FuturizedStore::Shard::read_errorator::all_same_way([] {
+ CRIMSON_DEBUG("OSDriver::{}:{}", "get_next", __LINE__);
+ return -EINVAL;
+ }))); // this requires seastar::thread
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+}
+
+int OSDriver::get_next_or_current(
+ const std::string &key,
+ std::pair<std::string, ceph::buffer::list> *next_or_current)
+{
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+ using crimson::os::FuturizedStore;
+ // let's try to get current first
+ return interruptor::green_get(os->omap_get_values(
+ ch, hoid, FuturizedStore::Shard::omap_keys_t{key}
+ ).safe_then([&key, next_or_current] (FuturizedStore::Shard::omap_values_t&& vals) {
+ assert(vals.size() == 1);
+ *next_or_current = std::make_pair(key, std::move(vals[0]));
+ return 0;
+ }, FuturizedStore::Shard::read_errorator::all_same_way(
+ [next_or_current, &key, this] {
+ // no current, try next
+ return get_next(key, next_or_current);
+ }))); // this requires seastar::thread
+ CRIMSON_DEBUG("OSDriver::{}:{}", __func__, __LINE__);
+}
+#else
+int OSDriver::get_keys(
+ const std::set<std::string> &keys,
+ std::map<std::string, ceph::buffer::list> *out)
{
return os->omap_get_values(ch, hoid, keys, out);
}
int OSDriver::get_next(
const std::string &key,
- pair<std::string, bufferlist> *next)
+ std::pair<std::string, ceph::buffer::list> *next)
{
ObjectMap::ObjectMapIterator iter =
os->get_omap_iterator(ch, hoid);
}
}
+int OSDriver::get_next_or_current(
+ const std::string &key,
+ std::pair<std::string, ceph::buffer::list> *next_or_current)
+{
+ ObjectMap::ObjectMapIterator iter =
+ os->get_omap_iterator(ch, hoid);
+ if (!iter) {
+ ceph_abort();
+ return -EINVAL;
+ }
+ iter->lower_bound(key);
+ if (iter->valid()) {
+ if (next_or_current)
+ *next_or_current = make_pair(iter->key(), iter->value());
+ return 0;
+ } else {
+ return -ENOENT;
+ }
+}
+#endif // WITH_SEASTAR
+
string SnapMapper::get_prefix(int64_t pool, snapid_t snap)
{
- char buf[100];
- int len = snprintf(
- buf, sizeof(buf),
- "%lld_%.*X_",
- (long long)pool,
- (int)(sizeof(snap)*2), static_cast<unsigned>(snap));
- return MAPPING_PREFIX + string(buf, len);
+ static_assert(sizeof(pool) == 8, "assumed by the formatting code");
+ return fmt::sprintf("%s%lld_%.16X_",
+ MAPPING_PREFIX,
+ pool,
+ snap);
}
string SnapMapper::to_raw_key(
- const pair<snapid_t, hobject_t> &in)
+ const pair<snapid_t, hobject_t> &in) const
{
return get_prefix(in.second.pool, in.first) + shard_prefix + in.second.to_str();
}
-pair<string, bufferlist> SnapMapper::to_raw(
- const pair<snapid_t, hobject_t> &in)
+std::string SnapMapper::to_raw_key(snapid_t snap, const hobject_t &clone) const
{
- bufferlist bl;
+ return get_prefix(clone.pool, snap) + shard_prefix + clone.to_str();
+}
+
+pair<string, ceph::buffer::list> SnapMapper::to_raw(
+ const pair<snapid_t, hobject_t> &in) const
+{
+ ceph::buffer::list bl;
encode(Mapping(in), bl);
- return make_pair(
- to_raw_key(in),
- bl);
+ return make_pair(to_raw_key(in), bl);
}
pair<snapid_t, hobject_t> SnapMapper::from_raw(
- const pair<std::string, bufferlist> &image)
+ const pair<std::string, ceph::buffer::list> &image)
{
using ceph::decode;
Mapping map;
- bufferlist bl(image.second);
+ ceph::buffer::list bl(image.second);
auto bp = bl.cbegin();
decode(map, bp);
return make_pair(map.snap, map.hoid);
}
+std::pair<snapid_t, hobject_t> SnapMapper::from_raw(
+ const ceph::buffer::list &image)
+{
+ using ceph::decode;
+ Mapping map;
+ auto bp = image.cbegin();
+ decode(map, bp);
+ return make_pair(map.snap, map.hoid);
+}
+
bool SnapMapper::is_mapping(const string &to_test)
{
return to_test.substr(0, MAPPING_PREFIX.size()) == MAPPING_PREFIX;
}
-string SnapMapper::to_object_key(const hobject_t &hoid)
+string SnapMapper::to_object_key(const hobject_t &hoid) const
{
return OBJECT_PREFIX + shard_prefix + hoid.to_str();
}
-void SnapMapper::object_snaps::encode(bufferlist &bl) const
+void SnapMapper::object_snaps::encode(ceph::buffer::list &bl) const
{
ENCODE_START(1, 1, bl);
encode(oid, bl);
ENCODE_FINISH(bl);
}
-void SnapMapper::object_snaps::decode(bufferlist::const_iterator &bl)
+void SnapMapper::object_snaps::decode(ceph::buffer::list::const_iterator &bl)
{
DECODE_START(1, bl);
decode(oid, bl);
return false;
}
-int SnapMapper::get_snaps(
- const hobject_t &oid,
- object_snaps *out)
+int SnapMapper::get_snaps(const hobject_t &oid, object_snaps *out) const
+{
+ auto snaps = get_snaps_common(oid);
+ if (snaps) {
+ *out = *snaps;
+ return 0;
+ }
+ switch (auto e = snaps.error(); e.code) {
+ case code_t::backend_error:
+ return e.backend_error;
+ case code_t::not_found:
+ return -ENOENT;
+ case code_t::inconsistent:
+ // As this is a legacy interface, we cannot surprise the user with
+ // a new error code here.
+ return -ENOENT;
+ default:
+ // Can't happen. Just to keep the compiler happy.
+ ceph_abort("get_snaps_common() returned invalid error code");
+ }
+}
+
+tl::expected<std::set<snapid_t>, Scrub::SnapMapReaderI::result_t>
+SnapMapper::get_snaps(const hobject_t &oid) const
+{
+ auto snaps = get_snaps_common(oid);
+ if (snaps) {
+ return snaps->snaps;
+ }
+ return tl::unexpected(snaps.error());
+}
+
+tl::expected<SnapMapper::object_snaps, Scrub::SnapMapReaderI::result_t>
+SnapMapper::get_snaps_common(const hobject_t &oid) const
{
ceph_assert(check(oid));
- set<string> keys;
- map<string, bufferlist> got;
- keys.insert(to_object_key(oid));
+ set<string> keys{to_object_key(oid)};
+ dout(20) << fmt::format("{}: key string: {} oid:{}", __func__, keys, oid)
+ << dendl;
+
+ map<string, ceph::buffer::list> got;
int r = backend.get_keys(keys, &got);
if (r < 0) {
- dout(20) << __func__ << " " << oid << " got err " << r << dendl;
- return r;
+ dout(10) << __func__ << " " << oid << " got err " << r << dendl;
+ return tl::unexpected(result_t{code_t::backend_error, r});
}
if (got.empty()) {
- dout(20) << __func__ << " " << oid << " got.empty()" << dendl;
- return -ENOENT;
+ dout(10) << __func__ << " " << oid << " got.empty()" << dendl;
+ return tl::unexpected(result_t{code_t::not_found, -ENOENT});
}
- if (out) {
- auto bp = got.begin()->second.cbegin();
- decode(*out, bp);
- dout(20) << __func__ << " " << oid << " " << out->snaps << dendl;
- if (out->snaps.empty()) {
- dout(1) << __func__ << " " << oid << " empty snapset" << dendl;
- ceph_assert(!cct->_conf->osd_debug_verify_snaps);
+
+ object_snaps out;
+ auto bp = got.begin()->second.cbegin();
+ try {
+ decode(out, bp);
+ } catch (...) {
+ dout(1) << __func__ << ": " << oid << " decode failed" << dendl;
+ return tl::unexpected(result_t{code_t::backend_error, -EIO});
+ }
+
+ dout(20) << __func__ << " " << oid << " " << out.snaps << dendl;
+ if (out.snaps.empty()) {
+ dout(1) << __func__ << " " << oid << " empty snapset" << dendl;
+ ceph_assert(!cct->_conf->osd_debug_verify_snaps);
+ }
+ return out;
+}
+
+std::set<std::string> SnapMapper::to_raw_keys(
+ const hobject_t &clone,
+ const std::set<snapid_t> &snaps) const
+{
+ std::set<std::string> keys;
+ for (auto snap : snaps) {
+ keys.insert(to_raw_key(snap, clone));
+ }
+ dout(20) << fmt::format(
+ "{}: clone:{} snaps:{} -> keys: {}", __func__, clone, snaps,
+ keys)
+ << dendl;
+ return keys;
+}
+
+tl::expected<std::set<snapid_t>, result_t>
+SnapMapper::get_snaps_check_consistency(const hobject_t &hoid) const
+{
+ // derive the set of snaps from the 'OBJ_' entry
+ auto obj_snaps = get_snaps(hoid);
+ if (!obj_snaps) {
+ return obj_snaps;
+ }
+
+ // make sure we have the expected set of SNA_ entries:
+ // we have the clone oid and the set of snaps relevant to this clone.
+ // Let's construct all expected SNA_ key, then fetch them.
+
+ auto mapping_keys = to_raw_keys(hoid, *obj_snaps);
+ map<string, ceph::buffer::list> kvmap;
+ auto r = backend.get_keys(mapping_keys, &kvmap);
+ if (r < 0) {
+ dout(10) << fmt::format(
+ "{}: backend error ({}) for cobject {}", __func__, r, hoid)
+ << dendl;
+ // that's a backend error, but for the SNA_ entries. Let's treat it as an
+ // internal consistency error (although a backend error would have made
+ // sense too).
+ return tl::unexpected(result_t{code_t::inconsistent, r});
+ }
+
+ std::set<snapid_t> snaps_from_mapping;
+ for (auto &[k, v] : kvmap) {
+ dout(20) << __func__ << " " << hoid << " " << k << dendl;
+ // extract the object ID from the value fetched for an SNA mapping key
+ auto [sn, obj] = SnapMapper::from_raw(v);
+ if (obj != hoid) {
+ dout(1) << fmt::format(
+ "{}: unexpected object ID {} for key{} (expected {})",
+ __func__, obj, k, hoid)
+ << dendl;
+ return tl::unexpected(result_t{code_t::inconsistent});
}
- } else {
- dout(20) << __func__ << " " << oid << " (out == NULL)" << dendl;
+ snaps_from_mapping.insert(sn);
}
- return 0;
+
+ if (snaps_from_mapping != *obj_snaps) {
+ dout(10) << fmt::format(
+ "{}: hoid:{} -> mapper internal inconsistency ({} vs {})",
+ __func__, hoid, *obj_snaps, snaps_from_mapping)
+ << dendl;
+ return tl::unexpected(result_t{code_t::inconsistent});
+ }
+ dout(10) << fmt::format(
+ "{}: snaps for {}: {}", __func__, hoid, snaps_from_mapping)
+ << dendl;
+ return obj_snaps;
}
void SnapMapper::clear_snaps(
const hobject_t &oid,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
dout(20) << __func__ << " " << oid << dendl;
ceph_assert(check(oid));
void SnapMapper::set_snaps(
const hobject_t &oid,
const object_snaps &in,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
ceph_assert(check(oid));
- map<string, bufferlist> to_set;
- bufferlist bl;
+ map<string, ceph::buffer::list> to_set;
+ ceph::buffer::list bl;
encode(in, bl);
to_set[to_object_key(oid)] = bl;
dout(20) << __func__ << " " << oid << " " << in.snaps << dendl;
const hobject_t &oid,
const set<snapid_t> &new_snaps,
const set<snapid_t> *old_snaps_check,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
dout(20) << __func__ << " " << oid << " " << new_snaps
<< " was " << (old_snaps_check ? *old_snaps_check : set<snapid_t>())
void SnapMapper::add_oid(
const hobject_t &oid,
const set<snapid_t>& snaps,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
dout(20) << __func__ << " " << oid << " " << snaps << dendl;
ceph_assert(!snaps.empty());
object_snaps _snaps(oid, snaps);
set_snaps(oid, _snaps, t);
- map<string, bufferlist> to_add;
+ map<string, ceph::buffer::list> to_add;
for (set<snapid_t>::iterator i = snaps.begin();
i != snaps.end();
++i) {
// trim the snaptrim queue
ceph_assert(max > 0);
int r = 0;
+
+ /// \todo cache the prefixes-set in update_bits()
for (set<string>::iterator i = prefixes.begin();
i != prefixes.end() && out->size() < max && r == 0;
++i) {
string prefix(get_prefix(pool, snap) + *i);
string pos = prefix;
while (out->size() < max) {
- pair<string, bufferlist> next;
+ pair<string, ceph::buffer::list> next;
r = backend.get_next(pos, &next);
dout(20) << __func__ << " get_next(" << pos << ") returns " << r
<< " " << next << dendl;
int SnapMapper::remove_oid(
const hobject_t &oid,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
dout(20) << __func__ << " " << oid << dendl;
ceph_assert(check(oid));
int SnapMapper::_remove_oid(
const hobject_t &oid,
- MapCacher::Transaction<std::string, bufferlist> *t)
+ MapCacher::Transaction<std::string, ceph::buffer::list> *t)
{
dout(20) << __func__ << " " << oid << dendl;
object_snaps out;
int SnapMapper::get_snaps(
const hobject_t &oid,
- std::set<snapid_t> *snaps)
+ std::set<snapid_t> *snaps) const
{
ceph_assert(check(oid));
object_snaps out;
string SnapMapper::make_purged_snap_key(int64_t pool, snapid_t last)
{
- char k[80];
- snprintf(k, sizeof(k), "%s_%llu_%016llx", PURGED_SNAP_PREFIX,
- (unsigned long long)pool, (unsigned long long)last);
- return k;
+ return fmt::sprintf("%s_%lld_%016llx",
+ PURGED_SNAP_PREFIX,
+ pool,
+ last);
}
void SnapMapper::make_purged_snap_key_value(
- int64_t pool, snapid_t begin, snapid_t end, map<string,bufferlist> *m)
+ int64_t pool, snapid_t begin, snapid_t end, map<string,ceph::buffer::list> *m)
{
string k = make_purged_snap_key(pool, end - 1);
auto& v = (*m)[k];
int SnapMapper::_lookup_purged_snap(
CephContext *cct,
- ObjectStore *store,
- ObjectStore::CollectionHandle& ch,
- const ghobject_t& hoid,
+ OSDriver& backend,
int64_t pool, snapid_t snap,
snapid_t *begin, snapid_t *end)
{
string k = make_purged_snap_key(pool, snap);
- auto it = store->get_omap_iterator(ch, hoid);
- it->lower_bound(k);
- if (!it->valid()) {
+ std::pair<std::string, ceph::buffer::list> kv;
+ if (auto ret = backend.get_next_or_current(k, &kv); ret == -ENOENT) {
dout(20) << __func__ << " pool " << pool << " snap " << snap
<< " key '" << k << "' lower_bound not found" << dendl;
return -ENOENT;
}
- if (it->key().find(PURGED_SNAP_PREFIX) != 0) {
+ if (kv.first.find(PURGED_SNAP_PREFIX) != 0) {
dout(20) << __func__ << " pool " << pool << " snap " << snap
<< " key '" << k << "' lower_bound got mismatched prefix '"
- << it->key() << "'" << dendl;
+ << kv.first << "'" << dendl;
return -ENOENT;
}
- bufferlist v = it->value();
+ ceph::buffer::list v = kv.second;
auto p = v.cbegin();
int64_t gotpool;
decode(gotpool, p);
void SnapMapper::record_purged_snaps(
CephContext *cct,
- ObjectStore *store,
- ObjectStore::CollectionHandle& ch,
- ghobject_t hoid,
- ObjectStore::Transaction *t,
+ OSDriver& backend,
+ OSDriver::OSTransaction&& txn,
map<epoch_t,mempool::osdmap::map<int64_t,snap_interval_set_t>> purged_snaps)
{
dout(10) << __func__ << " purged_snaps " << purged_snaps << dendl;
- map<string,bufferlist> m;
+ map<string,ceph::buffer::list> m;
set<string> rm;
for (auto& [epoch, bypool] : purged_snaps) {
// index by (pool, snap)
snapid_t end = i.get_end();
snapid_t before_begin, before_end;
snapid_t after_begin, after_end;
- int b = _lookup_purged_snap(cct, store, ch, hoid,
+ int b = _lookup_purged_snap(cct, backend,
pool, begin - 1, &before_begin, &before_end);
- int a = _lookup_purged_snap(cct, store, ch, hoid,
+ int a = _lookup_purged_snap(cct, backend,
pool, end, &after_begin, &after_end);
if (!b && !a) {
dout(10) << __func__
}
}
}
- t->omap_rmkeys(ch->cid, hoid, rm);
- t->omap_setkeys(ch->cid, hoid, m);
+ txn.remove_keys(rm);
+ txn.set_keys(m);
dout(10) << __func__ << " rm " << rm.size() << " keys, set " << m.size()
<< " keys" << dendl;
}
+#ifndef WITH_SEASTAR
bool SnapMapper::Scrubber::_parse_p()
{
if (!psit->valid()) {
pool = -1;
return false;
}
- bufferlist v = psit->value();
+ ceph::buffer::list v = psit->value();
auto p = v.cbegin();
ceph::decode(pool, p);
ceph::decode(begin, p);
psit = ObjectMap::ObjectMapIterator();
mapit = ObjectMap::ObjectMapIterator();
}
+#endif // !WITH_SEASTAR
// -------------------------------------
string SnapMapper::get_legacy_prefix(snapid_t snap)
{
- char buf[100];
- int len = snprintf(
- buf, sizeof(buf),
- "%.*X_",
- (int)(sizeof(snap)*2), static_cast<unsigned>(snap));
- return LEGACY_MAPPING_PREFIX + string(buf, len);
+ return fmt::sprintf("%s%.16X_",
+ LEGACY_MAPPING_PREFIX,
+ snap);
}
string SnapMapper::to_legacy_raw_key(
LEGACY_MAPPING_PREFIX;
}
+#ifndef WITH_SEASTAR
/* Octopus modified the SnapMapper key format from
*
* <LEGACY_MAPPING_PREFIX><snapid>_<shardid>_<hobject_t::to_str()>
*/
std::string SnapMapper::convert_legacy_key(
const std::string& old_key,
- const bufferlist& value)
+ const ceph::buffer::list& value)
{
auto old = from_raw(make_pair(old_key, value));
std::string object_suffix = old_key.substr(
auto start = ceph::mono_clock::now();
iter->upper_bound(SnapMapper::LEGACY_MAPPING_PREFIX);
- map<string,bufferlist> to_set;
+ map<string,ceph::buffer::list> to_set;
while (iter->valid()) {
bool valid = SnapMapper::is_legacy_mapping(iter->key());
if (valid) {
}
return 0;
}
+#endif // !WITH_SEASTAR