// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab ft=cpp /* * Ceph - scalable distributed file system * * Copyright (C) 2020 Red Hat, Inc. * * This is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License version 2.1, as published by the Free Software * Foundation. See file COPYING. * */ #include #include "common/errno.h" #include "rgw_sync_checkpoint.h" #include "rgw_sal_rados.h" #include "rgw_bucket_sync.h" #include "rgw_data_sync.h" #include "rgw_http_errors.h" #include "cls/rgw/cls_rgw_client.h" #include "services/svc_sys_obj.h" #include "services/svc_zone.h" #include "rgw_zone.h" #define dout_subsys ceph_subsys_rgw namespace { std::string incremental_marker(const rgw_bucket_shard_sync_info& info) { if (info.state != rgw_bucket_shard_sync_info::StateIncrementalSync) { return ""; } return BucketIndexShardsManager::get_shard_marker(info.inc_marker.position); } bool operator<(const std::vector& lhs, const BucketIndexShardsManager& rhs) { for (size_t i = 0; i < lhs.size(); ++i) { const auto& l = incremental_marker(lhs[i]); const auto& r = rhs.get(i, ""); if (l < r) { return true; } } return false; } bool empty(const BucketIndexShardsManager& markers, int size) { for (int i = 0; i < size; ++i) { const auto& m = markers.get(i, ""); if (!m.empty()) { return false; } } return true; } std::ostream& operator<<(std::ostream& out, const std::vector& rhs) { const char* separator = ""; // first entry has no comma out << '['; for (auto& i : rhs) { out << std::exchange(separator, ", ") << incremental_marker(i); } return out << ']'; } std::ostream& operator<<(std::ostream& out, const BucketIndexShardsManager& rhs) { out << '['; const char* separator = ""; // first entry has no comma for (auto& [i, marker] : rhs.get()) { out << std::exchange(separator, ", ") << marker; } return out << ']'; } int bucket_source_sync_checkpoint(const DoutPrefixProvider* dpp, rgw::sal::RGWRadosStore *store, const RGWBucketInfo& bucket_info, const RGWBucketInfo& source_bucket_info, const rgw_sync_bucket_pipe& pipe, const BucketIndexShardsManager& remote_markers, ceph::timespan retry_delay, ceph::coarse_mono_time timeout_at) { const auto num_shards = source_bucket_info.layout.current_index.layout.normal.num_shards; if (empty(remote_markers, num_shards)) { ldpp_dout(dpp, 1) << "bucket sync caught up with empty source" << dendl; return 0; } std::vector status; status.resize(std::max(1, num_shards)); int r = rgw_bucket_sync_status(dpp, store, pipe, bucket_info, &source_bucket_info, &status); if (r < 0) { return r; } while (status < remote_markers) { auto delay_until = ceph::coarse_mono_clock::now() + retry_delay; if (delay_until > timeout_at) { ldpp_dout(dpp, 0) << "bucket checkpoint timed out waiting for incremental sync to catch up" << dendl; return -ETIMEDOUT; } ldpp_dout(dpp, 1) << "waiting for incremental sync to catch up:\n" << " local status: " << status << '\n' << " remote markers: " << remote_markers << dendl; std::this_thread::sleep_until(delay_until); r = rgw_bucket_sync_status(dpp, store, pipe, bucket_info, &source_bucket_info, &status); if (r < 0) { return r; } } ldpp_dout(dpp, 1) << "bucket sync caught up with source:\n" << " local status: " << status << '\n' << " remote markers: " << remote_markers << dendl; return 0; } int source_bilog_markers(const DoutPrefixProvider *dpp, RGWSI_Zone* zone_svc, const rgw_sync_bucket_pipe& pipe, BucketIndexShardsManager& remote_markers, optional_yield y) { ceph_assert(pipe.source.zone); auto& zone_conn_map = zone_svc->get_zone_conn_map(); auto conn = zone_conn_map.find(pipe.source.zone->id); if (conn == zone_conn_map.end()) { return -EINVAL; } return rgw_read_remote_bilog_info(dpp, conn->second, *pipe.source.bucket, remote_markers, y); } } // anonymous namespace int rgw_bucket_sync_checkpoint(const DoutPrefixProvider* dpp, rgw::sal::RGWRadosStore *store, const RGWBucketSyncPolicyHandler& policy, const RGWBucketInfo& info, std::optional opt_source_zone, std::optional opt_source_bucket, ceph::timespan retry_delay, ceph::coarse_mono_time timeout_at) { struct sync_source_entry { rgw_sync_bucket_pipe pipe; BucketIndexShardsManager remote_markers; RGWBucketInfo source_bucket_info; }; std::list sources; // fetch remote markers and bucket info in parallel boost::asio::io_context ioctx; for (const auto& [source_zone_id, pipe] : policy.get_all_sources()) { // filter by source zone/bucket if (opt_source_zone && *opt_source_zone != *pipe.source.zone) { continue; } if (opt_source_bucket && !opt_source_bucket->match(*pipe.source.bucket)) { continue; } auto& entry = sources.emplace_back(); entry.pipe = pipe; // fetch remote markers spawn::spawn(ioctx, [&] (yield_context yield) { auto y = optional_yield{ioctx, yield}; int r = source_bilog_markers(dpp, store->svc()->zone, entry.pipe, entry.remote_markers, y); if (r < 0) { ldpp_dout(dpp, 0) << "failed to fetch remote bilog markers: " << cpp_strerror(r) << dendl; throw std::system_error(-r, std::system_category()); } }); // fetch source bucket info spawn::spawn(ioctx, [&] (yield_context yield) { auto y = optional_yield{ioctx, yield}; auto obj_ctx = store->svc()->sysobj->init_obj_ctx(); int r = store->getRados()->get_bucket_instance_info( obj_ctx, *entry.pipe.source.bucket, entry.source_bucket_info, nullptr, nullptr, y, dpp); if (r < 0) { ldpp_dout(dpp, 0) << "failed to read source bucket info: " << cpp_strerror(r) << dendl; throw std::system_error(-r, std::system_category()); } }); } try { ioctx.run(); } catch (const std::system_error& e) { return -e.code().value(); } // checkpoint each source sequentially for (const auto& [pipe, remote_markers, source_bucket_info] : sources) { int r = bucket_source_sync_checkpoint(dpp, store, info, source_bucket_info, pipe, remote_markers, retry_delay, timeout_at); if (r < 0) { ldpp_dout(dpp, 0) << "bucket sync checkpoint failed: " << cpp_strerror(r) << dendl; return r; } } ldpp_dout(dpp, 0) << "bucket checkpoint complete" << dendl; return 0; }