// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab ft=cpp #ifndef CEPH_RGW_DATA_SYNC_H #define CEPH_RGW_DATA_SYNC_H #include "include/encoding.h" #include "common/RWLock.h" #include "common/ceph_json.h" #include "rgw_coroutine.h" #include "rgw_http_client.h" #include "rgw_sal.h" #include "rgw_datalog.h" #include "rgw_sync_module.h" #include "rgw_sync_trace.h" #include "rgw_sync_policy.h" #include "rgw_bucket_sync.h" // represents an obligation to sync an entry up a given time struct rgw_data_sync_obligation { std::string key; std::string marker; ceph::real_time timestamp; bool retry = false; }; inline std::ostream& operator<<(std::ostream& out, const rgw_data_sync_obligation& o) { out << "key=" << o.key; if (!o.marker.empty()) { out << " marker=" << o.marker; } if (o.timestamp != ceph::real_time{}) { out << " timestamp=" << o.timestamp; } if (o.retry) { out << " retry"; } return out; } class JSONObj; struct rgw_sync_bucket_pipe; struct rgw_bucket_sync_pair_info { RGWBucketSyncFlowManager::pipe_handler handler; /* responsible for sync filters */ rgw_bucket_shard source_bs; rgw_bucket_shard dest_bs; }; inline ostream& operator<<(ostream& out, const rgw_bucket_sync_pair_info& p) { if (p.source_bs.bucket == p.dest_bs.bucket) { return out << p.source_bs; } out << p.source_bs; out << "->" << p.dest_bs.bucket; return out; } struct rgw_bucket_sync_pipe { rgw_bucket_sync_pair_info info; RGWBucketInfo source_bucket_info; map source_bucket_attrs; RGWBucketInfo dest_bucket_info; map dest_bucket_attrs; RGWBucketSyncFlowManager::pipe_rules_ref& get_rules() { return info.handler.rules; } }; inline ostream& operator<<(ostream& out, const rgw_bucket_sync_pipe& p) { return out << p.info; } struct rgw_datalog_info { uint32_t num_shards; rgw_datalog_info() : num_shards(0) {} void decode_json(JSONObj *obj); }; struct rgw_data_sync_info { enum SyncState { StateInit = 0, StateBuildingFullSyncMaps = 1, StateSync = 2, }; uint16_t state; uint32_t num_shards; uint64_t instance_id{0}; void encode(bufferlist& bl) const { ENCODE_START(2, 1, bl); encode(state, bl); encode(num_shards, bl); encode(instance_id, bl); ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(2, bl); decode(state, bl); decode(num_shards, bl); if (struct_v >= 2) { decode(instance_id, bl); } DECODE_FINISH(bl); } void dump(Formatter *f) const { string s; switch ((SyncState)state) { case StateInit: s = "init"; break; case StateBuildingFullSyncMaps: s = "building-full-sync-maps"; break; case StateSync: s = "sync"; break; default: s = "unknown"; break; } encode_json("status", s, f); encode_json("num_shards", num_shards, f); encode_json("instance_id", instance_id, f); } void decode_json(JSONObj *obj) { std::string s; JSONDecoder::decode_json("status", s, obj); if (s == "building-full-sync-maps") { state = StateBuildingFullSyncMaps; } else if (s == "sync") { state = StateSync; } else { state = StateInit; } JSONDecoder::decode_json("num_shards", num_shards, obj); JSONDecoder::decode_json("instance_id", instance_id, obj); } static void generate_test_instances(std::list& o); rgw_data_sync_info() : state((int)StateInit), num_shards(0) {} }; WRITE_CLASS_ENCODER(rgw_data_sync_info) struct rgw_data_sync_marker { enum SyncState { FullSync = 0, IncrementalSync = 1, }; uint16_t state; string marker; string next_step_marker; uint64_t total_entries; uint64_t pos; real_time timestamp; rgw_data_sync_marker() : state(FullSync), total_entries(0), pos(0) {} void encode(bufferlist& bl) const { ENCODE_START(1, 1, bl); encode(state, bl); encode(marker, bl); encode(next_step_marker, bl); encode(total_entries, bl); encode(pos, bl); encode(timestamp, bl); ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(1, bl); decode(state, bl); decode(marker, bl); decode(next_step_marker, bl); decode(total_entries, bl); decode(pos, bl); decode(timestamp, bl); DECODE_FINISH(bl); } void dump(Formatter *f) const { const char *s{nullptr}; switch ((SyncState)state) { case FullSync: s = "full-sync"; break; case IncrementalSync: s = "incremental-sync"; break; default: s = "unknown"; break; } encode_json("status", s, f); encode_json("marker", marker, f); encode_json("next_step_marker", next_step_marker, f); encode_json("total_entries", total_entries, f); encode_json("pos", pos, f); encode_json("timestamp", utime_t(timestamp), f); } void decode_json(JSONObj *obj) { std::string s; JSONDecoder::decode_json("status", s, obj); if (s == "full-sync") { state = FullSync; } else if (s == "incremental-sync") { state = IncrementalSync; } JSONDecoder::decode_json("marker", marker, obj); JSONDecoder::decode_json("next_step_marker", next_step_marker, obj); JSONDecoder::decode_json("total_entries", total_entries, obj); JSONDecoder::decode_json("pos", pos, obj); utime_t t; JSONDecoder::decode_json("timestamp", t, obj); timestamp = t.to_real_time(); } static void generate_test_instances(std::list& o); }; WRITE_CLASS_ENCODER(rgw_data_sync_marker) struct rgw_data_sync_status { rgw_data_sync_info sync_info; map sync_markers; rgw_data_sync_status() {} void encode(bufferlist& bl) const { ENCODE_START(1, 1, bl); encode(sync_info, bl); /* sync markers are encoded separately */ ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(1, bl); decode(sync_info, bl); /* sync markers are decoded separately */ DECODE_FINISH(bl); } void dump(Formatter *f) const { encode_json("info", sync_info, f); encode_json("markers", sync_markers, f); } void decode_json(JSONObj *obj) { JSONDecoder::decode_json("info", sync_info, obj); JSONDecoder::decode_json("markers", sync_markers, obj); } static void generate_test_instances(std::list& o); }; WRITE_CLASS_ENCODER(rgw_data_sync_status) struct rgw_datalog_entry { string key; ceph::real_time timestamp; void decode_json(JSONObj *obj); }; struct rgw_datalog_shard_data { string marker; bool truncated; vector entries; void decode_json(JSONObj *obj); }; class RGWAsyncRadosProcessor; class RGWDataSyncControlCR; struct rgw_bucket_entry_owner { string id; string display_name; rgw_bucket_entry_owner() {} rgw_bucket_entry_owner(const string& _id, const string& _display_name) : id(_id), display_name(_display_name) {} void decode_json(JSONObj *obj); }; class RGWSyncErrorLogger; class RGWRESTConn; class RGWServices; struct RGWDataSyncEnv { const DoutPrefixProvider *dpp{nullptr}; CephContext *cct{nullptr}; rgw::sal::RGWRadosStore *store{nullptr}; RGWServices *svc{nullptr}; RGWAsyncRadosProcessor *async_rados{nullptr}; RGWHTTPManager *http_manager{nullptr}; RGWSyncErrorLogger *error_logger{nullptr}; RGWSyncTraceManager *sync_tracer{nullptr}; RGWSyncModuleInstanceRef sync_module{nullptr}; PerfCounters* counters{nullptr}; RGWDataSyncEnv() {} void init(const DoutPrefixProvider *_dpp, CephContext *_cct, rgw::sal::RGWRadosStore *_store, RGWServices *_svc, RGWAsyncRadosProcessor *_async_rados, RGWHTTPManager *_http_manager, RGWSyncErrorLogger *_error_logger, RGWSyncTraceManager *_sync_tracer, RGWSyncModuleInstanceRef& _sync_module, PerfCounters* _counters) { dpp = _dpp; cct = _cct; store = _store; svc = _svc; async_rados = _async_rados; http_manager = _http_manager; error_logger = _error_logger; sync_tracer = _sync_tracer; sync_module = _sync_module; counters = _counters; } string shard_obj_name(int shard_id); string status_oid(); }; struct RGWDataSyncCtx { CephContext *cct{nullptr}; RGWDataSyncEnv *env{nullptr}; RGWRESTConn *conn{nullptr}; rgw_zone_id source_zone; void init(RGWDataSyncEnv *_env, RGWRESTConn *_conn, const rgw_zone_id& _source_zone) { cct = _env->cct; env = _env; conn = _conn; source_zone = _source_zone; } }; class RGWRados; class RGWRemoteDataLog : public RGWCoroutinesManager { const DoutPrefixProvider *dpp; rgw::sal::RGWRadosStore *store; CephContext *cct; RGWCoroutinesManagerRegistry *cr_registry; RGWAsyncRadosProcessor *async_rados; RGWHTTPManager http_manager; RGWDataSyncEnv sync_env; RGWDataSyncCtx sc; ceph::shared_mutex lock = ceph::make_shared_mutex("RGWRemoteDataLog::lock"); RGWDataSyncControlCR *data_sync_cr; RGWSyncTraceNodeRef tn; bool initialized; public: RGWRemoteDataLog(const DoutPrefixProvider *dpp, rgw::sal::RGWRadosStore *_store, RGWAsyncRadosProcessor *async_rados); int init(const rgw_zone_id& _source_zone, RGWRESTConn *_conn, RGWSyncErrorLogger *_error_logger, RGWSyncTraceManager *_sync_tracer, RGWSyncModuleInstanceRef& module, PerfCounters* _counters); void finish(); int read_log_info(const DoutPrefixProvider *dpp, rgw_datalog_info *log_info); int read_source_log_shards_info(const DoutPrefixProvider *dpp, map *shards_info); int read_source_log_shards_next(const DoutPrefixProvider *dpp, map shard_markers, map *result); int read_sync_status(const DoutPrefixProvider *dpp, rgw_data_sync_status *sync_status); int read_recovering_shards(const DoutPrefixProvider *dpp, const int num_shards, set& recovering_shards); int read_shard_status(const DoutPrefixProvider *dpp, int shard_id, set& lagging_buckets,set& recovering_buckets, rgw_data_sync_marker* sync_marker, const int max_entries); int init_sync_status(const DoutPrefixProvider *dpp, int num_shards); int run_sync(const DoutPrefixProvider *dpp, int num_shards); void wakeup(int shard_id, set& keys); }; class RGWDataSyncStatusManager : public DoutPrefixProvider { rgw::sal::RGWRadosStore *store; rgw_zone_id source_zone; RGWRESTConn *conn; RGWSyncErrorLogger *error_logger; RGWSyncModuleInstanceRef sync_module; PerfCounters* counters; RGWRemoteDataLog source_log; string source_status_oid; string source_shard_status_oid_prefix; map shard_objs; int num_shards; public: RGWDataSyncStatusManager(rgw::sal::RGWRadosStore *_store, RGWAsyncRadosProcessor *async_rados, const rgw_zone_id& _source_zone, PerfCounters* counters) : store(_store), source_zone(_source_zone), conn(NULL), error_logger(NULL), sync_module(nullptr), counters(counters), source_log(this, store, async_rados), num_shards(0) {} RGWDataSyncStatusManager(rgw::sal::RGWRadosStore *_store, RGWAsyncRadosProcessor *async_rados, const rgw_zone_id& _source_zone, PerfCounters* counters, const RGWSyncModuleInstanceRef& _sync_module) : store(_store), source_zone(_source_zone), conn(NULL), error_logger(NULL), sync_module(_sync_module), counters(counters), source_log(this, store, async_rados), num_shards(0) {} ~RGWDataSyncStatusManager() { finalize(); } int init(const DoutPrefixProvider *dpp); void finalize(); static string shard_obj_name(const rgw_zone_id& source_zone, int shard_id); static string sync_status_oid(const rgw_zone_id& source_zone); int read_sync_status(const DoutPrefixProvider *dpp, rgw_data_sync_status *sync_status) { return source_log.read_sync_status(dpp, sync_status); } int read_recovering_shards(const DoutPrefixProvider *dpp, const int num_shards, set& recovering_shards) { return source_log.read_recovering_shards(dpp, num_shards, recovering_shards); } int read_shard_status(const DoutPrefixProvider *dpp, int shard_id, set& lagging_buckets, set& recovering_buckets, rgw_data_sync_marker *sync_marker, const int max_entries) { return source_log.read_shard_status(dpp, shard_id, lagging_buckets, recovering_buckets,sync_marker, max_entries); } int init_sync_status(const DoutPrefixProvider *dpp) { return source_log.init_sync_status(dpp, num_shards); } int read_log_info(const DoutPrefixProvider *dpp, rgw_datalog_info *log_info) { return source_log.read_log_info(dpp, log_info); } int read_source_log_shards_info(const DoutPrefixProvider *dpp, map *shards_info) { return source_log.read_source_log_shards_info(dpp, shards_info); } int read_source_log_shards_next(const DoutPrefixProvider *dpp, map shard_markers, map *result) { return source_log.read_source_log_shards_next(dpp, shard_markers, result); } int run(const DoutPrefixProvider *dpp) { return source_log.run_sync(dpp, num_shards); } void wakeup(int shard_id, set& keys) { return source_log.wakeup(shard_id, keys); } void stop() { source_log.finish(); } // implements DoutPrefixProvider CephContext *get_cct() const override; unsigned get_subsys() const override; std::ostream& gen_prefix(std::ostream& out) const override; }; class RGWBucketPipeSyncStatusManager; class RGWBucketSyncCR; struct rgw_bucket_shard_full_sync_marker { rgw_obj_key position; uint64_t count; rgw_bucket_shard_full_sync_marker() : count(0) {} void encode_attr(map& attrs); void encode(bufferlist& bl) const { ENCODE_START(1, 1, bl); encode(position, bl); encode(count, bl); ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(1, bl); decode(position, bl); decode(count, bl); DECODE_FINISH(bl); } void dump(Formatter *f) const; void decode_json(JSONObj *obj); }; WRITE_CLASS_ENCODER(rgw_bucket_shard_full_sync_marker) struct rgw_bucket_shard_inc_sync_marker { string position; ceph::real_time timestamp; void encode_attr(map& attrs); void encode(bufferlist& bl) const { ENCODE_START(2, 1, bl); encode(position, bl); encode(timestamp, bl); ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(2, bl); decode(position, bl); if (struct_v >= 2) { decode(timestamp, bl); } DECODE_FINISH(bl); } void dump(Formatter *f) const; void decode_json(JSONObj *obj); }; WRITE_CLASS_ENCODER(rgw_bucket_shard_inc_sync_marker) struct rgw_bucket_shard_sync_info { enum SyncState { StateInit = 0, StateFullSync = 1, StateIncrementalSync = 2, StateStopped = 3, }; uint16_t state; rgw_bucket_shard_full_sync_marker full_marker; rgw_bucket_shard_inc_sync_marker inc_marker; void decode_from_attrs(CephContext *cct, map& attrs); void encode_all_attrs(map& attrs); void encode_state_attr(map& attrs); void encode(bufferlist& bl) const { ENCODE_START(1, 1, bl); encode(state, bl); encode(full_marker, bl); encode(inc_marker, bl); ENCODE_FINISH(bl); } void decode(bufferlist::const_iterator& bl) { DECODE_START(1, bl); decode(state, bl); decode(full_marker, bl); decode(inc_marker, bl); DECODE_FINISH(bl); } void dump(Formatter *f) const; void decode_json(JSONObj *obj); rgw_bucket_shard_sync_info() : state((int)StateInit) {} }; WRITE_CLASS_ENCODER(rgw_bucket_shard_sync_info) struct rgw_bucket_index_marker_info { string bucket_ver; string master_ver; string max_marker; bool syncstopped{false}; void decode_json(JSONObj *obj) { JSONDecoder::decode_json("bucket_ver", bucket_ver, obj); JSONDecoder::decode_json("master_ver", master_ver, obj); JSONDecoder::decode_json("max_marker", max_marker, obj); JSONDecoder::decode_json("syncstopped", syncstopped, obj); } }; class RGWRemoteBucketManager { const DoutPrefixProvider *dpp; RGWDataSyncEnv *sync_env; RGWRESTConn *conn{nullptr}; rgw_zone_id source_zone; vector sync_pairs; RGWDataSyncCtx sc; rgw_bucket_shard_sync_info init_status; RGWBucketSyncCR *sync_cr{nullptr}; public: RGWRemoteBucketManager(const DoutPrefixProvider *_dpp, RGWDataSyncEnv *_sync_env, const rgw_zone_id& _source_zone, RGWRESTConn *_conn, const RGWBucketInfo& source_bucket_info, const rgw_bucket& dest_bucket); void init(const rgw_zone_id& _source_zone, RGWRESTConn *_conn, const rgw_bucket& source_bucket, int shard_id, const rgw_bucket& dest_bucket); RGWCoroutine *read_sync_status_cr(int num, rgw_bucket_shard_sync_info *sync_status); RGWCoroutine *init_sync_status_cr(int num, RGWObjVersionTracker& objv_tracker); RGWCoroutine *run_sync_cr(int num); int num_pipes() { return sync_pairs.size(); } void wakeup(); }; class BucketIndexShardsManager; int rgw_read_remote_bilog_info(const DoutPrefixProvider *dpp, RGWRESTConn* conn, const rgw_bucket& bucket, BucketIndexShardsManager& markers, optional_yield y); class RGWBucketPipeSyncStatusManager : public DoutPrefixProvider { rgw::sal::RGWRadosStore *store; RGWDataSyncEnv sync_env; RGWCoroutinesManager cr_mgr; RGWHTTPManager http_manager; std::optional source_zone; std::optional source_bucket; RGWRESTConn *conn; RGWSyncErrorLogger *error_logger; RGWSyncModuleInstanceRef sync_module; rgw_bucket dest_bucket; vector source_mgrs; string source_status_oid; string source_shard_status_oid_prefix; map sync_status; rgw_raw_obj status_obj; int num_shards; public: RGWBucketPipeSyncStatusManager(rgw::sal::RGWRadosStore *_store, std::optional _source_zone, std::optional _source_bucket, const rgw_bucket& dest_bucket); ~RGWBucketPipeSyncStatusManager(); int init(const DoutPrefixProvider *dpp); map& get_sync_status() { return sync_status; } int init_sync_status(const DoutPrefixProvider *dpp); static string status_oid(const rgw_zone_id& source_zone, const rgw_bucket_sync_pair_info& bs); static string obj_status_oid(const rgw_bucket_sync_pipe& sync_pipe, const rgw_zone_id& source_zone, const rgw::sal::RGWObject* obj); /* specific source obj sync status, can be used by sync modules */ // implements DoutPrefixProvider CephContext *get_cct() const override; unsigned get_subsys() const override; std::ostream& gen_prefix(std::ostream& out) const override; int read_sync_status(const DoutPrefixProvider *dpp); int run(const DoutPrefixProvider *dpp); }; /// read the sync status of all bucket shards from the given source zone int rgw_bucket_sync_status(const DoutPrefixProvider *dpp, rgw::sal::RGWRadosStore *store, const rgw_sync_bucket_pipe& pipe, const RGWBucketInfo& dest_bucket_info, const RGWBucketInfo *psource_bucket_info, std::vector *status); class RGWDefaultSyncModule : public RGWSyncModule { public: RGWDefaultSyncModule() {} bool supports_writes() override { return true; } bool supports_data_export() override { return true; } int create_instance(CephContext *cct, const JSONFormattable& config, RGWSyncModuleInstanceRef *instance) override; }; class RGWArchiveSyncModule : public RGWDefaultSyncModule { public: RGWArchiveSyncModule() {} bool supports_writes() override { return true; } bool supports_data_export() override { return false; } int create_instance(CephContext *cct, const JSONFormattable& config, RGWSyncModuleInstanceRef *instance) override; }; #endif