// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab /* * Ceph - scalable distributed file system * * Copyright (C) 2016 John Spray * * This is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License version 2.1, as published by the Free Software * Foundation. See file COPYING. */ #ifndef DAEMON_SERVER_H_ #define DAEMON_SERVER_H_ #include "PyModuleRegistry.h" #include #include #include #include "common/ceph_mutex.h" #include "common/LogClient.h" #include "common/Timer.h" #include #include #include "ServiceMap.h" #include "MgrSession.h" #include "DaemonState.h" #include "MetricCollector.h" #include "OSDPerfMetricCollector.h" #include "MDSPerfMetricCollector.h" class MMgrReport; class MMgrOpen; class MMgrUpdate; class MMgrClose; class MMonMgrReport; class MCommand; class MMgrCommand; struct MonCommand; class CommandContext; struct OSDPerfMetricQuery; struct MDSPerfMetricQuery; struct offline_pg_report { set osds; set ok, not_ok, unknown; set ok_become_degraded, ok_become_more_degraded; // ok set bad_no_pool, bad_already_inactive, bad_become_inactive; // not ok bool ok_to_stop() const { return not_ok.empty() && unknown.empty(); } void dump(Formatter *f) const { f->dump_bool("ok_to_stop", ok_to_stop()); f->open_array_section("osds"); for (auto o : osds) { f->dump_int("osd", o); } f->close_section(); f->dump_unsigned("num_ok_pgs", ok.size()); f->dump_unsigned("num_not_ok_pgs", not_ok.size()); // ambiguous if (!unknown.empty()) { f->open_array_section("unknown_pgs"); for (auto pg : unknown) { f->dump_stream("pg") << pg; } f->close_section(); } // bad news if (!bad_no_pool.empty()) { f->open_array_section("bad_no_pool_pgs"); for (auto pg : bad_no_pool) { f->dump_stream("pg") << pg; } f->close_section(); } if (!bad_already_inactive.empty()) { f->open_array_section("bad_already_inactive"); for (auto pg : bad_already_inactive) { f->dump_stream("pg") << pg; } f->close_section(); } if (!bad_become_inactive.empty()) { f->open_array_section("bad_become_inactive"); for (auto pg : bad_become_inactive) { f->dump_stream("pg") << pg; } f->close_section(); } // informative if (!ok_become_degraded.empty()) { f->open_array_section("ok_become_degraded"); for (auto pg : ok_become_degraded) { f->dump_stream("pg") << pg; } f->close_section(); } if (!ok_become_more_degraded.empty()) { f->open_array_section("ok_become_more_degraded"); for (auto pg : ok_become_more_degraded) { f->dump_stream("pg") << pg; } f->close_section(); } } }; /** * Server used in ceph-mgr to communicate with Ceph daemons like * MDSs and OSDs. */ class DaemonServer : public Dispatcher, public md_config_obs_t { protected: boost::scoped_ptr client_byte_throttler; boost::scoped_ptr client_msg_throttler; boost::scoped_ptr osd_byte_throttler; boost::scoped_ptr osd_msg_throttler; boost::scoped_ptr mds_byte_throttler; boost::scoped_ptr mds_msg_throttler; boost::scoped_ptr mon_byte_throttler; boost::scoped_ptr mon_msg_throttler; Messenger *msgr; MonClient *monc; Finisher &finisher; DaemonStateIndex &daemon_state; ClusterState &cluster_state; PyModuleRegistry &py_modules; LogChannelRef clog, audit_clog; // Connections for daemons, and clients with service names set // (i.e. those MgrClients that are allowed to send MMgrReports) std::set daemon_connections; /// connections for osds ceph::unordered_map> osd_cons; ServiceMap pending_service_map; // uncommitted epoch_t pending_service_map_dirty = 0; ceph::mutex lock = ceph::make_mutex("DaemonServer"); static void _generate_command_map(cmdmap_t& cmdmap, std::map ¶m_str_map); static const MonCommand *_get_mgrcommand(const std::string &cmd_prefix, const std::vector &commands); bool _allowed_command( MgrSession *s, const std::string &service, const std::string &module, const std::string &prefix, const cmdmap_t& cmdmap, const std::map& param_str_map, const MonCommand *this_cmd); private: friend class ReplyOnFinish; bool _reply(MCommand* m, int ret, const std::string& s, const bufferlist& payload); void _prune_pending_service_map(); void _check_offlines_pgs( const std::set& osds, const OSDMap& osdmap, const PGMap& pgmap, offline_pg_report *report); void _maximize_ok_to_stop_set( const set& orig_osds, unsigned max, const OSDMap& osdmap, const PGMap& pgmap, offline_pg_report *report); utime_t started_at; std::atomic pgmap_ready; std::set reported_osds; void maybe_ready(int32_t osd_id); SafeTimer timer; bool shutting_down; Context *tick_event; void tick(); void schedule_tick_locked(double delay_sec); class OSDPerfMetricCollectorListener : public MetricListener { public: OSDPerfMetricCollectorListener(DaemonServer *server) : server(server) { } void handle_query_updated() override { server->handle_osd_perf_metric_query_updated(); } private: DaemonServer *server; }; OSDPerfMetricCollectorListener osd_perf_metric_collector_listener; OSDPerfMetricCollector osd_perf_metric_collector; void handle_osd_perf_metric_query_updated(); class MDSPerfMetricCollectorListener : public MetricListener { public: MDSPerfMetricCollectorListener(DaemonServer *server) : server(server) { } void handle_query_updated() override { server->handle_mds_perf_metric_query_updated(); } private: DaemonServer *server; }; MDSPerfMetricCollectorListener mds_perf_metric_collector_listener; MDSPerfMetricCollector mds_perf_metric_collector; void handle_mds_perf_metric_query_updated(); void handle_metric_payload(const OSDMetricPayload &payload) { osd_perf_metric_collector.process_reports(payload); } void handle_metric_payload(const MDSMetricPayload &payload) { mds_perf_metric_collector.process_reports(payload); } void handle_metric_payload(const UnknownMetricPayload &payload) { ceph_abort(); } struct HandlePayloadVisitor : public boost::static_visitor { DaemonServer *server; HandlePayloadVisitor(DaemonServer *server) : server(server) { } template inline void operator()(const MetricPayload &payload) const { server->handle_metric_payload(payload); } }; void update_task_status(DaemonKey key, const std::map& task_status); public: int init(uint64_t gid, entity_addrvec_t client_addrs); void shutdown(); entity_addrvec_t get_myaddrs() const; DaemonServer(MonClient *monc_, Finisher &finisher_, DaemonStateIndex &daemon_state_, ClusterState &cluster_state_, PyModuleRegistry &py_modules_, LogChannelRef cl, LogChannelRef auditcl); ~DaemonServer() override; bool ms_dispatch2(const ceph::ref_t& m) override; int ms_handle_fast_authentication(Connection *con) override; void ms_handle_accept(Connection *con) override; bool ms_handle_reset(Connection *con) override; void ms_handle_remote_reset(Connection *con) override {} bool ms_handle_refused(Connection *con) override; void fetch_missing_metadata(const DaemonKey& key, const entity_addr_t& addr); bool handle_open(const ceph::ref_t& m); bool handle_update(const ceph::ref_t& m); bool handle_close(const ceph::ref_t& m); bool handle_report(const ceph::ref_t& m); bool handle_command(const ceph::ref_t& m); bool handle_command(const ceph::ref_t& m); bool _handle_command(std::shared_ptr& cmdctx); void send_report(); void got_service_map(); void got_mgr_map(); void adjust_pgs(); void _send_configure(ConnectionRef c); MetricQueryID add_osd_perf_query( const OSDPerfMetricQuery &query, const std::optional &limit); int remove_osd_perf_query(MetricQueryID query_id); int get_osd_perf_counters(OSDPerfCollector *collector); MetricQueryID add_mds_perf_query(const MDSPerfMetricQuery &query, const std::optional &limit); int remove_mds_perf_query(MetricQueryID query_id); void reregister_mds_perf_queries(); int get_mds_perf_counters(MDSPerfCollector *collector); virtual const char** get_tracked_conf_keys() const override; virtual void handle_conf_change(const ConfigProxy& conf, const std::set &changed) override; void schedule_tick(double delay_sec); void log_access_denied(std::shared_ptr& cmdctx, MgrSession* session, std::stringstream& ss); void dump_pg_ready(ceph::Formatter *f); }; #endif