// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab #include "MgrStatMonitor.h" #include "mon/OSDMonitor.h" #include "mon/PGMap.h" #include "mon/PGMonitor.h" #include "messages/MGetPoolStats.h" #include "messages/MGetPoolStatsReply.h" #include "messages/MMonMgrReport.h" #include "messages/MStatfs.h" #include "messages/MStatfsReply.h" #include "messages/MServiceMap.h" class MgrPGStatService : public MonPGStatService { PGMapDigest& digest; public: MgrPGStatService(PGMapDigest& d) : digest(d) {} const pool_stat_t* get_pool_stat(int64_t poolid) const override { auto i = digest.pg_pool_sum.find(poolid); if (i != digest.pg_pool_sum.end()) { return &i->second; } return nullptr; } ceph_statfs get_statfs(OSDMap& osdmap, boost::optional data_pool) const override { return digest.get_statfs(osdmap, data_pool); } void print_summary(Formatter *f, ostream *out) const override { digest.print_summary(f, out); } void dump_info(Formatter *f) const override { digest.dump(f); } void dump_fs_stats(stringstream *ss, Formatter *f, bool verbose) const override { digest.dump_fs_stats(ss, f, verbose); } void dump_pool_stats(const OSDMap& osdm, stringstream *ss, Formatter *f, bool verbose) const override { digest.dump_pool_stats_full(osdm, ss, f, verbose); } }; #define dout_subsys ceph_subsys_mon #undef dout_prefix #define dout_prefix _prefix(_dout, mon) static ostream& _prefix(std::ostream *_dout, Monitor *mon) { return *_dout << "mon." << mon->name << "@" << mon->rank << "(" << mon->get_state_name() << ").mgrstat "; } MgrStatMonitor::MgrStatMonitor(Monitor *mn, Paxos *p, const string& service_name) : PaxosService(mn, p, service_name), pgservice(new MgrPGStatService(digest)) { } MgrStatMonitor::~MgrStatMonitor() = default; MonPGStatService *MgrStatMonitor::get_pg_stat_service() { return pgservice.get(); } void MgrStatMonitor::create_initial() { dout(10) << __func__ << dendl; version = 0; service_map.epoch = 1; ::encode(service_map, pending_service_map_bl, CEPH_FEATURES_ALL); } void MgrStatMonitor::update_from_paxos(bool *need_bootstrap) { version = get_last_committed(); dout(10) << " " << version << dendl; load_health(); bufferlist bl; get_version(version, bl); if (version) { assert(bl.length()); try { auto p = bl.begin(); ::decode(digest, p); ::decode(service_map, p); dout(10) << __func__ << " v" << version << " service_map e" << service_map.epoch << dendl; } catch (buffer::error& e) { derr << "failed to decode mgrstat state; luminous dev version?" << dendl; } } check_subs(); update_logger(); } void MgrStatMonitor::update_logger() { dout(20) << __func__ << dendl; if (mon->osdmon()->osdmap.require_osd_release < CEPH_RELEASE_LUMINOUS) { dout(20) << "yielding cluster perfcounter updates to pgmon" << dendl; return; } mon->cluster_logger->set(l_cluster_osd_bytes, digest.osd_sum.kb * 1024ull); mon->cluster_logger->set(l_cluster_osd_bytes_used, digest.osd_sum.kb_used * 1024ull); mon->cluster_logger->set(l_cluster_osd_bytes_avail, digest.osd_sum.kb_avail * 1024ull); mon->cluster_logger->set(l_cluster_num_pool, digest.pg_pool_sum.size()); uint64_t num_pg = 0; for (auto i : digest.num_pg_by_pool) { num_pg += i.second; } mon->cluster_logger->set(l_cluster_num_pg, num_pg); unsigned active = 0, active_clean = 0, peering = 0; for (auto p = digest.num_pg_by_state.begin(); p != digest.num_pg_by_state.end(); ++p) { if (p->first & PG_STATE_ACTIVE) { active += p->second; if (p->first & PG_STATE_CLEAN) active_clean += p->second; } if (p->first & PG_STATE_PEERING) peering += p->second; } mon->cluster_logger->set(l_cluster_num_pg_active_clean, active_clean); mon->cluster_logger->set(l_cluster_num_pg_active, active); mon->cluster_logger->set(l_cluster_num_pg_peering, peering); mon->cluster_logger->set(l_cluster_num_object, digest.pg_sum.stats.sum.num_objects); mon->cluster_logger->set(l_cluster_num_object_degraded, digest.pg_sum.stats.sum.num_objects_degraded); mon->cluster_logger->set(l_cluster_num_object_misplaced, digest.pg_sum.stats.sum.num_objects_misplaced); mon->cluster_logger->set(l_cluster_num_object_unfound, digest.pg_sum.stats.sum.num_objects_unfound); mon->cluster_logger->set(l_cluster_num_bytes, digest.pg_sum.stats.sum.num_bytes); } void MgrStatMonitor::create_pending() { dout(10) << " " << version << dendl; pending_digest = digest; pending_health_checks = get_health_checks(); pending_service_map_bl.clear(); ::encode(service_map, pending_service_map_bl, mon->get_quorum_con_features()); } void MgrStatMonitor::encode_pending(MonitorDBStore::TransactionRef t) { ++version; if (version < mon->pgmon()->get_last_committed()) { // fast-forward to pgmon version to ensure clients don't see a // jump back in time for MGetPoolStats and MStatFs. version = mon->pgmon()->get_last_committed() + 1; } dout(10) << " " << version << dendl; bufferlist bl; ::encode(pending_digest, bl, mon->get_quorum_con_features()); assert(pending_service_map_bl.length()); bl.append(pending_service_map_bl); put_version(t, version, bl); put_last_committed(t, version); encode_health(pending_health_checks, t); } version_t MgrStatMonitor::get_trim_to() { // we don't actually need *any* old states, but keep a few. if (version > 5) { return version - 5; } return 0; } void MgrStatMonitor::on_active() { update_logger(); } void MgrStatMonitor::get_health(list >& summary, list > *detail, CephContext *cct) const { } void MgrStatMonitor::tick() { } void MgrStatMonitor::print_summary(Formatter *f, std::ostream *ss) const { pgservice->print_summary(f, ss); } bool MgrStatMonitor::preprocess_query(MonOpRequestRef op) { auto m = static_cast(op->get_req()); switch (m->get_type()) { case CEPH_MSG_STATFS: return preprocess_statfs(op); case MSG_MON_MGR_REPORT: return preprocess_report(op); case MSG_GETPOOLSTATS: return preprocess_getpoolstats(op); default: mon->no_reply(op); derr << "Unhandled message type " << m->get_type() << dendl; return true; } } bool MgrStatMonitor::prepare_update(MonOpRequestRef op) { auto m = static_cast(op->get_req()); switch (m->get_type()) { case MSG_MON_MGR_REPORT: return prepare_report(op); default: mon->no_reply(op); derr << "Unhandled message type " << m->get_type() << dendl; return true; } } bool MgrStatMonitor::preprocess_report(MonOpRequestRef op) { return false; } bool MgrStatMonitor::prepare_report(MonOpRequestRef op) { auto m = static_cast(op->get_req()); bufferlist bl = m->get_data(); auto p = bl.begin(); ::decode(pending_digest, p); pending_health_checks.swap(m->health_checks); if (m->service_map_bl.length()) { pending_service_map_bl.swap(m->service_map_bl); } dout(10) << __func__ << " " << pending_digest << ", " << pending_health_checks.checks.size() << " health checks" << dendl; return true; } bool MgrStatMonitor::preprocess_getpoolstats(MonOpRequestRef op) { op->mark_pgmon_event(__func__); auto m = static_cast(op->get_req()); auto session = m->get_session(); if (!session) return true; if (!session->is_capable("pg", MON_CAP_R)) { dout(0) << "MGetPoolStats received from entity with insufficient caps " << session->caps << dendl; return true; } if (m->fsid != mon->monmap->fsid) { dout(0) << __func__ << " on fsid " << m->fsid << " != " << mon->monmap->fsid << dendl; return true; } epoch_t ver = 0; if (mon->pgservice == get_pg_stat_service()) { ver = get_last_committed(); } else { ver = mon->pgmon()->get_last_committed(); } auto reply = new MGetPoolStatsReply(m->fsid, m->get_tid(), ver); for (const auto& pool_name : m->pools) { const auto pool_id = mon->osdmon()->osdmap.lookup_pg_pool_name(pool_name); if (pool_id == -ENOENT) continue; auto pool_stat = mon->pgservice->get_pool_stat(pool_id); if (!pool_stat) continue; reply->pool_stats[pool_name] = *pool_stat; } mon->send_reply(op, reply); return true; } bool MgrStatMonitor::preprocess_statfs(MonOpRequestRef op) { op->mark_pgmon_event(__func__); auto statfs = static_cast(op->get_req()); auto session = statfs->get_session(); if (!session) return true; if (!session->is_capable("pg", MON_CAP_R)) { dout(0) << "MStatfs received from entity with insufficient privileges " << session->caps << dendl; return true; } if (statfs->fsid != mon->monmap->fsid) { dout(0) << __func__ << " on fsid " << statfs->fsid << " != " << mon->monmap->fsid << dendl; return true; } dout(10) << __func__ << " " << *statfs << " from " << statfs->get_orig_source() << dendl; epoch_t ver = 0; if (mon->pgservice == get_pg_stat_service()) { ver = get_last_committed(); } else { ver = mon->pgmon()->get_last_committed(); } auto reply = new MStatfsReply(statfs->fsid, statfs->get_tid(), ver); reply->h.st = mon->pgservice->get_statfs(mon->osdmon()->osdmap, statfs->data_pool); mon->send_reply(op, reply); return true; } void MgrStatMonitor::check_sub(Subscription *sub) { const auto epoch = mon->monmap->get_epoch(); dout(10) << __func__ << " next " << sub->next << " have " << epoch << dendl; if (sub->next <= service_map.epoch) { auto m = new MServiceMap(service_map); sub->session->con->send_message(m); if (sub->onetime) { mon->with_session_map([this, sub](MonSessionMap& session_map) { session_map.remove_sub(sub); }); } else { sub->next = epoch + 1; } } } void MgrStatMonitor::check_subs() { dout(10) << __func__ << dendl; if (!service_map.epoch) { return; } auto subs = mon->session_map.subs.find("servicemap"); if (subs == mon->session_map.subs.end()) { return; } auto p = subs->second->begin(); while (!p.end()) { auto sub = *p; ++p; check_sub(sub); } }