summaryrefslogtreecommitdiffstats
path: root/lib/checker/checkercomponent.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'lib/checker/checkercomponent.cpp')
-rw-r--r--lib/checker/checkercomponent.cpp358
1 files changed, 358 insertions, 0 deletions
diff --git a/lib/checker/checkercomponent.cpp b/lib/checker/checkercomponent.cpp
new file mode 100644
index 0000000..d92101f
--- /dev/null
+++ b/lib/checker/checkercomponent.cpp
@@ -0,0 +1,358 @@
+/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
+
+#include "checker/checkercomponent.hpp"
+#include "checker/checkercomponent-ti.cpp"
+#include "icinga/icingaapplication.hpp"
+#include "icinga/cib.hpp"
+#include "remote/apilistener.hpp"
+#include "base/configuration.hpp"
+#include "base/configtype.hpp"
+#include "base/objectlock.hpp"
+#include "base/utility.hpp"
+#include "base/perfdatavalue.hpp"
+#include "base/logger.hpp"
+#include "base/exception.hpp"
+#include "base/convert.hpp"
+#include "base/statsfunction.hpp"
+#include <chrono>
+
+using namespace icinga;
+
+REGISTER_TYPE(CheckerComponent);
+
+REGISTER_STATSFUNCTION(CheckerComponent, &CheckerComponent::StatsFunc);
+
+void CheckerComponent::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr& perfdata)
+{
+ DictionaryData nodes;
+
+ for (const CheckerComponent::Ptr& checker : ConfigType::GetObjectsByType<CheckerComponent>()) {
+ unsigned long idle = checker->GetIdleCheckables();
+ unsigned long pending = checker->GetPendingCheckables();
+
+ nodes.emplace_back(checker->GetName(), new Dictionary({
+ { "idle", idle },
+ { "pending", pending }
+ }));
+
+ String perfdata_prefix = "checkercomponent_" + checker->GetName() + "_";
+ perfdata->Add(new PerfdataValue(perfdata_prefix + "idle", Convert::ToDouble(idle)));
+ perfdata->Add(new PerfdataValue(perfdata_prefix + "pending", Convert::ToDouble(pending)));
+ }
+
+ status->Set("checkercomponent", new Dictionary(std::move(nodes)));
+}
+
+void CheckerComponent::OnConfigLoaded()
+{
+ ConfigObject::OnActiveChanged.connect([this](const ConfigObject::Ptr& object, const Value&) {
+ ObjectHandler(object);
+ });
+ ConfigObject::OnPausedChanged.connect([this](const ConfigObject::Ptr& object, const Value&) {
+ ObjectHandler(object);
+ });
+
+ Checkable::OnNextCheckChanged.connect([this](const Checkable::Ptr& checkable, const Value&) {
+ NextCheckChangedHandler(checkable);
+ });
+}
+
+void CheckerComponent::Start(bool runtimeCreated)
+{
+ ObjectImpl<CheckerComponent>::Start(runtimeCreated);
+
+ Log(LogInformation, "CheckerComponent")
+ << "'" << GetName() << "' started.";
+
+
+ m_Thread = std::thread([this]() { CheckThreadProc(); });
+
+ m_ResultTimer = Timer::Create();
+ m_ResultTimer->SetInterval(5);
+ m_ResultTimer->OnTimerExpired.connect([this](const Timer * const&) { ResultTimerHandler(); });
+ m_ResultTimer->Start();
+}
+
+void CheckerComponent::Stop(bool runtimeRemoved)
+{
+ {
+ std::unique_lock<std::mutex> lock(m_Mutex);
+ m_Stopped = true;
+ m_CV.notify_all();
+ }
+
+ m_ResultTimer->Stop(true);
+ m_Thread.join();
+
+ Log(LogInformation, "CheckerComponent")
+ << "'" << GetName() << "' stopped.";
+
+ ObjectImpl<CheckerComponent>::Stop(runtimeRemoved);
+}
+
+void CheckerComponent::CheckThreadProc()
+{
+ Utility::SetThreadName("Check Scheduler");
+ IcingaApplication::Ptr icingaApp = IcingaApplication::GetInstance();
+
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ for (;;) {
+ typedef boost::multi_index::nth_index<CheckableSet, 1>::type CheckTimeView;
+ CheckTimeView& idx = boost::get<1>(m_IdleCheckables);
+
+ while (idx.begin() == idx.end() && !m_Stopped)
+ m_CV.wait(lock);
+
+ if (m_Stopped)
+ break;
+
+ auto it = idx.begin();
+ CheckableScheduleInfo csi = *it;
+
+ double wait = csi.NextCheck - Utility::GetTime();
+
+//#ifdef I2_DEBUG
+// Log(LogDebug, "CheckerComponent")
+// << "Pending checks " << Checkable::GetPendingChecks()
+// << " vs. max concurrent checks " << icingaApp->GetMaxConcurrentChecks() << ".";
+//#endif /* I2_DEBUG */
+
+ if (Checkable::GetPendingChecks() >= icingaApp->GetMaxConcurrentChecks())
+ wait = 0.5;
+
+ if (wait > 0) {
+ /* Wait for the next check. */
+ m_CV.wait_for(lock, std::chrono::duration<double>(wait));
+
+ continue;
+ }
+
+ Checkable::Ptr checkable = csi.Object;
+
+ m_IdleCheckables.erase(checkable);
+
+ bool forced = checkable->GetForceNextCheck();
+ bool check = true;
+ bool notifyNextCheck = false;
+
+ if (!forced) {
+ if (!checkable->IsReachable(DependencyCheckExecution)) {
+ Log(LogNotice, "CheckerComponent")
+ << "Skipping check for object '" << checkable->GetName() << "': Dependency failed.";
+
+ check = false;
+ notifyNextCheck = true;
+ }
+
+ Host::Ptr host;
+ Service::Ptr service;
+ tie(host, service) = GetHostService(checkable);
+
+ if (host && !service && (!checkable->GetEnableActiveChecks() || !icingaApp->GetEnableHostChecks())) {
+ Log(LogNotice, "CheckerComponent")
+ << "Skipping check for host '" << host->GetName() << "': active host checks are disabled";
+ check = false;
+ }
+ if (host && service && (!checkable->GetEnableActiveChecks() || !icingaApp->GetEnableServiceChecks())) {
+ Log(LogNotice, "CheckerComponent")
+ << "Skipping check for service '" << service->GetName() << "': active service checks are disabled";
+ check = false;
+ }
+
+ TimePeriod::Ptr tp = checkable->GetCheckPeriod();
+
+ if (tp && !tp->IsInside(Utility::GetTime())) {
+ Log(LogNotice, "CheckerComponent")
+ << "Skipping check for object '" << checkable->GetName()
+ << "': not in check period '" << tp->GetName() << "'";
+
+ check = false;
+ notifyNextCheck = true;
+ }
+ }
+
+ /* reschedule the checkable if checks are disabled */
+ if (!check) {
+ m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
+ lock.unlock();
+
+ Log(LogDebug, "CheckerComponent")
+ << "Checks for checkable '" << checkable->GetName() << "' are disabled. Rescheduling check.";
+
+ checkable->UpdateNextCheck();
+
+ if (notifyNextCheck) {
+ // Trigger update event for Icinga DB
+ Checkable::OnNextCheckUpdated(checkable);
+ }
+
+ lock.lock();
+
+ continue;
+ }
+
+
+ csi = GetCheckableScheduleInfo(checkable);
+
+ Log(LogDebug, "CheckerComponent")
+ << "Scheduling info for checkable '" << checkable->GetName() << "' ("
+ << Utility::FormatDateTime("%Y-%m-%d %H:%M:%S %z", checkable->GetNextCheck()) << "): Object '"
+ << csi.Object->GetName() << "', Next Check: "
+ << Utility::FormatDateTime("%Y-%m-%d %H:%M:%S %z", csi.NextCheck) << "(" << csi.NextCheck << ").";
+
+ m_PendingCheckables.insert(csi);
+
+ lock.unlock();
+
+ if (forced) {
+ ObjectLock olock(checkable);
+ checkable->SetForceNextCheck(false);
+ }
+
+ Log(LogDebug, "CheckerComponent")
+ << "Executing check for '" << checkable->GetName() << "'";
+
+ Checkable::IncreasePendingChecks();
+
+ /*
+ * Explicitly use CheckerComponent::Ptr to keep the reference counted while the
+ * callback is active and making it crash safe
+ */
+ CheckerComponent::Ptr checkComponent(this);
+
+ Utility::QueueAsyncCallback([this, checkComponent, checkable]() { ExecuteCheckHelper(checkable); });
+
+ lock.lock();
+ }
+}
+
+void CheckerComponent::ExecuteCheckHelper(const Checkable::Ptr& checkable)
+{
+ try {
+ checkable->ExecuteCheck();
+ } catch (const std::exception& ex) {
+ CheckResult::Ptr cr = new CheckResult();
+ cr->SetState(ServiceUnknown);
+
+ String output = "Exception occurred while checking '" + checkable->GetName() + "': " + DiagnosticInformation(ex);
+ cr->SetOutput(output);
+
+ double now = Utility::GetTime();
+ cr->SetScheduleStart(now);
+ cr->SetScheduleEnd(now);
+ cr->SetExecutionStart(now);
+ cr->SetExecutionEnd(now);
+
+ checkable->ProcessCheckResult(cr);
+
+ Log(LogCritical, "checker", output);
+ }
+
+ Checkable::DecreasePendingChecks();
+
+ {
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ /* remove the object from the list of pending objects; if it's not in the
+ * list this was a manual (i.e. forced) check and we must not re-add the
+ * object to the list because it's already there. */
+ auto it = m_PendingCheckables.find(checkable);
+
+ if (it != m_PendingCheckables.end()) {
+ m_PendingCheckables.erase(it);
+
+ if (checkable->IsActive())
+ m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
+
+ m_CV.notify_all();
+ }
+ }
+
+ Log(LogDebug, "CheckerComponent")
+ << "Check finished for object '" << checkable->GetName() << "'";
+}
+
+void CheckerComponent::ResultTimerHandler()
+{
+ std::ostringstream msgbuf;
+
+ {
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ msgbuf << "Pending checkables: " << m_PendingCheckables.size() << "; Idle checkables: " << m_IdleCheckables.size() << "; Checks/s: "
+ << (CIB::GetActiveHostChecksStatistics(60) + CIB::GetActiveServiceChecksStatistics(60)) / 60.0;
+ }
+
+ Log(LogNotice, "CheckerComponent", msgbuf.str());
+}
+
+void CheckerComponent::ObjectHandler(const ConfigObject::Ptr& object)
+{
+ Checkable::Ptr checkable = dynamic_pointer_cast<Checkable>(object);
+
+ if (!checkable)
+ return;
+
+ Zone::Ptr zone = Zone::GetByName(checkable->GetZoneName());
+ bool same_zone = (!zone || Zone::GetLocalZone() == zone);
+
+ {
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ if (object->IsActive() && !object->IsPaused() && same_zone) {
+ if (m_PendingCheckables.find(checkable) != m_PendingCheckables.end())
+ return;
+
+ m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
+ } else {
+ m_IdleCheckables.erase(checkable);
+ m_PendingCheckables.erase(checkable);
+ }
+
+ m_CV.notify_all();
+ }
+}
+
+CheckableScheduleInfo CheckerComponent::GetCheckableScheduleInfo(const Checkable::Ptr& checkable)
+{
+ CheckableScheduleInfo csi;
+ csi.Object = checkable;
+ csi.NextCheck = checkable->GetNextCheck();
+ return csi;
+}
+
+void CheckerComponent::NextCheckChangedHandler(const Checkable::Ptr& checkable)
+{
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ /* remove and re-insert the object from the set in order to force an index update */
+ typedef boost::multi_index::nth_index<CheckableSet, 0>::type CheckableView;
+ CheckableView& idx = boost::get<0>(m_IdleCheckables);
+
+ auto it = idx.find(checkable);
+
+ if (it == idx.end())
+ return;
+
+ idx.erase(checkable);
+
+ CheckableScheduleInfo csi = GetCheckableScheduleInfo(checkable);
+ idx.insert(csi);
+
+ m_CV.notify_all();
+}
+
+unsigned long CheckerComponent::GetIdleCheckables()
+{
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ return m_IdleCheckables.size();
+}
+
+unsigned long CheckerComponent::GetPendingCheckables()
+{
+ std::unique_lock<std::mutex> lock(m_Mutex);
+
+ return m_PendingCheckables.size();
+}