mirror of https://github.com/Icinga/icinga2.git
359 lines
9.7 KiB
C++
359 lines
9.7 KiB
C++
/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
|
|
|
|
#include "checker/checkercomponent.hpp"
|
|
#include "checker/checkercomponent-ti.cpp"
|
|
#include "icinga/icingaapplication.hpp"
|
|
#include "icinga/cib.hpp"
|
|
#include "remote/apilistener.hpp"
|
|
#include "base/configuration.hpp"
|
|
#include "base/configtype.hpp"
|
|
#include "base/objectlock.hpp"
|
|
#include "base/utility.hpp"
|
|
#include "base/perfdatavalue.hpp"
|
|
#include "base/logger.hpp"
|
|
#include "base/exception.hpp"
|
|
#include "base/convert.hpp"
|
|
#include "base/statsfunction.hpp"
|
|
#include <chrono>
|
|
|
|
using namespace icinga;
|
|
|
|
REGISTER_TYPE(CheckerComponent);
|
|
|
|
REGISTER_STATSFUNCTION(CheckerComponent, &CheckerComponent::StatsFunc);
|
|
|
|
void CheckerComponent::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr& perfdata)
|
|
{
|
|
DictionaryData nodes;
|
|
|
|
for (const CheckerComponent::Ptr& checker : ConfigType::GetObjectsByType<CheckerComponent>()) {
|
|
unsigned long idle = checker->GetIdleCheckables();
|
|
unsigned long pending = checker->GetPendingCheckables();
|
|
|
|
nodes.emplace_back(checker->GetName(), new Dictionary({
|
|
{ "idle", idle },
|
|
{ "pending", pending }
|
|
}));
|
|
|
|
String perfdata_prefix = "checkercomponent_" + checker->GetName() + "_";
|
|
perfdata->Add(new PerfdataValue(perfdata_prefix + "idle", Convert::ToDouble(idle)));
|
|
perfdata->Add(new PerfdataValue(perfdata_prefix + "pending", Convert::ToDouble(pending)));
|
|
}
|
|
|
|
status->Set("checkercomponent", new Dictionary(std::move(nodes)));
|
|
}
|
|
|
|
void CheckerComponent::OnConfigLoaded()
|
|
{
|
|
ConfigObject::OnActiveChanged.connect([this](const ConfigObject::Ptr& object, const Value&) {
|
|
ObjectHandler(object);
|
|
});
|
|
ConfigObject::OnPausedChanged.connect([this](const ConfigObject::Ptr& object, const Value&) {
|
|
ObjectHandler(object);
|
|
});
|
|
|
|
Checkable::OnNextCheckChanged.connect([this](const Checkable::Ptr& checkable, const Value&) {
|
|
NextCheckChangedHandler(checkable);
|
|
});
|
|
}
|
|
|
|
void CheckerComponent::Start(bool runtimeCreated)
|
|
{
|
|
ObjectImpl<CheckerComponent>::Start(runtimeCreated);
|
|
|
|
Log(LogInformation, "CheckerComponent")
|
|
<< "'" << GetName() << "' started.";
|
|
|
|
|
|
m_Thread = std::thread([this]() { CheckThreadProc(); });
|
|
|
|
m_ResultTimer = Timer::Create();
|
|
m_ResultTimer->SetInterval(5);
|
|
m_ResultTimer->OnTimerExpired.connect([this](const Timer * const&) { ResultTimerHandler(); });
|
|
m_ResultTimer->Start();
|
|
}
|
|
|
|
void CheckerComponent::Stop(bool runtimeRemoved)
|
|
{
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
m_Stopped = true;
|
|
m_CV.notify_all();
|
|
}
|
|
|
|
m_ResultTimer->Stop(true);
|
|
m_Thread.join();
|
|
|
|
Log(LogInformation, "CheckerComponent")
|
|
<< "'" << GetName() << "' stopped.";
|
|
|
|
ObjectImpl<CheckerComponent>::Stop(runtimeRemoved);
|
|
}
|
|
|
|
void CheckerComponent::CheckThreadProc()
|
|
{
|
|
Utility::SetThreadName("Check Scheduler");
|
|
IcingaApplication::Ptr icingaApp = IcingaApplication::GetInstance();
|
|
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
for (;;) {
|
|
typedef boost::multi_index::nth_index<CheckableSet, 1>::type CheckTimeView;
|
|
CheckTimeView& idx = boost::get<1>(m_IdleCheckables);
|
|
|
|
while (idx.begin() == idx.end() && !m_Stopped)
|
|
m_CV.wait(lock);
|
|
|
|
if (m_Stopped)
|
|
break;
|
|
|
|
auto it = idx.begin();
|
|
CheckableScheduleInfo csi = *it;
|
|
|
|
double wait = csi.NextCheck - Utility::GetTime();
|
|
|
|
//#ifdef I2_DEBUG
|
|
// Log(LogDebug, "CheckerComponent")
|
|
// << "Pending checks " << Checkable::GetPendingChecks()
|
|
// << " vs. max concurrent checks " << icingaApp->GetMaxConcurrentChecks() << ".";
|
|
//#endif /* I2_DEBUG */
|
|
|
|
if (Checkable::GetPendingChecks() >= icingaApp->GetMaxConcurrentChecks())
|
|
wait = 0.5;
|
|
|
|
if (wait > 0) {
|
|
/* Wait for the next check. */
|
|
m_CV.wait_for(lock, std::chrono::duration<double>(wait));
|
|
|
|
continue;
|
|
}
|
|
|
|
Checkable::Ptr checkable = csi.Object;
|
|
|
|
m_IdleCheckables.erase(checkable);
|
|
|
|
bool forced = checkable->GetForceNextCheck();
|
|
bool check = true;
|
|
bool notifyNextCheck = false;
|
|
|
|
if (!forced) {
|
|
if (!checkable->IsReachable(DependencyCheckExecution)) {
|
|
Log(LogNotice, "CheckerComponent")
|
|
<< "Skipping check for object '" << checkable->GetName() << "': Dependency failed.";
|
|
|
|
check = false;
|
|
notifyNextCheck = true;
|
|
}
|
|
|
|
Host::Ptr host;
|
|
Service::Ptr service;
|
|
tie(host, service) = GetHostService(checkable);
|
|
|
|
if (host && !service && (!checkable->GetEnableActiveChecks() || !icingaApp->GetEnableHostChecks())) {
|
|
Log(LogNotice, "CheckerComponent")
|
|
<< "Skipping check for host '" << host->GetName() << "': active host checks are disabled";
|
|
check = false;
|
|
}
|
|
if (host && service && (!checkable->GetEnableActiveChecks() || !icingaApp->GetEnableServiceChecks())) {
|
|
Log(LogNotice, "CheckerComponent")
|
|
<< "Skipping check for service '" << service->GetName() << "': active service checks are disabled";
|
|
check = false;
|
|
}
|
|
|
|
TimePeriod::Ptr tp = checkable->GetCheckPeriod();
|
|
|
|
if (tp && !tp->IsInside(Utility::GetTime())) {
|
|
Log(LogNotice, "CheckerComponent")
|
|
<< "Skipping check for object '" << checkable->GetName()
|
|
<< "': not in check period '" << tp->GetName() << "'";
|
|
|
|
check = false;
|
|
notifyNextCheck = true;
|
|
}
|
|
}
|
|
|
|
/* reschedule the checkable if checks are disabled */
|
|
if (!check) {
|
|
m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
|
|
lock.unlock();
|
|
|
|
Log(LogDebug, "CheckerComponent")
|
|
<< "Checks for checkable '" << checkable->GetName() << "' are disabled. Rescheduling check.";
|
|
|
|
checkable->UpdateNextCheck();
|
|
|
|
if (notifyNextCheck) {
|
|
// Trigger update event for Icinga DB
|
|
Checkable::OnNextCheckUpdated(checkable);
|
|
}
|
|
|
|
lock.lock();
|
|
|
|
continue;
|
|
}
|
|
|
|
|
|
csi = GetCheckableScheduleInfo(checkable);
|
|
|
|
Log(LogDebug, "CheckerComponent")
|
|
<< "Scheduling info for checkable '" << checkable->GetName() << "' ("
|
|
<< Utility::FormatDateTime("%Y-%m-%d %H:%M:%S %z", checkable->GetNextCheck()) << "): Object '"
|
|
<< csi.Object->GetName() << "', Next Check: "
|
|
<< Utility::FormatDateTime("%Y-%m-%d %H:%M:%S %z", csi.NextCheck) << "(" << csi.NextCheck << ").";
|
|
|
|
m_PendingCheckables.insert(csi);
|
|
|
|
lock.unlock();
|
|
|
|
if (forced) {
|
|
ObjectLock olock(checkable);
|
|
checkable->SetForceNextCheck(false);
|
|
}
|
|
|
|
Log(LogDebug, "CheckerComponent")
|
|
<< "Executing check for '" << checkable->GetName() << "'";
|
|
|
|
Checkable::IncreasePendingChecks();
|
|
|
|
/*
|
|
* Explicitly use CheckerComponent::Ptr to keep the reference counted while the
|
|
* callback is active and making it crash safe
|
|
*/
|
|
CheckerComponent::Ptr checkComponent(this);
|
|
|
|
Utility::QueueAsyncCallback([this, checkComponent, checkable]() { ExecuteCheckHelper(checkable); });
|
|
|
|
lock.lock();
|
|
}
|
|
}
|
|
|
|
void CheckerComponent::ExecuteCheckHelper(const Checkable::Ptr& checkable)
|
|
{
|
|
try {
|
|
checkable->ExecuteCheck();
|
|
} catch (const std::exception& ex) {
|
|
CheckResult::Ptr cr = new CheckResult();
|
|
cr->SetState(ServiceUnknown);
|
|
|
|
String output = "Exception occurred while checking '" + checkable->GetName() + "': " + DiagnosticInformation(ex);
|
|
cr->SetOutput(output);
|
|
|
|
double now = Utility::GetTime();
|
|
cr->SetScheduleStart(now);
|
|
cr->SetScheduleEnd(now);
|
|
cr->SetExecutionStart(now);
|
|
cr->SetExecutionEnd(now);
|
|
|
|
checkable->ProcessCheckResult(cr);
|
|
|
|
Log(LogCritical, "checker", output);
|
|
}
|
|
|
|
Checkable::DecreasePendingChecks();
|
|
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
/* remove the object from the list of pending objects; if it's not in the
|
|
* list this was a manual (i.e. forced) check and we must not re-add the
|
|
* object to the list because it's already there. */
|
|
auto it = m_PendingCheckables.find(checkable);
|
|
|
|
if (it != m_PendingCheckables.end()) {
|
|
m_PendingCheckables.erase(it);
|
|
|
|
if (checkable->IsActive())
|
|
m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
|
|
|
|
m_CV.notify_all();
|
|
}
|
|
}
|
|
|
|
Log(LogDebug, "CheckerComponent")
|
|
<< "Check finished for object '" << checkable->GetName() << "'";
|
|
}
|
|
|
|
void CheckerComponent::ResultTimerHandler()
|
|
{
|
|
std::ostringstream msgbuf;
|
|
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
msgbuf << "Pending checkables: " << m_PendingCheckables.size() << "; Idle checkables: " << m_IdleCheckables.size() << "; Checks/s: "
|
|
<< (CIB::GetActiveHostChecksStatistics(60) + CIB::GetActiveServiceChecksStatistics(60)) / 60.0;
|
|
}
|
|
|
|
Log(LogNotice, "CheckerComponent", msgbuf.str());
|
|
}
|
|
|
|
void CheckerComponent::ObjectHandler(const ConfigObject::Ptr& object)
|
|
{
|
|
Checkable::Ptr checkable = dynamic_pointer_cast<Checkable>(object);
|
|
|
|
if (!checkable)
|
|
return;
|
|
|
|
Zone::Ptr zone = Zone::GetByName(checkable->GetZoneName());
|
|
bool same_zone = (!zone || Zone::GetLocalZone() == zone);
|
|
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
if (object->IsActive() && !object->IsPaused() && same_zone) {
|
|
if (m_PendingCheckables.find(checkable) != m_PendingCheckables.end())
|
|
return;
|
|
|
|
m_IdleCheckables.insert(GetCheckableScheduleInfo(checkable));
|
|
} else {
|
|
m_IdleCheckables.erase(checkable);
|
|
m_PendingCheckables.erase(checkable);
|
|
}
|
|
|
|
m_CV.notify_all();
|
|
}
|
|
}
|
|
|
|
CheckableScheduleInfo CheckerComponent::GetCheckableScheduleInfo(const Checkable::Ptr& checkable)
|
|
{
|
|
CheckableScheduleInfo csi;
|
|
csi.Object = checkable;
|
|
csi.NextCheck = checkable->GetNextCheck();
|
|
return csi;
|
|
}
|
|
|
|
void CheckerComponent::NextCheckChangedHandler(const Checkable::Ptr& checkable)
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
/* remove and re-insert the object from the set in order to force an index update */
|
|
typedef boost::multi_index::nth_index<CheckableSet, 0>::type CheckableView;
|
|
CheckableView& idx = boost::get<0>(m_IdleCheckables);
|
|
|
|
auto it = idx.find(checkable);
|
|
|
|
if (it == idx.end())
|
|
return;
|
|
|
|
idx.erase(checkable);
|
|
|
|
CheckableScheduleInfo csi = GetCheckableScheduleInfo(checkable);
|
|
idx.insert(csi);
|
|
|
|
m_CV.notify_all();
|
|
}
|
|
|
|
unsigned long CheckerComponent::GetIdleCheckables()
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
return m_IdleCheckables.size();
|
|
}
|
|
|
|
unsigned long CheckerComponent::GetPendingCheckables()
|
|
{
|
|
std::unique_lock<std::mutex> lock(m_Mutex);
|
|
|
|
return m_PendingCheckables.size();
|
|
}
|