icinga2/components/checker/checkercomponent.cpp

308 lines
9.4 KiB
C++
Raw Normal View History

2012-06-14 11:23:25 +02:00
/******************************************************************************
* Icinga 2 *
* Copyright (C) 2012-2014 Icinga Development Team (http://www.icinga.org) *
2012-06-14 11:23:25 +02:00
* *
* This program is free software; you can redistribute it and/or *
* modify it under the terms of the GNU General Public License *
* as published by the Free Software Foundation; either version 2 *
* of the License, or (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program; if not, write to the Free Software Foundation *
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. *
******************************************************************************/
2014-05-25 16:23:35 +02:00
#include "checker/checkercomponent.hpp"
#include "icinga/icingaapplication.hpp"
#include "icinga/cib.hpp"
#include "icinga/perfdatavalue.hpp"
2014-05-25 16:23:35 +02:00
#include "remote/apilistener.hpp"
#include "base/dynamictype.hpp"
#include "base/objectlock.hpp"
#include "base/utility.hpp"
#include "base/logger_fwd.hpp"
#include "base/exception.hpp"
#include "base/convert.hpp"
#include "base/statsfunction.hpp"
#include <boost/foreach.hpp>
2012-06-14 11:23:25 +02:00
using namespace icinga;
REGISTER_TYPE(CheckerComponent);
REGISTER_STATSFUNCTION(CheckerComponentStats, &CheckerComponent::StatsFunc);
Value CheckerComponent::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr& perfdata)
{
Dictionary::Ptr nodes = make_shared<Dictionary>();
BOOST_FOREACH(const CheckerComponent::Ptr& checker, DynamicType::GetObjectsByType<CheckerComponent>()) {
2014-04-03 15:36:13 +02:00
unsigned long idle = checker->GetIdleCheckables();
unsigned long pending = checker->GetPendingCheckables();
Dictionary::Ptr stats = make_shared<Dictionary>();
stats->Set("idle", idle);
stats->Set("pending", pending);
nodes->Set(checker->GetName(), stats);
String perfdata_prefix = "checkercomponent_" + checker->GetName() + "_";
perfdata->Add(make_shared<PerfdataValue>(perfdata_prefix + "idle", Convert::ToDouble(idle)));
perfdata->Add(make_shared<PerfdataValue>(perfdata_prefix + "pending", Convert::ToDouble(pending)));
}
status->Set("checkercomponent", nodes);
return 0;
}
void CheckerComponent::OnConfigLoaded(void)
2012-06-14 11:23:25 +02:00
{
DynamicObject::OnStarted.connect(bind(&CheckerComponent::ObjectHandler, this, _1));
DynamicObject::OnStopped.connect(bind(&CheckerComponent::ObjectHandler, this, _1));
DynamicObject::OnPaused.connect(bind(&CheckerComponent::ObjectHandler, this, _1));
DynamicObject::OnResumed.connect(bind(&CheckerComponent::ObjectHandler, this, _1));
2012-08-14 10:53:04 +02:00
2014-04-03 15:36:13 +02:00
Checkable::OnNextCheckChanged.connect(bind(&CheckerComponent::NextCheckChangedHandler, this, _1));
}
void CheckerComponent::Start(void)
{
DynamicObject::Start();
2013-02-19 23:02:08 +01:00
m_Stopped = false;
2013-03-15 18:21:29 +01:00
m_Thread = boost::thread(boost::bind(&CheckerComponent::CheckThreadProc, this));
2012-06-14 11:23:25 +02:00
m_ResultTimer = make_shared<Timer>();
2012-06-17 23:10:03 +02:00
m_ResultTimer->SetInterval(5);
2012-06-17 20:35:56 +02:00
m_ResultTimer->OnTimerExpired.connect(boost::bind(&CheckerComponent::ResultTimerHandler, this));
m_ResultTimer->Start();
2012-06-14 11:23:25 +02:00
}
void CheckerComponent::Stop(void)
{
Log(LogInformation, "CheckerComponent", "Checker stopped.");
2013-02-19 23:02:08 +01:00
{
boost::mutex::scoped_lock lock(m_Mutex);
m_Stopped = true;
m_CV.notify_all();
}
m_ResultTimer->Stop();
2013-02-19 23:02:08 +01:00
m_Thread.join();
2014-04-16 15:01:31 +02:00
DynamicObject::Stop();
2012-06-14 11:23:25 +02:00
}
2013-02-18 14:40:24 +01:00
void CheckerComponent::CheckThreadProc(void)
2012-06-14 11:23:25 +02:00
{
Utility::SetThreadName("Check Scheduler");
2013-02-24 01:10:34 +01:00
boost::mutex::scoped_lock lock(m_Mutex);
2013-02-17 19:14:34 +01:00
2013-02-24 01:10:34 +01:00
for (;;) {
2014-04-03 15:36:13 +02:00
typedef boost::multi_index::nth_index<CheckableSet, 1>::type CheckTimeView;
CheckTimeView& idx = boost::get<1>(m_IdleCheckables);
2013-02-17 19:14:34 +01:00
2013-02-21 16:12:50 +01:00
while (idx.begin() == idx.end() && !m_Stopped)
m_CV.wait(lock);
2013-02-21 16:12:50 +01:00
if (m_Stopped)
break;
2013-02-19 23:02:08 +01:00
2013-02-21 16:12:50 +01:00
CheckTimeView::iterator it = idx.begin();
2014-04-05 19:02:45 +02:00
Checkable::Ptr checkable = *it;
2013-02-17 19:14:34 +01:00
2014-04-05 19:02:45 +02:00
double wait = checkable->GetNextCheck() - Utility::GetTime();
2013-02-18 14:40:24 +01:00
if (wait > 0) {
/* Wait for the next check. */
2013-10-18 13:46:22 +02:00
m_CV.timed_wait(lock, boost::posix_time::milliseconds(wait * 1000));
2013-02-18 14:40:24 +01:00
continue;
}
2014-04-05 19:02:45 +02:00
m_IdleCheckables.erase(checkable);
2014-04-05 19:02:45 +02:00
bool forced = checkable->GetForceNextCheck();
2013-03-13 16:04:53 +01:00
bool check = true;
2013-09-12 10:03:48 +02:00
if (!forced) {
2014-04-05 19:02:45 +02:00
if (!checkable->IsReachable(DependencyCheckExecution)) {
Log(LogNotice, "CheckerComponent", "Skipping check for object '" + checkable->GetName() + "': Dependency failed.");
check = false;
}
Host::Ptr host;
Service::Ptr service;
tie(host, service) = GetHostService(checkable);
if (host && !service && (!checkable->GetEnableActiveChecks() || !IcingaApplication::GetInstance()->GetEnableHostChecks())) {
Log(LogNotice, "CheckerComponent", "Skipping check for host '" + host->GetName() + "': active host checks are disabled");
check = false;
}
if (host && service && (!checkable->GetEnableActiveChecks() || !IcingaApplication::GetInstance()->GetEnableServiceChecks())) {
Log(LogNotice, "CheckerComponent", "Skipping check for service '" + service->GetName() + "': active service checks are disabled");
2013-03-13 16:04:53 +01:00
check = false;
}
2014-04-05 19:02:45 +02:00
TimePeriod::Ptr tp = checkable->GetCheckPeriod();
2013-03-13 16:04:53 +01:00
if (tp && !tp->IsInside(Utility::GetTime())) {
Log(LogNotice, "CheckerComponent", "Skipping check for object '" + checkable->GetName() + "': not in check_period");
2013-03-13 16:04:53 +01:00
check = false;
}
}
2014-04-05 19:02:45 +02:00
/* reschedule the checkable if checks are disabled */
2013-03-13 16:04:53 +01:00
if (!check) {
2014-04-05 19:02:45 +02:00
m_IdleCheckables.insert(checkable);
lock.unlock();
2014-04-05 19:02:45 +02:00
checkable->UpdateNextCheck();
lock.lock();
2013-03-02 09:07:47 +01:00
continue;
}
2014-04-05 19:02:45 +02:00
m_PendingCheckables.insert(checkable);
lock.unlock();
if (forced) {
2014-04-05 19:02:45 +02:00
ObjectLock olock(checkable);
checkable->SetForceNextCheck(false);
2013-03-04 15:52:42 +01:00
}
Log(LogDebug, "CheckerComponent", "Executing check for '" + checkable->GetName() + "'");
2012-06-17 20:35:56 +02:00
2013-03-25 18:36:15 +01:00
CheckerComponent::Ptr self = GetSelf();
Utility::QueueAsyncCallback(boost::bind(&CheckerComponent::ExecuteCheckHelper, self, checkable));
lock.lock();
}
2012-06-14 11:23:25 +02:00
}
2014-04-05 19:02:45 +02:00
void CheckerComponent::ExecuteCheckHelper(const Checkable::Ptr& checkable)
2012-06-17 20:35:56 +02:00
{
2013-03-25 18:36:15 +01:00
try {
2014-04-05 19:02:45 +02:00
checkable->ExecuteCheck();
2013-03-25 18:36:15 +01:00
} catch (const std::exception& ex) {
CheckResult::Ptr cr = make_shared<CheckResult>();
cr->SetState(ServiceUnknown);
String output = "Exception occured while checking '" + checkable->GetName() + "': " + DiagnosticInformation(ex);
cr->SetOutput(output);
double now = Utility::GetTime();
cr->SetScheduleStart(now);
cr->SetScheduleEnd(now);
cr->SetExecutionStart(now);
cr->SetExecutionEnd(now);
checkable->ProcessCheckResult(cr);
Log(LogCritical, "checker", output);
2013-03-25 18:36:15 +01:00
}
{
boost::mutex::scoped_lock lock(m_Mutex);
2013-02-18 14:40:24 +01:00
2014-04-05 19:02:45 +02:00
/* remove the object from the list of pending objects; if it's not in the
* list this was a manual (i.e. forced) check and we must not re-add the
2014-04-05 19:02:45 +02:00
* object to the list because it's already there. */
2014-04-03 15:36:13 +02:00
CheckerComponent::CheckableSet::iterator it;
2014-04-05 19:02:45 +02:00
it = m_PendingCheckables.find(checkable);
2014-04-03 15:36:13 +02:00
if (it != m_PendingCheckables.end()) {
m_PendingCheckables.erase(it);
if (checkable->IsActive())
2014-04-05 19:02:45 +02:00
m_IdleCheckables.insert(checkable);
m_CV.notify_all();
}
2012-07-15 17:29:59 +02:00
}
Log(LogDebug, "CheckerComponent", "Check finished for object '" + checkable->GetName() + "'");
}
2012-06-20 15:23:31 +02:00
void CheckerComponent::ResultTimerHandler(void)
{
2013-03-16 21:18:53 +01:00
std::ostringstream msgbuf;
2013-02-17 19:14:34 +01:00
{
boost::mutex::scoped_lock lock(m_Mutex);
msgbuf << "Pending checkables: " << m_PendingCheckables.size() << "; Idle checkables: " << m_IdleCheckables.size() << "; Checks/s: "
<< (CIB::GetActiveHostChecksStatistics(5) + CIB::GetActiveServiceChecksStatistics(5)) / 5.0;
2013-02-17 19:14:34 +01:00
}
Log(LogNotice, "CheckerComponent", msgbuf.str());
2012-06-17 20:35:56 +02:00
}
void CheckerComponent::ObjectHandler(const DynamicObject::Ptr& object)
2012-06-14 11:23:25 +02:00
{
2014-04-03 15:36:13 +02:00
if (!Type::GetByName("Checkable")->IsAssignableFrom(object->GetReflectionType()))
return;
2013-02-21 16:12:50 +01:00
2014-04-05 19:02:45 +02:00
Checkable::Ptr checkable = static_pointer_cast<Checkable>(object);
Zone::Ptr zone = Zone::GetByName(checkable->GetZone());
bool same_zone = (!zone || Zone::GetLocalZone() == zone);
{
boost::mutex::scoped_lock lock(m_Mutex);
2012-06-14 16:09:04 +02:00
if (object->IsActive() && !object->IsPaused() && same_zone) {
2014-04-05 19:02:45 +02:00
if (m_PendingCheckables.find(checkable) != m_PendingCheckables.end())
return;
2012-06-14 16:09:04 +02:00
2014-04-05 19:02:45 +02:00
m_IdleCheckables.insert(checkable);
} else {
2014-04-05 19:02:45 +02:00
m_IdleCheckables.erase(checkable);
m_PendingCheckables.erase(checkable);
}
2013-02-18 14:40:24 +01:00
m_CV.notify_all();
}
2012-06-14 11:23:25 +02:00
}
2014-04-05 19:02:45 +02:00
void CheckerComponent::NextCheckChangedHandler(const Checkable::Ptr& checkable)
{
2013-02-21 16:12:50 +01:00
boost::mutex::scoped_lock lock(m_Mutex);
2014-04-05 19:02:45 +02:00
/* remove and re-insert the object from the set in order to force an index update */
2014-04-03 15:36:13 +02:00
typedef boost::multi_index::nth_index<CheckableSet, 0>::type CheckableView;
CheckableView& idx = boost::get<0>(m_IdleCheckables);
2013-02-17 19:14:34 +01:00
2014-04-05 19:02:45 +02:00
CheckableView::iterator it = idx.find(checkable);
2013-02-21 16:12:50 +01:00
if (it == idx.end())
return;
2014-04-05 19:02:45 +02:00
idx.erase(checkable);
idx.insert(checkable);
2013-02-21 16:12:50 +01:00
m_CV.notify_all();
}
2014-04-03 15:36:13 +02:00
unsigned long CheckerComponent::GetIdleCheckables(void)
{
boost::mutex::scoped_lock lock(m_Mutex);
2014-04-03 15:36:13 +02:00
return m_IdleCheckables.size();
}
2014-04-03 15:36:13 +02:00
unsigned long CheckerComponent::GetPendingCheckables(void)
{
boost::mutex::scoped_lock lock(m_Mutex);
2014-04-03 15:36:13 +02:00
return m_PendingCheckables.size();
}