/****************************************************************************** * Icinga 2 * * Copyright (C) 2012 Icinga Development Team (http://www.icinga.org/) * * * * This program is free software; you can redistribute it and/or * * modify it under the terms of the GNU General Public License * * as published by the Free Software Foundation; either version 2 * * of the License, or (at your option) any later version. * * * * This program is distributed in the hope that it will be useful, * * but WITHOUT ANY WARRANTY; without even the implied warranty of * * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * * GNU General Public License for more details. * * * * You should have received a copy of the GNU General Public License * * along with this program; if not, write to the Free Software Foundation * * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. * ******************************************************************************/ #include "i2-checker.h" using namespace icinga; string CheckerComponent::GetName(void) const { return "checker"; } void CheckerComponent::Start(void) { m_CheckerEndpoint = boost::make_shared(); m_CheckerEndpoint->RegisterTopicHandler("checker::AssignService", boost::bind(&CheckerComponent::AssignServiceRequestHandler, this, _2, _3)); m_CheckerEndpoint->RegisterTopicHandler("checker::ClearServices", boost::bind(&CheckerComponent::ClearServicesRequestHandler, this, _2, _3)); m_CheckerEndpoint->RegisterPublication("checker::CheckResult"); GetEndpointManager()->RegisterEndpoint(m_CheckerEndpoint); m_CheckTimer = boost::make_shared(); m_CheckTimer->SetInterval(5); m_CheckTimer->OnTimerExpired.connect(boost::bind(&CheckerComponent::CheckTimerHandler, this)); m_CheckTimer->Start(); CheckTask::RegisterType("nagios", NagiosCheckTask::CreateTask, NagiosCheckTask::FlushQueue, NagiosCheckTask::GetFinishedTasks); m_ResultTimer = boost::make_shared(); m_ResultTimer->SetInterval(5); m_ResultTimer->OnTimerExpired.connect(boost::bind(&CheckerComponent::ResultTimerHandler, this)); m_ResultTimer->Start(); } void CheckerComponent::Stop(void) { EndpointManager::Ptr mgr = GetEndpointManager(); if (mgr) mgr->UnregisterEndpoint(m_CheckerEndpoint); } void CheckerComponent::CheckTimerHandler(void) { time_t now; time(&now); Application::Log(LogDebug, "checker", "CheckTimerHandler entered."); long tasks = 0; while (!m_Services.empty()) { Service service = m_Services.top(); if (service.GetNextCheck() > now) break; m_Services.pop(); Application::Log(LogDebug, "checker", "Executing service check for '" + service.GetName() + "'"); m_PendingServices.insert(service.GetConfigObject()); CheckTask::Ptr task = CheckTask::CreateTask(service); task->Enqueue(); tasks++; } Application::Log(LogDebug, "checker", "CheckTimerHandler: past loop."); CheckTask::FlushQueue(); stringstream msgbuf; msgbuf << "CheckTimerHandler: created " << tasks << " tasks"; Application::Log(LogInformation, "checker", msgbuf.str()); } void CheckerComponent::ResultTimerHandler(void) { Application::Log(LogDebug, "checker", "ResultTimerHandler entered."); time_t now; time(&now); long min_latency = -1, max_latency = 0, avg_latency = 0, results = 0, failed = 0; vector finishedTasks = CheckTask::GetFinishedTasks(); for (vector::iterator it = finishedTasks.begin(); it != finishedTasks.end(); it++) { CheckTask::Ptr task = *it; Service service = task->GetService(); /* if the service isn't in the set of pending services * it was removed and we need to ignore this check result. */ if (m_PendingServices.find(service.GetConfigObject()) == m_PendingServices.end()) continue; CheckResult result = task->GetResult(); Application::Log(LogDebug, "checker", "Got result for service '" + service.GetName() + "'"); long latency = result.EndTime - result.StartTime; avg_latency += latency; if (min_latency == -1 || latency < min_latency) min_latency = latency; if (latency > max_latency) max_latency = latency; results++; if (result.State != StateOK) failed++; service.SetNextCheck(now + service.GetCheckInterval()); m_PendingServices.erase(service.GetConfigObject()); m_Services.push(service); } if (min_latency > 5) { stringstream latwarn; latwarn << "We can't keep up with the checks: minimum latency is " << min_latency << " seconds"; Application::Log(LogWarning, "checker", latwarn.str()); } { stringstream msgbuf; msgbuf << "ResultTimerHandler: " << results << " results (" << failed << " failed); latency: avg=" << avg_latency / (results ? results : 1) << ", min=" << min_latency << ", max: " << max_latency; Application::Log(LogInformation, "checker", msgbuf.str()); } { stringstream msgbuf; msgbuf << "Pending services: " << m_PendingServices.size() << "; Idle services: " << m_Services.size(); Application::Log(LogInformation, "checker", msgbuf.str()); } } void CheckerComponent::AssignServiceRequestHandler(const Endpoint::Ptr& sender, const RequestMessage& request) { MessagePart params; if (!request.GetParams(¶ms)) return; MessagePart serviceMsg; if (!params.GetProperty("service", &serviceMsg)) return; ConfigObject::Ptr object = boost::make_shared(serviceMsg.GetDictionary()); Service service(object); m_Services.push(service); Application::Log(LogDebug, "checker", "Accepted delegation for service '" + service.GetName() + "'"); string id; if (request.GetID(&id)) { ResponseMessage rm; rm.SetID(id); MessagePart result; rm.SetResult(result); GetEndpointManager()->SendUnicastMessage(m_CheckerEndpoint, sender, rm); } } void CheckerComponent::ClearServicesRequestHandler(const Endpoint::Ptr& sender, const RequestMessage& request) { Application::Log(LogInformation, "checker", "Clearing service delegations."); /* clear the services lists */ m_Services = ServiceQueue(); m_PendingServices.clear(); /* TODO: clear checks we've already sent to the thread pool */ } EXPORT_COMPONENT(checker, CheckerComponent);