2019-02-25 14:48:22 +01:00
|
|
|
/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
#include "perfdata/elasticsearchwriter.hpp"
|
2018-01-18 13:50:38 +01:00
|
|
|
#include "perfdata/elasticsearchwriter-ti.cpp"
|
2017-09-07 15:11:57 +02:00
|
|
|
#include "remote/url.hpp"
|
|
|
|
#include "icinga/compatutility.hpp"
|
|
|
|
#include "icinga/service.hpp"
|
|
|
|
#include "icinga/checkcommand.hpp"
|
2019-04-23 13:15:38 +02:00
|
|
|
#include "base/application.hpp"
|
2019-03-15 13:15:24 +01:00
|
|
|
#include "base/defer.hpp"
|
2019-04-23 13:15:38 +02:00
|
|
|
#include "base/io-engine.hpp"
|
2017-09-07 15:11:57 +02:00
|
|
|
#include "base/tcpsocket.hpp"
|
|
|
|
#include "base/stream.hpp"
|
2017-09-11 17:00:33 +02:00
|
|
|
#include "base/base64.hpp"
|
2017-09-07 15:11:57 +02:00
|
|
|
#include "base/json.hpp"
|
|
|
|
#include "base/utility.hpp"
|
|
|
|
#include "base/networkstream.hpp"
|
|
|
|
#include "base/perfdatavalue.hpp"
|
|
|
|
#include "base/exception.hpp"
|
|
|
|
#include "base/statsfunction.hpp"
|
|
|
|
#include <boost/algorithm/string.hpp>
|
2019-04-23 13:15:38 +02:00
|
|
|
#include <boost/asio/ssl/context.hpp>
|
|
|
|
#include <boost/beast/core/flat_buffer.hpp>
|
|
|
|
#include <boost/beast/http/field.hpp>
|
|
|
|
#include <boost/beast/http/message.hpp>
|
|
|
|
#include <boost/beast/http/parser.hpp>
|
|
|
|
#include <boost/beast/http/read.hpp>
|
|
|
|
#include <boost/beast/http/status.hpp>
|
|
|
|
#include <boost/beast/http/string_body.hpp>
|
|
|
|
#include <boost/beast/http/verb.hpp>
|
|
|
|
#include <boost/beast/http/write.hpp>
|
2017-11-21 11:52:55 +01:00
|
|
|
#include <boost/scoped_array.hpp>
|
2019-04-23 13:15:38 +02:00
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
2018-01-04 08:54:18 +01:00
|
|
|
#include <utility>
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
using namespace icinga;
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
REGISTER_TYPE(ElasticsearchWriter);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
REGISTER_STATSFUNCTION(ElasticsearchWriter, &ElasticsearchWriter::StatsFunc);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void ElasticsearchWriter::OnConfigLoaded()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2017-11-09 14:05:10 +01:00
|
|
|
ObjectImpl<ElasticsearchWriter>::OnConfigLoaded();
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
m_WorkQueue.SetName("ElasticsearchWriter, " + GetName());
|
2018-10-24 13:20:03 +02:00
|
|
|
|
|
|
|
if (!GetEnableHa()) {
|
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
|
|
|
<< "HA functionality disabled. Won't pause connection: " << GetName();
|
|
|
|
|
|
|
|
SetHAMode(HARunEverywhere);
|
|
|
|
} else {
|
|
|
|
SetHAMode(HARunOnce);
|
|
|
|
}
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr& perfdata)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2018-01-11 11:17:38 +01:00
|
|
|
DictionaryData nodes;
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
for (const ElasticsearchWriter::Ptr& elasticsearchwriter : ConfigType::GetObjectsByType<ElasticsearchWriter>()) {
|
|
|
|
size_t workQueueItems = elasticsearchwriter->m_WorkQueue.GetLength();
|
|
|
|
double workQueueItemRate = elasticsearchwriter->m_WorkQueue.GetTaskCount(60) / 60.0;
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
nodes.emplace_back(elasticsearchwriter->GetName(), new Dictionary({
|
|
|
|
{ "work_queue_items", workQueueItems },
|
|
|
|
{ "work_queue_item_rate", workQueueItemRate }
|
|
|
|
}));
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
perfdata->Add(new PerfdataValue("elasticsearchwriter_" + elasticsearchwriter->GetName() + "_work_queue_items", workQueueItems));
|
|
|
|
perfdata->Add(new PerfdataValue("elasticsearchwriter_" + elasticsearchwriter->GetName() + "_work_queue_item_rate", workQueueItemRate));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
status->Set("elasticsearchwriter", new Dictionary(std::move(nodes)));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2018-10-24 13:20:03 +02:00
|
|
|
void ElasticsearchWriter::Resume()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2018-10-24 13:20:03 +02:00
|
|
|
ObjectImpl<ElasticsearchWriter>::Resume();
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
m_EventPrefix = "icinga2.event.";
|
|
|
|
|
2017-12-19 15:50:05 +01:00
|
|
|
Log(LogInformation, "ElasticsearchWriter")
|
2018-10-24 13:20:03 +02:00
|
|
|
<< "'" << GetName() << "' resumed.";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-21 11:52:55 +01:00
|
|
|
m_WorkQueue.SetExceptionCallback(std::bind(&ElasticsearchWriter::ExceptionHandler, this, _1));
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
/* Setup timer for periodically flushing m_DataBuffer */
|
|
|
|
m_FlushTimer = new Timer();
|
|
|
|
m_FlushTimer->SetInterval(GetFlushInterval());
|
2017-11-21 11:52:55 +01:00
|
|
|
m_FlushTimer->OnTimerExpired.connect(std::bind(&ElasticsearchWriter::FlushTimeout, this));
|
2017-09-07 15:11:57 +02:00
|
|
|
m_FlushTimer->Start();
|
|
|
|
m_FlushTimer->Reschedule(0);
|
|
|
|
|
|
|
|
/* Register for new metrics. */
|
2017-11-21 11:52:55 +01:00
|
|
|
Checkable::OnNewCheckResult.connect(std::bind(&ElasticsearchWriter::CheckResultHandler, this, _1, _2));
|
|
|
|
Checkable::OnStateChange.connect(std::bind(&ElasticsearchWriter::StateChangeHandler, this, _1, _2, _3));
|
|
|
|
Checkable::OnNotificationSentToAllUsers.connect(std::bind(&ElasticsearchWriter::NotificationSentToAllUsersHandler, this, _1, _2, _3, _4, _5, _6, _7));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2019-02-20 17:11:39 +01:00
|
|
|
/* Pause is equivalent to Stop, but with HA capabilities to resume at runtime. */
|
2018-10-24 13:20:03 +02:00
|
|
|
void ElasticsearchWriter::Pause()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2019-02-20 17:11:39 +01:00
|
|
|
Flush();
|
|
|
|
m_WorkQueue.Join();
|
|
|
|
Flush();
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogInformation, "ElasticsearchWriter")
|
2018-10-24 13:20:03 +02:00
|
|
|
<< "'" << GetName() << "' paused.";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2018-10-24 13:20:03 +02:00
|
|
|
ObjectImpl<ElasticsearchWriter>::Pause();
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::AddCheckResult(const Dictionary::Ptr& fields, const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
String prefix = "check_result.";
|
|
|
|
|
|
|
|
fields->Set(prefix + "output", cr->GetOutput());
|
|
|
|
fields->Set(prefix + "check_source", cr->GetCheckSource());
|
|
|
|
fields->Set(prefix + "exit_status", cr->GetExitStatus());
|
|
|
|
fields->Set(prefix + "command", cr->GetCommand());
|
|
|
|
fields->Set(prefix + "state", cr->GetState());
|
|
|
|
fields->Set(prefix + "vars_before", cr->GetVarsBefore());
|
|
|
|
fields->Set(prefix + "vars_after", cr->GetVarsAfter());
|
|
|
|
|
|
|
|
fields->Set(prefix + "execution_start", FormatTimestamp(cr->GetExecutionStart()));
|
|
|
|
fields->Set(prefix + "execution_end", FormatTimestamp(cr->GetExecutionEnd()));
|
|
|
|
fields->Set(prefix + "schedule_start", FormatTimestamp(cr->GetScheduleStart()));
|
|
|
|
fields->Set(prefix + "schedule_end", FormatTimestamp(cr->GetScheduleEnd()));
|
|
|
|
|
|
|
|
/* Add extra calculated field. */
|
|
|
|
fields->Set(prefix + "latency", cr->CalculateLatency());
|
|
|
|
fields->Set(prefix + "execution_time", cr->CalculateExecutionTime());
|
|
|
|
|
|
|
|
if (!GetEnableSendPerfdata())
|
|
|
|
return;
|
|
|
|
|
|
|
|
Array::Ptr perfdata = cr->GetPerformanceData();
|
|
|
|
|
2019-03-19 09:01:12 +01:00
|
|
|
CheckCommand::Ptr checkCommand = checkable->GetCheckCommand();
|
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
if (perfdata) {
|
|
|
|
ObjectLock olock(perfdata);
|
|
|
|
for (const Value& val : perfdata) {
|
|
|
|
PerfdataValue::Ptr pdv;
|
|
|
|
|
|
|
|
if (val.IsObjectType<PerfdataValue>())
|
|
|
|
pdv = val;
|
|
|
|
else {
|
|
|
|
try {
|
|
|
|
pdv = PerfdataValue::Parse(val);
|
|
|
|
} catch (const std::exception&) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2019-03-19 09:01:12 +01:00
|
|
|
<< "Ignoring invalid perfdata for checkable '"
|
|
|
|
<< checkable->GetName() << "' and command '"
|
|
|
|
<< checkCommand->GetName() << "' with value: " << val;
|
2018-04-03 14:38:25 +02:00
|
|
|
continue;
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
String escapedKey = pdv->GetLabel();
|
|
|
|
boost::replace_all(escapedKey, " ", "_");
|
|
|
|
boost::replace_all(escapedKey, ".", "_");
|
|
|
|
boost::replace_all(escapedKey, "\\", "_");
|
|
|
|
boost::algorithm::replace_all(escapedKey, "::", ".");
|
|
|
|
|
|
|
|
String perfdataPrefix = prefix + "perfdata." + escapedKey;
|
|
|
|
|
|
|
|
fields->Set(perfdataPrefix + ".value", pdv->GetValue());
|
|
|
|
|
2019-12-05 13:05:59 +01:00
|
|
|
if (!pdv->GetMin().IsEmpty())
|
2017-09-07 15:11:57 +02:00
|
|
|
fields->Set(perfdataPrefix + ".min", pdv->GetMin());
|
2019-12-05 13:05:59 +01:00
|
|
|
if (!pdv->GetMax().IsEmpty())
|
2017-09-07 15:11:57 +02:00
|
|
|
fields->Set(perfdataPrefix + ".max", pdv->GetMax());
|
2019-12-05 13:05:59 +01:00
|
|
|
if (!pdv->GetWarn().IsEmpty())
|
2017-09-07 15:11:57 +02:00
|
|
|
fields->Set(perfdataPrefix + ".warn", pdv->GetWarn());
|
2019-12-05 13:05:59 +01:00
|
|
|
if (!pdv->GetCrit().IsEmpty())
|
2017-09-07 15:11:57 +02:00
|
|
|
fields->Set(perfdataPrefix + ".crit", pdv->GetCrit());
|
2018-04-03 14:49:50 +02:00
|
|
|
|
|
|
|
if (!pdv->GetUnit().IsEmpty())
|
|
|
|
fields->Set(perfdataPrefix + ".unit", pdv->GetUnit());
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::CheckResultHandler(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2018-10-24 13:20:03 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2017-11-21 11:52:55 +01:00
|
|
|
m_WorkQueue.Enqueue(std::bind(&ElasticsearchWriter::InternalCheckResultHandler, this, checkable, cr));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::InternalCheckResultHandler(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
AssertOnWorkQueue();
|
|
|
|
|
|
|
|
CONTEXT("Elasticwriter processing check result for '" + checkable->GetName() + "'");
|
|
|
|
|
|
|
|
if (!IcingaApplication::GetInstance()->GetEnablePerfdata() || !checkable->GetEnablePerfdata())
|
|
|
|
return;
|
|
|
|
|
|
|
|
Host::Ptr host;
|
|
|
|
Service::Ptr service;
|
2017-11-22 12:05:36 +01:00
|
|
|
tie(host, service) = GetHostService(checkable);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
Dictionary::Ptr fields = new Dictionary();
|
|
|
|
|
|
|
|
if (service) {
|
|
|
|
fields->Set("service", service->GetShortName());
|
|
|
|
fields->Set("state", service->GetState());
|
|
|
|
fields->Set("last_state", service->GetLastState());
|
|
|
|
fields->Set("last_hard_state", service->GetLastHardState());
|
|
|
|
} else {
|
|
|
|
fields->Set("state", host->GetState());
|
|
|
|
fields->Set("last_state", host->GetLastState());
|
|
|
|
fields->Set("last_hard_state", host->GetLastHardState());
|
|
|
|
}
|
|
|
|
|
|
|
|
fields->Set("host", host->GetName());
|
|
|
|
fields->Set("state_type", checkable->GetStateType());
|
|
|
|
|
|
|
|
fields->Set("current_check_attempt", checkable->GetCheckAttempt());
|
|
|
|
fields->Set("max_check_attempts", checkable->GetMaxCheckAttempts());
|
|
|
|
|
|
|
|
fields->Set("reachable", checkable->IsReachable());
|
|
|
|
|
|
|
|
CheckCommand::Ptr commandObj = checkable->GetCheckCommand();
|
|
|
|
|
|
|
|
if (commandObj)
|
|
|
|
fields->Set("check_command", commandObj->GetName());
|
|
|
|
|
|
|
|
double ts = Utility::GetTime();
|
|
|
|
|
|
|
|
if (cr) {
|
|
|
|
AddCheckResult(fields, checkable, cr);
|
|
|
|
ts = cr->GetExecutionEnd();
|
|
|
|
}
|
|
|
|
|
2019-03-19 09:01:12 +01:00
|
|
|
Enqueue(checkable, "checkresult", fields, ts);
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::StateChangeHandler(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr, StateType type)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2018-10-24 13:20:03 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2017-11-21 11:52:55 +01:00
|
|
|
m_WorkQueue.Enqueue(std::bind(&ElasticsearchWriter::StateChangeHandlerInternal, this, checkable, cr, type));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::StateChangeHandlerInternal(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr, StateType type)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
AssertOnWorkQueue();
|
|
|
|
|
|
|
|
CONTEXT("Elasticwriter processing state change '" + checkable->GetName() + "'");
|
|
|
|
|
|
|
|
Host::Ptr host;
|
|
|
|
Service::Ptr service;
|
|
|
|
tie(host, service) = GetHostService(checkable);
|
|
|
|
|
|
|
|
Dictionary::Ptr fields = new Dictionary();
|
|
|
|
|
|
|
|
fields->Set("current_check_attempt", checkable->GetCheckAttempt());
|
|
|
|
fields->Set("max_check_attempts", checkable->GetMaxCheckAttempts());
|
|
|
|
fields->Set("host", host->GetName());
|
|
|
|
|
|
|
|
if (service) {
|
|
|
|
fields->Set("service", service->GetShortName());
|
|
|
|
fields->Set("state", service->GetState());
|
|
|
|
fields->Set("last_state", service->GetLastState());
|
|
|
|
fields->Set("last_hard_state", service->GetLastHardState());
|
|
|
|
} else {
|
|
|
|
fields->Set("state", host->GetState());
|
|
|
|
fields->Set("last_state", host->GetLastState());
|
|
|
|
fields->Set("last_hard_state", host->GetLastHardState());
|
|
|
|
}
|
|
|
|
|
|
|
|
CheckCommand::Ptr commandObj = checkable->GetCheckCommand();
|
|
|
|
|
|
|
|
if (commandObj)
|
|
|
|
fields->Set("check_command", commandObj->GetName());
|
|
|
|
|
|
|
|
double ts = Utility::GetTime();
|
|
|
|
|
|
|
|
if (cr) {
|
|
|
|
AddCheckResult(fields, checkable, cr);
|
|
|
|
ts = cr->GetExecutionEnd();
|
|
|
|
}
|
|
|
|
|
2019-03-19 09:01:12 +01:00
|
|
|
Enqueue(checkable, "statechange", fields, ts);
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::NotificationSentToAllUsersHandler(const Notification::Ptr& notification,
|
2017-12-19 15:50:05 +01:00
|
|
|
const Checkable::Ptr& checkable, const std::set<User::Ptr>& users, NotificationType type,
|
|
|
|
const CheckResult::Ptr& cr, const String& author, const String& text)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2018-10-24 13:20:03 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2017-11-21 11:52:55 +01:00
|
|
|
m_WorkQueue.Enqueue(std::bind(&ElasticsearchWriter::NotificationSentToAllUsersHandlerInternal, this,
|
2017-12-19 15:50:05 +01:00
|
|
|
notification, checkable, users, type, cr, author, text));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::NotificationSentToAllUsersHandlerInternal(const Notification::Ptr& notification,
|
2017-12-19 15:50:05 +01:00
|
|
|
const Checkable::Ptr& checkable, const std::set<User::Ptr>& users, NotificationType type,
|
|
|
|
const CheckResult::Ptr& cr, const String& author, const String& text)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
AssertOnWorkQueue();
|
|
|
|
|
|
|
|
CONTEXT("Elasticwriter processing notification to all users '" + checkable->GetName() + "'");
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Processing notification for '" << checkable->GetName() << "'";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
Host::Ptr host;
|
|
|
|
Service::Ptr service;
|
|
|
|
tie(host, service) = GetHostService(checkable);
|
|
|
|
|
2019-07-02 16:33:11 +02:00
|
|
|
String notificationTypeString = Notification::NotificationTypeToStringCompat(type); //TODO: Change that to our own types.
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
Dictionary::Ptr fields = new Dictionary();
|
|
|
|
|
|
|
|
if (service) {
|
|
|
|
fields->Set("service", service->GetShortName());
|
|
|
|
fields->Set("state", service->GetState());
|
|
|
|
fields->Set("last_state", service->GetLastState());
|
|
|
|
fields->Set("last_hard_state", service->GetLastHardState());
|
|
|
|
} else {
|
|
|
|
fields->Set("state", host->GetState());
|
|
|
|
fields->Set("last_state", host->GetLastState());
|
|
|
|
fields->Set("last_hard_state", host->GetLastHardState());
|
|
|
|
}
|
|
|
|
|
|
|
|
fields->Set("host", host->GetName());
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
ArrayData userNames;
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
for (const User::Ptr& user : users) {
|
2018-01-11 11:17:38 +01:00
|
|
|
userNames.push_back(user->GetName());
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
fields->Set("users", new Array(std::move(userNames)));
|
2017-09-07 15:11:57 +02:00
|
|
|
fields->Set("notification_type", notificationTypeString);
|
|
|
|
fields->Set("author", author);
|
|
|
|
fields->Set("text", text);
|
|
|
|
|
|
|
|
CheckCommand::Ptr commandObj = checkable->GetCheckCommand();
|
|
|
|
|
|
|
|
if (commandObj)
|
|
|
|
fields->Set("check_command", commandObj->GetName());
|
|
|
|
|
|
|
|
double ts = Utility::GetTime();
|
|
|
|
|
|
|
|
if (cr) {
|
|
|
|
AddCheckResult(fields, checkable, cr);
|
|
|
|
ts = cr->GetExecutionEnd();
|
|
|
|
}
|
|
|
|
|
2019-03-19 09:01:12 +01:00
|
|
|
Enqueue(checkable, "notification", fields, ts);
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2019-03-19 09:01:12 +01:00
|
|
|
void ElasticsearchWriter::Enqueue(const Checkable::Ptr& checkable, const String& type,
|
|
|
|
const Dictionary::Ptr& fields, double ts)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
/* Atomically buffer the data point. */
|
|
|
|
boost::mutex::scoped_lock lock(m_DataBufferMutex);
|
|
|
|
|
|
|
|
/* Format the timestamps to dynamically select the date datatype inside the index. */
|
|
|
|
fields->Set("@timestamp", FormatTimestamp(ts));
|
|
|
|
fields->Set("timestamp", FormatTimestamp(ts));
|
|
|
|
|
|
|
|
String eventType = m_EventPrefix + type;
|
|
|
|
fields->Set("type", eventType);
|
|
|
|
|
2018-04-06 15:24:43 +02:00
|
|
|
/* Every payload needs a line describing the index.
|
2017-09-07 15:11:57 +02:00
|
|
|
* We do it this way to avoid problems with a near full queue.
|
|
|
|
*/
|
2018-04-06 15:24:43 +02:00
|
|
|
String indexBody = "{\"index\": {} }\n";
|
2017-09-11 17:28:41 +02:00
|
|
|
String fieldsBody = JsonEncode(fields);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2019-03-19 09:01:12 +01:00
|
|
|
<< "Checkable '" << checkable->GetName() << "' adds to metric list: '" << fieldsBody << "'.";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-30 08:19:58 +01:00
|
|
|
m_DataBuffer.emplace_back(indexBody + fieldsBody);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
/* Flush if we've buffered too much to prevent excessive memory use. */
|
|
|
|
if (static_cast<int>(m_DataBuffer.size()) >= GetFlushThreshold()) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Data buffer overflow writing " << m_DataBuffer.size() << " data points";
|
2017-09-07 15:11:57 +02:00
|
|
|
Flush();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void ElasticsearchWriter::FlushTimeout()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
/* Prevent new data points from being added to the array, there is a
|
|
|
|
* race condition where they could disappear.
|
|
|
|
*/
|
|
|
|
boost::mutex::scoped_lock lock(m_DataBufferMutex);
|
|
|
|
|
|
|
|
/* Flush if there are any data available. */
|
|
|
|
if (m_DataBuffer.size() > 0) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Timer expired writing " << m_DataBuffer.size() << " data points";
|
2017-09-07 15:11:57 +02:00
|
|
|
Flush();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void ElasticsearchWriter::Flush()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2019-03-27 11:35:41 +01:00
|
|
|
/* Flush can be called from 1) Timeout 2) Threshold 3) on shutdown/reload. */
|
|
|
|
if (m_DataBuffer.empty())
|
|
|
|
return;
|
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
/* Ensure you hold a lock against m_DataBuffer so that things
|
|
|
|
* don't go missing after creating the body and clearing the buffer.
|
|
|
|
*/
|
|
|
|
String body = boost::algorithm::join(m_DataBuffer, "\n");
|
|
|
|
m_DataBuffer.clear();
|
|
|
|
|
2017-12-07 11:11:03 +01:00
|
|
|
/* Elasticsearch 6.x requires a new line. This is compatible to 5.x.
|
|
|
|
* Tested with 6.0.0 and 5.6.4.
|
|
|
|
*/
|
|
|
|
body += "\n";
|
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
SendRequest(body);
|
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::SendRequest(const String& body)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2019-04-23 13:15:38 +02:00
|
|
|
namespace beast = boost::beast;
|
|
|
|
namespace http = beast::http;
|
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
Url::Ptr url = new Url();
|
2017-09-11 17:28:41 +02:00
|
|
|
|
|
|
|
url->SetScheme(GetEnableTls() ? "https" : "http");
|
2017-09-07 15:11:57 +02:00
|
|
|
url->SetHost(GetHost());
|
|
|
|
url->SetPort(GetPort());
|
|
|
|
|
|
|
|
std::vector<String> path;
|
|
|
|
|
|
|
|
/* Specify the index path. Best practice is a daily rotation.
|
|
|
|
* Example: http://localhost:9200/icinga2-2017.09.11?pretty=1
|
|
|
|
*/
|
2017-11-30 08:19:58 +01:00
|
|
|
path.emplace_back(GetIndex() + "-" + Utility::FormatDateTime("%Y.%m.%d", Utility::GetTime()));
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2018-04-06 15:24:43 +02:00
|
|
|
/* ES 6 removes multiple _type mappings: https://www.elastic.co/guide/en/elasticsearch/reference/6.x/removal-of-types.html
|
2018-04-11 14:04:39 +02:00
|
|
|
* Best practice is to statically define 'doc', as ES 5.X does not allow types starting with '_'.
|
2018-04-06 15:24:43 +02:00
|
|
|
*/
|
2018-04-11 14:04:39 +02:00
|
|
|
path.emplace_back("doc");
|
2018-04-06 15:24:43 +02:00
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
/* Use the bulk message format. */
|
2017-11-30 08:19:58 +01:00
|
|
|
path.emplace_back("_bulk");
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
url->SetPath(path);
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
OptionalTlsStream stream;
|
2018-06-21 15:41:40 +02:00
|
|
|
|
|
|
|
try {
|
|
|
|
stream = Connect();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2018-09-06 15:58:42 +02:00
|
|
|
<< "Flush failed, cannot connect to Elasticsearch: " << DiagnosticInformation(ex, false);
|
2018-06-21 15:41:40 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
Defer s ([&stream]() {
|
|
|
|
if (stream.first) {
|
|
|
|
stream.first->next_layer().shutdown();
|
|
|
|
}
|
|
|
|
});
|
2018-06-21 15:41:40 +02:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
http::request<http::string_body> request (http::verb::post, std::string(url->Format(true)), 10);
|
2019-03-15 13:15:24 +01:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
request.set(http::field::user_agent, "Icinga/" + Application::GetAppVersion());
|
|
|
|
request.set(http::field::host, url->GetHost() + ":" + url->GetPort());
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
/* Specify required headers by Elasticsearch. */
|
2019-04-23 13:15:38 +02:00
|
|
|
request.set(http::field::accept, "application/json");
|
2019-03-20 10:13:38 +01:00
|
|
|
|
|
|
|
/* Use application/x-ndjson for bulk streams. While ES
|
|
|
|
* is able to handle application/json, the newline separator
|
|
|
|
* causes problems with Logstash (#6609).
|
|
|
|
*/
|
2019-04-23 13:15:38 +02:00
|
|
|
request.set(http::field::content_type, "application/x-ndjson");
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-09-11 17:00:33 +02:00
|
|
|
/* Send authentication if configured. */
|
|
|
|
String username = GetUsername();
|
|
|
|
String password = GetPassword();
|
|
|
|
|
|
|
|
if (!username.IsEmpty() && !password.IsEmpty())
|
2019-04-23 13:15:38 +02:00
|
|
|
request.set(http::field::authorization, "Basic " + Base64::Encode(username + ":" + password));
|
2017-09-11 17:00:33 +02:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
request.body() = body;
|
|
|
|
request.set(http::field::content_length, request.body().size());
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-09-11 17:28:41 +02:00
|
|
|
/* Don't log the request body to debug log, this is already done above. */
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2019-04-23 13:15:38 +02:00
|
|
|
<< "Sending " << request.method_string() << " request" << ((!username.IsEmpty() && !password.IsEmpty()) ? " with basic auth" : "" )
|
2017-12-19 15:50:05 +01:00
|
|
|
<< " to '" << url->Format() << "'.";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
try {
|
2019-04-23 13:15:38 +02:00
|
|
|
if (stream.first) {
|
|
|
|
http::write(*stream.first, request);
|
|
|
|
stream.first->flush();
|
|
|
|
} else {
|
|
|
|
http::write(*stream.second, request);
|
|
|
|
stream.second->flush();
|
|
|
|
}
|
|
|
|
} catch (const std::exception&) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2017-09-07 15:11:57 +02:00
|
|
|
<< "Cannot write to HTTP API on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2019-04-23 13:15:38 +02:00
|
|
|
throw;
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
http::parser<false, http::string_body> parser;
|
|
|
|
beast::flat_buffer buf;
|
2017-09-07 15:11:57 +02:00
|
|
|
|
|
|
|
try {
|
2019-04-23 13:15:38 +02:00
|
|
|
if (stream.first) {
|
|
|
|
http::read(*stream.first, buf, parser);
|
|
|
|
} else {
|
|
|
|
http::read(*stream.second, buf, parser);
|
|
|
|
}
|
2017-09-07 15:11:57 +02:00
|
|
|
} catch (const std::exception& ex) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Failed to parse HTTP response from host '" << GetHost() << "' port '" << GetPort() << "': " << DiagnosticInformation(ex, false);
|
2019-04-23 13:15:38 +02:00
|
|
|
throw;
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
auto& response (parser.get());
|
2017-12-07 11:11:03 +01:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
if (response.result_int() > 299) {
|
|
|
|
if (response.result() == http::status::unauthorized) {
|
2017-09-11 17:00:33 +02:00
|
|
|
/* More verbose error logging with Elasticsearch is hidden behind a proxy. */
|
|
|
|
if (!username.IsEmpty() && !password.IsEmpty()) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogCritical, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "401 Unauthorized. Please ensure that the user '" << username
|
|
|
|
<< "' is able to authenticate against the HTTP API/Proxy.";
|
2017-09-11 17:00:33 +02:00
|
|
|
} else {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogCritical, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "401 Unauthorized. The HTTP API requires authentication but no username/password has been configured.";
|
2017-09-11 17:00:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2019-03-18 16:41:01 +01:00
|
|
|
std::ostringstream msgbuf;
|
2019-04-23 13:15:38 +02:00
|
|
|
msgbuf << "Unexpected response code " << response.result_int() << " from URL '" << url->Format() << "'";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
auto& contentType (response[http::field::content_type]);
|
2017-09-11 17:00:33 +02:00
|
|
|
|
2019-03-18 16:41:01 +01:00
|
|
|
if (contentType != "application/json" && contentType != "application/json; charset=utf-8") {
|
|
|
|
msgbuf << "; Unexpected Content-Type: '" << contentType << "'";
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
auto& body (response.body());
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2019-03-18 16:41:01 +01:00
|
|
|
#ifdef I2_DEBUG
|
2019-04-23 13:15:38 +02:00
|
|
|
msgbuf << "; Response body: '" << body << "'";
|
2019-03-18 16:41:01 +01:00
|
|
|
#endif /* I2_DEBUG */
|
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
Dictionary::Ptr jsonResponse;
|
2019-04-23 13:15:38 +02:00
|
|
|
|
2017-09-07 15:11:57 +02:00
|
|
|
try {
|
2019-04-23 13:15:38 +02:00
|
|
|
jsonResponse = JsonDecode(body);
|
2017-09-07 15:11:57 +02:00
|
|
|
} catch (...) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2019-04-23 13:15:38 +02:00
|
|
|
<< "Unable to parse JSON response:\n" << body;
|
2017-09-07 15:11:57 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
String error = jsonResponse->Get("error");
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogCritical, "ElasticsearchWriter")
|
2019-03-18 16:41:01 +01:00
|
|
|
<< "Error: '" << error << "'. " << msgbuf.str();
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
OptionalTlsStream ElasticsearchWriter::Connect()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogNotice, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Connecting to Elasticsearch on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
OptionalTlsStream stream;
|
|
|
|
bool tls = GetEnableTls();
|
2017-09-11 17:28:41 +02:00
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
if (tls) {
|
2019-07-25 16:45:39 +02:00
|
|
|
Shared<boost::asio::ssl::context>::Ptr sslContext;
|
2017-09-11 17:28:41 +02:00
|
|
|
|
|
|
|
try {
|
2019-04-23 13:15:38 +02:00
|
|
|
sslContext = MakeAsioSslContext(GetCertPath(), GetKeyPath(), GetCaPath());
|
|
|
|
} catch (const std::exception&) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Unable to create SSL context.";
|
2019-04-23 13:15:38 +02:00
|
|
|
throw;
|
2017-09-11 17:28:41 +02:00
|
|
|
}
|
|
|
|
|
2019-07-25 14:34:29 +02:00
|
|
|
stream.first = Shared<AsioTlsStream>::Make(IoEngine::Get().GetIoContext(), *sslContext, GetHost());
|
|
|
|
|
2019-04-23 13:15:38 +02:00
|
|
|
} else {
|
2019-07-25 14:55:22 +02:00
|
|
|
stream.second = Shared<AsioTcpStream>::Make(IoEngine::Get().GetIoContext());
|
2019-04-23 13:15:38 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
try {
|
|
|
|
icinga::Connect(tls ? stream.first->lowest_layer() : stream.second->lowest_layer(), GetHost(), GetPort());
|
|
|
|
} catch (const std::exception&) {
|
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
|
|
|
<< "Can't connect to Elasticsearch on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
|
|
|
throw;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (tls) {
|
|
|
|
auto& tlsStream (stream.first->next_layer());
|
2017-09-11 17:28:41 +02:00
|
|
|
|
|
|
|
try {
|
2019-04-23 13:15:38 +02:00
|
|
|
tlsStream.handshake(tlsStream.client);
|
|
|
|
} catch (const std::exception&) {
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogWarning, "ElasticsearchWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "TLS handshake with host '" << GetHost() << "' on port " << GetPort() << " failed.";
|
2019-04-23 13:15:38 +02:00
|
|
|
throw;
|
2017-09-11 17:28:41 +02:00
|
|
|
}
|
|
|
|
}
|
2019-04-23 13:15:38 +02:00
|
|
|
|
|
|
|
return std::move(stream);
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void ElasticsearchWriter::AssertOnWorkQueue()
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
ASSERT(m_WorkQueue.IsWorkerThread());
|
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
void ElasticsearchWriter::ExceptionHandler(boost::exception_ptr exp)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogCritical, "ElasticsearchWriter", "Exception during Elastic operation: Verify that your backend is operational!");
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
Log(LogDebug, "ElasticsearchWriter")
|
2018-01-04 08:54:18 +01:00
|
|
|
<< "Exception during Elasticsearch operation: " << DiagnosticInformation(std::move(exp));
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|
|
|
|
|
2017-11-09 14:05:10 +01:00
|
|
|
String ElasticsearchWriter::FormatTimestamp(double ts)
|
2017-09-07 15:11:57 +02:00
|
|
|
{
|
|
|
|
/* The date format must match the default dynamic date detection
|
|
|
|
* pattern in indexes. This enables applications like Kibana to
|
|
|
|
* detect a qualified timestamp index for time-series data.
|
|
|
|
*
|
|
|
|
* Example: 2017-09-11T10:56:21.463+0200
|
|
|
|
*
|
|
|
|
* References:
|
|
|
|
* https://www.elastic.co/guide/en/elasticsearch/reference/current/dynamic-field-mapping.html#date-detection
|
|
|
|
* https://www.elastic.co/guide/en/elasticsearch/reference/current/mapping-date-format.html
|
|
|
|
* https://www.elastic.co/guide/en/elasticsearch/reference/current/date.html
|
|
|
|
*/
|
2018-01-04 09:07:03 +01:00
|
|
|
auto milliSeconds = static_cast<int>((ts - static_cast<int>(ts)) * 1000);
|
2017-09-07 15:11:57 +02:00
|
|
|
|
2017-09-18 17:32:54 +02:00
|
|
|
return Utility::FormatDateTime("%Y-%m-%dT%H:%M:%S", ts) + "." + Convert::ToString(milliSeconds) + Utility::FormatDateTime("%z", ts);
|
2017-09-07 15:11:57 +02:00
|
|
|
}
|