2019-02-25 14:48:22 +01:00
|
|
|
/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
#include "perfdata/opentsdbwriter.hpp"
|
2018-01-18 13:50:38 +01:00
|
|
|
#include "perfdata/opentsdbwriter-ti.cpp"
|
2015-01-28 10:57:34 +01:00
|
|
|
#include "icinga/service.hpp"
|
2019-03-19 09:38:32 +01:00
|
|
|
#include "icinga/checkcommand.hpp"
|
2015-01-28 10:57:34 +01:00
|
|
|
#include "icinga/macroprocessor.hpp"
|
|
|
|
#include "icinga/icingaapplication.hpp"
|
|
|
|
#include "icinga/compatutility.hpp"
|
|
|
|
#include "base/tcpsocket.hpp"
|
2015-08-15 20:28:05 +02:00
|
|
|
#include "base/configtype.hpp"
|
2015-01-28 10:57:34 +01:00
|
|
|
#include "base/objectlock.hpp"
|
|
|
|
#include "base/logger.hpp"
|
|
|
|
#include "base/convert.hpp"
|
|
|
|
#include "base/utility.hpp"
|
2017-05-15 15:51:39 +02:00
|
|
|
#include "base/perfdatavalue.hpp"
|
2015-01-28 10:57:34 +01:00
|
|
|
#include "base/application.hpp"
|
|
|
|
#include "base/stream.hpp"
|
|
|
|
#include "base/networkstream.hpp"
|
|
|
|
#include "base/exception.hpp"
|
|
|
|
#include "base/statsfunction.hpp"
|
|
|
|
#include <boost/algorithm/string.hpp>
|
|
|
|
#include <boost/algorithm/string/replace.hpp>
|
|
|
|
|
|
|
|
using namespace icinga;
|
|
|
|
|
|
|
|
REGISTER_TYPE(OpenTsdbWriter);
|
|
|
|
|
2015-09-21 11:44:58 +02:00
|
|
|
REGISTER_STATSFUNCTION(OpenTsdbWriter, &OpenTsdbWriter::StatsFunc);
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/*
|
|
|
|
* Enable HA capabilities once the config object is loaded.
|
|
|
|
*/
|
2018-10-24 13:55:19 +02:00
|
|
|
void OpenTsdbWriter::OnConfigLoaded()
|
|
|
|
{
|
|
|
|
ObjectImpl<OpenTsdbWriter>::OnConfigLoaded();
|
|
|
|
|
|
|
|
if (!GetEnableHa()) {
|
|
|
|
Log(LogDebug, "OpenTsdbWriter")
|
|
|
|
<< "HA functionality disabled. Won't pause connection: " << GetName();
|
|
|
|
|
|
|
|
SetHAMode(HARunEverywhere);
|
|
|
|
} else {
|
|
|
|
SetHAMode(HARunOnce);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Feature stats interface
|
|
|
|
*
|
|
|
|
* @param status Key value pairs for feature stats
|
|
|
|
*/
|
2015-02-07 22:36:17 +01:00
|
|
|
void OpenTsdbWriter::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr&)
|
2015-01-28 10:57:34 +01:00
|
|
|
{
|
2018-01-11 11:17:38 +01:00
|
|
|
DictionaryData nodes;
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const OpenTsdbWriter::Ptr& opentsdbwriter : ConfigType::GetObjectsByType<OpenTsdbWriter>()) {
|
2019-05-27 15:09:26 +02:00
|
|
|
nodes.emplace_back(opentsdbwriter->GetName(), new Dictionary({
|
|
|
|
{ "connected", opentsdbwriter->GetConnected() }
|
|
|
|
}));
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
status->Set("opentsdbwriter", new Dictionary(std::move(nodes)));
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Resume is equivalent to Start, but with HA capabilities to resume at runtime.
|
|
|
|
*/
|
2018-10-24 13:55:19 +02:00
|
|
|
void OpenTsdbWriter::Resume()
|
2015-01-28 10:57:34 +01:00
|
|
|
{
|
2018-10-24 13:55:19 +02:00
|
|
|
ObjectImpl<OpenTsdbWriter>::Resume();
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2017-02-08 14:53:52 +01:00
|
|
|
Log(LogInformation, "OpentsdbWriter")
|
2018-10-24 13:55:19 +02:00
|
|
|
<< "'" << GetName() << "' resumed.";
|
2017-02-08 14:53:52 +01:00
|
|
|
|
2015-01-28 10:57:34 +01:00
|
|
|
m_ReconnectTimer = new Timer();
|
|
|
|
m_ReconnectTimer->SetInterval(10);
|
2017-11-21 11:52:55 +01:00
|
|
|
m_ReconnectTimer->OnTimerExpired.connect(std::bind(&OpenTsdbWriter::ReconnectTimerHandler, this));
|
2015-01-28 10:57:34 +01:00
|
|
|
m_ReconnectTimer->Start();
|
|
|
|
m_ReconnectTimer->Reschedule(0);
|
|
|
|
|
2017-11-21 11:52:55 +01:00
|
|
|
Service::OnNewCheckResult.connect(std::bind(&OpenTsdbWriter::CheckResultHandler, this, _1, _2));
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Pause is equivalent to Stop, but with HA capabilities to resume at runtime.
|
|
|
|
*/
|
2018-10-24 13:55:19 +02:00
|
|
|
void OpenTsdbWriter::Pause()
|
2017-02-08 14:53:52 +01:00
|
|
|
{
|
2019-02-20 17:17:45 +01:00
|
|
|
m_ReconnectTimer.reset();
|
|
|
|
|
2017-02-08 14:53:52 +01:00
|
|
|
Log(LogInformation, "OpentsdbWriter")
|
2018-10-24 13:55:19 +02:00
|
|
|
<< "'" << GetName() << "' paused.";
|
2017-02-08 14:53:52 +01:00
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
m_Stream->close();
|
|
|
|
|
|
|
|
SetConnected(false);
|
|
|
|
|
2018-10-24 13:55:19 +02:00
|
|
|
ObjectImpl<OpenTsdbWriter>::Pause();
|
2017-02-08 14:53:52 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Reconnect handler called by the timer.
|
|
|
|
* Handles TLS
|
|
|
|
*/
|
2018-01-04 04:25:35 +01:00
|
|
|
void OpenTsdbWriter::ReconnectTimerHandler()
|
2015-01-28 10:57:34 +01:00
|
|
|
{
|
2018-10-24 13:55:19 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
SetShouldConnect(true);
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
if (GetConnected())
|
|
|
|
return;
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
Log(LogNotice, "OpenTsdbWriter")
|
|
|
|
<< "Reconnect to OpenTSDB TSD on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/*
|
|
|
|
* We're using telnet as input method. Future PRs may change this into using the HTTP API.
|
|
|
|
* http://opentsdb.net/docs/build/html/user_guide/writing/index.html#telnet
|
|
|
|
*/
|
|
|
|
|
|
|
|
m_Stream = std::make_shared<AsioTcpStream>(IoEngine::Get().GetIoService());
|
|
|
|
|
2015-01-28 10:57:34 +01:00
|
|
|
try {
|
2019-05-27 15:09:26 +02:00
|
|
|
icinga::Connect(m_Stream->lowest_layer(), GetHost(), GetPort());
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogWarning, "OpenTsdbWriter")
|
|
|
|
<< "Can't connect to OpenTSDB on host '" << GetHost() << "' port '" << GetPort() << ".'";
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
SetConnected(true);
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Registered check result handler processing data.
|
|
|
|
* Calculates tags from the config.
|
|
|
|
*
|
|
|
|
* @param checkable Host/service object
|
|
|
|
* @param cr Check result
|
|
|
|
*/
|
2015-01-28 10:57:34 +01:00
|
|
|
void OpenTsdbWriter::CheckResultHandler(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
|
|
|
{
|
2018-10-24 13:55:19 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2015-01-28 10:57:34 +01:00
|
|
|
CONTEXT("Processing check result for '" + checkable->GetName() + "'");
|
|
|
|
|
|
|
|
if (!IcingaApplication::GetInstance()->GetEnablePerfdata() || !checkable->GetEnablePerfdata())
|
|
|
|
return;
|
|
|
|
|
|
|
|
Service::Ptr service = dynamic_pointer_cast<Service>(checkable);
|
|
|
|
Host::Ptr host;
|
|
|
|
|
|
|
|
if (service)
|
|
|
|
host = service->GetHost();
|
|
|
|
else
|
|
|
|
host = static_pointer_cast<Host>(checkable);
|
|
|
|
|
|
|
|
String metric;
|
|
|
|
std::map<String, String> tags;
|
2015-07-17 18:37:46 +02:00
|
|
|
|
2018-01-10 15:07:11 +01:00
|
|
|
String escaped_hostName = EscapeTag(host->GetName());
|
2015-07-17 18:37:46 +02:00
|
|
|
tags["host"] = escaped_hostName;
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2015-09-08 06:34:33 +02:00
|
|
|
double ts = cr->GetExecutionEnd();
|
|
|
|
|
2015-01-28 10:57:34 +01:00
|
|
|
if (service) {
|
|
|
|
String serviceName = service->GetShortName();
|
2015-07-17 18:37:46 +02:00
|
|
|
String escaped_serviceName = EscapeMetric(serviceName);
|
|
|
|
metric = "icinga.service." + escaped_serviceName;
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + ".state", tags, service->GetState(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
} else {
|
|
|
|
metric = "icinga.host";
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + ".state", tags, host->GetState(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + ".state_type", tags, checkable->GetStateType(), ts);
|
|
|
|
SendMetric(checkable, metric + ".reachable", tags, checkable->IsReachable(), ts);
|
|
|
|
SendMetric(checkable, metric + ".downtime_depth", tags, checkable->GetDowntimeDepth(), ts);
|
|
|
|
SendMetric(checkable, metric + ".acknowledgement", tags, checkable->GetAcknowledgement(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
SendPerfdata(checkable, metric, tags, cr, ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
metric = "icinga.check";
|
|
|
|
|
|
|
|
if (service) {
|
|
|
|
tags["type"] = "service";
|
|
|
|
String serviceName = service->GetShortName();
|
2015-07-17 18:37:46 +02:00
|
|
|
String escaped_serviceName = EscapeTag(serviceName);
|
|
|
|
tags["service"] = escaped_serviceName;
|
2015-01-28 10:57:34 +01:00
|
|
|
} else {
|
|
|
|
tags["type"] = "host";
|
|
|
|
}
|
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + ".current_attempt", tags, checkable->GetCheckAttempt(), ts);
|
|
|
|
SendMetric(checkable, metric + ".max_check_attempts", tags, checkable->GetMaxCheckAttempts(), ts);
|
|
|
|
SendMetric(checkable, metric + ".latency", tags, cr->CalculateLatency(), ts);
|
|
|
|
SendMetric(checkable, metric + ".execution_time", tags, cr->CalculateExecutionTime(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Parse and send performance data metrics to OpenTSDB
|
|
|
|
*
|
|
|
|
* @param checkable Host/service object
|
|
|
|
* @param metric Full metric name
|
|
|
|
* @param tags Tag key pairs
|
|
|
|
* @param cr Check result containing performance data
|
|
|
|
* @param ts Timestamp when the check result was received
|
|
|
|
*/
|
2019-03-19 09:38:32 +01:00
|
|
|
void OpenTsdbWriter::SendPerfdata(const Checkable::Ptr& checkable, const String& metric,
|
|
|
|
const std::map<String, String>& tags, const CheckResult::Ptr& cr, double ts)
|
2015-01-28 10:57:34 +01:00
|
|
|
{
|
|
|
|
Array::Ptr perfdata = cr->GetPerformanceData();
|
|
|
|
|
|
|
|
if (!perfdata)
|
|
|
|
return;
|
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
CheckCommand::Ptr checkCommand = checkable->GetCheckCommand();
|
|
|
|
|
2015-01-28 10:57:34 +01:00
|
|
|
ObjectLock olock(perfdata);
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Value& val : perfdata) {
|
2015-01-28 10:57:34 +01:00
|
|
|
PerfdataValue::Ptr pdv;
|
|
|
|
|
|
|
|
if (val.IsObjectType<PerfdataValue>())
|
|
|
|
pdv = val;
|
|
|
|
else {
|
|
|
|
try {
|
|
|
|
pdv = PerfdataValue::Parse(val);
|
|
|
|
} catch (const std::exception&) {
|
|
|
|
Log(LogWarning, "OpenTsdbWriter")
|
2019-03-19 09:38:32 +01:00
|
|
|
<< "Ignoring invalid perfdata for checkable '"
|
|
|
|
<< checkable->GetName() << "' and command '"
|
|
|
|
<< checkCommand->GetName() << "' with value: " << val;
|
2015-01-28 10:57:34 +01:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-07-17 18:37:46 +02:00
|
|
|
String escaped_key = EscapeMetric(pdv->GetLabel());
|
2015-01-28 10:57:34 +01:00
|
|
|
boost::algorithm::replace_all(escaped_key, "::", ".");
|
|
|
|
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + "." + escaped_key, tags, pdv->GetValue(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
if (pdv->GetCrit())
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + "." + escaped_key + "_crit", tags, pdv->GetCrit(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
if (pdv->GetWarn())
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + "." + escaped_key + "_warn", tags, pdv->GetWarn(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
if (pdv->GetMin())
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + "." + escaped_key + "_min", tags, pdv->GetMin(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
if (pdv->GetMax())
|
2019-03-19 09:38:32 +01:00
|
|
|
SendMetric(checkable, metric + "." + escaped_key + "_max", tags, pdv->GetMax(), ts);
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Send given metric to OpenTSDB
|
|
|
|
*
|
|
|
|
* @param checkable Host/service object
|
|
|
|
* @param metric Full metric name
|
|
|
|
* @param tags Tag key pairs
|
|
|
|
* @param value Floating point metric value
|
|
|
|
* @param ts Timestamp where the metric was received from the check result
|
|
|
|
*/
|
2019-03-19 09:38:32 +01:00
|
|
|
void OpenTsdbWriter::SendMetric(const Checkable::Ptr& checkable, const String& metric,
|
|
|
|
const std::map<String, String>& tags, double value, double ts)
|
2015-01-28 10:57:34 +01:00
|
|
|
{
|
|
|
|
String tags_string = "";
|
2019-03-19 09:38:32 +01:00
|
|
|
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Dictionary::Pair& tag : tags) {
|
2015-01-28 10:57:34 +01:00
|
|
|
tags_string += " " + tag.first + "=" + Convert::ToString(tag.second);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::ostringstream msgbuf;
|
|
|
|
/*
|
2019-05-27 15:09:26 +02:00
|
|
|
* must be (http://opentsdb.net/docs/build/html/user_guide/query/timeseries.html)
|
2015-01-28 10:57:34 +01:00
|
|
|
* put <metric> <timestamp> <value> <tagk1=tagv1[ tagk2=tagv2 ...tagkN=tagvN]>
|
|
|
|
* "tags" must include at least one tag, we use "host=HOSTNAME"
|
|
|
|
*/
|
2015-09-08 06:34:33 +02:00
|
|
|
msgbuf << "put " << metric << " " << static_cast<long>(ts) << " " << Convert::ToString(value) << " " << tags_string;
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
Log(LogDebug, "OpenTsdbWriter")
|
2019-03-19 09:38:32 +01:00
|
|
|
<< "Checkable '" << checkable->GetName() << "' adds to metric list: '" << msgbuf.str() << "'.";
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
/* do not send \n to debug log */
|
|
|
|
msgbuf << "\n";
|
|
|
|
String put = msgbuf.str();
|
|
|
|
|
|
|
|
ObjectLock olock(this);
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
if (!GetConnected())
|
2015-01-28 10:57:34 +01:00
|
|
|
return;
|
|
|
|
|
|
|
|
try {
|
2019-05-27 15:09:26 +02:00
|
|
|
Log(LogDebug, "OpenTsdbWriter")
|
|
|
|
<< "Checkable '" << checkable->GetName() << "' sending message '" << put << "'.";
|
|
|
|
|
|
|
|
boost::asio::write(*m_Stream, boost::asio::buffer(msgbuf.str()));
|
|
|
|
m_Stream->flush();
|
2015-01-28 10:57:34 +01:00
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "OpenTsdbWriter")
|
2019-05-27 15:09:26 +02:00
|
|
|
<< "Cannot write to TCP socket on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2015-01-28 10:57:34 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Escape tags for OpenTSDB
|
|
|
|
* http://opentsdb.net/docs/build/html/user_guide/query/timeseries.html#precisions-on-metrics-and-tags
|
|
|
|
*
|
|
|
|
* @param str Tag name
|
|
|
|
* @return Escaped tag
|
2015-01-28 10:57:34 +01:00
|
|
|
*/
|
|
|
|
String OpenTsdbWriter::EscapeTag(const String& str)
|
|
|
|
{
|
|
|
|
String result = str;
|
|
|
|
|
|
|
|
boost::replace_all(result, " ", "_");
|
|
|
|
boost::replace_all(result, "\\", "_");
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2019-05-27 15:09:26 +02:00
|
|
|
/**
|
|
|
|
* Escape metric name for OpenTSDB
|
|
|
|
* http://opentsdb.net/docs/build/html/user_guide/query/timeseries.html#precisions-on-metrics-and-tags
|
|
|
|
*
|
|
|
|
* @param str Metric name
|
|
|
|
* @return Escaped metric
|
|
|
|
*/
|
2015-01-28 10:57:34 +01:00
|
|
|
String OpenTsdbWriter::EscapeMetric(const String& str)
|
|
|
|
{
|
|
|
|
String result = str;
|
|
|
|
|
|
|
|
boost::replace_all(result, " ", "_");
|
|
|
|
boost::replace_all(result, ".", "_");
|
|
|
|
boost::replace_all(result, "\\", "_");
|
2018-05-08 09:40:13 +02:00
|
|
|
boost::replace_all(result, ":", "_");
|
2015-01-28 10:57:34 +01:00
|
|
|
|
|
|
|
return result;
|
2019-05-27 15:09:26 +02:00
|
|
|
}
|