2019-02-25 14:48:22 +01:00
|
|
|
/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
#include "perfdata/influxdbwriter.hpp"
|
2018-01-18 13:50:38 +01:00
|
|
|
#include "perfdata/influxdbwriter-ti.cpp"
|
2016-04-19 13:54:41 +02:00
|
|
|
#include "remote/url.hpp"
|
|
|
|
#include "remote/httprequest.hpp"
|
|
|
|
#include "remote/httpresponse.hpp"
|
|
|
|
#include "icinga/service.hpp"
|
|
|
|
#include "icinga/macroprocessor.hpp"
|
|
|
|
#include "icinga/icingaapplication.hpp"
|
|
|
|
#include "icinga/checkcommand.hpp"
|
2019-03-01 14:30:49 +01:00
|
|
|
#include "base/defer.hpp"
|
2016-04-19 13:54:41 +02:00
|
|
|
#include "base/tcpsocket.hpp"
|
|
|
|
#include "base/configtype.hpp"
|
|
|
|
#include "base/objectlock.hpp"
|
|
|
|
#include "base/logger.hpp"
|
|
|
|
#include "base/convert.hpp"
|
|
|
|
#include "base/utility.hpp"
|
2017-05-15 15:51:39 +02:00
|
|
|
#include "base/perfdatavalue.hpp"
|
2016-04-19 13:54:41 +02:00
|
|
|
#include "base/stream.hpp"
|
2016-07-28 14:29:37 +02:00
|
|
|
#include "base/json.hpp"
|
2016-04-19 13:54:41 +02:00
|
|
|
#include "base/networkstream.hpp"
|
|
|
|
#include "base/exception.hpp"
|
|
|
|
#include "base/statsfunction.hpp"
|
|
|
|
#include "base/tlsutility.hpp"
|
|
|
|
#include <boost/algorithm/string.hpp>
|
|
|
|
#include <boost/algorithm/string/replace.hpp>
|
2017-05-26 17:03:49 +02:00
|
|
|
#include <boost/math/special_functions/fpclassify.hpp>
|
2016-06-07 14:35:16 +02:00
|
|
|
#include <boost/regex.hpp>
|
2016-07-28 14:29:37 +02:00
|
|
|
#include <boost/scoped_array.hpp>
|
2018-01-04 08:54:18 +01:00
|
|
|
#include <utility>
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
using namespace icinga;
|
|
|
|
|
2018-01-04 06:11:04 +01:00
|
|
|
class InfluxdbInteger final : public Object
|
2017-10-24 15:23:58 +02:00
|
|
|
{
|
|
|
|
public:
|
|
|
|
DECLARE_PTR_TYPEDEFS(InfluxdbInteger);
|
|
|
|
|
|
|
|
InfluxdbInteger(int value)
|
2017-12-19 15:50:05 +01:00
|
|
|
: m_Value(value)
|
2017-10-24 15:23:58 +02:00
|
|
|
{ }
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
int GetValue() const
|
2017-10-24 15:23:58 +02:00
|
|
|
{
|
|
|
|
return m_Value;
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
int m_Value;
|
|
|
|
};
|
|
|
|
|
2016-04-19 13:54:41 +02:00
|
|
|
REGISTER_TYPE(InfluxdbWriter);
|
|
|
|
|
|
|
|
REGISTER_STATSFUNCTION(InfluxdbWriter, &InfluxdbWriter::StatsFunc);
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void InfluxdbWriter::OnConfigLoaded()
|
2017-05-04 10:29:49 +02:00
|
|
|
{
|
|
|
|
ObjectImpl<InfluxdbWriter>::OnConfigLoaded();
|
|
|
|
|
|
|
|
m_WorkQueue.SetName("InfluxdbWriter, " + GetName());
|
2018-10-24 13:38:06 +02:00
|
|
|
|
|
|
|
if (!GetEnableHa()) {
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
|
|
|
<< "HA functionality disabled. Won't pause connection: " << GetName();
|
|
|
|
|
|
|
|
SetHAMode(HARunEverywhere);
|
|
|
|
} else {
|
|
|
|
SetHAMode(HARunOnce);
|
|
|
|
}
|
2017-05-04 10:29:49 +02:00
|
|
|
}
|
|
|
|
|
2017-05-26 17:03:49 +02:00
|
|
|
void InfluxdbWriter::StatsFunc(const Dictionary::Ptr& status, const Array::Ptr& perfdata)
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2018-01-11 11:17:38 +01:00
|
|
|
DictionaryData nodes;
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const InfluxdbWriter::Ptr& influxdbwriter : ConfigType::GetObjectsByType<InfluxdbWriter>()) {
|
2017-05-04 10:29:49 +02:00
|
|
|
size_t workQueueItems = influxdbwriter->m_WorkQueue.GetLength();
|
2017-05-11 17:30:20 +02:00
|
|
|
double workQueueItemRate = influxdbwriter->m_WorkQueue.GetTaskCount(60) / 60.0;
|
2017-05-04 10:29:49 +02:00
|
|
|
size_t dataBufferItems = influxdbwriter->m_DataBuffer.size();
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
nodes.emplace_back(influxdbwriter->GetName(), new Dictionary({
|
|
|
|
{ "work_queue_items", workQueueItems },
|
|
|
|
{ "work_queue_item_rate", workQueueItemRate },
|
|
|
|
{ "data_buffer_items", dataBufferItems }
|
|
|
|
}));
|
2017-05-26 17:03:49 +02:00
|
|
|
|
|
|
|
perfdata->Add(new PerfdataValue("influxdbwriter_" + influxdbwriter->GetName() + "_work_queue_items", workQueueItems));
|
|
|
|
perfdata->Add(new PerfdataValue("influxdbwriter_" + influxdbwriter->GetName() + "_work_queue_item_rate", workQueueItemRate));
|
|
|
|
perfdata->Add(new PerfdataValue("influxdbwriter_" + influxdbwriter->GetName() + "_data_queue_items", dataBufferItems));
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2018-01-11 11:17:38 +01:00
|
|
|
status->Set("influxdbwriter", new Dictionary(std::move(nodes)));
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2018-10-24 13:38:06 +02:00
|
|
|
void InfluxdbWriter::Resume()
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2018-10-24 13:38:06 +02:00
|
|
|
ObjectImpl<InfluxdbWriter>::Resume();
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2017-02-08 14:53:52 +01:00
|
|
|
Log(LogInformation, "InfluxdbWriter")
|
2018-10-24 13:38:06 +02:00
|
|
|
<< "'" << GetName() << "' resumed.";
|
2017-02-08 14:53:52 +01:00
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
/* Register exception handler for WQ tasks. */
|
2017-11-21 11:52:55 +01:00
|
|
|
m_WorkQueue.SetExceptionCallback(std::bind(&InfluxdbWriter::ExceptionHandler, this, _1));
|
2017-05-04 10:29:49 +02:00
|
|
|
|
|
|
|
/* Setup timer for periodically flushing m_DataBuffer */
|
2016-04-19 13:54:41 +02:00
|
|
|
m_FlushTimer = new Timer();
|
|
|
|
m_FlushTimer->SetInterval(GetFlushInterval());
|
2017-11-21 11:52:55 +01:00
|
|
|
m_FlushTimer->OnTimerExpired.connect(std::bind(&InfluxdbWriter::FlushTimeout, this));
|
2016-04-19 13:54:41 +02:00
|
|
|
m_FlushTimer->Start();
|
|
|
|
m_FlushTimer->Reschedule(0);
|
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
/* Register for new metrics. */
|
2017-10-24 15:23:58 +02:00
|
|
|
Checkable::OnNewCheckResult.connect(std::bind(&InfluxdbWriter::CheckResultHandler, this, _1, _2));
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2019-02-20 15:21:24 +01:00
|
|
|
/* Pause is equivalent to Stop, but with HA capabilities to resume at runtime. */
|
2018-10-24 13:38:06 +02:00
|
|
|
void InfluxdbWriter::Pause()
|
2017-02-08 14:53:52 +01:00
|
|
|
{
|
2019-02-20 15:21:24 +01:00
|
|
|
/* Force a flush. */
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
|
|
|
<< "Flushing pending data buffers.";
|
2017-02-08 14:53:52 +01:00
|
|
|
|
2019-02-20 15:21:24 +01:00
|
|
|
Flush();
|
2017-05-04 10:29:49 +02:00
|
|
|
|
2019-02-20 15:21:24 +01:00
|
|
|
/* Work on the missing tasks. TODO: Find a way to cache them on disk. */
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
|
|
|
<< "Joining existing WQ tasks.";
|
2017-02-08 14:53:52 +01:00
|
|
|
|
2019-01-08 18:15:32 +01:00
|
|
|
m_WorkQueue.Join();
|
|
|
|
|
2019-02-20 15:21:24 +01:00
|
|
|
/* Flush again after the WQ tasks have filled the data buffer. */
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
|
|
|
<< "Flushing data buffers from WQ tasks.";
|
|
|
|
|
|
|
|
Flush();
|
|
|
|
|
|
|
|
Log(LogInformation, "InfluxdbWriter")
|
|
|
|
<< "'" << GetName() << "' paused.";
|
|
|
|
|
2018-10-24 13:38:06 +02:00
|
|
|
ObjectImpl<InfluxdbWriter>::Pause();
|
2019-01-08 18:15:32 +01:00
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void InfluxdbWriter::AssertOnWorkQueue()
|
2017-05-04 10:29:49 +02:00
|
|
|
{
|
|
|
|
ASSERT(m_WorkQueue.IsWorkerThread());
|
|
|
|
}
|
|
|
|
|
|
|
|
void InfluxdbWriter::ExceptionHandler(boost::exception_ptr exp)
|
|
|
|
{
|
|
|
|
Log(LogCritical, "InfluxdbWriter", "Exception during InfluxDB operation: Verify that your backend is operational!");
|
|
|
|
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
2018-01-04 08:54:18 +01:00
|
|
|
<< "Exception during InfluxDB operation: " << DiagnosticInformation(std::move(exp));
|
2017-05-04 10:29:49 +02:00
|
|
|
|
|
|
|
//TODO: Close the connection, if we keep it open.
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
Stream::Ptr InfluxdbWriter::Connect()
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2017-08-14 17:20:45 +02:00
|
|
|
TcpSocket::Ptr socket = new TcpSocket();
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
Log(LogNotice, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Reconnecting to InfluxDB on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
try {
|
|
|
|
socket->Connect(GetHost(), GetPort());
|
2017-05-04 10:29:49 +02:00
|
|
|
} catch (const std::exception& ex) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Can't connect to InfluxDB on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2017-05-04 10:29:49 +02:00
|
|
|
throw ex;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (GetSslEnable()) {
|
2017-11-21 13:20:55 +01:00
|
|
|
std::shared_ptr<SSL_CTX> sslContext;
|
2016-04-19 13:54:41 +02:00
|
|
|
try {
|
2017-05-04 10:29:49 +02:00
|
|
|
sslContext = MakeSSLContext(GetSslCert(), GetSslKey(), GetSslCaCert());
|
|
|
|
} catch (const std::exception& ex) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Unable to create SSL context.";
|
2017-05-04 10:29:49 +02:00
|
|
|
throw ex;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
TlsStream::Ptr tlsStream = new TlsStream(socket, GetHost(), RoleClient, sslContext);
|
2016-04-19 13:54:41 +02:00
|
|
|
try {
|
2017-05-04 10:29:49 +02:00
|
|
|
tlsStream->Handshake();
|
|
|
|
} catch (const std::exception& ex) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "TLS handshake with host '" << GetHost() << "' failed.";
|
2017-05-04 10:29:49 +02:00
|
|
|
throw ex;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
return tlsStream;
|
2016-04-19 13:54:41 +02:00
|
|
|
} else {
|
|
|
|
return new NetworkStream(socket);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void InfluxdbWriter::CheckResultHandler(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
|
|
|
{
|
2018-10-24 13:38:06 +02:00
|
|
|
if (IsPaused())
|
|
|
|
return;
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
m_WorkQueue.Enqueue(std::bind(&InfluxdbWriter::CheckResultHandlerWQ, this, checkable, cr), PriorityLow);
|
2017-05-26 17:03:49 +02:00
|
|
|
}
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
void InfluxdbWriter::CheckResultHandlerWQ(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr)
|
2017-05-26 17:03:49 +02:00
|
|
|
{
|
|
|
|
AssertOnWorkQueue();
|
|
|
|
|
2016-04-19 13:54:41 +02:00
|
|
|
CONTEXT("Processing check result for '" + checkable->GetName() + "'");
|
|
|
|
|
|
|
|
if (!IcingaApplication::GetInstance()->GetEnablePerfdata() || !checkable->GetEnablePerfdata())
|
|
|
|
return;
|
|
|
|
|
|
|
|
Host::Ptr host;
|
|
|
|
Service::Ptr service;
|
2017-11-22 12:05:36 +01:00
|
|
|
tie(host, service) = GetHostService(checkable);
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
MacroProcessor::ResolverList resolvers;
|
|
|
|
if (service)
|
2017-11-30 08:19:58 +01:00
|
|
|
resolvers.emplace_back("service", service);
|
|
|
|
resolvers.emplace_back("host", host);
|
|
|
|
resolvers.emplace_back("icinga", IcingaApplication::GetInstance());
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
String prefix;
|
|
|
|
|
|
|
|
double ts = cr->GetExecutionEnd();
|
|
|
|
|
|
|
|
// Clone the template and perform an in-place macro expansion of measurement and tag values
|
|
|
|
Dictionary::Ptr tmpl_clean = service ? GetServiceTemplate() : GetHostTemplate();
|
|
|
|
Dictionary::Ptr tmpl = static_pointer_cast<Dictionary>(tmpl_clean->Clone());
|
|
|
|
tmpl->Set("measurement", MacroProcessor::ResolveMacros(tmpl->Get("measurement"), resolvers, cr));
|
|
|
|
|
|
|
|
Dictionary::Ptr tags = tmpl->Get("tags");
|
|
|
|
if (tags) {
|
|
|
|
ObjectLock olock(tags);
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Dictionary::Pair& pair : tags) {
|
2016-04-19 13:54:41 +02:00
|
|
|
String missing_macro;
|
2017-10-24 15:23:58 +02:00
|
|
|
Value value = MacroProcessor::ResolveMacros(pair.second, resolvers, cr, &missing_macro);
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
if (!missing_macro.IsEmpty())
|
|
|
|
continue;
|
2016-06-08 12:09:21 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
tags->Set(pair.first, value);
|
|
|
|
}
|
|
|
|
}
|
2016-06-08 12:09:21 +02:00
|
|
|
|
2019-03-19 08:35:55 +01:00
|
|
|
CheckCommand::Ptr checkCommand = checkable->GetCheckCommand();
|
|
|
|
|
2016-04-19 13:54:41 +02:00
|
|
|
Array::Ptr perfdata = cr->GetPerformanceData();
|
2019-03-19 08:35:55 +01:00
|
|
|
|
2016-10-06 11:49:00 +02:00
|
|
|
if (perfdata) {
|
|
|
|
ObjectLock olock(perfdata);
|
|
|
|
for (const Value& val : perfdata) {
|
|
|
|
PerfdataValue::Ptr pdv;
|
|
|
|
|
|
|
|
if (val.IsObjectType<PerfdataValue>())
|
|
|
|
pdv = val;
|
|
|
|
else {
|
|
|
|
try {
|
|
|
|
pdv = PerfdataValue::Parse(val);
|
|
|
|
} catch (const std::exception&) {
|
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2019-03-19 08:35:55 +01:00
|
|
|
<< "Ignoring invalid perfdata for checkable '"
|
|
|
|
<< checkable->GetName() << "' and command '"
|
|
|
|
<< checkCommand->GetName() << "' with value: " << val;
|
2016-10-06 11:49:00 +02:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2016-10-06 11:49:00 +02:00
|
|
|
Dictionary::Ptr fields = new Dictionary();
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("value", pdv->GetValue());
|
2016-10-06 11:49:00 +02:00
|
|
|
|
|
|
|
if (GetEnableSendThresholds()) {
|
|
|
|
if (pdv->GetCrit())
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("crit", pdv->GetCrit());
|
2016-10-06 11:49:00 +02:00
|
|
|
if (pdv->GetWarn())
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("warn", pdv->GetWarn());
|
2016-10-06 11:49:00 +02:00
|
|
|
if (pdv->GetMin())
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("min", pdv->GetMin());
|
2016-10-06 11:49:00 +02:00
|
|
|
if (pdv->GetMax())
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("max", pdv->GetMax());
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
2017-10-13 14:54:00 +02:00
|
|
|
if (!pdv->GetUnit().IsEmpty()) {
|
2017-12-19 15:50:05 +01:00
|
|
|
fields->Set("unit", pdv->GetUnit());
|
|
|
|
}
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2019-03-19 08:35:55 +01:00
|
|
|
SendMetric(checkable, tmpl, pdv->GetLabel(), fields, ts);
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
2016-10-06 11:49:00 +02:00
|
|
|
}
|
2016-06-07 14:35:16 +02:00
|
|
|
|
2016-10-06 11:49:00 +02:00
|
|
|
if (GetEnableSendMetadata()) {
|
|
|
|
Host::Ptr host;
|
|
|
|
Service::Ptr service;
|
2017-11-22 12:05:36 +01:00
|
|
|
tie(host, service) = GetHostService(checkable);
|
2016-10-06 11:49:00 +02:00
|
|
|
|
|
|
|
Dictionary::Ptr fields = new Dictionary();
|
2016-06-08 12:09:21 +02:00
|
|
|
|
2016-10-06 11:49:00 +02:00
|
|
|
if (service)
|
2017-10-24 15:23:58 +02:00
|
|
|
fields->Set("state", new InfluxdbInteger(service->GetState()));
|
2016-10-06 11:49:00 +02:00
|
|
|
else
|
2017-10-24 15:23:58 +02:00
|
|
|
fields->Set("state", new InfluxdbInteger(host->GetState()));
|
|
|
|
|
|
|
|
fields->Set("current_attempt", new InfluxdbInteger(checkable->GetCheckAttempt()));
|
|
|
|
fields->Set("max_check_attempts", new InfluxdbInteger(checkable->GetMaxCheckAttempts()));
|
|
|
|
fields->Set("state_type", new InfluxdbInteger(checkable->GetStateType()));
|
|
|
|
fields->Set("reachable", checkable->IsReachable());
|
|
|
|
fields->Set("downtime_depth", new InfluxdbInteger(checkable->GetDowntimeDepth()));
|
|
|
|
fields->Set("acknowledgement", new InfluxdbInteger(checkable->GetAcknowledgement()));
|
2017-09-29 16:33:08 +02:00
|
|
|
fields->Set("latency", cr->CalculateLatency());
|
|
|
|
fields->Set("execution_time", cr->CalculateExecutionTime());
|
|
|
|
|
2019-03-19 08:35:55 +01:00
|
|
|
SendMetric(checkable, tmpl, Empty, fields, ts);
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
String InfluxdbWriter::EscapeKeyOrTagValue(const String& str)
|
2016-06-07 14:35:16 +02:00
|
|
|
{
|
|
|
|
// Iterate over the key name and escape commas and spaces with a backslash
|
|
|
|
String result = str;
|
2016-08-16 22:16:37 +02:00
|
|
|
boost::algorithm::replace_all(result, "\"", "\\\"");
|
|
|
|
boost::algorithm::replace_all(result, "=", "\\=");
|
2016-06-07 14:35:16 +02:00
|
|
|
boost::algorithm::replace_all(result, ",", "\\,");
|
|
|
|
boost::algorithm::replace_all(result, " ", "\\ ");
|
2018-04-04 13:02:48 +02:00
|
|
|
|
|
|
|
// InfluxDB 'feature': although backslashes are allowed in keys they also act
|
|
|
|
// as escape sequences when followed by ',' or ' '. When your tag is like
|
|
|
|
// 'metric=C:\' bad things happen. Backslashes themselves cannot be escaped
|
|
|
|
// and through experimentation they also escape '='. To be safe we replace
|
|
|
|
// trailing backslashes with and underscore.
|
|
|
|
// See https://github.com/influxdata/influxdb/issues/8587 for more info
|
|
|
|
size_t length = result.GetLength();
|
|
|
|
if (result[length - 1] == '\\')
|
|
|
|
result[length - 1] = '_';
|
|
|
|
|
2016-06-27 11:38:07 +02:00
|
|
|
return result;
|
2016-06-07 14:35:16 +02:00
|
|
|
}
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
String InfluxdbWriter::EscapeValue(const Value& value)
|
2016-06-07 14:35:16 +02:00
|
|
|
{
|
2017-10-24 15:23:58 +02:00
|
|
|
if (value.IsObjectType<InfluxdbInteger>()) {
|
|
|
|
std::ostringstream os;
|
2017-12-19 15:50:05 +01:00
|
|
|
os << static_cast<InfluxdbInteger::Ptr>(value)->GetValue() << "i";
|
2017-10-24 15:23:58 +02:00
|
|
|
return os.str();
|
2016-06-08 12:09:21 +02:00
|
|
|
}
|
2016-06-07 14:35:16 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
if (value.IsBoolean())
|
|
|
|
return value ? "true" : "false";
|
2017-05-26 17:03:49 +02:00
|
|
|
|
2018-01-17 10:25:42 +01:00
|
|
|
if (value.IsString())
|
|
|
|
return "\"" + EscapeKeyOrTagValue(value) + "\"";
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
return value;
|
2016-06-07 14:35:16 +02:00
|
|
|
}
|
|
|
|
|
2019-03-19 08:35:55 +01:00
|
|
|
void InfluxdbWriter::SendMetric(const Checkable::Ptr& checkable, const Dictionary::Ptr& tmpl,
|
|
|
|
const String& label, const Dictionary::Ptr& fields, double ts)
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
|
|
|
std::ostringstream msgbuf;
|
2017-10-24 15:23:58 +02:00
|
|
|
msgbuf << EscapeKeyOrTagValue(tmpl->Get("measurement"));
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
Dictionary::Ptr tags = tmpl->Get("tags");
|
|
|
|
if (tags) {
|
|
|
|
ObjectLock olock(tags);
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Dictionary::Pair& pair : tags) {
|
2016-04-19 13:54:41 +02:00
|
|
|
// Empty macro expansion, no tag
|
2016-06-07 14:35:16 +02:00
|
|
|
if (!pair.second.IsEmpty()) {
|
2017-10-24 15:23:58 +02:00
|
|
|
msgbuf << "," << EscapeKeyOrTagValue(pair.first) << "=" << EscapeKeyOrTagValue(pair.second);
|
2016-06-07 14:35:16 +02:00
|
|
|
}
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
// Label may be empty in the case of metadata
|
2016-10-06 11:49:00 +02:00
|
|
|
if (!label.IsEmpty())
|
2017-10-24 15:23:58 +02:00
|
|
|
msgbuf << ",metric=" << EscapeKeyOrTagValue(label);
|
2016-10-06 11:49:00 +02:00
|
|
|
|
|
|
|
msgbuf << " ";
|
2016-06-07 14:35:16 +02:00
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
{
|
|
|
|
bool first = true;
|
|
|
|
|
|
|
|
ObjectLock fieldLock(fields);
|
|
|
|
for (const Dictionary::Pair& pair : fields) {
|
|
|
|
if (first)
|
|
|
|
first = false;
|
|
|
|
else
|
|
|
|
msgbuf << ",";
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
msgbuf << EscapeKeyOrTagValue(pair.first) << "=" << EscapeValue(pair.second);
|
2017-05-04 10:29:49 +02:00
|
|
|
}
|
2016-06-07 14:35:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
msgbuf << " " << static_cast<unsigned long>(ts);
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
2019-03-19 08:35:55 +01:00
|
|
|
<< "Checkable '" << checkable->GetName() << "' adds to metric list:'" << msgbuf.str() << "'.";
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
// Buffer the data point
|
2018-01-04 09:14:55 +01:00
|
|
|
m_DataBuffer.emplace_back(msgbuf.str());
|
2016-04-19 13:54:41 +02:00
|
|
|
|
|
|
|
// Flush if we've buffered too much to prevent excessive memory use
|
2017-05-08 08:47:27 +02:00
|
|
|
if (static_cast<int>(m_DataBuffer.size()) >= GetFlushThreshold()) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Data buffer overflow writing " << m_DataBuffer.size() << " data points";
|
2017-10-24 15:23:58 +02:00
|
|
|
|
|
|
|
try {
|
|
|
|
Flush();
|
|
|
|
} catch (...) {
|
|
|
|
/* Do nothing. */
|
|
|
|
}
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void InfluxdbWriter::FlushTimeout()
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2017-10-24 15:23:58 +02:00
|
|
|
m_WorkQueue.Enqueue(boost::bind(&InfluxdbWriter::FlushTimeoutWQ, this), PriorityHigh);
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void InfluxdbWriter::FlushTimeoutWQ()
|
2017-10-24 15:23:58 +02:00
|
|
|
{
|
|
|
|
AssertOnWorkQueue();
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Timer expired writing " << m_DataBuffer.size() << " data points";
|
2017-10-24 15:23:58 +02:00
|
|
|
|
|
|
|
Flush();
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
void InfluxdbWriter::Flush()
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2019-03-27 11:16:08 +01:00
|
|
|
/* Flush can be called from 1) Timeout 2) Threshold 3) on shutdown/reload. */
|
|
|
|
if (m_DataBuffer.empty())
|
|
|
|
return;
|
|
|
|
|
2019-02-20 15:21:24 +01:00
|
|
|
Log(LogDebug, "InfluxdbWriter")
|
|
|
|
<< "Flushing data buffer to InfluxDB.";
|
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
String body = boost::algorithm::join(m_DataBuffer, "\n");
|
|
|
|
m_DataBuffer.clear();
|
|
|
|
|
2018-06-21 15:41:40 +02:00
|
|
|
Stream::Ptr stream;
|
|
|
|
|
|
|
|
try {
|
|
|
|
stream = Connect();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogWarning, "InfluxDbWriter")
|
2018-09-06 15:58:42 +02:00
|
|
|
<< "Flush failed, cannot connect to InfluxDB: " << DiagnosticInformation(ex, false);
|
2018-06-21 15:41:40 +02:00
|
|
|
return;
|
|
|
|
}
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2017-05-04 10:29:49 +02:00
|
|
|
if (!stream)
|
2016-04-19 13:54:41 +02:00
|
|
|
return;
|
2017-05-04 10:29:49 +02:00
|
|
|
|
2019-03-01 14:30:49 +01:00
|
|
|
Defer close ([&stream]() { stream->Close(); });
|
|
|
|
|
2016-04-19 13:54:41 +02:00
|
|
|
Url::Ptr url = new Url();
|
|
|
|
url->SetScheme(GetSslEnable() ? "https" : "http");
|
|
|
|
url->SetHost(GetHost());
|
|
|
|
url->SetPort(GetPort());
|
|
|
|
|
|
|
|
std::vector<String> path;
|
2018-01-04 09:14:55 +01:00
|
|
|
path.emplace_back("write");
|
2016-04-19 13:54:41 +02:00
|
|
|
url->SetPath(path);
|
|
|
|
|
|
|
|
url->AddQueryElement("db", GetDatabase());
|
|
|
|
url->AddQueryElement("precision", "s");
|
|
|
|
if (!GetUsername().IsEmpty())
|
|
|
|
url->AddQueryElement("u", GetUsername());
|
|
|
|
if (!GetPassword().IsEmpty())
|
|
|
|
url->AddQueryElement("p", GetPassword());
|
|
|
|
|
|
|
|
HttpRequest req(stream);
|
|
|
|
req.RequestMethod = "POST";
|
|
|
|
req.RequestUrl = url;
|
|
|
|
|
|
|
|
try {
|
|
|
|
req.WriteBody(body.CStr(), body.GetLength());
|
|
|
|
req.Finish();
|
2017-05-04 10:29:49 +02:00
|
|
|
} catch (const std::exception& ex) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Cannot write to TCP socket on host '" << GetHost() << "' port '" << GetPort() << "'.";
|
2017-05-04 10:29:49 +02:00
|
|
|
throw ex;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
HttpResponse resp(stream, req);
|
|
|
|
StreamReadContext context;
|
|
|
|
|
|
|
|
try {
|
2017-10-24 15:23:58 +02:00
|
|
|
while (resp.Parse(context, true) && !resp.Complete)
|
|
|
|
; /* Do nothing */
|
2017-05-04 10:29:49 +02:00
|
|
|
} catch (const std::exception& ex) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Failed to parse HTTP response from host '" << GetHost() << "' port '" << GetPort() << "': " << DiagnosticInformation(ex);
|
2017-05-04 10:29:49 +02:00
|
|
|
throw ex;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
if (!resp.Complete) {
|
2016-04-19 13:54:41 +02:00
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Failed to read a complete HTTP response from the InfluxDB server.";
|
2017-10-24 15:23:58 +02:00
|
|
|
return;
|
|
|
|
}
|
2016-07-28 14:29:37 +02:00
|
|
|
|
2017-10-24 15:23:58 +02:00
|
|
|
if (resp.StatusCode != 204) {
|
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Unexpected response code: " << resp.StatusCode;
|
2016-07-28 14:29:37 +02:00
|
|
|
|
|
|
|
String contentType = resp.Headers->Get("content-type");
|
|
|
|
if (contentType != "application/json") {
|
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Unexpected Content-Type: " << contentType;
|
2016-07-28 14:29:37 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t responseSize = resp.GetBodySize();
|
|
|
|
boost::scoped_array<char> buffer(new char[responseSize + 1]);
|
|
|
|
resp.ReadBody(buffer.get(), responseSize);
|
|
|
|
buffer.get()[responseSize] = '\0';
|
|
|
|
|
|
|
|
Dictionary::Ptr jsonResponse;
|
|
|
|
try {
|
|
|
|
jsonResponse = JsonDecode(buffer.get());
|
|
|
|
} catch (...) {
|
|
|
|
Log(LogWarning, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Unable to parse JSON response:\n" << buffer.get();
|
2016-07-28 14:29:37 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
String error = jsonResponse->Get("error");
|
|
|
|
|
|
|
|
Log(LogCritical, "InfluxdbWriter")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "InfluxDB error message:\n" << error;
|
2017-10-24 15:23:58 +02:00
|
|
|
|
|
|
|
return;
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
void InfluxdbWriter::ValidateHostTemplate(const Lazy<Dictionary::Ptr>& lvalue, const ValidationUtils& utils)
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2018-01-11 07:08:09 +01:00
|
|
|
ObjectImpl<InfluxdbWriter>::ValidateHostTemplate(lvalue, utils);
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
String measurement = lvalue()->Get("measurement");
|
2016-04-19 13:54:41 +02:00
|
|
|
if (!MacroProcessor::ValidateMacroString(measurement))
|
2017-11-30 18:09:38 +01:00
|
|
|
BOOST_THROW_EXCEPTION(ValidationError(this, { "host_template", "measurement" }, "Closing $ not found in macro format string '" + measurement + "'."));
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
Dictionary::Ptr tags = lvalue()->Get("tags");
|
2016-04-19 13:54:41 +02:00
|
|
|
if (tags) {
|
|
|
|
ObjectLock olock(tags);
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Dictionary::Pair& pair : tags) {
|
2016-04-19 13:54:41 +02:00
|
|
|
if (!MacroProcessor::ValidateMacroString(pair.second))
|
2017-11-30 18:09:38 +01:00
|
|
|
BOOST_THROW_EXCEPTION(ValidationError(this, { "host_template", "tags", pair.first }, "Closing $ not found in macro format string '" + pair.second));
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
void InfluxdbWriter::ValidateServiceTemplate(const Lazy<Dictionary::Ptr>& lvalue, const ValidationUtils& utils)
|
2016-04-19 13:54:41 +02:00
|
|
|
{
|
2018-01-11 07:08:09 +01:00
|
|
|
ObjectImpl<InfluxdbWriter>::ValidateServiceTemplate(lvalue, utils);
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
String measurement = lvalue()->Get("measurement");
|
2016-04-19 13:54:41 +02:00
|
|
|
if (!MacroProcessor::ValidateMacroString(measurement))
|
2017-11-30 18:09:38 +01:00
|
|
|
BOOST_THROW_EXCEPTION(ValidationError(this, { "service_template", "measurement" }, "Closing $ not found in macro format string '" + measurement + "'."));
|
2016-04-19 13:54:41 +02:00
|
|
|
|
2018-01-11 07:08:09 +01:00
|
|
|
Dictionary::Ptr tags = lvalue()->Get("tags");
|
2016-04-19 13:54:41 +02:00
|
|
|
if (tags) {
|
|
|
|
ObjectLock olock(tags);
|
2016-08-25 06:19:44 +02:00
|
|
|
for (const Dictionary::Pair& pair : tags) {
|
2016-04-19 13:54:41 +02:00
|
|
|
if (!MacroProcessor::ValidateMacroString(pair.second))
|
2017-11-30 18:09:38 +01:00
|
|
|
BOOST_THROW_EXCEPTION(ValidationError(this, { "service_template", "tags", pair.first }, "Closing $ not found in macro format string '" + pair.second));
|
2016-04-19 13:54:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|