Don't use thread-local variable in coroutine & process final `cr` in global thread pool

This commit is contained in:
Yonas Habteab 2024-08-30 18:00:00 +02:00
parent c9159494c0
commit 74009f0fcb
1 changed files with 83 additions and 135 deletions

View File

@ -33,55 +33,6 @@ using namespace icinga;
REGISTER_FUNCTION_NONCONST(Internal, IfwApiCheck, &IfwApiCheckTask::ScriptFunc, "checkable:cr:resolvedMacros:useResolvedMacros"); REGISTER_FUNCTION_NONCONST(Internal, IfwApiCheck, &IfwApiCheckTask::ScriptFunc, "checkable:cr:resolvedMacros:useResolvedMacros");
static void ReportIfwCheckResult(
const Checkable::Ptr& checkable, const Value& cmdLine, const CheckResult::Ptr& cr,
const String& output, double start, double end, int exitcode = 3, const Array::Ptr& perfdata = nullptr
)
{
if (Checkable::ExecuteCommandProcessFinishedHandler) {
ProcessResult pr;
pr.PID = -1;
pr.Output = perfdata ? output + " |" + String(perfdata->Join(" ")) : output;
pr.ExecutionStart = start;
pr.ExecutionEnd = end;
pr.ExitStatus = exitcode;
Checkable::ExecuteCommandProcessFinishedHandler(cmdLine, pr);
} else {
auto splittedPerfdata (perfdata);
if (perfdata) {
splittedPerfdata = new Array();
ObjectLock oLock (perfdata);
for (String pv : perfdata) {
PluginUtility::SplitPerfdata(pv)->CopyTo(splittedPerfdata);
}
}
cr->SetOutput(output);
cr->SetPerformanceData(splittedPerfdata);
cr->SetState((ServiceState)exitcode);
cr->SetExitStatus(exitcode);
cr->SetExecutionStart(start);
cr->SetExecutionEnd(end);
cr->SetCommand(cmdLine);
checkable->ProcessCheckResult(cr);
}
}
static void ReportIfwCheckResult(
boost::asio::yield_context yc, const Checkable::Ptr& checkable, const Value& cmdLine,
const CheckResult::Ptr& cr, const String& output, double start
)
{
double end = Utility::GetTime();
CpuBoundWork cbw (yc);
ReportIfwCheckResult(checkable, cmdLine, cr, output, start, end);
}
static const char* GetUnderstandableError(const std::exception& ex) static const char* GetUnderstandableError(const std::exception& ex)
{ {
auto se (dynamic_cast<const boost::system::system_error*>(&ex)); auto se (dynamic_cast<const boost::system::system_error*>(&ex));
@ -93,10 +44,12 @@ static const char* GetUnderstandableError(const std::exception& ex)
return ex.what(); return ex.what();
} }
// Note: If DoIfwNetIo returns due to an error, the plugin output of the specified CheckResult (cr) will always be set,
// and if it was successful, the cr exit status, plugin state and performance data (if any) will also be overridden.
// Therefore, you have to take care yourself of setting all the other necessary fields for the check result.
static void DoIfwNetIo( static void DoIfwNetIo(
boost::asio::yield_context yc, const Checkable::Ptr& checkable, const Array::Ptr& cmdLine, boost::asio::yield_context yc, const CheckResult::Ptr& cr, const String& psCommand, const String& psHost, const String& san,
const CheckResult::Ptr& cr, const String& psCommand, const String& psHost, const String& san, const String& psPort, const String& psPort, AsioTlsStream& conn, boost::beast::http::request<boost::beast::http::string_body>& req
AsioTlsStream& conn, boost::beast::http::request<boost::beast::http::string_body>& req, double start
) )
{ {
namespace http = boost::beast::http; namespace http = boost::beast::http;
@ -107,11 +60,7 @@ static void DoIfwNetIo(
try { try {
Connect(conn.lowest_layer(), psHost, psPort, yc); Connect(conn.lowest_layer(), psHost, psPort, yc);
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult( cr->SetOutput("Can't connect to IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex));
yc, checkable, cmdLine, cr,
"Can't connect to IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex),
start
);
return; return;
} }
@ -120,12 +69,7 @@ static void DoIfwNetIo(
try { try {
sslConn.async_handshake(conn.next_layer().client, yc); sslConn.async_handshake(conn.next_layer().client, yc);
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult( cr->SetOutput("TLS handshake with IfW API on host '" + psHost + "' (SNI: '" + san+ "') port '" + psPort + "' failed: " + GetUnderstandableError(ex));
yc, checkable, cmdLine, cr,
"TLS handshake with IfW API on host '" + psHost + "' (SNI: '" + san
+ "') port '" + psPort + "' failed: " + GetUnderstandableError(ex),
start
);
return; return;
} }
@ -135,15 +79,10 @@ static void DoIfwNetIo(
try { try {
cn = GetCertificateCN(cert); cn = GetCertificateCN(cert);
} catch (const std::exception&) { } catch (const std::exception&) { }
}
ReportIfwCheckResult( cr->SetOutput("Certificate validation failed for IfW API on host '" + psHost + "' (SNI: '" + san + "'; CN: "
yc, checkable, cmdLine, cr, + (cn.IsString() ? "'" + cn + "'" : "N/A") + ") port '" + psPort + "': " + sslConn.GetVerifyError());
"Certificate validation failed for IfW API on host '" + psHost + "' (SNI: '" + san + "'; CN: "
+ (cn.IsString() ? "'" + cn + "'" : "N/A") + ") port '" + psPort + "': " + sslConn.GetVerifyError(),
start
);
return; return;
} }
@ -151,87 +90,56 @@ static void DoIfwNetIo(
http::async_write(conn, req, yc); http::async_write(conn, req, yc);
conn.async_flush(yc); conn.async_flush(yc);
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult( cr->SetOutput("Can't send HTTP request to IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex));
yc, checkable, cmdLine, cr,
"Can't send HTTP request to IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex),
start
);
return; return;
} }
try { try {
http::async_read(conn, buf, resp, yc); http::async_read(conn, buf, resp, yc);
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult( cr->SetOutput("Can't read HTTP response from IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex));
yc, checkable, cmdLine, cr,
"Can't read HTTP response from IfW API on host '" + psHost + "' port '" + psPort + "': " + GetUnderstandableError(ex),
start
);
return; return;
} }
double end = Utility::GetTime();
{ {
boost::system::error_code ec; boost::system::error_code ec;
sslConn.async_shutdown(yc[ec]); sslConn.async_shutdown(yc[ec]);
} }
CpuBoundWork cbw (yc);
Value jsonRoot; Value jsonRoot;
try { try {
jsonRoot = JsonDecode(resp.body()); jsonRoot = JsonDecode(resp.body());
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult( cr->SetOutput("Got bad JSON from IfW API on host '" + psHost + "' port '" + psPort + "': " + ex.what());
checkable, cmdLine, cr,
"Got bad JSON from IfW API on host '" + psHost + "' port '" + psPort + "': " + ex.what(), start, end
);
return; return;
} }
if (!jsonRoot.IsObjectType<Dictionary>()) { if (!jsonRoot.IsObjectType<Dictionary>()) {
ReportIfwCheckResult( cr->SetOutput("Got JSON, but not an object, from IfW API on host '"+ psHost + "' port '" + psPort + "': " + JsonEncode(jsonRoot));
checkable, cmdLine, cr,
"Got JSON, but not an object, from IfW API on host '"
+ psHost + "' port '" + psPort + "': " + JsonEncode(jsonRoot),
start, end
);
return; return;
} }
Value jsonBranch; Value jsonBranch;
if (!Dictionary::Ptr(jsonRoot)->Get(psCommand, &jsonBranch)) { if (!Dictionary::Ptr(jsonRoot)->Get(psCommand, &jsonBranch)) {
ReportIfwCheckResult( cr->SetOutput("Missing ." + psCommand + " in JSON object from IfW API on host '" + psHost + "' port '" + psPort + "': " + JsonEncode(jsonRoot));
checkable, cmdLine, cr,
"Missing ." + psCommand + " in JSON object from IfW API on host '"
+ psHost + "' port '" + psPort + "': " + JsonEncode(jsonRoot),
start, end
);
return; return;
} }
if (!jsonBranch.IsObjectType<Dictionary>()) { if (!jsonBranch.IsObjectType<Dictionary>()) {
ReportIfwCheckResult( cr->SetOutput("." + psCommand + " in JSON from IfW API on host '" + psHost + "' port '" + psPort + "' is not an object: " + JsonEncode(jsonBranch));
checkable, cmdLine, cr,
"." + psCommand + " in JSON from IfW API on host '"
+ psHost + "' port '" + psPort + "' is not an object: " + JsonEncode(jsonBranch),
start, end
);
return; return;
} }
Dictionary::Ptr result = jsonBranch; Dictionary::Ptr result = jsonBranch;
Value exitcode; Value rawExitcode;
if (!result->Get("exitcode", &exitcode)) { if (!result->Get("exitcode", &rawExitcode)) {
ReportIfwCheckResult( cr->SetOutput(
checkable, cmdLine, cr,
"Missing ." + psCommand + ".exitcode in JSON object from IfW API on host '" "Missing ." + psCommand + ".exitcode in JSON object from IfW API on host '"
+ psHost + "' port '" + psPort + "': " + JsonEncode(result), + psHost + "' port '" + psPort + "': " + JsonEncode(result)
start, end
); );
return; return;
} }
@ -239,27 +147,25 @@ static void DoIfwNetIo(
static const std::set<double> exitcodes {ServiceOK, ServiceWarning, ServiceCritical, ServiceUnknown}; static const std::set<double> exitcodes {ServiceOK, ServiceWarning, ServiceCritical, ServiceUnknown};
static const auto exitcodeList (Array::FromSet(exitcodes)->Join(", ")); static const auto exitcodeList (Array::FromSet(exitcodes)->Join(", "));
if (!exitcode.IsNumber() || exitcodes.find(exitcode) == exitcodes.end()) { if (!rawExitcode.IsNumber() || exitcodes.find(rawExitcode) == exitcodes.end()) {
ReportIfwCheckResult( cr->SetOutput(
checkable, cmdLine, cr, "Got bad exitcode " + JsonEncode(rawExitcode) + " from IfW API on host '" + psHost + "' port '" + psPort
"Got bad exitcode " + JsonEncode(exitcode) + " from IfW API on host '" + psHost + "' port '" + psPort + "', expected one of: " + exitcodeList
+ "', expected one of: " + exitcodeList,
start, end
); );
return; return;
} }
auto exitcode (static_cast<ServiceState>(rawExitcode.Get<double>()));
auto perfdataVal (result->Get("perfdata")); auto perfdataVal (result->Get("perfdata"));
Array::Ptr perfdata; Array::Ptr perfdata;
try { try {
perfdata = perfdataVal; perfdata = perfdataVal;
} catch (const std::exception&) { } catch (const std::exception&) {
ReportIfwCheckResult( cr->SetOutput(
checkable, cmdLine, cr,
"Got bad perfdata " + JsonEncode(perfdataVal) + " from IfW API on host '" "Got bad perfdata " + JsonEncode(perfdataVal) + " from IfW API on host '"
+ psHost + "' port '" + psPort + "', expected an array", + psHost + "' port '" + psPort + "', expected an array"
start, end
); );
return; return;
} }
@ -269,18 +175,20 @@ static void DoIfwNetIo(
for (auto& pv : perfdata) { for (auto& pv : perfdata) {
if (!pv.IsString()) { if (!pv.IsString()) {
ReportIfwCheckResult( cr->SetOutput(
checkable, cmdLine, cr,
"Got bad perfdata value " + JsonEncode(perfdata) + " from IfW API on host '" "Got bad perfdata value " + JsonEncode(perfdata) + " from IfW API on host '"
+ psHost + "' port '" + psPort + "', expected an array of strings", + psHost + "' port '" + psPort + "', expected an array of strings"
start, end
); );
return; return;
} }
} }
cr->SetPerformanceData(PluginUtility::SplitPerfdata(perfdata->Join(" ")));
} }
ReportIfwCheckResult(checkable, cmdLine, cr, result->Get("checkresult"), start, end, exitcode, perfdata); cr->SetState(exitcode);
cr->SetExitStatus(exitcode);
cr->SetOutput(result->Get("checkresult"));
} }
void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr, void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckResult::Ptr& cr,
@ -344,6 +252,34 @@ void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckRes
String username = resolveMacros("$ifw_api_username$"); String username = resolveMacros("$ifw_api_username$");
String password = resolveMacros("$ifw_api_password$"); String password = resolveMacros("$ifw_api_password$");
// Use this lambda to process the final Ifw check result. Callers don't need to pass the check result
// as an argument, as the lambda already captures the `cr` and notices all the `cr` changes made across
// the code. You just need to set the necessary cr fields when appropriated and then call this closure.
std::function<void()> reportResult;
if (auto callback = Checkable::ExecuteCommandProcessFinishedHandler; callback) {
reportResult = [cr, callback = std::move(callback)]() {
ProcessResult pr;
pr.PID = -1;
if (auto pd = cr->GetPerformanceData(); pd) {
pr.Output = cr->GetOutput() +" |" + String(pd->Join(" "));
} else {
pr.Output = cr->GetOutput();
}
pr.ExecutionStart = cr->GetExecutionStart();
pr.ExecutionEnd = cr->GetExecutionEnd();
pr.ExitStatus = cr->GetExitStatus();
callback(cr->GetCommand(), pr);
};
} else {
reportResult = [checkable, cr]() { checkable->ProcessCheckResult(cr); };
}
// Set the default check result state and exit code to unknown for the moment!
cr->SetExitStatus(ServiceUnknown);
cr->SetState(ServiceUnknown);
Dictionary::Ptr params = new Dictionary(); Dictionary::Ptr params = new Dictionary();
if (arguments) { if (arguments) {
@ -369,11 +305,12 @@ void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckRes
if (kv.second.GetType() == ValueObject) { if (kv.second.GetType() == ValueObject) {
auto now (Utility::GetTime()); auto now (Utility::GetTime());
ReportIfwCheckResult( cr->SetCommand(command->GetName());
checkable, command->GetName(), cr, cr->SetExecutionStart(now);
"$ifw_api_arguments$ may not directly contain objects (especially functions).", now, now cr->SetExecutionEnd(now);
); cr->SetOutput("$ifw_api_arguments$ may not directly contain objects (especially functions).");
reportResult();
return; return;
} }
} }
@ -498,12 +435,17 @@ void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckRes
auto& io (IoEngine::Get().GetIoContext()); auto& io (IoEngine::Get().GetIoContext());
auto strand (Shared<asio::io_context::strand>::Make(io)); auto strand (Shared<asio::io_context::strand>::Make(io));
Shared<asio::ssl::context>::Ptr ctx; Shared<asio::ssl::context>::Ptr ctx;
double start = Utility::GetTime();
cr->SetExecutionStart(Utility::GetTime());
cr->SetCommand(cmdLine);
try { try {
ctx = SetupSslContext(cert, key, ca, crl, DEFAULT_TLS_CIPHERS, DEFAULT_TLS_PROTOCOLMIN, DebugInfo()); ctx = SetupSslContext(cert, key, ca, crl, DEFAULT_TLS_CIPHERS, DEFAULT_TLS_PROTOCOLMIN, DebugInfo());
} catch (const std::exception& ex) { } catch (const std::exception& ex) {
ReportIfwCheckResult(checkable, cmdLine, cr, ex.what(), start, Utility::GetTime()); cr->SetOutput(ex.what());
cr->SetExecutionEnd(Utility::GetTime());
reportResult();
return; return;
} }
@ -511,7 +453,7 @@ void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckRes
IoEngine::SpawnCoroutine( IoEngine::SpawnCoroutine(
*strand, *strand,
[strand, checkable, cmdLine, cr, psCommand, psHost, expectedSan, psPort, conn, req, start, checkTimeout](asio::yield_context yc) { [strand, checkable, cr, psCommand, psHost, expectedSan, psPort, conn, req, checkTimeout, reportResult = std::move(reportResult)](asio::yield_context yc) {
Timeout::Ptr timeout = new Timeout(strand->context(), *strand, boost::posix_time::microseconds(int64_t(checkTimeout * 1e6)), Timeout::Ptr timeout = new Timeout(strand->context(), *strand, boost::posix_time::microseconds(int64_t(checkTimeout * 1e6)),
[&conn, &checkable](boost::asio::yield_context yc) { [&conn, &checkable](boost::asio::yield_context yc) {
Log(LogNotice, "IfwApiCheckTask") Log(LogNotice, "IfwApiCheckTask")
@ -525,7 +467,13 @@ void IfwApiCheckTask::ScriptFunc(const Checkable::Ptr& checkable, const CheckRes
Defer cancelTimeout ([&timeout]() { timeout->Cancel(); }); Defer cancelTimeout ([&timeout]() { timeout->Cancel(); });
DoIfwNetIo(yc, checkable, cmdLine, cr, psCommand, psHost, expectedSan, psPort, *conn, *req, start); DoIfwNetIo(yc, cr, psCommand, psHost, expectedSan, psPort, *conn, *req);
cr->SetExecutionEnd(Utility::GetTime());
// Post the check result processing to the global pool not to block the I/O threads,
// which could affect processing important RPC messages and HTTP connections.
Utility::QueueAsyncCallback(reportResult);
} }
); );
} }