2019-02-25 14:48:22 +01:00
|
|
|
/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
|
2014-10-06 14:21:18 +02:00
|
|
|
|
|
|
|
#include "cli/daemoncommand.hpp"
|
2015-01-22 12:10:32 +01:00
|
|
|
#include "cli/daemonutility.hpp"
|
2016-05-11 12:50:08 +02:00
|
|
|
#include "remote/apilistener.hpp"
|
2016-06-03 14:16:52 +02:00
|
|
|
#include "remote/configobjectutility.hpp"
|
2014-10-06 14:21:18 +02:00
|
|
|
#include "config/configcompiler.hpp"
|
2014-12-18 15:11:57 +01:00
|
|
|
#include "config/configcompilercontext.hpp"
|
2014-10-06 14:21:18 +02:00
|
|
|
#include "config/configitembuilder.hpp"
|
2019-07-16 11:28:20 +02:00
|
|
|
#include "base/atomic.hpp"
|
2019-07-15 16:08:08 +02:00
|
|
|
#include "base/defer.hpp"
|
2014-10-19 14:21:12 +02:00
|
|
|
#include "base/logger.hpp"
|
2014-10-06 14:21:18 +02:00
|
|
|
#include "base/application.hpp"
|
|
|
|
#include "base/timer.hpp"
|
|
|
|
#include "base/utility.hpp"
|
|
|
|
#include "base/exception.hpp"
|
|
|
|
#include "base/convert.hpp"
|
2014-12-14 11:33:45 +01:00
|
|
|
#include "base/scriptglobal.hpp"
|
2014-10-06 14:21:18 +02:00
|
|
|
#include "base/context.hpp"
|
|
|
|
#include "config.h"
|
2019-07-12 18:14:02 +02:00
|
|
|
#include <cstdint>
|
|
|
|
#include <cstring>
|
2014-10-06 14:21:18 +02:00
|
|
|
#include <boost/program_options.hpp>
|
|
|
|
#include <iostream>
|
2015-12-16 15:57:59 +01:00
|
|
|
#include <fstream>
|
2014-10-06 14:21:18 +02:00
|
|
|
|
2019-07-19 17:58:56 +02:00
|
|
|
#ifdef _WIN32
|
|
|
|
#include <windows.h>
|
|
|
|
#else /* _WIN32 */
|
2019-07-12 18:14:02 +02:00
|
|
|
#include <signal.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/wait.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
#include <systemd/sd-daemon.h>
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2014-10-06 14:21:18 +02:00
|
|
|
using namespace icinga;
|
|
|
|
namespace po = boost::program_options;
|
|
|
|
|
|
|
|
static po::variables_map g_AppParams;
|
|
|
|
|
|
|
|
REGISTER_CLICOMMAND("daemon", DaemonCommand);
|
|
|
|
|
2018-05-30 13:21:39 +02:00
|
|
|
/*
|
|
|
|
* Daemonize(). On error, this function logs by itself and exits (i.e. does not return).
|
|
|
|
*
|
|
|
|
* Implementation note: We're only supposed to call exit() in one of the forked processes.
|
|
|
|
* The other process calls _exit(). This prevents issues with exit handlers like atexit().
|
|
|
|
*/
|
|
|
|
static void Daemonize() noexcept
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
|
|
|
#ifndef _WIN32
|
2018-05-30 13:21:39 +02:00
|
|
|
try {
|
|
|
|
Application::UninitializeBase();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to stop thread pool before daemonizing, unexpected error: " << DiagnosticInformation(ex);
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
}
|
2014-11-27 08:04:07 +01:00
|
|
|
|
2014-10-06 14:21:18 +02:00
|
|
|
pid_t pid = fork();
|
|
|
|
if (pid == -1) {
|
2018-05-30 13:21:39 +02:00
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "fork() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
|
|
|
|
exit(EXIT_FAILURE);
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (pid) {
|
|
|
|
// systemd requires that the pidfile of the daemon is written before the forking
|
|
|
|
// process terminates. So wait till either the forked daemon has written a pidfile or died.
|
|
|
|
|
|
|
|
int status;
|
|
|
|
int ret;
|
|
|
|
pid_t readpid;
|
|
|
|
do {
|
|
|
|
Utility::Sleep(0.1);
|
|
|
|
|
2018-08-09 15:37:23 +02:00
|
|
|
readpid = Application::ReadPidFile(Configuration::PidPath);
|
2014-10-06 14:21:18 +02:00
|
|
|
ret = waitpid(pid, &status, WNOHANG);
|
|
|
|
} while (readpid != pid && ret == 0);
|
|
|
|
|
|
|
|
if (ret == pid) {
|
|
|
|
Log(LogCritical, "cli", "The daemon could not be started. See log output for details.");
|
2015-02-26 17:09:45 +01:00
|
|
|
_exit(EXIT_FAILURE);
|
2014-10-06 14:21:18 +02:00
|
|
|
} else if (ret == -1) {
|
2014-10-19 17:52:17 +02:00
|
|
|
Log(LogCritical, "cli")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "waitpid() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
|
2015-02-26 17:09:45 +01:00
|
|
|
_exit(EXIT_FAILURE);
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
|
|
|
|
2015-02-26 17:09:45 +01:00
|
|
|
_exit(EXIT_SUCCESS);
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
2014-11-27 08:04:07 +01:00
|
|
|
|
2018-07-19 13:34:12 +02:00
|
|
|
Log(LogDebug, "Daemonize()")
|
|
|
|
<< "Child process with PID " << Utility::GetPid() << " continues; re-initializing base.";
|
|
|
|
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
// Detach from controlling terminal
|
|
|
|
pid_t sid = setsid();
|
|
|
|
if (sid == -1) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "setsid() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
|
2018-05-30 13:21:39 +02:00
|
|
|
try {
|
|
|
|
Application::InitializeBase();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to re-initialize thread pool after daemonizing: " << DiagnosticInformation(ex);
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
}
|
2014-10-06 14:21:18 +02:00
|
|
|
#endif /* _WIN32 */
|
|
|
|
}
|
|
|
|
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
static void CloseStdIO(const String& stderrFile)
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
|
|
|
#ifndef _WIN32
|
|
|
|
int fdnull = open("/dev/null", O_RDWR);
|
|
|
|
if (fdnull >= 0) {
|
|
|
|
if (fdnull != 0)
|
|
|
|
dup2(fdnull, 0);
|
|
|
|
|
|
|
|
if (fdnull != 1)
|
|
|
|
dup2(fdnull, 1);
|
|
|
|
|
|
|
|
if (fdnull > 1)
|
|
|
|
close(fdnull);
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *errPath = "/dev/null";
|
|
|
|
|
|
|
|
if (!stderrFile.IsEmpty())
|
|
|
|
errPath = stderrFile.CStr();
|
|
|
|
|
|
|
|
int fderr = open(errPath, O_WRONLY | O_APPEND);
|
|
|
|
|
|
|
|
if (fderr < 0 && errno == ENOENT)
|
|
|
|
fderr = open(errPath, O_CREAT | O_WRONLY | O_APPEND, 0600);
|
|
|
|
|
2015-03-03 07:36:43 +01:00
|
|
|
if (fderr >= 0) {
|
2014-10-06 14:21:18 +02:00
|
|
|
if (fderr != 2)
|
|
|
|
dup2(fderr, 2);
|
|
|
|
|
|
|
|
if (fderr > 2)
|
|
|
|
close(fderr);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
String DaemonCommand::GetDescription() const
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
|
|
|
return "Starts Icinga 2.";
|
|
|
|
}
|
|
|
|
|
2018-01-04 04:25:35 +01:00
|
|
|
String DaemonCommand::GetShortDescription() const
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
|
|
|
return "starts Icinga 2";
|
|
|
|
}
|
|
|
|
|
2014-10-10 11:08:24 +02:00
|
|
|
void DaemonCommand::InitParameters(boost::program_options::options_description& visibleDesc,
|
2017-12-19 15:50:05 +01:00
|
|
|
boost::program_options::options_description& hiddenDesc) const
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
2014-10-10 11:08:24 +02:00
|
|
|
visibleDesc.add_options()
|
2014-10-06 14:21:18 +02:00
|
|
|
("config,c", po::value<std::vector<std::string> >(), "parse a configuration file")
|
|
|
|
("no-config,z", "start without a configuration file")
|
|
|
|
("validate,C", "exit after validating the configuration")
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
("errorlog,e", po::value<std::string>(), "log fatal errors to the specified log file (only works in combination with --daemonize or --close-stdio)")
|
2014-10-06 14:21:18 +02:00
|
|
|
#ifndef _WIN32
|
|
|
|
("daemonize,d", "detach from the controlling terminal")
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
("close-stdio", "do not log to stdout (or stderr) after startup")
|
2014-10-06 14:21:18 +02:00
|
|
|
#endif /* _WIN32 */
|
|
|
|
;
|
2014-10-17 15:54:46 +02:00
|
|
|
}
|
2014-10-14 16:45:00 +02:00
|
|
|
|
2014-10-17 15:54:46 +02:00
|
|
|
std::vector<String> DaemonCommand::GetArgumentSuggestions(const String& argument, const String& word) const
|
|
|
|
{
|
|
|
|
if (argument == "config" || argument == "errorlog")
|
|
|
|
return GetBashCompletionSuggestions("file", word);
|
|
|
|
else
|
|
|
|
return CLICommand::GetArgumentSuggestions(argument, word);
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
#ifndef _WIN32
|
2019-07-16 11:11:10 +02:00
|
|
|
// The PID of the Icinga umbrella process
|
2019-07-12 18:14:02 +02:00
|
|
|
pid_t l_UmbrellaPid = 0;
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// Whether the umbrella process allowed us to continue working beyond config validation
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<bool> l_AllowedToWork (false);
|
2019-07-12 18:14:02 +02:00
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
2020-01-29 12:38:12 +01:00
|
|
|
#ifdef I2_DEBUG
|
|
|
|
/**
|
|
|
|
* Determine whether the developer wants to delay the worker process to attach a debugger to it.
|
|
|
|
*
|
|
|
|
* @return Internal.DebugWorkerDelay double
|
|
|
|
*/
|
|
|
|
static double GetDebugWorkerDelay()
|
|
|
|
{
|
|
|
|
Namespace::Ptr internal = ScriptGlobal::Get("Internal", &Empty);
|
|
|
|
|
|
|
|
Value vdebug;
|
|
|
|
if (internal && internal->Get("DebugWorkerDelay", &vdebug))
|
|
|
|
return Convert::ToDouble(vdebug);
|
|
|
|
|
|
|
|
return 0.0;
|
|
|
|
}
|
|
|
|
#endif /* I2_DEBUG */
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Do the actual work (config loading, ...)
|
|
|
|
*
|
|
|
|
* @param configs Files to read config from
|
2019-08-05 18:30:45 +02:00
|
|
|
* @param closeConsoleLog Whether to close the console log after config loading
|
|
|
|
* @param stderrFile Where to log errors
|
2019-07-16 11:11:10 +02:00
|
|
|
*
|
|
|
|
* @return Exit code
|
|
|
|
*/
|
2019-07-12 18:14:02 +02:00
|
|
|
static inline
|
2019-08-05 18:30:45 +02:00
|
|
|
int RunWorker(const std::vector<std::string>& configs, bool closeConsoleLog = false, const String& stderrFile = String())
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
2020-01-29 12:38:12 +01:00
|
|
|
|
|
|
|
#ifdef I2_DEBUG
|
|
|
|
double delay = GetDebugWorkerDelay();
|
|
|
|
|
|
|
|
if (delay > 0.0) {
|
|
|
|
Log(LogInformation, "RunWorker")
|
|
|
|
<< "DEBUG: Current PID: " << Utility::GetPid() << ". Sleeping for " << delay << " seconds to allow lldb/gdb -p <PID> attachment.";
|
|
|
|
|
|
|
|
Utility::Sleep(delay);
|
|
|
|
}
|
|
|
|
#endif /* I2_DEBUG */
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
Log(LogInformation, "cli", "Loading configuration file(s).");
|
|
|
|
|
|
|
|
{
|
|
|
|
std::vector<ConfigItem::Ptr> newItems;
|
|
|
|
|
2019-08-07 12:03:17 +02:00
|
|
|
if (!DaemonUtility::LoadConfigFiles(configs, newItems, Configuration::ObjectsPath, Configuration::VarsPath)) {
|
|
|
|
Log(LogCritical, "cli", "Config validation failed. Re-run with 'icinga2 daemon -C' after fixing the config.");
|
2019-07-12 18:14:02 +02:00
|
|
|
return EXIT_FAILURE;
|
2019-08-07 12:03:17 +02:00
|
|
|
}
|
2019-07-12 18:14:02 +02:00
|
|
|
|
|
|
|
#ifndef _WIN32
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Notifying umbrella process (PID " << l_UmbrellaPid << ") about the config loading success";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)kill(l_UmbrellaPid, SIGUSR2);
|
2019-07-15 12:11:19 +02:00
|
|
|
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Waiting for the umbrella process to let us doing the actual work";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-08-05 18:30:45 +02:00
|
|
|
if (closeConsoleLog) {
|
|
|
|
CloseStdIO(stderrFile);
|
|
|
|
Logger::DisableConsoleLog();
|
|
|
|
}
|
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
while (!l_AllowedToWork.load()) {
|
|
|
|
Utility::Sleep(0.2);
|
|
|
|
}
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "The umbrella process let us continuing";
|
2019-07-12 18:14:02 +02:00
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
|
|
|
/* restore the previous program state */
|
|
|
|
try {
|
|
|
|
ConfigObject::RestoreObjects(Configuration::StatePath);
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to restore state file: " << DiagnosticInformation(ex);
|
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
|
|
|
|
WorkQueue upq(25000, Configuration::Concurrency);
|
|
|
|
upq.SetName("DaemonCommand::Run");
|
|
|
|
|
|
|
|
// activate config only after daemonization: it starts threads and that is not compatible with fork()
|
|
|
|
if (!ConfigItem::ActivateItems(upq, newItems, false, false, true)) {
|
|
|
|
Log(LogCritical, "cli", "Error activating configuration.");
|
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Create the internal API object storage. Do this here too with setups without API. */
|
|
|
|
ConfigObjectUtility::CreateStorage();
|
|
|
|
|
|
|
|
/* Remove ignored Downtime/Comment objects. */
|
|
|
|
try {
|
|
|
|
String configDir = ConfigObjectUtility::GetConfigDir();
|
|
|
|
ConfigItem::RemoveIgnoredItems(configDir);
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Cannot clean ignored downtimes/comments: " << ex.what();
|
|
|
|
}
|
|
|
|
|
|
|
|
ApiListener::UpdateObjectAuthority();
|
|
|
|
|
|
|
|
return Application::GetInstance()->Run();
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifndef _WIN32
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* The possible states of a seemless worker being started by StartUnixWorker().
|
|
|
|
*/
|
2019-07-12 18:14:02 +02:00
|
|
|
enum class UnixWorkerState : uint_fast8_t
|
|
|
|
{
|
|
|
|
Pending,
|
|
|
|
LoadedConfig,
|
|
|
|
Failed
|
|
|
|
};
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// The signals to block temporarily in StartUnixWorker().
|
2019-07-12 18:14:02 +02:00
|
|
|
static const sigset_t l_UnixWorkerSignals = ([]() -> sigset_t {
|
|
|
|
sigset_t s;
|
|
|
|
|
|
|
|
(void)sigemptyset(&s);
|
|
|
|
(void)sigaddset(&s, SIGCHLD);
|
2019-07-15 18:36:34 +02:00
|
|
|
(void)sigaddset(&s, SIGUSR1);
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)sigaddset(&s, SIGUSR2);
|
|
|
|
(void)sigaddset(&s, SIGINT);
|
|
|
|
(void)sigaddset(&s, SIGTERM);
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)sigaddset(&s, SIGHUP);
|
2019-07-12 18:14:02 +02:00
|
|
|
|
|
|
|
return s;
|
|
|
|
})();
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// The PID of the seemless worker currently being started by StartUnixWorker()
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<pid_t> l_CurrentlyStartingUnixWorkerPid (-1);
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// The state of the seemless worker currently being started by StartUnixWorker()
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<UnixWorkerState> l_CurrentlyStartingUnixWorkerState (UnixWorkerState::Pending);
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// The last temination signal we received
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<int> l_TermSignal (-1);
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// Whether someone requested to re-load config (and we didn't handle that request, yet)
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<bool> l_RequestedReload (false);
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// Whether someone requested to re-open logs (and we didn't handle that request, yet)
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<bool> l_RequestedReopenLogs (false);
|
2019-07-12 18:14:02 +02:00
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Umbrella process' signal handlers
|
|
|
|
*/
|
2019-07-12 18:14:02 +02:00
|
|
|
static void UmbrellaSignalHandler(int num, siginfo_t *info, void*)
|
|
|
|
{
|
|
|
|
switch (num) {
|
2019-07-15 18:36:34 +02:00
|
|
|
case SIGUSR1:
|
2019-07-16 11:11:10 +02:00
|
|
|
// Someone requested to re-open logs
|
2019-07-15 18:36:34 +02:00
|
|
|
l_RequestedReopenLogs.store(true);
|
|
|
|
break;
|
2019-07-12 18:14:02 +02:00
|
|
|
case SIGUSR2:
|
|
|
|
if (l_CurrentlyStartingUnixWorkerState.load() == UnixWorkerState::Pending
|
2020-01-07 23:08:38 +01:00
|
|
|
&& (info->si_pid == 0 || info->si_pid == l_CurrentlyStartingUnixWorkerPid.load()) ) {
|
2019-07-16 11:11:10 +02:00
|
|
|
// The seemless worker currently being started by StartUnixWorker() successfully loaded its config
|
2019-07-12 18:14:02 +02:00
|
|
|
l_CurrentlyStartingUnixWorkerState.store(UnixWorkerState::LoadedConfig);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case SIGCHLD:
|
|
|
|
if (l_CurrentlyStartingUnixWorkerState.load() == UnixWorkerState::Pending
|
2020-01-07 23:08:38 +01:00
|
|
|
&& (info->si_pid == 0 || info->si_pid == l_CurrentlyStartingUnixWorkerPid.load()) ) {
|
2019-07-16 11:11:10 +02:00
|
|
|
// The seemless worker currently being started by StartUnixWorker() failed
|
2019-07-12 18:14:02 +02:00
|
|
|
l_CurrentlyStartingUnixWorkerState.store(UnixWorkerState::Failed);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case SIGINT:
|
|
|
|
case SIGTERM:
|
2019-07-16 11:11:10 +02:00
|
|
|
// Someone requested our termination
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
|
|
|
struct sigaction sa;
|
|
|
|
memset(&sa, 0, sizeof(sa));
|
|
|
|
|
|
|
|
sa.sa_handler = SIG_DFL;
|
|
|
|
|
|
|
|
(void)sigaction(num, &sa, nullptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
l_TermSignal.store(num);
|
2019-07-15 12:11:19 +02:00
|
|
|
break;
|
|
|
|
case SIGHUP:
|
2019-07-16 11:11:10 +02:00
|
|
|
// Someone requested to re-load config
|
2019-07-15 12:11:19 +02:00
|
|
|
l_RequestedReload.store(true);
|
2019-07-15 15:09:35 +02:00
|
|
|
break;
|
|
|
|
default:
|
2019-07-16 11:11:10 +02:00
|
|
|
// Programming error (or someone has broken the userspace)
|
2019-07-15 15:09:35 +02:00
|
|
|
VERIFY(!"Caught unexpected signal");
|
2019-07-12 18:14:02 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Seemless worker's signal handlers
|
|
|
|
*/
|
2019-07-12 18:14:02 +02:00
|
|
|
static void WorkerSignalHandler(int num, siginfo_t *info, void*)
|
|
|
|
{
|
|
|
|
switch (num) {
|
2019-07-15 12:11:19 +02:00
|
|
|
case SIGUSR2:
|
2020-01-07 23:08:38 +01:00
|
|
|
if (info->si_pid == 0 || info->si_pid == l_UmbrellaPid) {
|
2019-07-16 11:11:10 +02:00
|
|
|
// The umbrella process allowed us to continue working beyond config validation
|
2019-07-15 12:11:19 +02:00
|
|
|
l_AllowedToWork.store(true);
|
|
|
|
}
|
|
|
|
break;
|
2019-07-12 18:14:02 +02:00
|
|
|
case SIGINT:
|
|
|
|
case SIGTERM:
|
2020-01-07 23:08:38 +01:00
|
|
|
if (info->si_pid == 0 || info->si_pid == l_UmbrellaPid) {
|
2019-07-16 11:11:10 +02:00
|
|
|
// The umbrella process requested our termination
|
2019-07-12 18:14:02 +02:00
|
|
|
Application::RequestShutdown();
|
|
|
|
}
|
2019-07-15 15:09:35 +02:00
|
|
|
break;
|
|
|
|
default:
|
2019-07-16 11:11:10 +02:00
|
|
|
// Programming error (or someone has broken the userspace)
|
2019-07-15 15:09:35 +02:00
|
|
|
VERIFY(!"Caught unexpected signal");
|
2019-07-12 18:14:02 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
2019-07-16 11:11:10 +02:00
|
|
|
// When we last notified the watchdog.
|
2019-07-16 11:28:20 +02:00
|
|
|
static Atomic<double> l_LastNotifiedWatchdog (0);
|
2019-07-15 16:58:34 +02:00
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Notify the watchdog if not notified during the last 2.5s.
|
|
|
|
*/
|
2019-07-15 16:58:34 +02:00
|
|
|
static void NotifyWatchdog()
|
|
|
|
{
|
|
|
|
double now = Utility::GetTime();
|
|
|
|
|
|
|
|
if (now - l_LastNotifiedWatchdog.load() >= 2.5) {
|
|
|
|
sd_notify(0, "WATCHDOG=1");
|
|
|
|
l_LastNotifiedWatchdog.store(now);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Starts seemless worker process doing the actual work (config loading, ...)
|
|
|
|
*
|
|
|
|
* @param configs Files to read config from
|
2019-08-05 18:30:45 +02:00
|
|
|
* @param closeConsoleLog Whether to close the console log after config loading
|
|
|
|
* @param stderrFile Where to log errors
|
2019-07-16 11:11:10 +02:00
|
|
|
*
|
|
|
|
* @return The worker's PID on success, -1 on failure (if the worker couldn't load its config)
|
|
|
|
*/
|
2019-08-05 18:30:45 +02:00
|
|
|
static pid_t StartUnixWorker(const std::vector<std::string>& configs, bool closeConsoleLog = false, const String& stderrFile = String())
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Spawning seemless worker process doing the actual work";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
try {
|
|
|
|
Application::UninitializeBase();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to stop thread pool before forking, unexpected error: " << DiagnosticInformation(ex);
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/* Block the signal handlers we'd like to change in the child process until we changed them.
|
|
|
|
* Block SIGUSR2 and SIGCHLD handlers until we've set l_CurrentlyStartingUnixWorkerPid.
|
|
|
|
*/
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)sigprocmask(SIG_BLOCK, &l_UnixWorkerSignals, nullptr);
|
|
|
|
|
|
|
|
pid_t pid = fork();
|
|
|
|
|
|
|
|
switch (pid) {
|
|
|
|
case -1:
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "fork() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
|
|
|
|
case 0:
|
|
|
|
try {
|
|
|
|
{
|
|
|
|
struct sigaction sa;
|
|
|
|
memset(&sa, 0, sizeof(sa));
|
|
|
|
|
|
|
|
sa.sa_handler = SIG_DFL;
|
|
|
|
|
|
|
|
(void)sigaction(SIGCHLD, &sa, nullptr);
|
2019-07-15 18:36:34 +02:00
|
|
|
(void)sigaction(SIGUSR1, &sa, nullptr);
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)sigaction(SIGHUP, &sa, nullptr);
|
2019-07-12 18:14:02 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
struct sigaction sa;
|
|
|
|
memset(&sa, 0, sizeof(sa));
|
|
|
|
|
|
|
|
sa.sa_sigaction = &WorkerSignalHandler;
|
|
|
|
sa.sa_flags = SA_RESTART | SA_SIGINFO;
|
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)sigaction(SIGUSR2, &sa, nullptr);
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)sigaction(SIGINT, &sa, nullptr);
|
|
|
|
(void)sigaction(SIGTERM, &sa, nullptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
(void)sigprocmask(SIG_UNBLOCK, &l_UnixWorkerSignals, nullptr);
|
|
|
|
|
|
|
|
try {
|
|
|
|
Application::InitializeBase();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to re-initialize thread pool after forking (child): " << DiagnosticInformation(ex);
|
|
|
|
_exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
|
2019-08-05 18:30:45 +02:00
|
|
|
_exit(RunWorker(configs, closeConsoleLog, stderrFile));
|
2019-07-12 18:14:02 +02:00
|
|
|
} catch (...) {
|
|
|
|
_exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
|
|
|
|
default:
|
|
|
|
l_CurrentlyStartingUnixWorkerPid.store(pid);
|
|
|
|
(void)sigprocmask(SIG_UNBLOCK, &l_UnixWorkerSignals, nullptr);
|
|
|
|
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Spawned worker process (PID " << pid << "), waiting for it to load its config";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// Wait for the newly spawned process to either load its config or fail.
|
2019-07-12 18:14:02 +02:00
|
|
|
for (;;) {
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
NotifyWatchdog();
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
switch (l_CurrentlyStartingUnixWorkerState.load()) {
|
|
|
|
case UnixWorkerState::LoadedConfig:
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Worker process successfully loaded its config";
|
2019-07-12 18:14:02 +02:00
|
|
|
break;
|
|
|
|
case UnixWorkerState::Failed:
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Worker process couldn't load its config";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
while (waitpid(pid, nullptr, 0) == -1 && errno == EINTR) {
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
NotifyWatchdog();
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
2019-07-12 18:14:02 +02:00
|
|
|
}
|
|
|
|
pid = -1;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
Utility::Sleep(0.2);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// Reset flags for the next time
|
2019-07-12 18:14:02 +02:00
|
|
|
l_CurrentlyStartingUnixWorkerPid.store(-1);
|
|
|
|
l_CurrentlyStartingUnixWorkerState.store(UnixWorkerState::Pending);
|
|
|
|
|
|
|
|
try {
|
|
|
|
Application::InitializeBase();
|
|
|
|
} catch (const std::exception& ex) {
|
|
|
|
Log(LogCritical, "cli")
|
|
|
|
<< "Failed to re-initialize thread pool after forking (parent): " << DiagnosticInformation(ex);
|
|
|
|
exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return pid;
|
|
|
|
}
|
2019-07-15 16:08:08 +02:00
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
/**
|
|
|
|
* Workaround to instantiate Application (which is abstract) in DaemonCommand#Run()
|
|
|
|
*/
|
2019-07-15 16:08:08 +02:00
|
|
|
class PidFileManagementApp : public Application
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
inline int Main() override
|
|
|
|
{
|
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
};
|
2019-07-12 18:14:02 +02:00
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
2014-10-06 14:21:18 +02:00
|
|
|
/**
|
|
|
|
* The entry point for the "daemon" CLI command.
|
|
|
|
*
|
|
|
|
* @returns An exit status.
|
|
|
|
*/
|
2014-10-13 18:07:52 +02:00
|
|
|
int DaemonCommand::Run(const po::variables_map& vm, const std::vector<std::string>& ap) const
|
2014-10-06 14:21:18 +02:00
|
|
|
{
|
2019-07-19 17:58:56 +02:00
|
|
|
#ifdef _WIN32
|
|
|
|
SetConsoleOutputCP(65001);
|
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
2018-05-03 11:35:29 +02:00
|
|
|
Logger::EnableTimestamp();
|
2014-10-31 22:01:36 +01:00
|
|
|
|
2014-10-19 17:52:17 +02:00
|
|
|
Log(LogInformation, "cli")
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "Icinga application loader (version: " << Application::GetAppVersion()
|
2014-12-19 12:19:28 +01:00
|
|
|
#ifdef I2_DEBUG
|
2017-12-19 15:50:05 +01:00
|
|
|
<< "; debug"
|
2014-12-19 12:19:28 +01:00
|
|
|
#endif /* I2_DEBUG */
|
2017-12-19 15:50:05 +01:00
|
|
|
<< ")";
|
2014-10-06 14:21:18 +02:00
|
|
|
|
2015-01-22 12:10:32 +01:00
|
|
|
std::vector<std::string> configs;
|
|
|
|
if (vm.count("config") > 0)
|
2017-11-30 08:19:58 +01:00
|
|
|
configs = vm["config"].as<std::vector<std::string> >();
|
2018-07-31 11:59:09 +02:00
|
|
|
else if (!vm.count("no-config")) {
|
2018-08-07 18:33:59 +02:00
|
|
|
/* The implicit string assignment is needed for Windows builds. */
|
2018-08-09 15:37:23 +02:00
|
|
|
String configDir = Configuration::ConfigDir;
|
2018-07-31 11:59:09 +02:00
|
|
|
configs.push_back(configDir + "/icinga2.conf");
|
|
|
|
}
|
2015-01-22 12:10:32 +01:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
if (vm.count("validate")) {
|
|
|
|
Log(LogInformation, "cli", "Loading configuration file(s).");
|
2016-07-05 15:43:48 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
std::vector<ConfigItem::Ptr> newItems;
|
2015-11-19 19:38:20 +01:00
|
|
|
|
2019-08-07 12:03:17 +02:00
|
|
|
if (!DaemonUtility::LoadConfigFiles(configs, newItems, Configuration::ObjectsPath, Configuration::VarsPath)) {
|
|
|
|
Log(LogCritical, "cli", "Config validation failed. Re-run with 'icinga2 daemon -C' after fixing the config.");
|
2019-07-12 18:14:02 +02:00
|
|
|
return EXIT_FAILURE;
|
2019-08-07 12:03:17 +02:00
|
|
|
}
|
2014-10-06 14:21:18 +02:00
|
|
|
|
|
|
|
Log(LogInformation, "cli", "Finished validating the configuration file(s).");
|
|
|
|
return EXIT_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
|
|
|
pid_t runningpid = Application::ReadPidFile(Configuration::PidPath);
|
|
|
|
if (runningpid > 0) {
|
2018-03-14 10:01:11 +01:00
|
|
|
Log(LogCritical, "cli")
|
2019-07-12 18:14:02 +02:00
|
|
|
<< "Another instance of Icinga already running with PID " << runningpid;
|
2018-01-17 13:52:23 +01:00
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (vm.count("daemonize")) {
|
2019-07-12 18:14:02 +02:00
|
|
|
// this subroutine either succeeds, or logs an error
|
|
|
|
// and terminates the process (does not return).
|
|
|
|
Daemonize();
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|
|
|
|
|
2019-07-15 16:08:08 +02:00
|
|
|
#ifndef _WIN32
|
2019-07-16 11:11:10 +02:00
|
|
|
/* The Application manages the PID file,
|
|
|
|
* but on *nix this process doesn't load any config
|
|
|
|
* so there's no central Application instance.
|
|
|
|
*/
|
2019-07-15 16:08:08 +02:00
|
|
|
PidFileManagementApp app;
|
|
|
|
|
|
|
|
try {
|
|
|
|
app.UpdatePidFile(Configuration::PidPath);
|
|
|
|
} catch (const std::exception&) {
|
|
|
|
Log(LogCritical, "Application")
|
|
|
|
<< "Cannot update PID file '" << Configuration::PidPath << "'. Aborting.";
|
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
|
|
|
|
Defer closePidFile ([&app]() {
|
|
|
|
app.ClosePidFile(true);
|
|
|
|
});
|
|
|
|
#endif /* _WIN32 */
|
|
|
|
|
2019-08-05 18:30:45 +02:00
|
|
|
if (vm.count("daemonize")) {
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
// After disabling the console log, any further errors will go to the configured log only.
|
|
|
|
// Let's try to make this clear and say good bye.
|
|
|
|
Log(LogInformation, "cli", "Closing console log.");
|
|
|
|
|
2014-10-06 14:21:18 +02:00
|
|
|
String errorLog;
|
|
|
|
if (vm.count("errorlog"))
|
|
|
|
errorLog = vm["errorlog"].as<std::string>();
|
|
|
|
|
Fix logging under systemd
icinga2.service used `-e ${ICINGA2_ERROR_LOG}`, but this is documented
as having no effect without `-d`. Furthermore, icinga2 under systemd
unconditionally logged everything to the system log (but without setting
the log level etc), which contradicted the documentation. (Issue #6339)
Stop icinga2 on systemd from logging to stdout - and hence the system log -
once it has finished starting up. Just like when you start icinga2 from a
terminal using `-d`. And just like -d, we stop logging fatal errors to
stderr, and instead write to the log file passed with `-e`.
As per docs, mainlog (icinga2.log) is already enabled by default. And
pre-startup messages including config errors will still appear in the
system log.
This uses a new option --close-stdio, which has the same effect on logging as
--daemonize, but does not fork or call setsid().
For this purpose, I moved setsid() up and into Daemonize().
Consequence of that last point: if anyone is weird enough to specify a TTY
device file as the fatal error log (-e option), that will become icinga's
controlling terminal, which you generally don't want as a daemon. This
makes it consistent with the existing behaviour for icinga mainlog. For
this reason you're supposed to use O_NOCTTY in Linux daemons. But I wasn't
sure where icinga would want to put the ugly `#ifdef _WIN32 ... #else ...`.
2018-05-29 18:24:05 +02:00
|
|
|
CloseStdIO(errorLog);
|
2014-10-06 14:21:18 +02:00
|
|
|
Logger::DisableConsoleLog();
|
|
|
|
}
|
2014-10-13 18:07:52 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
#ifdef _WIN32
|
|
|
|
return RunWorker(configs);
|
|
|
|
#else /* _WIN32 */
|
|
|
|
l_UmbrellaPid = getpid();
|
2019-07-15 13:59:17 +02:00
|
|
|
Application::SetUmbrellaProcess(l_UmbrellaPid);
|
2019-05-10 12:48:34 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
|
|
|
struct sigaction sa;
|
|
|
|
memset(&sa, 0, sizeof(sa));
|
|
|
|
|
|
|
|
sa.sa_sigaction = &UmbrellaSignalHandler;
|
|
|
|
sa.sa_flags = SA_NOCLDSTOP | SA_RESTART | SA_SIGINFO;
|
|
|
|
|
|
|
|
(void)sigaction(SIGCHLD, &sa, nullptr);
|
2019-07-15 18:36:34 +02:00
|
|
|
(void)sigaction(SIGUSR1, &sa, nullptr);
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)sigaction(SIGUSR2, &sa, nullptr);
|
|
|
|
(void)sigaction(SIGINT, &sa, nullptr);
|
|
|
|
(void)sigaction(SIGTERM, &sa, nullptr);
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)sigaction(SIGHUP, &sa, nullptr);
|
2019-04-26 14:43:10 +02:00
|
|
|
}
|
2016-06-03 14:16:52 +02:00
|
|
|
|
2019-08-05 18:30:45 +02:00
|
|
|
bool closeConsoleLog = !vm.count("daemonize") && vm.count("close-stdio");
|
|
|
|
|
|
|
|
String errorLog;
|
|
|
|
if (vm.count("errorlog"))
|
|
|
|
errorLog = vm["errorlog"].as<std::string>();
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// The PID of the current seemless worker
|
2019-08-05 18:30:45 +02:00
|
|
|
pid_t currentWorker = StartUnixWorker(configs, closeConsoleLog, errorLog);
|
2016-05-11 12:50:08 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
if (currentWorker == -1) {
|
|
|
|
return EXIT_FAILURE;
|
|
|
|
}
|
|
|
|
|
2019-08-05 18:30:45 +02:00
|
|
|
if (closeConsoleLog) {
|
|
|
|
// After disabling the console log, any further errors will go to the configured log only.
|
|
|
|
// Let's try to make this clear and say good bye.
|
|
|
|
Log(LogInformation, "cli", "Closing console log.");
|
|
|
|
|
|
|
|
CloseStdIO(errorLog);
|
|
|
|
Logger::DisableConsoleLog();
|
|
|
|
}
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// Immediately allow the first (non-reload) worker to continue working beyond config validation
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)kill(currentWorker, SIGUSR2);
|
|
|
|
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
sd_notify(0, "READY=1");
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// Whether we already forwarded a termination signal to the seemless worker
|
2019-07-12 18:14:02 +02:00
|
|
|
bool requestedTermination = false;
|
2019-07-16 11:11:10 +02:00
|
|
|
|
|
|
|
// Whether we already notified systemd about our termination
|
2019-07-15 16:58:34 +02:00
|
|
|
bool notifiedTermination = false;
|
2019-07-12 18:14:02 +02:00
|
|
|
|
|
|
|
for (;;) {
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
NotifyWatchdog();
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
if (!requestedTermination) {
|
|
|
|
int termSig = l_TermSignal.load();
|
|
|
|
if (termSig != -1) {
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Got signal " << termSig << ", forwarding to seemless worker (PID " << currentWorker << ")";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
(void)kill(currentWorker, termSig);
|
|
|
|
requestedTermination = true;
|
2019-07-15 16:58:34 +02:00
|
|
|
|
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
if (!notifiedTermination) {
|
|
|
|
notifiedTermination = true;
|
|
|
|
sd_notify(0, "STOPPING=1");
|
|
|
|
}
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
2019-07-12 18:14:02 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
if (l_RequestedReload.exchange(false)) {
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogInformation, "Application")
|
|
|
|
<< "Got reload command: Starting new instance.";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
sd_notify(0, "RELOADING=1");
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
pid_t nextWorker = StartUnixWorker(configs);
|
|
|
|
|
2019-07-15 18:29:15 +02:00
|
|
|
if (nextWorker == -1) {
|
|
|
|
Log(LogCritical, "Application", "Found error in config: reloading aborted");
|
|
|
|
} else {
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogInformation, "Application")
|
|
|
|
<< "Reload done, old process shutting down. Child process with PID '" << nextWorker << "' is taking over.";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)kill(currentWorker, SIGTERM);
|
2019-07-15 18:29:15 +02:00
|
|
|
|
|
|
|
{
|
|
|
|
double start = Utility::GetTime();
|
|
|
|
|
|
|
|
while (waitpid(currentWorker, nullptr, 0) == -1 && errno == EINTR) {
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
2019-07-15 18:29:15 +02:00
|
|
|
NotifyWatchdog();
|
2019-07-15 16:58:34 +02:00
|
|
|
#endif /* HAVE_SYSTEMD */
|
2019-07-15 18:29:15 +02:00
|
|
|
}
|
|
|
|
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Waited for " << Utility::FormatDuration(Utility::GetTime() - start) << " on old process to exit.";
|
2019-07-15 12:11:19 +02:00
|
|
|
}
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// Old instance shut down, allow the new one to continue working beyond config validation
|
2019-07-15 12:11:19 +02:00
|
|
|
(void)kill(nextWorker, SIGUSR2);
|
|
|
|
|
|
|
|
currentWorker = nextWorker;
|
|
|
|
}
|
2019-07-15 16:58:34 +02:00
|
|
|
|
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
sd_notify(0, "READY=1");
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-15 12:11:19 +02:00
|
|
|
}
|
|
|
|
|
2019-07-15 18:36:34 +02:00
|
|
|
if (l_RequestedReopenLogs.exchange(false)) {
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Got signal " << SIGUSR1 << ", forwarding to seemless worker (PID " << currentWorker << ")";
|
2019-07-15 18:36:34 +02:00
|
|
|
|
|
|
|
(void)kill(currentWorker, SIGUSR1);
|
|
|
|
}
|
|
|
|
|
2019-07-12 18:14:02 +02:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
if (waitpid(currentWorker, &status, WNOHANG) > 0) {
|
2019-07-16 11:43:47 +02:00
|
|
|
Log(LogNotice, "cli")
|
|
|
|
<< "Seemless worker (PID " << currentWorker << ") stopped, stopping as well";
|
2019-07-15 18:29:15 +02:00
|
|
|
|
2019-07-15 16:58:34 +02:00
|
|
|
#ifdef HAVE_SYSTEMD
|
|
|
|
if (!notifiedTermination) {
|
|
|
|
notifiedTermination = true;
|
|
|
|
sd_notify(0, "STOPPING=1");
|
|
|
|
}
|
|
|
|
#endif /* HAVE_SYSTEMD */
|
|
|
|
|
2019-07-16 11:11:10 +02:00
|
|
|
// If killed by signal, forward it via the exit code (to be as seemless as possible)
|
2019-07-12 18:14:02 +02:00
|
|
|
return WIFSIGNALED(status) ? 128 + WTERMSIG(status) : WEXITSTATUS(status);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Utility::Sleep(0.2);
|
|
|
|
}
|
|
|
|
#endif /* _WIN32 */
|
2014-10-06 14:21:18 +02:00
|
|
|
}
|