icinga2/lib/cli/daemoncommand.cpp

856 lines
23 KiB
C++
Raw Normal View History

/* Icinga 2 | (c) 2012 Icinga GmbH | GPLv2+ */
#include "cli/daemoncommand.hpp"
#include "cli/daemonutility.hpp"
#include "remote/apilistener.hpp"
#include "remote/configobjectutility.hpp"
#include "config/configcompiler.hpp"
#include "config/configcompilercontext.hpp"
#include "config/configitembuilder.hpp"
#include "base/atomic.hpp"
2019-07-15 16:08:08 +02:00
#include "base/defer.hpp"
2014-10-19 14:21:12 +02:00
#include "base/logger.hpp"
#include "base/application.hpp"
#include "base/process.hpp"
#include "base/timer.hpp"
#include "base/utility.hpp"
#include "base/exception.hpp"
#include "base/convert.hpp"
#include "base/scriptglobal.hpp"
#include "base/context.hpp"
#include "config.h"
#include <cstdint>
#include <cstring>
#include <boost/program_options.hpp>
#include <iostream>
#include <fstream>
#ifdef _WIN32
#include <windows.h>
#else /* _WIN32 */
#include <signal.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <unistd.h>
#endif /* _WIN32 */
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
#include <systemd/sd-daemon.h>
#endif /* HAVE_SYSTEMD */
using namespace icinga;
namespace po = boost::program_options;
static po::variables_map g_AppParams;
REGISTER_CLICOMMAND("daemon", DaemonCommand);
static inline
void NotifyStatus(const char* status)
{
#ifdef HAVE_SYSTEMD
(void)sd_notifyf(0, "STATUS=%s", status);
#endif /* HAVE_SYSTEMD */
}
/*
* Daemonize(). On error, this function logs by itself and exits (i.e. does not return).
*
* Implementation note: We're only supposed to call exit() in one of the forked processes.
* The other process calls _exit(). This prevents issues with exit handlers like atexit().
*/
static void Daemonize() noexcept
{
#ifndef _WIN32
try {
Application::UninitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to stop thread pool before daemonizing, unexpected error: " << DiagnosticInformation(ex);
exit(EXIT_FAILURE);
}
pid_t pid = fork();
if (pid == -1) {
Log(LogCritical, "cli")
<< "fork() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
exit(EXIT_FAILURE);
}
if (pid) {
// systemd requires that the pidfile of the daemon is written before the forking
// process terminates. So wait till either the forked daemon has written a pidfile or died.
int status;
int ret;
pid_t readpid;
do {
Utility::Sleep(0.1);
2018-08-09 15:37:23 +02:00
readpid = Application::ReadPidFile(Configuration::PidPath);
ret = waitpid(pid, &status, WNOHANG);
} while (readpid != pid && ret == 0);
if (ret == pid) {
Log(LogCritical, "cli", "The daemon could not be started. See log output for details.");
_exit(EXIT_FAILURE);
} else if (ret == -1) {
2014-10-19 17:52:17 +02:00
Log(LogCritical, "cli")
<< "waitpid() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
_exit(EXIT_FAILURE);
}
_exit(EXIT_SUCCESS);
}
Log(LogDebug, "Daemonize()")
<< "Child process with PID " << Utility::GetPid() << " continues; re-initializing base.";
// Detach from controlling terminal
pid_t sid = setsid();
if (sid == -1) {
Log(LogCritical, "cli")
<< "setsid() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
exit(EXIT_FAILURE);
}
try {
Application::InitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to re-initialize thread pool after daemonizing: " << DiagnosticInformation(ex);
exit(EXIT_FAILURE);
}
#endif /* _WIN32 */
}
static void CloseStdIO(const String& stderrFile)
{
#ifndef _WIN32
int fdnull = open("/dev/null", O_RDWR);
if (fdnull >= 0) {
if (fdnull != 0)
dup2(fdnull, 0);
if (fdnull != 1)
dup2(fdnull, 1);
if (fdnull > 1)
close(fdnull);
}
const char *errPath = "/dev/null";
if (!stderrFile.IsEmpty())
errPath = stderrFile.CStr();
int fderr = open(errPath, O_WRONLY | O_APPEND);
if (fderr < 0 && errno == ENOENT)
fderr = open(errPath, O_CREAT | O_WRONLY | O_APPEND, 0600);
if (fderr >= 0) {
if (fderr != 2)
dup2(fderr, 2);
if (fderr > 2)
close(fderr);
}
#endif
}
String DaemonCommand::GetDescription() const
{
return "Starts Icinga 2.";
}
String DaemonCommand::GetShortDescription() const
{
return "starts Icinga 2";
}
void DaemonCommand::InitParameters(boost::program_options::options_description& visibleDesc,
boost::program_options::options_description& hiddenDesc) const
{
visibleDesc.add_options()
("config,c", po::value<std::vector<std::string> >(), "parse a configuration file")
("no-config,z", "start without a configuration file")
("validate,C", "exit after validating the configuration")
("errorlog,e", po::value<std::string>(), "log fatal errors to the specified log file (only works in combination with --daemonize or --close-stdio)")
#ifndef _WIN32
("daemonize,d", "detach from the controlling terminal")
("close-stdio", "do not log to stdout (or stderr) after startup")
#endif /* _WIN32 */
;
}
std::vector<String> DaemonCommand::GetArgumentSuggestions(const String& argument, const String& word) const
{
if (argument == "config" || argument == "errorlog")
return GetBashCompletionSuggestions("file", word);
else
return CLICommand::GetArgumentSuggestions(argument, word);
}
#ifndef _WIN32
2019-07-16 11:11:10 +02:00
// The PID of the Icinga umbrella process
pid_t l_UmbrellaPid = 0;
2019-07-16 11:11:10 +02:00
// Whether the umbrella process allowed us to continue working beyond config validation
static Atomic<bool> l_AllowedToWork (false);
#endif /* _WIN32 */
#ifdef I2_DEBUG
/**
* Determine whether the developer wants to delay the worker process to attach a debugger to it.
*
* @return Internal.DebugWorkerDelay double
*/
static double GetDebugWorkerDelay()
{
Namespace::Ptr internal = ScriptGlobal::Get("Internal", &Empty);
Value vdebug;
if (internal && internal->Get("DebugWorkerDelay", &vdebug))
return Convert::ToDouble(vdebug);
return 0.0;
}
#endif /* I2_DEBUG */
2019-07-16 11:11:10 +02:00
/**
* Do the actual work (config loading, ...)
*
* @param configs Files to read config from
* @param closeConsoleLog Whether to close the console log after config loading
* @param stderrFile Where to log errors
2019-07-16 11:11:10 +02:00
*
* @return Exit code
*/
static inline
int RunWorker(const std::vector<std::string>& configs, bool closeConsoleLog = false, const String& stderrFile = String())
{
#ifdef I2_DEBUG
double delay = GetDebugWorkerDelay();
if (delay > 0.0) {
Log(LogInformation, "RunWorker")
<< "DEBUG: Current PID: " << Utility::GetPid() << ". Sleeping for " << delay << " seconds to allow lldb/gdb -p <PID> attachment.";
Utility::Sleep(delay);
}
#endif /* I2_DEBUG */
Log(LogInformation, "cli", "Loading configuration file(s).");
NotifyStatus("Loading configuration file(s)...");
{
std::vector<ConfigItem::Ptr> newItems;
if (!DaemonUtility::LoadConfigFiles(configs, newItems, Configuration::ObjectsPath, Configuration::VarsPath)) {
Log(LogCritical, "cli", "Config validation failed. Re-run with 'icinga2 daemon -C' after fixing the config.");
NotifyStatus("Config validation failed.");
return EXIT_FAILURE;
}
#ifndef _WIN32
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
<< "Notifying umbrella process (PID " << l_UmbrellaPid << ") about the config loading success";
2019-07-15 18:29:15 +02:00
(void)kill(l_UmbrellaPid, SIGUSR2);
2019-07-15 12:11:19 +02:00
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
<< "Waiting for the umbrella process to let us doing the actual work";
2019-07-15 18:29:15 +02:00
NotifyStatus("Waiting for the umbrella process to let us doing the actual work...");
if (closeConsoleLog) {
CloseStdIO(stderrFile);
Logger::DisableConsoleLog();
}
2019-07-15 12:11:19 +02:00
while (!l_AllowedToWork.load()) {
Utility::Sleep(0.2);
}
2019-07-15 18:29:15 +02:00
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
<< "The umbrella process let us continuing";
#endif /* _WIN32 */
NotifyStatus("Restoring the previous program state...");
/* restore the previous program state */
try {
ConfigObject::RestoreObjects(Configuration::StatePath);
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to restore state file: " << DiagnosticInformation(ex);
NotifyStatus("Failed to restore state file.");
return EXIT_FAILURE;
}
NotifyStatus("Activating config objects...");
// activate config only after daemonization: it starts threads and that is not compatible with fork()
if (!ConfigItem::ActivateItems(newItems, false, true, true)) {
Log(LogCritical, "cli", "Error activating configuration.");
NotifyStatus("Error activating configuration.");
return EXIT_FAILURE;
}
}
/* Create the internal API object storage. Do this here too with setups without API. */
ConfigObjectUtility::CreateStorage();
/* Remove ignored Downtime/Comment objects. */
try {
String configDir = ConfigObjectUtility::GetConfigDir();
ConfigItem::RemoveIgnoredItems(configDir);
} catch (const std::exception& ex) {
Log(LogNotice, "cli")
<< "Cannot clean ignored downtimes/comments: " << ex.what();
}
ApiListener::UpdateObjectAuthority();
NotifyStatus("Startup finished.");
return Application::GetInstance()->Run();
}
#ifndef _WIN32
2019-07-16 11:11:10 +02:00
// The signals to block temporarily in StartUnixWorker().
static const sigset_t l_UnixWorkerSignals = ([]() -> sigset_t {
sigset_t s;
(void)sigemptyset(&s);
2019-07-15 18:36:34 +02:00
(void)sigaddset(&s, SIGUSR1);
(void)sigaddset(&s, SIGUSR2);
(void)sigaddset(&s, SIGINT);
(void)sigaddset(&s, SIGTERM);
2019-07-15 12:11:19 +02:00
(void)sigaddset(&s, SIGHUP);
return s;
})();
2020-12-25 23:27:08 +01:00
// The PID of the seamless worker currently being started by StartUnixWorker()
static Atomic<pid_t> l_CurrentlyStartingUnixWorkerPid (-1);
2019-07-16 11:11:10 +02:00
2020-12-25 23:27:08 +01:00
// The state of the seamless worker currently being started by StartUnixWorker()
2022-10-07 15:14:33 +02:00
static Atomic<bool> l_CurrentlyStartingUnixWorkerReady (false);
2019-07-16 11:11:10 +02:00
// The last temination signal we received
static Atomic<int> l_TermSignal (-1);
2019-07-16 11:11:10 +02:00
// Whether someone requested to re-load config (and we didn't handle that request, yet)
static Atomic<bool> l_RequestedReload (false);
2019-07-16 11:11:10 +02:00
// Whether someone requested to re-open logs (and we didn't handle that request, yet)
static Atomic<bool> l_RequestedReopenLogs (false);
2019-07-16 11:11:10 +02:00
/**
* Umbrella process' signal handlers
*/
static void UmbrellaSignalHandler(int num, siginfo_t *info, void*)
{
switch (num) {
2019-07-15 18:36:34 +02:00
case SIGUSR1:
2019-07-16 11:11:10 +02:00
// Someone requested to re-open logs
2019-07-15 18:36:34 +02:00
l_RequestedReopenLogs.store(true);
break;
case SIGUSR2:
2022-10-07 15:14:33 +02:00
if (!l_CurrentlyStartingUnixWorkerReady.load()
&& (info->si_pid == 0 || info->si_pid == l_CurrentlyStartingUnixWorkerPid.load()) ) {
2020-12-25 23:27:08 +01:00
// The seamless worker currently being started by StartUnixWorker() successfully loaded its config
2022-10-07 15:14:33 +02:00
l_CurrentlyStartingUnixWorkerReady.store(true);
}
break;
case SIGINT:
case SIGTERM:
2019-07-16 11:11:10 +02:00
// Someone requested our termination
{
struct sigaction sa;
memset(&sa, 0, sizeof(sa));
sa.sa_handler = SIG_DFL;
(void)sigaction(num, &sa, nullptr);
}
l_TermSignal.store(num);
2019-07-15 12:11:19 +02:00
break;
case SIGHUP:
2019-07-16 11:11:10 +02:00
// Someone requested to re-load config
2019-07-15 12:11:19 +02:00
l_RequestedReload.store(true);
2019-07-15 15:09:35 +02:00
break;
default:
2019-07-16 11:11:10 +02:00
// Programming error (or someone has broken the userspace)
2019-07-15 15:09:35 +02:00
VERIFY(!"Caught unexpected signal");
}
}
2019-07-16 11:11:10 +02:00
/**
2020-12-25 23:27:08 +01:00
* Seamless worker's signal handlers
2019-07-16 11:11:10 +02:00
*/
static void WorkerSignalHandler(int num, siginfo_t *info, void*)
{
switch (num) {
case SIGUSR1:
// Catches SIGUSR1 as long as the actual handler (logrotate)
// has not been installed not to let SIGUSR1 terminate the process
break;
2019-07-15 12:11:19 +02:00
case SIGUSR2:
if (info->si_pid == 0 || info->si_pid == l_UmbrellaPid) {
2019-07-16 11:11:10 +02:00
// The umbrella process allowed us to continue working beyond config validation
2019-07-15 12:11:19 +02:00
l_AllowedToWork.store(true);
}
break;
case SIGINT:
case SIGTERM:
if (info->si_pid == 0 || info->si_pid == l_UmbrellaPid) {
2019-07-16 11:11:10 +02:00
// The umbrella process requested our termination
Application::RequestShutdown();
}
2019-07-15 15:09:35 +02:00
break;
default:
2019-07-16 11:11:10 +02:00
// Programming error (or someone has broken the userspace)
2019-07-15 15:09:35 +02:00
VERIFY(!"Caught unexpected signal");
}
}
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
2019-07-16 11:11:10 +02:00
// When we last notified the watchdog.
static Atomic<double> l_LastNotifiedWatchdog (0);
2019-07-15 16:58:34 +02:00
2019-07-16 11:11:10 +02:00
/**
* Notify the watchdog if not notified during the last 2.5s.
*/
2019-07-15 16:58:34 +02:00
static void NotifyWatchdog()
{
double now = Utility::GetTime();
if (now - l_LastNotifiedWatchdog.load() >= 2.5) {
sd_notify(0, "WATCHDOG=1");
l_LastNotifiedWatchdog.store(now);
}
}
#endif /* HAVE_SYSTEMD */
2019-07-16 11:11:10 +02:00
/**
2020-12-25 23:27:08 +01:00
* Starts seamless worker process doing the actual work (config loading, ...)
2019-07-16 11:11:10 +02:00
*
* @param configs Files to read config from
* @param closeConsoleLog Whether to close the console log after config loading
* @param stderrFile Where to log errors
2019-07-16 11:11:10 +02:00
*
* @return The worker's PID on success, -1 on fork(2) failure, -2 if the worker couldn't load its config
2019-07-16 11:11:10 +02:00
*/
static pid_t StartUnixWorker(const std::vector<std::string>& configs, bool closeConsoleLog = false, const String& stderrFile = String())
{
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
2020-12-25 23:27:08 +01:00
<< "Spawning seamless worker process doing the actual work";
2019-07-15 18:29:15 +02:00
try {
Application::UninitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to stop thread pool before forking, unexpected error: " << DiagnosticInformation(ex);
exit(EXIT_FAILURE);
}
2019-07-16 11:11:10 +02:00
/* Block the signal handlers we'd like to change in the child process until we changed them.
* Block SIGUSR2 handler until we've set l_CurrentlyStartingUnixWorkerPid.
2019-07-16 11:11:10 +02:00
*/
(void)sigprocmask(SIG_BLOCK, &l_UnixWorkerSignals, nullptr);
pid_t pid = fork();
switch (pid) {
case -1:
Log(LogCritical, "cli")
<< "fork() failed with error code " << errno << ", \"" << Utility::FormatErrorNumber(errno) << "\"";
try {
Application::InitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to re-initialize thread pool after forking (parent): " << DiagnosticInformation(ex);
exit(EXIT_FAILURE);
}
(void)sigprocmask(SIG_UNBLOCK, &l_UnixWorkerSignals, nullptr);
return -1;
case 0:
try {
{
struct sigaction sa;
memset(&sa, 0, sizeof(sa));
sa.sa_handler = SIG_DFL;
2019-07-15 18:36:34 +02:00
(void)sigaction(SIGUSR1, &sa, nullptr);
2019-07-15 12:11:19 +02:00
(void)sigaction(SIGHUP, &sa, nullptr);
}
{
struct sigaction sa;
memset(&sa, 0, sizeof(sa));
sa.sa_sigaction = &WorkerSignalHandler;
sa.sa_flags = SA_RESTART | SA_SIGINFO;
(void)sigaction(SIGUSR1, &sa, nullptr);
2019-07-15 12:11:19 +02:00
(void)sigaction(SIGUSR2, &sa, nullptr);
(void)sigaction(SIGINT, &sa, nullptr);
(void)sigaction(SIGTERM, &sa, nullptr);
}
(void)sigprocmask(SIG_UNBLOCK, &l_UnixWorkerSignals, nullptr);
try {
Application::InitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to re-initialize thread pool after forking (child): " << DiagnosticInformation(ex);
_exit(EXIT_FAILURE);
}
try {
Process::InitializeSpawnHelper();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to initialize process spawn helper after forking (child): " << DiagnosticInformation(ex);
_exit(EXIT_FAILURE);
}
_exit(RunWorker(configs, closeConsoleLog, stderrFile));
} catch (const std::exception& ex) {
Log(LogCritical, "cli") << "Exception in main process: " << DiagnosticInformation(ex);
_exit(EXIT_FAILURE);
} catch (...) {
_exit(EXIT_FAILURE);
}
default:
l_CurrentlyStartingUnixWorkerPid.store(pid);
(void)sigprocmask(SIG_UNBLOCK, &l_UnixWorkerSignals, nullptr);
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
<< "Spawned worker process (PID " << pid << "), waiting for it to load its config";
2019-07-15 18:29:15 +02:00
2019-07-16 11:11:10 +02:00
// Wait for the newly spawned process to either load its config or fail.
for (;;) {
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
NotifyWatchdog();
#endif /* HAVE_SYSTEMD */
if (waitpid(pid, nullptr, WNOHANG) > 0) {
Log(LogNotice, "cli")
<< "Worker process couldn't load its config";
2019-07-15 18:29:15 +02:00
pid = -2;
break;
}
2022-10-07 15:14:33 +02:00
if (l_CurrentlyStartingUnixWorkerReady.load()) {
Log(LogNotice, "cli")
<< "Worker process successfully loaded its config";
break;
}
Utility::Sleep(0.2);
}
2019-07-16 11:11:10 +02:00
// Reset flags for the next time
l_CurrentlyStartingUnixWorkerPid.store(-1);
2022-10-07 15:14:33 +02:00
l_CurrentlyStartingUnixWorkerReady.store(false);
try {
Application::InitializeBase();
} catch (const std::exception& ex) {
Log(LogCritical, "cli")
<< "Failed to re-initialize thread pool after forking (parent): " << DiagnosticInformation(ex);
exit(EXIT_FAILURE);
}
}
return pid;
}
2019-07-15 16:08:08 +02:00
2019-07-16 11:11:10 +02:00
/**
* Workaround to instantiate Application (which is abstract) in DaemonCommand#Run()
*/
2019-07-15 16:08:08 +02:00
class PidFileManagementApp : public Application
{
public:
inline int Main() override
{
return EXIT_FAILURE;
}
};
#endif /* _WIN32 */
/**
* The entry point for the "daemon" CLI command.
*
* @returns An exit status.
*/
int DaemonCommand::Run(const po::variables_map& vm, const std::vector<std::string>& ap) const
{
#ifdef _WIN32
SetConsoleOutputCP(65001);
#endif /* _WIN32 */
Logger::EnableTimestamp();
2014-10-19 17:52:17 +02:00
Log(LogInformation, "cli")
<< "Icinga application loader (version: " << Application::GetAppVersion()
2014-12-19 12:19:28 +01:00
#ifdef I2_DEBUG
<< "; debug"
2014-12-19 12:19:28 +01:00
#endif /* I2_DEBUG */
<< ")";
std::vector<std::string> configs;
if (vm.count("config") > 0)
configs = vm["config"].as<std::vector<std::string> >();
else if (!vm.count("no-config")) {
/* The implicit string assignment is needed for Windows builds. */
2018-08-09 15:37:23 +02:00
String configDir = Configuration::ConfigDir;
configs.push_back(configDir + "/icinga2.conf");
}
if (vm.count("validate")) {
Log(LogInformation, "cli", "Loading configuration file(s).");
std::vector<ConfigItem::Ptr> newItems;
if (!DaemonUtility::LoadConfigFiles(configs, newItems, Configuration::ObjectsPath, Configuration::VarsPath)) {
Log(LogCritical, "cli", "Config validation failed. Re-run with 'icinga2 daemon -C' after fixing the config.");
return EXIT_FAILURE;
}
Log(LogInformation, "cli", "Finished validating the configuration file(s).");
return EXIT_SUCCESS;
}
{
pid_t runningpid = Application::ReadPidFile(Configuration::PidPath);
if (runningpid > 0) {
Log(LogCritical, "cli")
<< "Another instance of Icinga already running with PID " << runningpid;
return EXIT_FAILURE;
}
}
if (vm.count("daemonize")) {
// this subroutine either succeeds, or logs an error
// and terminates the process (does not return).
Daemonize();
}
2019-07-15 16:08:08 +02:00
#ifndef _WIN32
2019-07-16 11:11:10 +02:00
/* The Application manages the PID file,
* but on *nix this process doesn't load any config
* so there's no central Application instance.
*/
2019-07-15 16:08:08 +02:00
PidFileManagementApp app;
try {
app.UpdatePidFile(Configuration::PidPath);
} catch (const std::exception&) {
Log(LogCritical, "Application")
<< "Cannot update PID file '" << Configuration::PidPath << "'. Aborting.";
return EXIT_FAILURE;
}
Defer closePidFile ([&app]() {
app.ClosePidFile(true);
});
#endif /* _WIN32 */
if (vm.count("daemonize")) {
// After disabling the console log, any further errors will go to the configured log only.
// Let's try to make this clear and say good bye.
Log(LogInformation, "cli", "Closing console log.");
String errorLog;
if (vm.count("errorlog"))
errorLog = vm["errorlog"].as<std::string>();
CloseStdIO(errorLog);
Logger::DisableConsoleLog();
}
#ifdef _WIN32
try {
return RunWorker(configs);
} catch (const std::exception& ex) {
Log(LogCritical, "cli") << "Exception in main process: " << DiagnosticInformation(ex);
return EXIT_FAILURE;
} catch (...) {
return EXIT_FAILURE;
}
#else /* _WIN32 */
l_UmbrellaPid = getpid();
Application::SetUmbrellaProcess(l_UmbrellaPid);
{
struct sigaction sa;
memset(&sa, 0, sizeof(sa));
sa.sa_sigaction = &UmbrellaSignalHandler;
sa.sa_flags = SA_NOCLDSTOP | SA_RESTART | SA_SIGINFO;
2019-07-15 18:36:34 +02:00
(void)sigaction(SIGUSR1, &sa, nullptr);
(void)sigaction(SIGUSR2, &sa, nullptr);
(void)sigaction(SIGINT, &sa, nullptr);
(void)sigaction(SIGTERM, &sa, nullptr);
2019-07-15 12:11:19 +02:00
(void)sigaction(SIGHUP, &sa, nullptr);
}
bool closeConsoleLog = !vm.count("daemonize") && vm.count("close-stdio");
String errorLog;
if (vm.count("errorlog"))
errorLog = vm["errorlog"].as<std::string>();
2020-12-25 23:27:08 +01:00
// The PID of the current seamless worker
pid_t currentWorker = StartUnixWorker(configs, closeConsoleLog, errorLog);
if (currentWorker < 0) {
return EXIT_FAILURE;
}
if (closeConsoleLog) {
// After disabling the console log, any further errors will go to the configured log only.
// Let's try to make this clear and say good bye.
Log(LogInformation, "cli", "Closing console log.");
CloseStdIO(errorLog);
Logger::DisableConsoleLog();
}
2019-07-16 11:11:10 +02:00
// Immediately allow the first (non-reload) worker to continue working beyond config validation
2019-07-15 12:11:19 +02:00
(void)kill(currentWorker, SIGUSR2);
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
sd_notify(0, "READY=1");
#endif /* HAVE_SYSTEMD */
2020-12-25 23:27:08 +01:00
// Whether we already forwarded a termination signal to the seamless worker
bool requestedTermination = false;
2019-07-16 11:11:10 +02:00
// Whether we already notified systemd about our termination
2019-07-15 16:58:34 +02:00
bool notifiedTermination = false;
for (;;) {
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
NotifyWatchdog();
#endif /* HAVE_SYSTEMD */
if (!requestedTermination) {
int termSig = l_TermSignal.load();
if (termSig != -1) {
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
2020-12-25 23:27:08 +01:00
<< "Got signal " << termSig << ", forwarding to seamless worker (PID " << currentWorker << ")";
2019-07-15 18:29:15 +02:00
(void)kill(currentWorker, termSig);
requestedTermination = true;
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
if (!notifiedTermination) {
notifiedTermination = true;
sd_notify(0, "STOPPING=1");
}
#endif /* HAVE_SYSTEMD */
}
}
2019-07-15 12:11:19 +02:00
if (l_RequestedReload.exchange(false)) {
2019-07-16 11:43:47 +02:00
Log(LogInformation, "Application")
<< "Got reload command: Starting new instance.";
2019-07-15 18:29:15 +02:00
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
sd_notify(0, "RELOADING=1");
#endif /* HAVE_SYSTEMD */
2019-07-15 12:11:19 +02:00
pid_t nextWorker = StartUnixWorker(configs);
switch (nextWorker) {
case -1:
break;
case -2:
Log(LogCritical, "Application", "Found error in config: reloading aborted");
break;
default:
Log(LogInformation, "Application")
<< "Reload done, old process shutting down. Child process with PID '" << nextWorker << "' is taking over.";
2019-07-15 18:29:15 +02:00
NotifyStatus("Shutting down old instance...");
(void)kill(currentWorker, SIGTERM);
2019-07-15 18:29:15 +02:00
{
double start = Utility::GetTime();
2019-07-15 18:29:15 +02:00
while (waitpid(currentWorker, nullptr, 0) == -1 && errno == EINTR) {
#ifdef HAVE_SYSTEMD
NotifyWatchdog();
#endif /* HAVE_SYSTEMD */
}
2019-07-15 18:29:15 +02:00
Log(LogNotice, "cli")
<< "Waited for " << Utility::FormatDuration(Utility::GetTime() - start) << " on old process to exit.";
}
2019-07-15 12:11:19 +02:00
// Old instance shut down, allow the new one to continue working beyond config validation
(void)kill(nextWorker, SIGUSR2);
2019-07-15 12:11:19 +02:00
NotifyStatus("Shut down old instance.");
currentWorker = nextWorker;
2019-07-15 12:11:19 +02:00
}
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
sd_notify(0, "READY=1");
#endif /* HAVE_SYSTEMD */
2019-07-15 12:11:19 +02:00
}
2019-07-15 18:36:34 +02:00
if (l_RequestedReopenLogs.exchange(false)) {
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
2020-12-25 23:27:08 +01:00
<< "Got signal " << SIGUSR1 << ", forwarding to seamless worker (PID " << currentWorker << ")";
2019-07-15 18:36:34 +02:00
(void)kill(currentWorker, SIGUSR1);
}
{
int status;
if (waitpid(currentWorker, &status, WNOHANG) > 0) {
2019-07-16 11:43:47 +02:00
Log(LogNotice, "cli")
2020-12-25 23:27:08 +01:00
<< "Seamless worker (PID " << currentWorker << ") stopped, stopping as well";
2019-07-15 18:29:15 +02:00
2019-07-15 16:58:34 +02:00
#ifdef HAVE_SYSTEMD
if (!notifiedTermination) {
notifiedTermination = true;
sd_notify(0, "STOPPING=1");
}
#endif /* HAVE_SYSTEMD */
2020-12-25 23:27:08 +01:00
// If killed by signal, forward it via the exit code (to be as seamless as possible)
return WIFSIGNALED(status) ? 128 + WTERMSIG(status) : WEXITSTATUS(status);
}
}
Utility::Sleep(0.2);
}
#endif /* _WIN32 */
}