1
0
Fork 0
arangodb/lib/ApplicationFeatures/SupervisorFeature.cpp

241 lines
7.5 KiB
C++

////////////////////////////////////////////////////////////////////////////////
/// DISCLAIMER
///
/// Copyright 2016 ArangoDB GmbH, Cologne, Germany
///
/// Licensed under the Apache License, Version 2.0 (the "License");
/// you may not use this file except in compliance with the License.
/// You may obtain a copy of the License at
///
/// http://www.apache.org/licenses/LICENSE-2.0
///
/// Unless required by applicable law or agreed to in writing, software
/// distributed under the License is distributed on an "AS IS" BASIS,
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
/// See the License for the specific language governing permissions and
/// limitations under the License.
///
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
///
/// @author Dr. Frank Celler
////////////////////////////////////////////////////////////////////////////////
#include "SupervisorFeature.h"
#include "ApplicationFeatures/LoggerFeature.h"
#include "ApplicationFeatures/DaemonFeature.h"
#include "Basics/ArangoGlobalContext.h"
#include "ProgramOptions/ProgramOptions.h"
#include "ProgramOptions/Section.h"
using namespace arangodb;
using namespace arangodb::application_features;
using namespace arangodb::basics;
using namespace arangodb::options;
SupervisorFeature::SupervisorFeature(
application_features::ApplicationServer* server)
: ApplicationFeature(server, "Supervisor"), _supervisor(false) {
setOptional(true);
requiresElevatedPrivileges(false);
startsAfter("Daemon");
startsAfter("Logger");
startsAfter("WorkMonitor");
}
void SupervisorFeature::collectOptions(
std::shared_ptr<ProgramOptions> options) {
LOG_TOPIC(TRACE, Logger::STARTUP) << name() << "::collectOptions";
options->addSection(
Section("", "Global configuration", "global options", false, false));
options->addHiddenOption("--supervisor",
"background the server, starts a supervisor",
new BooleanParameter(&_supervisor, false));
}
void SupervisorFeature::validateOptions(
std::shared_ptr<ProgramOptions> options) {
LOG_TOPIC(TRACE, Logger::STARTUP) << name() << "::validateOptions";
if (_supervisor) {
DaemonFeature* daemon = dynamic_cast<DaemonFeature*>(
ApplicationServer::lookupFeature("Daemon"));
if (daemon == nullptr) {
LOG(FATAL) << "daemon mode not available, cannot start supervisor";
FATAL_ERROR_EXIT();
}
// force daemon mode
daemon->setDaemon(true);
// revalidate options
daemon->validateOptions(options);
}
}
void SupervisorFeature::daemonize() {
LOG_TOPIC(TRACE, Logger::STARTUP) << name() << "::daemonize";
static time_t const MIN_TIME_ALIVE_IN_SEC = 30;
if (!_supervisor) {
return;
}
time_t startTime = time(0);
time_t t;
bool done = false;
int result = EXIT_SUCCESS;
std::vector<ApplicationFeature*> supervisorFeatures(_supervisorStart.size());
std::transform(_supervisorStart.begin(), _supervisorStart.end(),
supervisorFeatures.begin(), [](std::string const& name) {
ApplicationFeature* feature =
ApplicationServer::lookupFeature(name);
if (feature == nullptr) {
LOG_TOPIC(FATAL, Logger::STARTUP)
<< "unknown feature '" << name << "', giving up";
FATAL_ERROR_EXIT();
}
return feature;
});
while (!done) {
// fork of the server
_clientPid = fork();
if (_clientPid < 0) {
LOG_TOPIC(FATAL, Logger::STARTUP) << "fork failed, giving up";
FATAL_ERROR_EXIT();
}
// parent (supervisor)
if (0 < _clientPid) {
LOG_TOPIC(DEBUG, Logger::STARTUP) << "supervisor mode: within parent";
TRI_SetProcessTitle("arangodb [supervisor]");
ArangoGlobalContext::CONTEXT->unmaskStandardSignals();
std::for_each(supervisorFeatures.begin(), supervisorFeatures.end(),
[](ApplicationFeature* feature) {
LoggerFeature* logger =
dynamic_cast<LoggerFeature*>(feature);
if (logger != nullptr) {
logger->setSupervisor(true);
logger->setThreaded(false);
}
});
std::for_each(supervisorFeatures.begin(), supervisorFeatures.end(),
[](ApplicationFeature* feature) { feature->prepare(); });
std::for_each(supervisorFeatures.begin(), supervisorFeatures.end(),
[](ApplicationFeature* feature) { feature->start(); });
int status;
waitpid(_clientPid, &status, 0);
bool horrible = true;
if (WIFEXITED(status)) {
// give information about cause of death
if (WEXITSTATUS(status) == 0) {
LOG_TOPIC(INFO, Logger::STARTUP) << "child " << _clientPid
<< " died of natural causes";
done = true;
horrible = false;
} else {
t = time(0) - startTime;
LOG_TOPIC(ERR, Logger::STARTUP)
<< "child " << _clientPid
<< " died a horrible death, exit status " << WEXITSTATUS(status);
if (t < MIN_TIME_ALIVE_IN_SEC) {
LOG_TOPIC(ERR, Logger::STARTUP)
<< "child only survived for " << t
<< " seconds, this will not work - please fix the error "
"first";
done = true;
} else {
done = false;
}
}
} else if (WIFSIGNALED(status)) {
switch (WTERMSIG(status)) {
case 2:
case 9:
case 15:
LOG_TOPIC(INFO, Logger::STARTUP)
<< "child " << _clientPid
<< " died of natural causes, exit status " << WTERMSIG(status);
done = true;
horrible = false;
break;
default:
t = time(0) - startTime;
LOG_TOPIC(ERR, Logger::STARTUP) << "child " << _clientPid
<< " died a horrible death, signal "
<< WTERMSIG(status);
if (t < MIN_TIME_ALIVE_IN_SEC) {
LOG_TOPIC(ERR, Logger::STARTUP)
<< "child only survived for " << t
<< " seconds, this will not work - please fix the "
"error first";
done = true;
#ifdef WCOREDUMP
if (WCOREDUMP(status)) {
LOG_TOPIC(WARN, Logger::STARTUP) << "child process "
<< _clientPid
<< " produced a core dump";
}
#endif
} else {
done = false;
}
break;
}
} else {
LOG_TOPIC(ERR, Logger::STARTUP)
<< "child " << _clientPid
<< " died a horrible death, unknown cause";
done = false;
}
// remove pid file
if (horrible) {
result = EXIT_FAILURE;
}
}
// child - run the normal boot sequence
else {
LOG_TOPIC(DEBUG, Logger::STARTUP) << "supervisor mode: within child";
TRI_SetProcessTitle("arangodb [server]");
#ifdef TRI_HAVE_PRCTL
// force child to stop if supervisor dies
prctl(PR_SET_PDEATHSIG, SIGTERM, 0, 0, 0);
#endif
return;
}
}
std::for_each(supervisorFeatures.rbegin(), supervisorFeatures.rend(),
[](ApplicationFeature* feature) { feature->stop(); });
exit(result);
}