2016-02-09 17:06:50 +00:00
|
|
|
#include <daemon/BaseDaemon.h>
|
2020-05-27 19:11:04 +00:00
|
|
|
#include <daemon/SentryWriter.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/time.h>
|
2020-12-22 02:57:22 +00:00
|
|
|
#include <sys/wait.h>
|
|
|
|
#include <sys/resource.h>
|
2020-12-22 03:17:31 +00:00
|
|
|
#if defined(__linux__)
|
|
|
|
#include <sys/prctl.h>
|
|
|
|
#endif
|
2019-01-19 21:05:20 +00:00
|
|
|
#include <fcntl.h>
|
2016-01-15 03:55:07 +00:00
|
|
|
#include <errno.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <signal.h>
|
|
|
|
#include <cxxabi.h>
|
2018-08-12 12:23:22 +00:00
|
|
|
#include <unistd.h>
|
2017-06-23 05:16:34 +00:00
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
#include <typeinfo>
|
|
|
|
#include <iostream>
|
2017-11-16 19:09:08 +00:00
|
|
|
#include <fstream>
|
2017-08-18 01:00:13 +00:00
|
|
|
#include <sstream>
|
2017-03-21 19:08:09 +00:00
|
|
|
#include <memory>
|
2020-01-10 18:35:39 +00:00
|
|
|
#include <ext/scope_guard.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
#include <Poco/Observer.h>
|
|
|
|
#include <Poco/AutoPtr.h>
|
|
|
|
#include <Poco/PatternFormatter.h>
|
|
|
|
#include <Poco/File.h>
|
|
|
|
#include <Poco/Path.h>
|
|
|
|
#include <Poco/Message.h>
|
2018-02-08 19:12:37 +00:00
|
|
|
#include <Poco/Util/Application.h>
|
2016-01-15 03:55:07 +00:00
|
|
|
#include <Poco/Exception.h>
|
|
|
|
#include <Poco/ErrorHandler.h>
|
|
|
|
#include <Poco/Condition.h>
|
|
|
|
#include <Poco/SyslogChannel.h>
|
2018-08-12 12:23:22 +00:00
|
|
|
#include <Poco/DirectoryIterator.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
|
|
|
|
#include <common/logger_useful.h>
|
|
|
|
#include <common/ErrorHandlers.h>
|
|
|
|
#include <common/argsToConfig.h>
|
2020-02-02 02:35:47 +00:00
|
|
|
#include <common/getThreadId.h>
|
2019-12-23 16:41:23 +00:00
|
|
|
#include <common/coverage.h>
|
2020-06-20 10:15:53 +00:00
|
|
|
#include <common/sleep.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
|
2019-07-25 12:49:14 +00:00
|
|
|
#include <IO/WriteBufferFromFile.h>
|
2019-08-17 20:33:50 +00:00
|
|
|
#include <IO/WriteBufferFromFileDescriptorDiscardOnFailure.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <IO/ReadBufferFromFileDescriptor.h>
|
|
|
|
#include <IO/ReadHelpers.h>
|
|
|
|
#include <IO/WriteHelpers.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
#include <Common/Exception.h>
|
|
|
|
#include <Common/PipeFDs.h>
|
|
|
|
#include <Common/StackTrace.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Common/getMultipleKeysFromConfig.h>
|
|
|
|
#include <Common/ClickHouseRevision.h>
|
2019-12-22 17:20:33 +00:00
|
|
|
#include <Common/Config/ConfigProcessor.h>
|
2020-07-31 14:53:41 +00:00
|
|
|
#include <Common/MemorySanitizer.h>
|
2020-06-20 09:07:05 +00:00
|
|
|
#include <Common/SymbolIndex.h>
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2020-04-16 12:31:57 +00:00
|
|
|
#if !defined(ARCADIA_BUILD)
|
2020-05-10 22:17:28 +00:00
|
|
|
# include <Common/config_version.h>
|
2020-04-16 12:31:57 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#if defined(OS_DARWIN)
|
2020-05-10 22:17:28 +00:00
|
|
|
# pragma GCC diagnostic ignored "-Wunused-macros"
|
|
|
|
# define _XOPEN_SOURCE 700 // ucontext is not available without _XOPEN_SOURCE
|
2019-03-27 15:42:24 +00:00
|
|
|
#endif
|
|
|
|
#include <ucontext.h>
|
|
|
|
|
|
|
|
|
2019-12-22 17:20:33 +00:00
|
|
|
DB::PipeFDs signal_pipe;
|
2016-01-15 03:55:07 +00:00
|
|
|
|
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/** Reset signal handler to the default and send signal to itself.
|
|
|
|
* It's called from user signal handler to write core dump.
|
2016-01-15 03:55:07 +00:00
|
|
|
*/
|
|
|
|
static void call_default_signal_handler(int sig)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
signal(sig, SIG_DFL);
|
2018-08-20 23:16:50 +00:00
|
|
|
raise(sig);
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2021-01-05 13:19:27 +00:00
|
|
|
// Apparently strsignal is not instrumented by MemorySanitizer, so we
|
|
|
|
// have to unpoison it to avoid msan reports inside fmt library when we
|
|
|
|
// print it.
|
2020-07-31 14:53:41 +00:00
|
|
|
const char * msan_strsignal(int sig)
|
|
|
|
{
|
2021-01-05 13:19:27 +00:00
|
|
|
// no glibc in osx/freebsd
|
|
|
|
#if !defined(__GLIBC_PREREQ)
|
|
|
|
#define __GLIBC_PREREQ(x, y) 0
|
|
|
|
#endif
|
|
|
|
|
|
|
|
// glibc 2.32+ deprecates sys_siglist[]
|
|
|
|
// newer glibc is a problem only for unbundled build.
|
|
|
|
#if __GLIBC_PREREQ(2, 32)
|
|
|
|
const char * signal_name = sigdescr_np(sig);
|
|
|
|
#else
|
2020-12-21 00:28:19 +00:00
|
|
|
const char * signal_name = sys_siglist[sig];
|
2021-01-05 13:19:27 +00:00
|
|
|
#endif
|
|
|
|
|
2020-07-31 14:53:41 +00:00
|
|
|
__msan_unpoison_string(signal_name);
|
|
|
|
return signal_name;
|
|
|
|
}
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2019-12-23 20:19:49 +00:00
|
|
|
static constexpr size_t max_query_id_size = 127;
|
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
static const size_t signal_pipe_buf_size =
|
2019-12-23 20:19:49 +00:00
|
|
|
sizeof(int)
|
|
|
|
+ sizeof(siginfo_t)
|
|
|
|
+ sizeof(ucontext_t)
|
|
|
|
+ sizeof(StackTrace)
|
|
|
|
+ sizeof(UInt32)
|
2020-06-20 10:10:18 +00:00
|
|
|
+ max_query_id_size + 1 /// query_id + varint encoded length
|
|
|
|
+ sizeof(void*);
|
2019-12-22 17:20:33 +00:00
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2016-06-08 14:39:19 +00:00
|
|
|
using signal_function = void(int, siginfo_t*, void*);
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2016-06-08 14:39:19 +00:00
|
|
|
static void writeSignalIDtoSignalPipe(int sig)
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2020-03-01 14:23:43 +00:00
|
|
|
auto saved_errno = errno; /// We must restore previous value of errno in signal handler.
|
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
char buf[signal_pipe_buf_size];
|
|
|
|
DB::WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
|
2017-04-01 07:20:54 +00:00
|
|
|
DB::writeBinary(sig, out);
|
|
|
|
out.next();
|
2020-03-01 14:23:43 +00:00
|
|
|
|
|
|
|
errno = saved_errno;
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/** Signal handler for HUP / USR1 */
|
2020-03-18 03:27:32 +00:00
|
|
|
static void closeLogsSignalHandler(int sig, siginfo_t *, void *)
|
2016-06-08 14:39:19 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
writeSignalIDtoSignalPipe(sig);
|
2016-06-08 14:39:19 +00:00
|
|
|
}
|
|
|
|
|
2020-03-18 03:27:32 +00:00
|
|
|
static void terminateRequestedSignalHandler(int sig, siginfo_t *, void *)
|
2016-06-08 14:39:19 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
writeSignalIDtoSignalPipe(sig);
|
2016-06-08 14:39:19 +00:00
|
|
|
}
|
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2019-12-22 17:20:33 +00:00
|
|
|
/** Handler for "fault" or diagnostic signals. Send data about fault to separate thread to write into log.
|
2016-01-15 03:55:07 +00:00
|
|
|
*/
|
2019-12-22 17:20:33 +00:00
|
|
|
static void signalHandler(int sig, siginfo_t * info, void * context)
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2020-03-01 14:23:43 +00:00
|
|
|
auto saved_errno = errno; /// We must restore previous value of errno in signal handler.
|
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
char buf[signal_pipe_buf_size];
|
|
|
|
DB::WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2019-06-28 18:06:38 +00:00
|
|
|
const ucontext_t signal_context = *reinterpret_cast<ucontext_t *>(context);
|
2019-07-02 00:19:56 +00:00
|
|
|
const StackTrace stack_trace(signal_context);
|
2019-03-27 20:37:39 +00:00
|
|
|
|
2020-05-30 21:57:37 +00:00
|
|
|
StringRef query_id = DB::CurrentThread::getQueryId(); /// This is signal safe.
|
2019-12-23 20:19:49 +00:00
|
|
|
query_id.size = std::min(query_id.size, max_query_id_size);
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
DB::writeBinary(sig, out);
|
|
|
|
DB::writePODBinary(*info, out);
|
2019-06-28 18:06:38 +00:00
|
|
|
DB::writePODBinary(signal_context, out);
|
2019-07-02 00:19:56 +00:00
|
|
|
DB::writePODBinary(stack_trace, out);
|
2020-02-02 02:35:47 +00:00
|
|
|
DB::writeBinary(UInt32(getThreadId()), out);
|
2019-12-23 20:19:49 +00:00
|
|
|
DB::writeStringBinary(query_id, out);
|
2020-06-20 11:17:15 +00:00
|
|
|
DB::writePODBinary(DB::current_thread, out);
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
out.next();
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2019-12-02 17:29:19 +00:00
|
|
|
if (sig != SIGTSTP) /// This signal is used for debugging.
|
2019-08-17 21:13:38 +00:00
|
|
|
{
|
|
|
|
/// The time that is usually enough for separate thread to print info into log.
|
2020-06-20 10:15:53 +00:00
|
|
|
sleepForSeconds(10);
|
2019-08-17 21:13:38 +00:00
|
|
|
call_default_signal_handler(sig);
|
|
|
|
}
|
2020-03-01 14:23:43 +00:00
|
|
|
|
|
|
|
errno = saved_errno;
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-08-01 15:54:44 +00:00
|
|
|
/// Avoid link time dependency on DB/Interpreters - will use this function only when linked.
|
|
|
|
__attribute__((__weak__)) void collectCrashLog(
|
|
|
|
Int32 signal, UInt64 thread_id, const String & query_id, const StackTrace & stack_trace);
|
|
|
|
|
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/** The thread that read info about signal or std::terminate from pipe.
|
|
|
|
* On HUP / USR1, close log files (for new files to be opened later).
|
|
|
|
* On information about std::terminate, write it to log.
|
|
|
|
* On other signals, write info to log.
|
2016-01-15 03:55:07 +00:00
|
|
|
*/
|
|
|
|
class SignalListener : public Poco::Runnable
|
|
|
|
{
|
|
|
|
public:
|
2017-04-01 07:20:54 +00:00
|
|
|
enum Signals : int
|
|
|
|
{
|
|
|
|
StdTerminate = -1,
|
2020-07-09 02:00:48 +00:00
|
|
|
StopThread = -2,
|
|
|
|
SanitizerTrap = -3,
|
2017-04-01 07:20:54 +00:00
|
|
|
};
|
|
|
|
|
2017-09-07 21:04:48 +00:00
|
|
|
explicit SignalListener(BaseDaemon & daemon_)
|
2020-05-30 21:57:37 +00:00
|
|
|
: log(&Poco::Logger::get("BaseDaemon"))
|
2017-09-07 21:04:48 +00:00
|
|
|
, daemon(daemon_)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
void run() override
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-05-09 23:22:51 +00:00
|
|
|
char buf[signal_pipe_buf_size];
|
|
|
|
DB::ReadBufferFromFileDescriptor in(signal_pipe.fds_rw[0], signal_pipe_buf_size, buf);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
while (!in.eof())
|
|
|
|
{
|
|
|
|
int sig = 0;
|
|
|
|
DB::readBinary(sig, in);
|
2019-12-09 13:52:52 +00:00
|
|
|
// We may log some specific signals afterwards, with different log
|
|
|
|
// levels and more info, but for completeness we log all signals
|
|
|
|
// here at trace level.
|
2020-03-26 09:59:25 +00:00
|
|
|
// Don't use strsignal here, because it's not thread-safe.
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_TRACE(log, "Received signal {}", sig);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
if (sig == Signals::StopThread)
|
|
|
|
{
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_INFO(log, "Stop SignalListener thread");
|
2017-04-01 07:20:54 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
else if (sig == SIGHUP || sig == SIGUSR1)
|
|
|
|
{
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_DEBUG(log, "Received signal to close logs.");
|
2019-06-14 14:00:37 +00:00
|
|
|
BaseDaemon::instance().closeLogs(BaseDaemon::instance().logger());
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_INFO(log, "Opened new log file after received signal.");
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
else if (sig == Signals::StdTerminate)
|
|
|
|
{
|
2019-12-22 17:20:33 +00:00
|
|
|
UInt32 thread_num;
|
2017-04-01 07:20:54 +00:00
|
|
|
std::string message;
|
|
|
|
|
|
|
|
DB::readBinary(thread_num, in);
|
|
|
|
DB::readBinary(message, in);
|
|
|
|
|
|
|
|
onTerminate(message, thread_num);
|
|
|
|
}
|
|
|
|
else if (sig == SIGINT ||
|
|
|
|
sig == SIGQUIT ||
|
|
|
|
sig == SIGTERM)
|
|
|
|
{
|
|
|
|
daemon.handleSignal(sig);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
siginfo_t info;
|
|
|
|
ucontext_t context;
|
2019-07-02 00:19:56 +00:00
|
|
|
StackTrace stack_trace(NoCapture{});
|
2019-12-22 17:20:33 +00:00
|
|
|
UInt32 thread_num;
|
2019-12-23 20:19:49 +00:00
|
|
|
std::string query_id;
|
2020-06-20 11:17:15 +00:00
|
|
|
DB::ThreadStatus * thread_ptr{};
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
if (sig != SanitizerTrap)
|
|
|
|
{
|
|
|
|
DB::readPODBinary(info, in);
|
|
|
|
DB::readPODBinary(context, in);
|
|
|
|
}
|
|
|
|
|
2019-07-02 00:19:56 +00:00
|
|
|
DB::readPODBinary(stack_trace, in);
|
2017-04-01 07:20:54 +00:00
|
|
|
DB::readBinary(thread_num, in);
|
2019-12-23 20:19:49 +00:00
|
|
|
DB::readBinary(query_id, in);
|
2020-06-20 11:17:15 +00:00
|
|
|
DB::readPODBinary(thread_ptr, in);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2019-08-17 21:42:47 +00:00
|
|
|
/// This allows to receive more signals if failure happens inside onFault function.
|
|
|
|
/// Example: segfault while symbolizing stack trace.
|
2020-06-20 10:10:18 +00:00
|
|
|
std::thread([=, this] { onFault(sig, info, context, stack_trace, thread_num, query_id, thread_ptr); }).detach();
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-01-15 03:55:07 +00:00
|
|
|
|
|
|
|
private:
|
2020-05-30 21:57:37 +00:00
|
|
|
Poco::Logger * log;
|
2017-04-01 07:20:54 +00:00
|
|
|
BaseDaemon & daemon;
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2019-12-22 17:20:33 +00:00
|
|
|
void onTerminate(const std::string & message, UInt32 thread_num) const
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-06-20 09:07:05 +00:00
|
|
|
LOG_FATAL(log, "(version {}{}, {}) (from thread {}) {}",
|
|
|
|
VERSION_STRING, VERSION_OFFICIAL, daemon.build_id_info, thread_num, message);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
2019-12-23 20:19:49 +00:00
|
|
|
void onFault(
|
|
|
|
int sig,
|
|
|
|
const siginfo_t & info,
|
|
|
|
const ucontext_t & context,
|
|
|
|
const StackTrace & stack_trace,
|
|
|
|
UInt32 thread_num,
|
2020-06-20 10:10:18 +00:00
|
|
|
const std::string & query_id,
|
2020-06-20 11:17:15 +00:00
|
|
|
DB::ThreadStatus * thread_ptr) const
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-06-20 11:17:15 +00:00
|
|
|
DB::ThreadStatus thread_status;
|
2019-12-23 20:19:49 +00:00
|
|
|
|
2020-06-20 10:10:18 +00:00
|
|
|
/// Send logs from this thread to client if possible.
|
|
|
|
/// It will allow client to see failure messages directly.
|
2020-06-20 11:17:15 +00:00
|
|
|
if (thread_ptr)
|
2019-12-23 20:19:49 +00:00
|
|
|
{
|
2020-06-20 10:10:18 +00:00
|
|
|
if (auto logs_queue = thread_ptr->getInternalTextLogsQueue())
|
|
|
|
DB::CurrentThread::attachInternalTextLogsQueue(logs_queue, DB::LogsLevel::trace);
|
2020-06-20 11:17:15 +00:00
|
|
|
}
|
2020-06-20 10:10:18 +00:00
|
|
|
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_FATAL(log, "########################################");
|
2019-12-23 20:19:49 +00:00
|
|
|
|
2020-06-20 09:07:05 +00:00
|
|
|
if (query_id.empty())
|
2019-12-23 20:19:49 +00:00
|
|
|
{
|
2020-06-20 09:07:05 +00:00
|
|
|
LOG_FATAL(log, "(version {}{}, {}) (from thread {}) (no query) Received signal {} ({})",
|
2020-07-31 14:53:41 +00:00
|
|
|
VERSION_STRING, VERSION_OFFICIAL, daemon.build_id_info,
|
|
|
|
thread_num, msan_strsignal(sig), sig);
|
2020-06-20 09:07:05 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
LOG_FATAL(log, "(version {}{}, {}) (from thread {}) (query_id: {}) Received signal {} ({})",
|
2020-07-31 14:53:41 +00:00
|
|
|
VERSION_STRING, VERSION_OFFICIAL, daemon.build_id_info,
|
|
|
|
thread_num, query_id, msan_strsignal(sig), sig);
|
2019-12-23 20:19:49 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
String error_message;
|
|
|
|
|
|
|
|
if (sig != SanitizerTrap)
|
|
|
|
error_message = signalToErrorMessage(sig, info, context);
|
|
|
|
else
|
|
|
|
error_message = "Sanitizer trap.";
|
|
|
|
|
|
|
|
LOG_FATAL(log, error_message);
|
2019-08-17 21:27:25 +00:00
|
|
|
|
|
|
|
if (stack_trace.getSize())
|
|
|
|
{
|
2020-05-12 03:36:09 +00:00
|
|
|
/// Write bare stack trace (addresses) just in case if we will fail to print symbolized stack trace.
|
|
|
|
/// NOTE This still require memory allocations and mutex lock inside logger. BTW we can also print it to stderr using write syscalls.
|
|
|
|
|
2019-08-17 21:27:25 +00:00
|
|
|
std::stringstream bare_stacktrace;
|
|
|
|
bare_stacktrace << "Stack trace:";
|
|
|
|
for (size_t i = stack_trace.getOffset(); i < stack_trace.getSize(); ++i)
|
2020-05-27 19:11:04 +00:00
|
|
|
bare_stacktrace << ' ' << stack_trace.getFramePointers()[i];
|
2019-08-17 21:27:25 +00:00
|
|
|
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_FATAL(log, bare_stacktrace.str());
|
2019-08-17 21:27:25 +00:00
|
|
|
}
|
|
|
|
|
2019-08-17 22:39:26 +00:00
|
|
|
/// Write symbolized stack trace line by line for better grep-ability.
|
2020-05-23 22:24:01 +00:00
|
|
|
stack_trace.toStringEveryLine([&](const std::string & s) { LOG_FATAL(log, s); });
|
2020-05-29 21:28:55 +00:00
|
|
|
|
2020-07-31 20:16:31 +00:00
|
|
|
/// Write crash to system.crash_log table if available.
|
2020-08-01 15:54:44 +00:00
|
|
|
if (collectCrashLog)
|
|
|
|
collectCrashLog(sig, thread_num, query_id, stack_trace);
|
2020-06-23 21:27:04 +00:00
|
|
|
|
2020-07-31 20:16:31 +00:00
|
|
|
/// Send crash report to developers (if configured)
|
2020-07-09 02:00:48 +00:00
|
|
|
if (sig != SanitizerTrap)
|
2020-07-31 20:16:31 +00:00
|
|
|
SentryWriter::onFault(sig, error_message, stack_trace);
|
2020-06-23 21:18:16 +00:00
|
|
|
|
2020-06-20 11:17:15 +00:00
|
|
|
/// When everything is done, we will try to send these error messages to client.
|
|
|
|
if (thread_ptr)
|
|
|
|
thread_ptr->onFatalError();
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2016-01-15 03:55:07 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2020-05-12 03:31:53 +00:00
|
|
|
#if defined(SANITIZER)
|
|
|
|
extern "C" void __sanitizer_set_death_callback(void (*)());
|
|
|
|
|
|
|
|
static void sanitizerDeathCallback()
|
|
|
|
{
|
2020-07-09 02:00:48 +00:00
|
|
|
/// Also need to send data via pipe. Otherwise it may lead to deadlocks or failures in printing diagnostic info.
|
2020-05-12 03:31:53 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
char buf[signal_pipe_buf_size];
|
|
|
|
DB::WriteBufferFromFileDescriptorDiscardOnFailure out(signal_pipe.fds_rw[1], signal_pipe_buf_size, buf);
|
2020-05-12 03:31:53 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
const StackTrace stack_trace;
|
2020-05-12 03:31:53 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
StringRef query_id = DB::CurrentThread::getQueryId();
|
|
|
|
query_id.size = std::min(query_id.size, max_query_id_size);
|
2020-05-12 03:31:53 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
int sig = SignalListener::SanitizerTrap;
|
|
|
|
DB::writeBinary(sig, out);
|
|
|
|
DB::writePODBinary(stack_trace, out);
|
|
|
|
DB::writeBinary(UInt32(getThreadId()), out);
|
|
|
|
DB::writeStringBinary(query_id, out);
|
|
|
|
DB::writePODBinary(DB::current_thread, out);
|
|
|
|
|
|
|
|
out.next();
|
2020-05-12 03:31:53 +00:00
|
|
|
|
2020-07-09 02:00:48 +00:00
|
|
|
/// The time that is usually enough for separate thread to print info into log.
|
|
|
|
sleepForSeconds(10);
|
2020-05-12 03:31:53 +00:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/** To use with std::set_terminate.
|
|
|
|
* Collects slightly more info than __gnu_cxx::__verbose_terminate_handler,
|
|
|
|
* and send it to pipe. Other thread will read this info from pipe and asynchronously write it to log.
|
|
|
|
* Look at libstdc++-v3/libsupc++/vterminate.cc for example.
|
2016-01-15 03:55:07 +00:00
|
|
|
*/
|
2020-05-09 22:59:34 +00:00
|
|
|
[[noreturn]] static void terminate_handler()
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2017-10-19 19:36:37 +00:00
|
|
|
static thread_local bool terminating = false;
|
2017-04-01 07:20:54 +00:00
|
|
|
if (terminating)
|
|
|
|
abort();
|
|
|
|
|
|
|
|
terminating = true;
|
|
|
|
|
2018-08-29 18:35:46 +00:00
|
|
|
std::string log_message;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2018-08-29 18:35:46 +00:00
|
|
|
if (std::current_exception())
|
|
|
|
log_message = "Terminate called for uncaught exception:\n" + DB::getCurrentExceptionMessage(true);
|
2017-04-01 07:20:54 +00:00
|
|
|
else
|
2018-08-29 18:35:46 +00:00
|
|
|
log_message = "Terminate called without an active exception";
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
static const size_t buf_size = 1024;
|
|
|
|
|
|
|
|
if (log_message.size() > buf_size - 16)
|
|
|
|
log_message.resize(buf_size - 16);
|
|
|
|
|
|
|
|
char buf[buf_size];
|
2019-02-09 21:40:10 +00:00
|
|
|
DB::WriteBufferFromFileDescriptor out(signal_pipe.fds_rw[1], buf_size, buf);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
DB::writeBinary(static_cast<int>(SignalListener::StdTerminate), out);
|
2020-02-02 02:35:47 +00:00
|
|
|
DB::writeBinary(UInt32(getThreadId()), out);
|
2017-04-01 07:20:54 +00:00
|
|
|
DB::writeBinary(log_message, out);
|
|
|
|
out.next();
|
2016-01-15 03:55:07 +00:00
|
|
|
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2018-02-14 20:41:46 +00:00
|
|
|
static std::string createDirectory(const std::string & file)
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2018-02-14 20:41:46 +00:00
|
|
|
auto path = Poco::Path(file).makeParent();
|
|
|
|
if (path.toString().empty())
|
|
|
|
return "";
|
2018-02-08 19:12:37 +00:00
|
|
|
Poco::File(path).createDirectories();
|
|
|
|
return path.toString();
|
2016-01-15 03:55:07 +00:00
|
|
|
};
|
|
|
|
|
2019-06-14 14:00:37 +00:00
|
|
|
|
2017-02-14 12:11:46 +00:00
|
|
|
static bool tryCreateDirectories(Poco::Logger * logger, const std::string & path)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
try
|
|
|
|
{
|
|
|
|
Poco::File(path).createDirectories();
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
catch (...)
|
|
|
|
{
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_WARNING(logger, "{}: when creating {}, {}", __PRETTY_FUNCTION__, path, DB::getCurrentExceptionMessage(true));
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
return false;
|
2017-02-14 12:11:46 +00:00
|
|
|
}
|
|
|
|
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2016-02-09 17:06:50 +00:00
|
|
|
void BaseDaemon::reloadConfiguration()
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2018-01-17 18:06:39 +00:00
|
|
|
/** If the program is not run in daemon mode and 'config-file' is not specified,
|
|
|
|
* then we use config from 'config.xml' file in current directory,
|
|
|
|
* but will log to console (or use parameters --log-file, --errorlog-file from command line)
|
|
|
|
* instead of using files specified in config.xml.
|
|
|
|
* (It's convenient to log in console when you start server without any command line parameters.)
|
2017-04-01 07:20:54 +00:00
|
|
|
*/
|
|
|
|
config_path = config().getString("config-file", "config.xml");
|
2018-11-27 16:11:46 +00:00
|
|
|
DB::ConfigProcessor config_processor(config_path, false, true);
|
|
|
|
config_processor.setConfigPath(Poco::Path(config_path).makeParent().toString());
|
|
|
|
loaded_config = config_processor.loadConfig(/* allow_zk_includes = */ true);
|
|
|
|
|
2017-06-19 13:31:55 +00:00
|
|
|
if (last_configuration != nullptr)
|
|
|
|
config().removeConfiguration(last_configuration);
|
|
|
|
last_configuration = loaded_config.configuration.duplicate();
|
|
|
|
config().add(last_configuration, PRIO_DEFAULT, false);
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-03-26 21:03:02 +00:00
|
|
|
BaseDaemon::BaseDaemon() = default;
|
2020-03-18 00:57:00 +00:00
|
|
|
|
|
|
|
|
|
|
|
BaseDaemon::~BaseDaemon()
|
|
|
|
{
|
|
|
|
writeSignalIDtoSignalPipe(SignalListener::StopThread);
|
|
|
|
signal_listener_thread.join();
|
Reset signal handlers just before closing signal pipe to avoid EBADF after
stack trace:
(gdb) bt
0 0x00007ffff7dda355 in raise () from /usr/lib/libc.so.6
1 0x00007ffff7dc3853 in abort () from /usr/lib/libc.so.6
2 0x0000000013a78180 in abort_message (format=format@entry=0x5781e10 "terminate_handler unexpectedly threw an exception") at abort_message.cpp:76
3 0x0000000013a899ff in std::__terminate (func=<optimized out>) at cxa_handlers.cpp:67
4 0x0000000013a771a1 in __cxxabiv1::call_terminate (native_exception=native_exception@entry=true, unwind_exception=unwind_exception@entry=0x7ffff70e9060) at cxa_personality.cpp:323
5 0x0000000013a77669 in __cxxabiv1::scan_eh_tab (results=..., actions=<optimized out>, native_exception=native_exception@entry=true, unwind_exception=0x7ffff70e9060, context=context@entry=0x7fffffffc3a0) at cxa_personality.cpp:887
6 0x0000000013a77bde in __cxxabiv1::__gxx_personality_v0 (version=<optimized out>, actions=<optimized out>, exceptionClass=<optimized out>, unwind_exception=0x7ffff70e9060, context=0x7fffffffc3a0) at cxa_personality.cpp:969
7 0x0000000013a962d7 in unwind_phase1 (exception_object=0x7ffff70e9060, cursor=0x7fffffffc3a0, uc=0x7fffffffc2f0) at UnwindLevel1.c:98
8 _Unwind_RaiseException (exception_object=exception_object@entry=0x7ffff70e9060) at UnwindLevel1.c:363
9 0x0000000013a8929b in __cxxabiv1::__cxa_rethrow () at cxa_exception.cpp:607
10 0x000000000f170ad2 in DB::WriteBuffer::next (this=0x7fffffffc510) at WriteBuffer.h:52
11 writeSignalIDtoSignalPipe (sig=<optimized out>) at BaseDaemon.cpp:111
12 <signal handler called>
13 0x00007ffff7e9895b in munmap () from /usr/lib/libc.so.6
14 0x00007ffff7f7e255 in free_stacks () from /usr/lib/libpthread.so.0
15 0x00007ffff7f7e6aa in __deallocate_stack () from /usr/lib/libpthread.so.0
16 0x00007ffff7f80898 in __pthread_clockjoin_ex () from /usr/lib/libpthread.so.0
17 0x0000000013a759f7 in std::__1::__libcpp_thread_join (__t=0x7fff0aa2b090) at __threading_support:409
18 std::__1::thread::join (this=this@entry=0x7fff0aa2b090) at thread.cpp:56
19 0x000000000a4c9399 in ThreadPoolImpl<std::__1::thread>::finalize (this=this@entry=0x7ffff7053900) at list:355
20 0x000000000a4c9426 in ThreadPoolImpl<std::__1::thread>::~ThreadPoolImpl (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.cpp:172
21 0x000000000a4c8a9c in GlobalThreadPool::~GlobalThreadPool (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.h:132
22 std::__1::default_delete<GlobalThreadPool>::operator() (__ptr=0x7ffff7053900, this=<optimized out>) at memory:2363
23 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::reset (__p=0x0, this=<optimized out>) at memory:2618
24 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::~unique_ptr (this=<optimized out>, __in_chrg=<optimized out>) at memory:2572
25 0x00007ffff7ddcc57 in __run_exit_handlers () from /usr/lib/libc.so.6
26 0x00007ffff7ddcdfe in exit () from /usr/lib/libc.so.6
27 0x00007ffff7dc5009 in __libc_start_main () from /usr/lib/libc.so.6
28 0x000000000a48702e in _start () at new:340
2020-08-13 19:51:41 +00:00
|
|
|
/// Reset signals to SIG_DFL to avoid trying to write to the signal_pipe that will be closed after.
|
|
|
|
for (int sig : handled_signals)
|
|
|
|
{
|
|
|
|
signal(sig, SIG_DFL);
|
|
|
|
}
|
2020-03-18 00:57:00 +00:00
|
|
|
signal_pipe.close();
|
|
|
|
}
|
|
|
|
|
2019-02-02 12:26:07 +00:00
|
|
|
|
2016-02-09 17:06:50 +00:00
|
|
|
void BaseDaemon::terminate()
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2018-08-20 23:16:50 +00:00
|
|
|
if (::raise(SIGTERM) != 0)
|
2017-04-01 07:20:54 +00:00
|
|
|
throw Poco::SystemException("cannot terminate process");
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2016-02-09 17:06:50 +00:00
|
|
|
void BaseDaemon::kill()
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2019-12-18 10:43:40 +00:00
|
|
|
dumpCoverageReportIfPossible();
|
2020-12-22 02:57:22 +00:00
|
|
|
pid_file.reset();
|
2018-08-20 23:16:50 +00:00
|
|
|
if (::raise(SIGKILL) != 0)
|
|
|
|
throw Poco::SystemException("cannot kill process");
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2017-02-14 12:12:23 +00:00
|
|
|
std::string BaseDaemon::getDefaultCorePath() const
|
2017-01-09 13:42:29 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
return "/opt/cores/";
|
2017-01-09 13:42:29 +00:00
|
|
|
}
|
|
|
|
|
2018-08-12 12:23:22 +00:00
|
|
|
void BaseDaemon::closeFDs()
|
|
|
|
{
|
2020-04-16 12:31:57 +00:00
|
|
|
#if defined(OS_FREEBSD) || defined(OS_DARWIN)
|
2018-08-12 12:23:22 +00:00
|
|
|
Poco::File proc_path{"/dev/fd"};
|
|
|
|
#else
|
|
|
|
Poco::File proc_path{"/proc/self/fd"};
|
|
|
|
#endif
|
|
|
|
if (proc_path.isDirectory()) /// Hooray, proc exists
|
|
|
|
{
|
2019-01-22 14:37:28 +00:00
|
|
|
std::vector<std::string> fds;
|
|
|
|
/// in /proc/self/fd directory filenames are numeric file descriptors
|
|
|
|
proc_path.list(fds);
|
|
|
|
for (const auto & fd_str : fds)
|
2018-08-12 12:23:22 +00:00
|
|
|
{
|
2019-01-22 16:28:05 +00:00
|
|
|
int fd = DB::parse<int>(fd_str);
|
2019-02-09 21:40:10 +00:00
|
|
|
if (fd > 2 && fd != signal_pipe.fds_rw[0] && fd != signal_pipe.fds_rw[1])
|
2018-08-12 12:23:22 +00:00
|
|
|
::close(fd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2019-01-22 16:28:05 +00:00
|
|
|
int max_fd = -1;
|
2020-04-16 12:31:57 +00:00
|
|
|
#if defined(_SC_OPEN_MAX)
|
2018-08-12 12:23:22 +00:00
|
|
|
max_fd = sysconf(_SC_OPEN_MAX);
|
|
|
|
if (max_fd == -1)
|
|
|
|
#endif
|
|
|
|
max_fd = 256; /// bad fallback
|
2019-01-22 16:28:05 +00:00
|
|
|
for (int fd = 3; fd < max_fd; ++fd)
|
2019-02-09 21:40:10 +00:00
|
|
|
if (fd != signal_pipe.fds_rw[0] && fd != signal_pipe.fds_rw[1])
|
2018-08-12 12:23:22 +00:00
|
|
|
::close(fd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-25 12:49:14 +00:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
/// In debug version on Linux, increase oom score so that clickhouse is killed
|
|
|
|
/// first, instead of some service. Use a carefully chosen random score of 555:
|
|
|
|
/// the maximum is 1000, and chromium uses 300 for its tab processes. Ignore
|
|
|
|
/// whatever errors that occur, because it's just a debugging aid and we don't
|
|
|
|
/// care if it breaks.
|
2020-04-16 12:31:57 +00:00
|
|
|
#if defined(OS_LINUX) && !defined(NDEBUG)
|
2019-07-25 12:49:14 +00:00
|
|
|
void debugIncreaseOOMScore()
|
|
|
|
{
|
|
|
|
const std::string new_score = "555";
|
2019-07-25 20:17:17 +00:00
|
|
|
try
|
|
|
|
{
|
2019-07-25 12:49:14 +00:00
|
|
|
DB::WriteBufferFromFile buf("/proc/self/oom_score_adj");
|
|
|
|
buf.write(new_score.c_str(), new_score.size());
|
|
|
|
}
|
2019-07-25 20:17:17 +00:00
|
|
|
catch (const Poco::Exception & e)
|
2019-07-25 12:49:14 +00:00
|
|
|
{
|
2020-05-31 13:50:40 +00:00
|
|
|
LOG_WARNING(&Poco::Logger::root(), "Failed to adjust OOM score: '{}'.", e.displayText());
|
2019-07-25 12:49:14 +00:00
|
|
|
return;
|
|
|
|
}
|
2020-05-31 13:50:40 +00:00
|
|
|
LOG_INFO(&Poco::Logger::root(), "Set OOM score adjustment to {}", new_score);
|
2019-07-25 12:49:14 +00:00
|
|
|
}
|
|
|
|
#else
|
|
|
|
void debugIncreaseOOMScore() {}
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2017-08-18 01:00:13 +00:00
|
|
|
void BaseDaemon::initialize(Application & self)
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2018-08-12 12:23:22 +00:00
|
|
|
closeFDs();
|
2020-05-27 19:11:04 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
ServerApplication::initialize(self);
|
|
|
|
|
2019-06-14 14:00:37 +00:00
|
|
|
/// now highest priority (lowest value) is PRIO_APPLICATION = -100, we want higher!
|
|
|
|
argsToConfig(argv(), config(), PRIO_APPLICATION - 100);
|
2018-02-08 19:12:37 +00:00
|
|
|
|
2018-05-15 16:22:00 +00:00
|
|
|
bool is_daemon = config().getBool("application.runAsDaemon", false);
|
2017-04-01 07:20:54 +00:00
|
|
|
if (is_daemon)
|
|
|
|
{
|
2018-01-17 18:06:39 +00:00
|
|
|
/** When creating pid file and looking for config, will search for paths relative to the working path of the program when started.
|
2017-04-01 07:20:54 +00:00
|
|
|
*/
|
|
|
|
std::string path = Poco::Path(config().getString("application.path")).setFileName("").toString();
|
|
|
|
if (0 != chdir(path.c_str()))
|
|
|
|
throw Poco::Exception("Cannot change directory to " + path);
|
|
|
|
}
|
|
|
|
|
|
|
|
reloadConfiguration();
|
|
|
|
|
2017-11-21 16:54:25 +00:00
|
|
|
/// This must be done before creation of any files (including logs).
|
2019-01-30 21:29:50 +00:00
|
|
|
mode_t umask_num = 0027;
|
2017-11-21 16:54:25 +00:00
|
|
|
if (config().has("umask"))
|
|
|
|
{
|
|
|
|
std::string umask_str = config().getString("umask");
|
|
|
|
std::stringstream stream;
|
|
|
|
stream << umask_str;
|
|
|
|
stream >> std::oct >> umask_num;
|
|
|
|
}
|
2019-01-30 21:29:50 +00:00
|
|
|
umask(umask_num);
|
2017-11-21 16:54:25 +00:00
|
|
|
|
2018-11-27 16:11:46 +00:00
|
|
|
DB::ConfigProcessor(config_path).savePreprocessedConfig(loaded_config, "");
|
2017-11-21 16:54:25 +00:00
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/// Write core dump on crash.
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
struct rlimit rlim;
|
|
|
|
if (getrlimit(RLIMIT_CORE, &rlim))
|
|
|
|
throw Poco::Exception("Cannot getrlimit");
|
2018-01-17 18:06:39 +00:00
|
|
|
/// 1 GiB by default. If more - it writes to disk too long.
|
2017-04-01 07:20:54 +00:00
|
|
|
rlim.rlim_cur = config().getUInt64("core_dump.size_limit", 1024 * 1024 * 1024);
|
|
|
|
|
2019-02-21 18:51:43 +00:00
|
|
|
if (rlim.rlim_cur && setrlimit(RLIMIT_CORE, &rlim))
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2018-01-17 18:06:39 +00:00
|
|
|
/// It doesn't work under address/thread sanitizer. http://lists.llvm.org/pipermail/llvm-bugs/2013-April/027880.html
|
2019-02-21 18:51:43 +00:00
|
|
|
std::cerr << "Cannot set max size of core file to " + std::to_string(rlim.rlim_cur) << std::endl;
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// This must be done before any usage of DateLUT. In particular, before any logging.
|
|
|
|
if (config().has("timezone"))
|
|
|
|
{
|
2020-05-09 22:59:34 +00:00
|
|
|
const std::string config_timezone = config().getString("timezone");
|
|
|
|
if (0 != setenv("TZ", config_timezone.data(), 1))
|
2017-04-01 07:20:54 +00:00
|
|
|
throw Poco::Exception("Cannot setenv TZ variable");
|
|
|
|
|
|
|
|
tzset();
|
2020-05-09 22:59:34 +00:00
|
|
|
DateLUT::setDefaultTimezone(config_timezone);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
std::string log_path = config().getString("logger.log", "");
|
|
|
|
if (!log_path.empty())
|
|
|
|
log_path = Poco::Path(log_path).setFileName("").toString();
|
|
|
|
|
2018-05-15 17:05:13 +00:00
|
|
|
/** Redirect stdout, stderr to separate files in the log directory (or in the specified file).
|
|
|
|
* Some libraries write to stderr in case of errors in debug mode,
|
|
|
|
* and this output makes sense even if the program is run in daemon mode.
|
|
|
|
* We have to do it before buildLoggers, for errors on logger initialization will be written to these files.
|
|
|
|
* If logger.stderr is specified then stderr will be forcibly redirected to that file.
|
|
|
|
*/
|
2018-05-15 18:10:50 +00:00
|
|
|
if ((!log_path.empty() && is_daemon) || config().has("logger.stderr"))
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2018-08-29 18:48:14 +00:00
|
|
|
std::string stderr_path = config().getString("logger.stderr", log_path + "/stderr.log");
|
2018-05-15 17:05:13 +00:00
|
|
|
if (!freopen(stderr_path.c_str(), "a+", stderr))
|
|
|
|
throw Poco::OpenFileException("Cannot attach stderr to " + stderr_path);
|
2020-05-04 14:57:09 +00:00
|
|
|
|
|
|
|
/// Disable buffering for stderr
|
|
|
|
setbuf(stderr, nullptr);
|
2018-05-15 17:05:13 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2018-05-15 18:10:50 +00:00
|
|
|
if ((!log_path.empty() && is_daemon) || config().has("logger.stdout"))
|
2018-05-15 17:05:13 +00:00
|
|
|
{
|
2018-08-29 18:48:14 +00:00
|
|
|
std::string stdout_path = config().getString("logger.stdout", log_path + "/stdout.log");
|
2018-05-15 17:05:13 +00:00
|
|
|
if (!freopen(stdout_path.c_str(), "a+", stdout))
|
|
|
|
throw Poco::OpenFileException("Cannot attach stdout to " + stdout_path);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
|
|
|
|
2018-02-28 20:34:25 +00:00
|
|
|
/// Change path for logging.
|
2018-04-19 18:19:12 +00:00
|
|
|
if (!log_path.empty())
|
2018-02-28 20:34:25 +00:00
|
|
|
{
|
2018-04-19 18:19:12 +00:00
|
|
|
std::string path = createDirectory(log_path);
|
2018-02-28 20:34:25 +00:00
|
|
|
if (is_daemon
|
|
|
|
&& chdir(path.c_str()) != 0)
|
|
|
|
throw Poco::Exception("Cannot change directory to " + path);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (is_daemon
|
|
|
|
&& chdir("/tmp") != 0)
|
|
|
|
throw Poco::Exception("Cannot change directory to /tmp");
|
|
|
|
}
|
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
/// sensitive data masking rules are not used here
|
2019-12-29 13:08:33 +00:00
|
|
|
buildLoggers(config(), logger(), self.commandName());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
/// After initialized loggers but before initialized signal handling.
|
|
|
|
if (should_setup_watchdog)
|
|
|
|
setupWatchdog();
|
|
|
|
|
|
|
|
/// Create pid file.
|
|
|
|
if (config().has("pid"))
|
|
|
|
pid_file.emplace(config().getString("pid"), DB::StatusFile::write_pid);
|
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
if (is_daemon)
|
|
|
|
{
|
2018-01-17 18:06:39 +00:00
|
|
|
/** Change working directory to the directory to write core dumps.
|
|
|
|
* We have to do it after buildLoggers, because there is the case when config files was in current directory.
|
2017-04-01 07:20:54 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
std::string core_path = config().getString("core_path", "");
|
|
|
|
if (core_path.empty())
|
|
|
|
core_path = getDefaultCorePath();
|
|
|
|
|
|
|
|
tryCreateDirectories(&logger(), core_path);
|
|
|
|
|
|
|
|
Poco::File cores = core_path;
|
|
|
|
if (!(cores.exists() && cores.isDirectory()))
|
|
|
|
{
|
|
|
|
core_path = !log_path.empty() ? log_path : "/opt/";
|
|
|
|
tryCreateDirectories(&logger(), core_path);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (0 != chdir(core_path.c_str()))
|
|
|
|
throw Poco::Exception("Cannot change directory to " + core_path);
|
|
|
|
}
|
|
|
|
|
2018-08-07 17:57:44 +00:00
|
|
|
initializeTerminationAndSignalProcessing();
|
|
|
|
logRevision();
|
2019-07-25 12:49:14 +00:00
|
|
|
debugIncreaseOOMScore();
|
2018-08-07 17:57:44 +00:00
|
|
|
|
|
|
|
for (const auto & key : DB::getMultipleKeysFromConfig(config(), "", "graphite"))
|
|
|
|
{
|
|
|
|
graphite_writers.emplace(key, std::make_unique<GraphiteWriter>(key));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
static void addSignalHandler(const std::vector<int> & signals, signal_function handler, std::vector<int> * out_handled_signals)
|
2018-08-07 17:57:44 +00:00
|
|
|
{
|
2020-12-22 02:57:22 +00:00
|
|
|
struct sigaction sa;
|
|
|
|
memset(&sa, 0, sizeof(sa));
|
|
|
|
sa.sa_sigaction = handler;
|
|
|
|
sa.sa_flags = SA_SIGINFO;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-10 22:17:28 +00:00
|
|
|
#if defined(OS_DARWIN)
|
2020-12-22 02:57:22 +00:00
|
|
|
sigemptyset(&sa.sa_mask);
|
|
|
|
for (auto signal : signals)
|
|
|
|
sigaddset(&sa.sa_mask, signal);
|
2020-05-10 22:17:28 +00:00
|
|
|
#else
|
2020-12-22 02:57:22 +00:00
|
|
|
if (sigemptyset(&sa.sa_mask))
|
|
|
|
throw Poco::Exception("Cannot set signal handler.");
|
2017-10-13 18:58:19 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
for (auto signal : signals)
|
|
|
|
if (sigaddset(&sa.sa_mask, signal))
|
|
|
|
throw Poco::Exception("Cannot set signal handler.");
|
2020-05-10 22:17:28 +00:00
|
|
|
#endif
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
for (auto signal : signals)
|
|
|
|
if (sigaction(signal, &sa, nullptr))
|
|
|
|
throw Poco::Exception("Cannot set signal handler.");
|
Reset signal handlers just before closing signal pipe to avoid EBADF after
stack trace:
(gdb) bt
0 0x00007ffff7dda355 in raise () from /usr/lib/libc.so.6
1 0x00007ffff7dc3853 in abort () from /usr/lib/libc.so.6
2 0x0000000013a78180 in abort_message (format=format@entry=0x5781e10 "terminate_handler unexpectedly threw an exception") at abort_message.cpp:76
3 0x0000000013a899ff in std::__terminate (func=<optimized out>) at cxa_handlers.cpp:67
4 0x0000000013a771a1 in __cxxabiv1::call_terminate (native_exception=native_exception@entry=true, unwind_exception=unwind_exception@entry=0x7ffff70e9060) at cxa_personality.cpp:323
5 0x0000000013a77669 in __cxxabiv1::scan_eh_tab (results=..., actions=<optimized out>, native_exception=native_exception@entry=true, unwind_exception=0x7ffff70e9060, context=context@entry=0x7fffffffc3a0) at cxa_personality.cpp:887
6 0x0000000013a77bde in __cxxabiv1::__gxx_personality_v0 (version=<optimized out>, actions=<optimized out>, exceptionClass=<optimized out>, unwind_exception=0x7ffff70e9060, context=0x7fffffffc3a0) at cxa_personality.cpp:969
7 0x0000000013a962d7 in unwind_phase1 (exception_object=0x7ffff70e9060, cursor=0x7fffffffc3a0, uc=0x7fffffffc2f0) at UnwindLevel1.c:98
8 _Unwind_RaiseException (exception_object=exception_object@entry=0x7ffff70e9060) at UnwindLevel1.c:363
9 0x0000000013a8929b in __cxxabiv1::__cxa_rethrow () at cxa_exception.cpp:607
10 0x000000000f170ad2 in DB::WriteBuffer::next (this=0x7fffffffc510) at WriteBuffer.h:52
11 writeSignalIDtoSignalPipe (sig=<optimized out>) at BaseDaemon.cpp:111
12 <signal handler called>
13 0x00007ffff7e9895b in munmap () from /usr/lib/libc.so.6
14 0x00007ffff7f7e255 in free_stacks () from /usr/lib/libpthread.so.0
15 0x00007ffff7f7e6aa in __deallocate_stack () from /usr/lib/libpthread.so.0
16 0x00007ffff7f80898 in __pthread_clockjoin_ex () from /usr/lib/libpthread.so.0
17 0x0000000013a759f7 in std::__1::__libcpp_thread_join (__t=0x7fff0aa2b090) at __threading_support:409
18 std::__1::thread::join (this=this@entry=0x7fff0aa2b090) at thread.cpp:56
19 0x000000000a4c9399 in ThreadPoolImpl<std::__1::thread>::finalize (this=this@entry=0x7ffff7053900) at list:355
20 0x000000000a4c9426 in ThreadPoolImpl<std::__1::thread>::~ThreadPoolImpl (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.cpp:172
21 0x000000000a4c8a9c in GlobalThreadPool::~GlobalThreadPool (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.h:132
22 std::__1::default_delete<GlobalThreadPool>::operator() (__ptr=0x7ffff7053900, this=<optimized out>) at memory:2363
23 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::reset (__p=0x0, this=<optimized out>) at memory:2618
24 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::~unique_ptr (this=<optimized out>, __in_chrg=<optimized out>) at memory:2572
25 0x00007ffff7ddcc57 in __run_exit_handlers () from /usr/lib/libc.so.6
26 0x00007ffff7ddcdfe in exit () from /usr/lib/libc.so.6
27 0x00007ffff7dc5009 in __libc_start_main () from /usr/lib/libc.so.6
28 0x000000000a48702e in _start () at new:340
2020-08-13 19:51:41 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
if (out_handled_signals)
|
|
|
|
std::copy(signals.begin(), signals.end(), std::back_inserter(*out_handled_signals));
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
static void blockSignals(const std::vector<int> & signals)
|
|
|
|
{
|
|
|
|
sigset_t sig_set;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-10 22:17:28 +00:00
|
|
|
#if defined(OS_DARWIN)
|
2020-12-22 17:13:18 +00:00
|
|
|
sigemptyset(&sig_set);
|
|
|
|
for (auto signal : signals)
|
|
|
|
sigaddset(&sig_set, signal);
|
2020-05-10 22:17:28 +00:00
|
|
|
#else
|
2020-12-22 02:57:22 +00:00
|
|
|
if (sigemptyset(&sig_set))
|
|
|
|
throw Poco::Exception("Cannot block signal.");
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
for (auto signal : signals)
|
|
|
|
if (sigaddset(&sig_set, signal))
|
|
|
|
throw Poco::Exception("Cannot block signal.");
|
2020-05-10 22:17:28 +00:00
|
|
|
#endif
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
if (pthread_sigmask(SIG_BLOCK, &sig_set, nullptr))
|
|
|
|
throw Poco::Exception("Cannot block signal.");
|
|
|
|
};
|
|
|
|
|
Reset signal handlers just before closing signal pipe to avoid EBADF after
stack trace:
(gdb) bt
0 0x00007ffff7dda355 in raise () from /usr/lib/libc.so.6
1 0x00007ffff7dc3853 in abort () from /usr/lib/libc.so.6
2 0x0000000013a78180 in abort_message (format=format@entry=0x5781e10 "terminate_handler unexpectedly threw an exception") at abort_message.cpp:76
3 0x0000000013a899ff in std::__terminate (func=<optimized out>) at cxa_handlers.cpp:67
4 0x0000000013a771a1 in __cxxabiv1::call_terminate (native_exception=native_exception@entry=true, unwind_exception=unwind_exception@entry=0x7ffff70e9060) at cxa_personality.cpp:323
5 0x0000000013a77669 in __cxxabiv1::scan_eh_tab (results=..., actions=<optimized out>, native_exception=native_exception@entry=true, unwind_exception=0x7ffff70e9060, context=context@entry=0x7fffffffc3a0) at cxa_personality.cpp:887
6 0x0000000013a77bde in __cxxabiv1::__gxx_personality_v0 (version=<optimized out>, actions=<optimized out>, exceptionClass=<optimized out>, unwind_exception=0x7ffff70e9060, context=0x7fffffffc3a0) at cxa_personality.cpp:969
7 0x0000000013a962d7 in unwind_phase1 (exception_object=0x7ffff70e9060, cursor=0x7fffffffc3a0, uc=0x7fffffffc2f0) at UnwindLevel1.c:98
8 _Unwind_RaiseException (exception_object=exception_object@entry=0x7ffff70e9060) at UnwindLevel1.c:363
9 0x0000000013a8929b in __cxxabiv1::__cxa_rethrow () at cxa_exception.cpp:607
10 0x000000000f170ad2 in DB::WriteBuffer::next (this=0x7fffffffc510) at WriteBuffer.h:52
11 writeSignalIDtoSignalPipe (sig=<optimized out>) at BaseDaemon.cpp:111
12 <signal handler called>
13 0x00007ffff7e9895b in munmap () from /usr/lib/libc.so.6
14 0x00007ffff7f7e255 in free_stacks () from /usr/lib/libpthread.so.0
15 0x00007ffff7f7e6aa in __deallocate_stack () from /usr/lib/libpthread.so.0
16 0x00007ffff7f80898 in __pthread_clockjoin_ex () from /usr/lib/libpthread.so.0
17 0x0000000013a759f7 in std::__1::__libcpp_thread_join (__t=0x7fff0aa2b090) at __threading_support:409
18 std::__1::thread::join (this=this@entry=0x7fff0aa2b090) at thread.cpp:56
19 0x000000000a4c9399 in ThreadPoolImpl<std::__1::thread>::finalize (this=this@entry=0x7ffff7053900) at list:355
20 0x000000000a4c9426 in ThreadPoolImpl<std::__1::thread>::~ThreadPoolImpl (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.cpp:172
21 0x000000000a4c8a9c in GlobalThreadPool::~GlobalThreadPool (this=0x7ffff7053900, __in_chrg=<optimized out>) at ThreadPool.h:132
22 std::__1::default_delete<GlobalThreadPool>::operator() (__ptr=0x7ffff7053900, this=<optimized out>) at memory:2363
23 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::reset (__p=0x0, this=<optimized out>) at memory:2618
24 std::__1::unique_ptr<GlobalThreadPool, std::__1::default_delete<GlobalThreadPool> >::~unique_ptr (this=<optimized out>, __in_chrg=<optimized out>) at memory:2572
25 0x00007ffff7ddcc57 in __run_exit_handlers () from /usr/lib/libc.so.6
26 0x00007ffff7ddcdfe in exit () from /usr/lib/libc.so.6
27 0x00007ffff7dc5009 in __libc_start_main () from /usr/lib/libc.so.6
28 0x000000000a48702e in _start () at new:340
2020-08-13 19:51:41 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
void BaseDaemon::initializeTerminationAndSignalProcessing()
|
|
|
|
{
|
|
|
|
SentryWriter::initialize(config());
|
|
|
|
std::set_terminate(terminate_handler);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
/// We want to avoid SIGPIPE when working with sockets and pipes, and just handle return value/errno instead.
|
|
|
|
blockSignals({SIGPIPE});
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
/// Setup signal handlers.
|
2019-12-02 17:29:19 +00:00
|
|
|
/// SIGTSTP is added for debugging purposes. To output a stack trace of any running thread at anytime.
|
2019-08-17 21:13:38 +00:00
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
addSignalHandler({SIGABRT, SIGSEGV, SIGILL, SIGBUS, SIGSYS, SIGFPE, SIGPIPE, SIGTSTP}, signalHandler, &handled_signals);
|
|
|
|
addSignalHandler({SIGHUP, SIGUSR1}, closeLogsSignalHandler, &handled_signals);
|
|
|
|
addSignalHandler({SIGINT, SIGQUIT, SIGTERM}, terminateRequestedSignalHandler, &handled_signals);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-12 03:31:53 +00:00
|
|
|
#if defined(SANITIZER)
|
|
|
|
__sanitizer_set_death_callback(sanitizerDeathCallback);
|
|
|
|
#endif
|
|
|
|
|
2018-01-17 18:06:39 +00:00
|
|
|
/// Set up Poco ErrorHandler for Poco Threads.
|
2017-04-01 07:20:54 +00:00
|
|
|
static KillingErrorHandler killing_error_handler;
|
|
|
|
Poco::ErrorHandler::set(&killing_error_handler);
|
|
|
|
|
2020-11-27 10:12:11 +00:00
|
|
|
signal_pipe.setNonBlockingWrite();
|
2019-12-22 17:20:33 +00:00
|
|
|
signal_pipe.tryIncreaseSize(1 << 20);
|
|
|
|
|
2020-03-08 21:04:10 +00:00
|
|
|
signal_listener = std::make_unique<SignalListener>(*this);
|
2017-04-01 07:20:54 +00:00
|
|
|
signal_listener_thread.start(*signal_listener);
|
2020-06-20 09:07:05 +00:00
|
|
|
|
2020-06-20 09:17:31 +00:00
|
|
|
#if defined(__ELF__) && !defined(__FreeBSD__)
|
2020-11-30 14:30:55 +00:00
|
|
|
String build_id_hex = DB::SymbolIndex::instance()->getBuildIDHex();
|
2020-06-20 09:07:05 +00:00
|
|
|
if (build_id_hex.empty())
|
|
|
|
build_id_info = "no build id";
|
|
|
|
else
|
|
|
|
build_id_info = "build id: " + build_id_hex;
|
2020-06-20 09:17:31 +00:00
|
|
|
#else
|
|
|
|
build_id_info = "no build id";
|
|
|
|
#endif
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2016-02-10 07:54:22 +00:00
|
|
|
void BaseDaemon::logRevision() const
|
2016-02-09 17:06:50 +00:00
|
|
|
{
|
2020-05-30 21:57:37 +00:00
|
|
|
Poco::Logger::root().information("Starting " + std::string{VERSION_FULL}
|
2020-09-17 12:15:05 +00:00
|
|
|
+ " with revision " + std::to_string(ClickHouseRevision::getVersionRevision())
|
2020-06-20 09:13:11 +00:00
|
|
|
+ ", " + build_id_info
|
2019-09-26 12:08:24 +00:00
|
|
|
+ ", PID " + std::to_string(getpid()));
|
2016-02-09 17:06:50 +00:00
|
|
|
}
|
2016-01-15 03:55:07 +00:00
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
void BaseDaemon::defineOptions(Poco::Util::OptionSet & new_options)
|
2016-01-15 03:55:07 +00:00
|
|
|
{
|
2020-05-09 23:22:51 +00:00
|
|
|
new_options.addOption(
|
2018-01-17 16:39:56 +00:00
|
|
|
Poco::Util::Option("config-file", "C", "load configuration from a given file")
|
|
|
|
.required(false)
|
|
|
|
.repeatable(false)
|
|
|
|
.argument("<file>")
|
|
|
|
.binding("config-file"));
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
new_options.addOption(
|
2018-01-17 16:39:56 +00:00
|
|
|
Poco::Util::Option("log-file", "L", "use given log file")
|
|
|
|
.required(false)
|
|
|
|
.repeatable(false)
|
|
|
|
.argument("<file>")
|
|
|
|
.binding("logger.log"));
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
new_options.addOption(
|
2018-01-17 16:39:56 +00:00
|
|
|
Poco::Util::Option("errorlog-file", "E", "use given log file for errors only")
|
|
|
|
.required(false)
|
|
|
|
.repeatable(false)
|
|
|
|
.argument("<file>")
|
|
|
|
.binding("logger.errorlog"));
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2020-05-09 23:22:51 +00:00
|
|
|
new_options.addOption(
|
2018-01-17 16:39:56 +00:00
|
|
|
Poco::Util::Option("pid-file", "P", "use given pidfile")
|
|
|
|
.required(false)
|
|
|
|
.repeatable(false)
|
|
|
|
.argument("<file>")
|
|
|
|
.binding("pid"));
|
2020-05-09 23:22:51 +00:00
|
|
|
|
|
|
|
Poco::Util::ServerApplication::defineOptions(new_options);
|
2016-01-15 03:55:07 +00:00
|
|
|
}
|
|
|
|
|
2016-06-08 14:39:19 +00:00
|
|
|
void BaseDaemon::handleSignal(int signal_id)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
if (signal_id == SIGINT ||
|
|
|
|
signal_id == SIGQUIT ||
|
|
|
|
signal_id == SIGTERM)
|
|
|
|
{
|
|
|
|
std::unique_lock<std::mutex> lock(signal_handler_mutex);
|
|
|
|
{
|
|
|
|
++terminate_signals_counter;
|
|
|
|
sigint_signals_counter += signal_id == SIGINT;
|
|
|
|
signal_event.notify_all();
|
|
|
|
}
|
|
|
|
|
|
|
|
onInterruptSignals(signal_id);
|
|
|
|
}
|
|
|
|
else
|
2020-07-31 14:53:41 +00:00
|
|
|
throw DB::Exception(std::string("Unsupported signal: ") + msan_strsignal(signal_id), 0);
|
2016-06-08 14:39:19 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void BaseDaemon::onInterruptSignals(int signal_id)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
is_cancelled = true;
|
2020-07-31 14:53:41 +00:00
|
|
|
LOG_INFO(&logger(), "Received termination signal ({})", msan_strsignal(signal_id));
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
if (sigint_signals_counter >= 2)
|
|
|
|
{
|
2020-05-23 22:24:01 +00:00
|
|
|
LOG_INFO(&logger(), "Received second signal Interrupt. Immediately terminate.");
|
2020-12-22 02:57:22 +00:00
|
|
|
call_default_signal_handler(signal_id);
|
|
|
|
/// If the above did not help.
|
|
|
|
_exit(128 + signal_id);
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2016-06-08 14:39:19 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void BaseDaemon::waitForTerminationRequest()
|
|
|
|
{
|
2020-12-22 17:10:10 +00:00
|
|
|
/// NOTE: as we already process signals via pipe, we don't have to block them with sigprocmask in threads
|
2017-04-01 07:20:54 +00:00
|
|
|
std::unique_lock<std::mutex> lock(signal_handler_mutex);
|
|
|
|
signal_event.wait(lock, [this](){ return terminate_signals_counter > 0; });
|
2016-06-08 14:39:19 +00:00
|
|
|
}
|
2020-12-22 02:57:22 +00:00
|
|
|
|
|
|
|
|
|
|
|
void BaseDaemon::shouldSetupWatchdog(char * argv0_)
|
|
|
|
{
|
|
|
|
should_setup_watchdog = true;
|
|
|
|
argv0 = argv0_;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void BaseDaemon::setupWatchdog()
|
|
|
|
{
|
2020-12-22 07:38:39 +00:00
|
|
|
/// Initialize in advance to avoid double initialization in forked processes.
|
|
|
|
DateLUT::instance();
|
|
|
|
|
2020-12-22 02:57:22 +00:00
|
|
|
std::string original_process_name;
|
|
|
|
if (argv0)
|
|
|
|
original_process_name = argv0;
|
|
|
|
|
|
|
|
while (true)
|
|
|
|
{
|
2020-12-22 03:17:31 +00:00
|
|
|
static pid_t pid = -1;
|
|
|
|
pid = fork();
|
2020-12-22 02:57:22 +00:00
|
|
|
|
|
|
|
if (-1 == pid)
|
|
|
|
throw Poco::Exception("Cannot fork");
|
|
|
|
|
|
|
|
if (0 == pid)
|
|
|
|
{
|
|
|
|
logger().information("Forked a child process to watch");
|
2020-12-22 03:17:31 +00:00
|
|
|
#if defined(__linux__)
|
|
|
|
if (0 != prctl(PR_SET_PDEATHSIG, SIGKILL))
|
|
|
|
logger().warning("Cannot do prctl to ask termination with parent.");
|
|
|
|
#endif
|
2020-12-22 02:57:22 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Change short thread name and process name.
|
|
|
|
setThreadName("clckhouse-watch"); /// 15 characters
|
|
|
|
|
|
|
|
if (argv0)
|
|
|
|
{
|
|
|
|
const char * new_process_name = "clickhouse-watchdog";
|
|
|
|
memset(argv0, 0, original_process_name.size());
|
|
|
|
memcpy(argv0, new_process_name, std::min(strlen(new_process_name), original_process_name.size()));
|
|
|
|
}
|
|
|
|
|
|
|
|
logger().information(fmt::format("Will watch for the process with pid {}", pid));
|
|
|
|
|
2020-12-22 03:17:31 +00:00
|
|
|
/// Forward signals to the child process.
|
2020-12-22 02:57:22 +00:00
|
|
|
addSignalHandler(
|
|
|
|
{SIGHUP, SIGUSR1, SIGINT, SIGQUIT, SIGTERM},
|
2020-12-22 03:17:31 +00:00
|
|
|
[](int sig, siginfo_t *, void *)
|
|
|
|
{
|
2020-12-22 06:45:08 +00:00
|
|
|
/// Forward all signals except INT as it can be send by terminal to the process group when user press Ctrl+C,
|
|
|
|
/// and we process double delivery of this signal as immediate termination.
|
2020-12-22 03:17:31 +00:00
|
|
|
if (sig == SIGINT)
|
|
|
|
return;
|
|
|
|
|
|
|
|
const char * error_message = "Cannot forward signal to the child process.\n";
|
|
|
|
if (0 != ::kill(pid, sig))
|
2020-12-22 06:45:08 +00:00
|
|
|
{
|
|
|
|
auto res = write(STDERR_FILENO, error_message, strlen(error_message));
|
|
|
|
(void)res;
|
|
|
|
}
|
2020-12-22 03:17:31 +00:00
|
|
|
},
|
|
|
|
nullptr);
|
2020-12-22 02:57:22 +00:00
|
|
|
|
|
|
|
int status = 0;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (-1 != waitpid(pid, &status, WUNTRACED | WCONTINUED) || errno == ECHILD)
|
|
|
|
{
|
|
|
|
if (WIFSTOPPED(status))
|
|
|
|
logger().warning(fmt::format("Child process was stopped by signal {}.", WSTOPSIG(status)));
|
|
|
|
else if (WIFCONTINUED(status))
|
|
|
|
logger().warning(fmt::format("Child process was continued."));
|
|
|
|
else
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
else if (errno != EINTR)
|
|
|
|
throw Poco::Exception("Cannot waitpid, errno: " + std::string(strerror(errno)));
|
|
|
|
} while (true);
|
|
|
|
|
|
|
|
if (errno == ECHILD)
|
|
|
|
{
|
|
|
|
logger().information("Child process no longer exists.");
|
|
|
|
_exit(status);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (WIFEXITED(status))
|
|
|
|
{
|
|
|
|
logger().information(fmt::format("Child process exited normally with code {}.", WEXITSTATUS(status)));
|
2020-12-29 17:36:10 +00:00
|
|
|
_exit(WEXITSTATUS(status));
|
2020-12-22 02:57:22 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (WIFSIGNALED(status))
|
|
|
|
{
|
|
|
|
int sig = WTERMSIG(status);
|
|
|
|
|
|
|
|
if (sig == SIGKILL)
|
|
|
|
{
|
|
|
|
logger().fatal(fmt::format("Child process was terminated by signal {} (KILL)."
|
|
|
|
" If it is not done by 'forcestop' command or manually,"
|
|
|
|
" the possible cause is OOM Killer (see 'dmesg' and look at the '/var/log/kern.log' for the details).", sig));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
logger().fatal(fmt::format("Child process was terminated by signal {}.", sig));
|
|
|
|
|
|
|
|
if (sig == SIGINT || sig == SIGTERM || sig == SIGQUIT)
|
2020-12-29 17:36:10 +00:00
|
|
|
_exit(128 + sig);
|
2020-12-22 02:57:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
logger().fatal("Child process was not exited normally by unknown reason.");
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Automatic restart is not enabled but you can play with it.
|
|
|
|
#if 1
|
|
|
|
_exit(status);
|
|
|
|
#else
|
|
|
|
logger().information("Will restart.");
|
|
|
|
if (argv0)
|
|
|
|
memcpy(argv0, original_process_name.c_str(), original_process_name.size());
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
}
|