Kazu Hirata ea88634764
[Support] Remove an unnecessary cast (NFC) (#146810)
We don't need to cast std::string to std::string.
2025-07-03 12:02:26 -07:00

358 lines
14 KiB
C++

//===- Signals.cpp - Signal Handling support --------------------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file defines some helpful functions for dealing with the possibility of
// Unix signals occurring while your program is running.
//
//===----------------------------------------------------------------------===//
#include "llvm/Support/Signals.h"
#include "DebugOptions.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/Config/llvm-config.h"
#include "llvm/Support/CommandLine.h"
#include "llvm/Support/ErrorOr.h"
#include "llvm/Support/FileSystem.h"
#include "llvm/Support/FileUtilities.h"
#include "llvm/Support/Format.h"
#include "llvm/Support/FormatVariadic.h"
#include "llvm/Support/ManagedStatic.h"
#include "llvm/Support/MemoryBuffer.h"
#include "llvm/Support/Path.h"
#include "llvm/Support/Program.h"
#include "llvm/Support/StringSaver.h"
#include "llvm/Support/raw_ostream.h"
#include <array>
#include <cmath>
//===----------------------------------------------------------------------===//
//=== WARNING: Implementation here must contain only TRULY operating system
//=== independent code.
//===----------------------------------------------------------------------===//
using namespace llvm;
// Use explicit storage to avoid accessing cl::opt in a signal handler.
static bool DisableSymbolicationFlag = false;
static ManagedStatic<std::string> CrashDiagnosticsDirectory;
namespace {
struct CreateDisableSymbolication {
static void *call() {
return new cl::opt<bool, true>(
"disable-symbolication",
cl::desc("Disable symbolizing crash backtraces."),
cl::location(DisableSymbolicationFlag), cl::Hidden);
}
};
struct CreateCrashDiagnosticsDir {
static void *call() {
return new cl::opt<std::string, true>(
"crash-diagnostics-dir", cl::value_desc("directory"),
cl::desc("Directory for crash diagnostic files."),
cl::location(*CrashDiagnosticsDirectory), cl::Hidden);
}
};
} // namespace
void llvm::initSignalsOptions() {
static ManagedStatic<cl::opt<bool, true>, CreateDisableSymbolication>
DisableSymbolication;
static ManagedStatic<cl::opt<std::string, true>, CreateCrashDiagnosticsDir>
CrashDiagnosticsDir;
*DisableSymbolication;
*CrashDiagnosticsDir;
}
constexpr char DisableSymbolizationEnv[] = "LLVM_DISABLE_SYMBOLIZATION";
constexpr char LLVMSymbolizerPathEnv[] = "LLVM_SYMBOLIZER_PATH";
constexpr char EnableSymbolizerMarkupEnv[] = "LLVM_ENABLE_SYMBOLIZER_MARKUP";
// Callbacks to run in signal handler must be lock-free because a signal handler
// could be running as we add new callbacks. We don't add unbounded numbers of
// callbacks, an array is therefore sufficient.
struct CallbackAndCookie {
sys::SignalHandlerCallback Callback;
void *Cookie;
enum class Status { Empty, Initializing, Initialized, Executing };
std::atomic<Status> Flag;
};
static constexpr size_t MaxSignalHandlerCallbacks = 8;
// A global array of CallbackAndCookie may not compile with
// -Werror=global-constructors in c++20 and above
static std::array<CallbackAndCookie, MaxSignalHandlerCallbacks> &
CallBacksToRun() {
static std::array<CallbackAndCookie, MaxSignalHandlerCallbacks> callbacks;
return callbacks;
}
// Signal-safe.
void sys::RunSignalHandlers() {
for (CallbackAndCookie &RunMe : CallBacksToRun()) {
auto Expected = CallbackAndCookie::Status::Initialized;
auto Desired = CallbackAndCookie::Status::Executing;
if (!RunMe.Flag.compare_exchange_strong(Expected, Desired))
continue;
(*RunMe.Callback)(RunMe.Cookie);
RunMe.Callback = nullptr;
RunMe.Cookie = nullptr;
RunMe.Flag.store(CallbackAndCookie::Status::Empty);
}
}
// Signal-safe.
static void insertSignalHandler(sys::SignalHandlerCallback FnPtr,
void *Cookie) {
for (CallbackAndCookie &SetMe : CallBacksToRun()) {
auto Expected = CallbackAndCookie::Status::Empty;
auto Desired = CallbackAndCookie::Status::Initializing;
if (!SetMe.Flag.compare_exchange_strong(Expected, Desired))
continue;
SetMe.Callback = FnPtr;
SetMe.Cookie = Cookie;
SetMe.Flag.store(CallbackAndCookie::Status::Initialized);
return;
}
report_fatal_error("too many signal callbacks already registered");
}
static bool findModulesAndOffsets(void **StackTrace, int Depth,
const char **Modules, intptr_t *Offsets,
const char *MainExecutableName,
StringSaver &StrPool);
/// Format a pointer value as hexadecimal. Zero pad it out so its always the
/// same width.
static FormattedNumber format_ptr(void *PC) {
// Each byte is two hex digits plus 2 for the 0x prefix.
unsigned PtrWidth = 2 + 2 * sizeof(void *);
return format_hex((uint64_t)PC, PtrWidth);
}
/// Reads a file \p Filename written by llvm-symbolizer containing function
/// names and source locations for the addresses in \p AddressList and returns
/// the strings in a vector of pairs, where the first pair element is the index
/// of the corresponding entry in AddressList and the second is the symbolized
/// frame, in a format based on the sanitizer stack trace printer, with the
/// exception that it does not write out frame numbers (i.e. "#2 " for the
/// third address), as it is not assumed that \p AddressList corresponds to a
/// single stack trace.
/// There may be multiple returned entries for a single \p AddressList entry if
/// that frame address corresponds to one or more inlined frames; in this case,
/// all frames for an address will appear contiguously and in-order.
std::optional<SmallVector<std::pair<unsigned, std::string>, 0>>
collectAddressSymbols(void **AddressList, unsigned AddressCount,
const char *MainExecutableName,
const std::string &LLVMSymbolizerPath) {
BumpPtrAllocator Allocator;
StringSaver StrPool(Allocator);
SmallVector<const char *, 0> Modules(AddressCount, nullptr);
SmallVector<intptr_t, 0> Offsets(AddressCount, 0);
if (!findModulesAndOffsets(AddressList, AddressCount, Modules.data(),
Offsets.data(), MainExecutableName, StrPool))
return {};
int InputFD;
SmallString<32> InputFile, OutputFile;
sys::fs::createTemporaryFile("symbolizer-input", "", InputFD, InputFile);
sys::fs::createTemporaryFile("symbolizer-output", "", OutputFile);
FileRemover InputRemover(InputFile.c_str());
FileRemover OutputRemover(OutputFile.c_str());
{
raw_fd_ostream Input(InputFD, true);
for (unsigned AddrIdx = 0; AddrIdx < AddressCount; AddrIdx++) {
if (Modules[AddrIdx])
Input << Modules[AddrIdx] << " " << (void *)Offsets[AddrIdx] << "\n";
}
}
std::optional<StringRef> Redirects[] = {InputFile.str(), OutputFile.str(),
StringRef("")};
StringRef Args[] = {"llvm-symbolizer", "--functions=linkage", "--inlining",
#ifdef _WIN32
// Pass --relative-address on Windows so that we don't
// have to add ImageBase from PE file.
// FIXME: Make this the default for llvm-symbolizer.
"--relative-address",
#endif
"--demangle"};
int RunResult =
sys::ExecuteAndWait(LLVMSymbolizerPath, Args, std::nullopt, Redirects);
if (RunResult != 0)
return {};
SmallVector<std::pair<unsigned, std::string>, 0> Result;
auto OutputBuf = MemoryBuffer::getFile(OutputFile.c_str());
if (!OutputBuf)
return {};
StringRef Output = OutputBuf.get()->getBuffer();
SmallVector<StringRef, 32> Lines;
Output.split(Lines, "\n");
auto *CurLine = Lines.begin();
// Lines contains the output from llvm-symbolizer, which should contain for
// each address with a module in order of appearance, one or more lines
// containing the function name and line associated with that address,
// followed by an empty line.
// For each address, adds an output entry for every real or inlined frame at
// that address. For addresses without known modules, we have a single entry
// containing just the formatted address; for all other output entries, we
// output the function entry if it is known, and either the line number if it
// is known or the module+address offset otherwise.
for (unsigned AddrIdx = 0; AddrIdx < AddressCount; AddrIdx++) {
if (!Modules[AddrIdx]) {
auto &SymbolizedFrame = Result.emplace_back(std::make_pair(AddrIdx, ""));
raw_string_ostream OS(SymbolizedFrame.second);
OS << format_ptr(AddressList[AddrIdx]);
continue;
}
// Read pairs of lines (function name and file/line info) until we
// encounter empty line.
for (;;) {
if (CurLine == Lines.end())
return {};
StringRef FunctionName = *CurLine++;
if (FunctionName.empty())
break;
auto &SymbolizedFrame = Result.emplace_back(std::make_pair(AddrIdx, ""));
raw_string_ostream OS(SymbolizedFrame.second);
OS << format_ptr(AddressList[AddrIdx]) << ' ';
if (!FunctionName.starts_with("??"))
OS << FunctionName << ' ';
if (CurLine == Lines.end())
return {};
StringRef FileLineInfo = *CurLine++;
if (!FileLineInfo.starts_with("??")) {
OS << FileLineInfo;
} else {
OS << "(" << Modules[AddrIdx] << '+' << format_hex(Offsets[AddrIdx], 0)
<< ")";
}
}
}
return Result;
}
ErrorOr<std::string> getLLVMSymbolizerPath(StringRef Argv0 = {}) {
ErrorOr<std::string> LLVMSymbolizerPathOrErr = std::error_code();
if (const char *Path = getenv(LLVMSymbolizerPathEnv)) {
LLVMSymbolizerPathOrErr = sys::findProgramByName(Path);
} else if (!Argv0.empty()) {
StringRef Parent = llvm::sys::path::parent_path(Argv0);
if (!Parent.empty())
LLVMSymbolizerPathOrErr =
sys::findProgramByName("llvm-symbolizer", Parent);
}
if (!LLVMSymbolizerPathOrErr)
LLVMSymbolizerPathOrErr = sys::findProgramByName("llvm-symbolizer");
return LLVMSymbolizerPathOrErr;
}
/// Helper that launches llvm-symbolizer and symbolizes a backtrace.
LLVM_ATTRIBUTE_USED
static bool printSymbolizedStackTrace(StringRef Argv0, void **StackTrace,
int Depth, llvm::raw_ostream &OS) {
if (DisableSymbolicationFlag || getenv(DisableSymbolizationEnv))
return false;
// Don't recursively invoke the llvm-symbolizer binary.
if (Argv0.contains("llvm-symbolizer"))
return false;
// FIXME: Subtract necessary number from StackTrace entries to turn return
// addresses into actual instruction addresses.
// Use llvm-symbolizer tool to symbolize the stack traces. First look for it
// alongside our binary, then in $PATH.
ErrorOr<std::string> LLVMSymbolizerPathOrErr = getLLVMSymbolizerPath(Argv0);
if (!LLVMSymbolizerPathOrErr)
return false;
const std::string &LLVMSymbolizerPath = *LLVMSymbolizerPathOrErr;
// If we don't know argv0 or the address of main() at this point, try
// to guess it anyway (it's possible on some platforms).
std::string MainExecutableName =
sys::fs::exists(Argv0) ? std::string(Argv0)
: sys::fs::getMainExecutable(nullptr, nullptr);
auto SymbolizedAddressesOpt = collectAddressSymbols(
StackTrace, Depth, MainExecutableName.c_str(), LLVMSymbolizerPath);
if (!SymbolizedAddressesOpt)
return false;
for (unsigned FrameNo = 0; FrameNo < SymbolizedAddressesOpt->size();
++FrameNo) {
OS << right_justify(formatv("#{0}", FrameNo).str(), std::log10(Depth) + 2)
<< ' ' << (*SymbolizedAddressesOpt)[FrameNo].second << '\n';
}
return true;
}
#if LLVM_ENABLE_DEBUGLOC_TRACKING_ORIGIN
void sys::symbolizeAddresses(AddressSet &Addresses,
SymbolizedAddressMap &SymbolizedAddresses) {
assert(!DisableSymbolicationFlag && !getenv(DisableSymbolizationEnv) &&
"Debugify origin stacktraces require symbolization to be enabled.");
// Convert Set of Addresses to ordered list.
SmallVector<void *, 0> AddressList(Addresses.begin(), Addresses.end());
if (AddressList.empty())
return;
llvm::sort(AddressList);
// Use llvm-symbolizer tool to symbolize the stack traces. First look for it
// alongside our binary, then in $PATH.
ErrorOr<std::string> LLVMSymbolizerPathOrErr = getLLVMSymbolizerPath();
if (!LLVMSymbolizerPathOrErr)
report_fatal_error("Debugify origin stacktraces require llvm-symbolizer");
const std::string &LLVMSymbolizerPath = *LLVMSymbolizerPathOrErr;
// Try to guess the main executable name, since we don't have argv0 available
// here.
std::string MainExecutableName = sys::fs::getMainExecutable(nullptr, nullptr);
auto SymbolizedAddressesOpt =
collectAddressSymbols(AddressList.begin(), AddressList.size(),
MainExecutableName.c_str(), LLVMSymbolizerPath);
if (!SymbolizedAddressesOpt)
return;
for (auto SymbolizedFrame : *SymbolizedAddressesOpt) {
SmallVector<std::string, 0> &SymbolizedAddrs =
SymbolizedAddresses[AddressList[SymbolizedFrame.first]];
SymbolizedAddrs.push_back(SymbolizedFrame.second);
}
return;
}
#endif
static bool printMarkupContext(raw_ostream &OS, const char *MainExecutableName);
LLVM_ATTRIBUTE_USED
static bool printMarkupStackTrace(StringRef Argv0, void **StackTrace, int Depth,
raw_ostream &OS) {
const char *Env = getenv(EnableSymbolizerMarkupEnv);
if (!Env || !*Env)
return false;
std::string MainExecutableName =
sys::fs::exists(Argv0) ? std::string(Argv0)
: sys::fs::getMainExecutable(nullptr, nullptr);
if (!printMarkupContext(OS, MainExecutableName.c_str()))
return false;
for (int I = 0; I < Depth; I++)
OS << format("{{{bt:%d:%#016x}}}\n", I, StackTrace[I]);
return true;
}
// Include the platform-specific parts of this class.
#ifdef LLVM_ON_UNIX
#include "Unix/Signals.inc"
#endif
#ifdef _WIN32
#include "Windows/Signals.inc"
#endif