BOLT uses `MCAsmLayout` to calculate the output values of functions and basic blocks. This means output values are calculated based on a pre-linking state and any changes to symbol values during linking will cause incorrect values to be used. This issue can be triggered by enabling linker relaxation on RISC-V. Since linker relaxation can remove instructions, symbol values may change. This causes, among other things, the symbol table created by BOLT in the output executable to be incorrect. This patch solves this issue by using `BOLTLinker` to get symbol values instead of `MCAsmLayout`. This way, output values are calculated based on a post-linking state. To make sure the linker can update all necessary symbols, this patch also makes sure all these symbols are not marked as temporary so that they end-up in the object file's symbol table. Note that this patch only deals with symbols of binary functions (`BinaryFunction::updateOutputValues`). The technique described above turned out to be too expensive for basic block symbols so those are handled differently in D155604. Reviewed By: maksfb Differential Revision: https://reviews.llvm.org/D154604
614 lines
21 KiB
C++
614 lines
21 KiB
C++
//===- bolt/Rewrite/MachORewriteInstance.cpp - MachO rewriter -------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "bolt/Rewrite/MachORewriteInstance.h"
|
|
#include "bolt/Core/BinaryContext.h"
|
|
#include "bolt/Core/BinaryEmitter.h"
|
|
#include "bolt/Core/BinaryFunction.h"
|
|
#include "bolt/Core/JumpTable.h"
|
|
#include "bolt/Core/MCPlusBuilder.h"
|
|
#include "bolt/Passes/Instrumentation.h"
|
|
#include "bolt/Passes/PatchEntries.h"
|
|
#include "bolt/Profile/DataReader.h"
|
|
#include "bolt/Rewrite/BinaryPassManager.h"
|
|
#include "bolt/Rewrite/ExecutableFileMemoryManager.h"
|
|
#include "bolt/Rewrite/JITLinkLinker.h"
|
|
#include "bolt/RuntimeLibs/InstrumentationRuntimeLibrary.h"
|
|
#include "bolt/Utils/Utils.h"
|
|
#include "llvm/MC/MCObjectStreamer.h"
|
|
#include "llvm/Support/Errc.h"
|
|
#include "llvm/Support/FileSystem.h"
|
|
#include "llvm/Support/ToolOutputFile.h"
|
|
#include <memory>
|
|
#include <optional>
|
|
|
|
namespace opts {
|
|
|
|
using namespace llvm;
|
|
extern cl::opt<unsigned> AlignText;
|
|
//FIXME! Upstream change
|
|
//extern cl::opt<bool> CheckOverlappingElements;
|
|
extern cl::opt<bool> ForcePatch;
|
|
extern cl::opt<bool> Instrument;
|
|
extern cl::opt<bool> InstrumentCalls;
|
|
extern cl::opt<bolt::JumpTableSupportLevel> JumpTables;
|
|
extern cl::opt<bool> KeepTmp;
|
|
extern cl::opt<bool> NeverPrint;
|
|
extern cl::opt<std::string> OutputFilename;
|
|
extern cl::opt<bool> PrintAfterBranchFixup;
|
|
extern cl::opt<bool> PrintFinalized;
|
|
extern cl::opt<bool> PrintNormalized;
|
|
extern cl::opt<bool> PrintReordered;
|
|
extern cl::opt<bool> PrintSections;
|
|
extern cl::opt<bool> PrintDisasm;
|
|
extern cl::opt<bool> PrintCFG;
|
|
extern cl::opt<std::string> RuntimeInstrumentationLib;
|
|
extern cl::opt<unsigned> Verbosity;
|
|
} // namespace opts
|
|
|
|
namespace llvm {
|
|
namespace bolt {
|
|
|
|
extern MCPlusBuilder *createX86MCPlusBuilder(const MCInstrAnalysis *,
|
|
const MCInstrInfo *,
|
|
const MCRegisterInfo *);
|
|
extern MCPlusBuilder *createAArch64MCPlusBuilder(const MCInstrAnalysis *,
|
|
const MCInstrInfo *,
|
|
const MCRegisterInfo *);
|
|
|
|
namespace {
|
|
|
|
MCPlusBuilder *createMCPlusBuilder(const Triple::ArchType Arch,
|
|
const MCInstrAnalysis *Analysis,
|
|
const MCInstrInfo *Info,
|
|
const MCRegisterInfo *RegInfo) {
|
|
#ifdef X86_AVAILABLE
|
|
if (Arch == Triple::x86_64)
|
|
return createX86MCPlusBuilder(Analysis, Info, RegInfo);
|
|
#endif
|
|
|
|
#ifdef AARCH64_AVAILABLE
|
|
if (Arch == Triple::aarch64)
|
|
return createAArch64MCPlusBuilder(Analysis, Info, RegInfo);
|
|
#endif
|
|
|
|
llvm_unreachable("architecture unsupported by MCPlusBuilder");
|
|
}
|
|
|
|
} // anonymous namespace
|
|
|
|
#define DEBUG_TYPE "bolt"
|
|
|
|
Expected<std::unique_ptr<MachORewriteInstance>>
|
|
MachORewriteInstance::create(object::MachOObjectFile *InputFile,
|
|
StringRef ToolPath) {
|
|
Error Err = Error::success();
|
|
auto MachORI =
|
|
std::make_unique<MachORewriteInstance>(InputFile, ToolPath, Err);
|
|
if (Err)
|
|
return std::move(Err);
|
|
return std::move(MachORI);
|
|
}
|
|
|
|
MachORewriteInstance::MachORewriteInstance(object::MachOObjectFile *InputFile,
|
|
StringRef ToolPath, Error &Err)
|
|
: InputFile(InputFile), ToolPath(ToolPath) {
|
|
ErrorAsOutParameter EAO(&Err);
|
|
auto BCOrErr = BinaryContext::createBinaryContext(
|
|
InputFile, /* IsPIC */ true, DWARFContext::create(*InputFile));
|
|
if (Error E = BCOrErr.takeError()) {
|
|
Err = std::move(E);
|
|
return;
|
|
}
|
|
BC = std::move(BCOrErr.get());
|
|
BC->initializeTarget(std::unique_ptr<MCPlusBuilder>(createMCPlusBuilder(
|
|
BC->TheTriple->getArch(), BC->MIA.get(), BC->MII.get(), BC->MRI.get())));
|
|
if (opts::Instrument)
|
|
BC->setRuntimeLibrary(std::make_unique<InstrumentationRuntimeLibrary>());
|
|
}
|
|
|
|
Error MachORewriteInstance::setProfile(StringRef Filename) {
|
|
if (!sys::fs::exists(Filename))
|
|
return errorCodeToError(make_error_code(errc::no_such_file_or_directory));
|
|
|
|
if (ProfileReader) {
|
|
// Already exists
|
|
return make_error<StringError>(
|
|
Twine("multiple profiles specified: ") + ProfileReader->getFilename() +
|
|
" and " + Filename, inconvertibleErrorCode());
|
|
}
|
|
|
|
ProfileReader = std::make_unique<DataReader>(Filename);
|
|
return Error::success();
|
|
}
|
|
|
|
void MachORewriteInstance::preprocessProfileData() {
|
|
if (!ProfileReader)
|
|
return;
|
|
if (Error E = ProfileReader->preprocessProfile(*BC.get()))
|
|
report_error("cannot pre-process profile", std::move(E));
|
|
}
|
|
|
|
void MachORewriteInstance::processProfileDataPreCFG() {
|
|
if (!ProfileReader)
|
|
return;
|
|
if (Error E = ProfileReader->readProfilePreCFG(*BC.get()))
|
|
report_error("cannot read profile pre-CFG", std::move(E));
|
|
}
|
|
|
|
void MachORewriteInstance::processProfileData() {
|
|
if (!ProfileReader)
|
|
return;
|
|
if (Error E = ProfileReader->readProfile(*BC.get()))
|
|
report_error("cannot read profile", std::move(E));
|
|
}
|
|
|
|
void MachORewriteInstance::readSpecialSections() {
|
|
for (const object::SectionRef &Section : InputFile->sections()) {
|
|
Expected<StringRef> SectionName = Section.getName();;
|
|
check_error(SectionName.takeError(), "cannot get section name");
|
|
// Only register sections with names.
|
|
if (!SectionName->empty()) {
|
|
BC->registerSection(Section);
|
|
LLVM_DEBUG(
|
|
dbgs() << "BOLT-DEBUG: registering section " << *SectionName
|
|
<< " @ 0x" << Twine::utohexstr(Section.getAddress()) << ":0x"
|
|
<< Twine::utohexstr(Section.getAddress() + Section.getSize())
|
|
<< "\n");
|
|
}
|
|
}
|
|
|
|
if (opts::PrintSections) {
|
|
outs() << "BOLT-INFO: Sections from original binary:\n";
|
|
BC->printSections(outs());
|
|
}
|
|
}
|
|
|
|
namespace {
|
|
|
|
struct DataInCodeRegion {
|
|
explicit DataInCodeRegion(DiceRef D) {
|
|
D.getOffset(Offset);
|
|
D.getLength(Length);
|
|
D.getKind(Kind);
|
|
}
|
|
|
|
uint32_t Offset;
|
|
uint16_t Length;
|
|
uint16_t Kind;
|
|
};
|
|
|
|
std::vector<DataInCodeRegion> readDataInCode(const MachOObjectFile &O) {
|
|
const MachO::linkedit_data_command DataInCodeLC =
|
|
O.getDataInCodeLoadCommand();
|
|
const uint32_t NumberOfEntries =
|
|
DataInCodeLC.datasize / sizeof(MachO::data_in_code_entry);
|
|
std::vector<DataInCodeRegion> DataInCode;
|
|
DataInCode.reserve(NumberOfEntries);
|
|
for (auto I = O.begin_dices(), E = O.end_dices(); I != E; ++I)
|
|
DataInCode.emplace_back(*I);
|
|
llvm::stable_sort(DataInCode, [](DataInCodeRegion LHS, DataInCodeRegion RHS) {
|
|
return LHS.Offset < RHS.Offset;
|
|
});
|
|
return DataInCode;
|
|
}
|
|
|
|
std::optional<uint64_t> readStartAddress(const MachOObjectFile &O) {
|
|
std::optional<uint64_t> StartOffset;
|
|
std::optional<uint64_t> TextVMAddr;
|
|
for (const object::MachOObjectFile::LoadCommandInfo &LC : O.load_commands()) {
|
|
switch (LC.C.cmd) {
|
|
case MachO::LC_MAIN: {
|
|
MachO::entry_point_command LCMain = O.getEntryPointCommand(LC);
|
|
StartOffset = LCMain.entryoff;
|
|
break;
|
|
}
|
|
case MachO::LC_SEGMENT: {
|
|
MachO::segment_command LCSeg = O.getSegmentLoadCommand(LC);
|
|
StringRef SegmentName(LCSeg.segname,
|
|
strnlen(LCSeg.segname, sizeof(LCSeg.segname)));
|
|
if (SegmentName == "__TEXT")
|
|
TextVMAddr = LCSeg.vmaddr;
|
|
break;
|
|
}
|
|
case MachO::LC_SEGMENT_64: {
|
|
MachO::segment_command_64 LCSeg = O.getSegment64LoadCommand(LC);
|
|
StringRef SegmentName(LCSeg.segname,
|
|
strnlen(LCSeg.segname, sizeof(LCSeg.segname)));
|
|
if (SegmentName == "__TEXT")
|
|
TextVMAddr = LCSeg.vmaddr;
|
|
break;
|
|
}
|
|
default:
|
|
continue;
|
|
}
|
|
}
|
|
return (TextVMAddr && StartOffset)
|
|
? std::optional<uint64_t>(*TextVMAddr + *StartOffset)
|
|
: std::nullopt;
|
|
}
|
|
|
|
} // anonymous namespace
|
|
|
|
void MachORewriteInstance::discoverFileObjects() {
|
|
std::vector<SymbolRef> FunctionSymbols;
|
|
for (const SymbolRef &S : InputFile->symbols()) {
|
|
SymbolRef::Type Type = cantFail(S.getType(), "cannot get symbol type");
|
|
if (Type == SymbolRef::ST_Function)
|
|
FunctionSymbols.push_back(S);
|
|
}
|
|
if (FunctionSymbols.empty())
|
|
return;
|
|
llvm::stable_sort(
|
|
FunctionSymbols, [](const SymbolRef &LHS, const SymbolRef &RHS) {
|
|
return cantFail(LHS.getValue()) < cantFail(RHS.getValue());
|
|
});
|
|
for (size_t Index = 0; Index < FunctionSymbols.size(); ++Index) {
|
|
const uint64_t Address = cantFail(FunctionSymbols[Index].getValue());
|
|
ErrorOr<BinarySection &> Section = BC->getSectionForAddress(Address);
|
|
// TODO: It happens for some symbols (e.g. __mh_execute_header).
|
|
// Add proper logic to handle them correctly.
|
|
if (!Section) {
|
|
errs() << "BOLT-WARNING: no section found for address " << Address
|
|
<< "\n";
|
|
continue;
|
|
}
|
|
|
|
std::string SymbolName =
|
|
cantFail(FunctionSymbols[Index].getName(), "cannot get symbol name")
|
|
.str();
|
|
// Uniquify names of local symbols.
|
|
if (!(cantFail(FunctionSymbols[Index].getFlags()) & SymbolRef::SF_Global))
|
|
SymbolName = NR.uniquify(SymbolName);
|
|
|
|
section_iterator S = cantFail(FunctionSymbols[Index].getSection());
|
|
uint64_t EndAddress = S->getAddress() + S->getSize();
|
|
|
|
size_t NFIndex = Index + 1;
|
|
// Skip aliases.
|
|
while (NFIndex < FunctionSymbols.size() &&
|
|
cantFail(FunctionSymbols[NFIndex].getValue()) == Address)
|
|
++NFIndex;
|
|
if (NFIndex < FunctionSymbols.size() &&
|
|
S == cantFail(FunctionSymbols[NFIndex].getSection()))
|
|
EndAddress = cantFail(FunctionSymbols[NFIndex].getValue());
|
|
|
|
const uint64_t SymbolSize = EndAddress - Address;
|
|
const auto It = BC->getBinaryFunctions().find(Address);
|
|
if (It == BC->getBinaryFunctions().end()) {
|
|
BinaryFunction *Function = BC->createBinaryFunction(
|
|
std::move(SymbolName), *Section, Address, SymbolSize);
|
|
if (!opts::Instrument)
|
|
Function->setOutputAddress(Function->getAddress());
|
|
|
|
} else {
|
|
It->second.addAlternativeName(std::move(SymbolName));
|
|
}
|
|
}
|
|
|
|
const std::vector<DataInCodeRegion> DataInCode = readDataInCode(*InputFile);
|
|
|
|
for (auto &BFI : BC->getBinaryFunctions()) {
|
|
BinaryFunction &Function = BFI.second;
|
|
Function.setMaxSize(Function.getSize());
|
|
|
|
ErrorOr<ArrayRef<uint8_t>> FunctionData = Function.getData();
|
|
if (!FunctionData) {
|
|
errs() << "BOLT-ERROR: corresponding section is non-executable or "
|
|
<< "empty for function " << Function << '\n';
|
|
continue;
|
|
}
|
|
|
|
// Treat zero-sized functions as non-simple ones.
|
|
if (Function.getSize() == 0) {
|
|
Function.setSimple(false);
|
|
continue;
|
|
}
|
|
|
|
// Offset of the function in the file.
|
|
const auto *FileBegin =
|
|
reinterpret_cast<const uint8_t *>(InputFile->getData().data());
|
|
Function.setFileOffset(FunctionData->begin() - FileBegin);
|
|
|
|
// Treat functions which contain data in code as non-simple ones.
|
|
const auto It = std::lower_bound(
|
|
DataInCode.cbegin(), DataInCode.cend(), Function.getFileOffset(),
|
|
[](DataInCodeRegion D, uint64_t Offset) { return D.Offset < Offset; });
|
|
if (It != DataInCode.cend() &&
|
|
It->Offset + It->Length <=
|
|
Function.getFileOffset() + Function.getMaxSize())
|
|
Function.setSimple(false);
|
|
}
|
|
|
|
BC->StartFunctionAddress = readStartAddress(*InputFile);
|
|
}
|
|
|
|
void MachORewriteInstance::disassembleFunctions() {
|
|
for (auto &BFI : BC->getBinaryFunctions()) {
|
|
BinaryFunction &Function = BFI.second;
|
|
if (!Function.isSimple())
|
|
continue;
|
|
Function.disassemble();
|
|
if (opts::PrintDisasm)
|
|
Function.print(outs(), "after disassembly");
|
|
}
|
|
}
|
|
|
|
void MachORewriteInstance::buildFunctionsCFG() {
|
|
for (auto &BFI : BC->getBinaryFunctions()) {
|
|
BinaryFunction &Function = BFI.second;
|
|
if (!Function.isSimple())
|
|
continue;
|
|
if (!Function.buildCFG(/*AllocId*/ 0)) {
|
|
errs() << "BOLT-WARNING: failed to build CFG for the function "
|
|
<< Function << "\n";
|
|
}
|
|
}
|
|
}
|
|
|
|
void MachORewriteInstance::postProcessFunctions() {
|
|
for (auto &BFI : BC->getBinaryFunctions()) {
|
|
BinaryFunction &Function = BFI.second;
|
|
if (Function.empty())
|
|
continue;
|
|
Function.postProcessCFG();
|
|
if (opts::PrintCFG)
|
|
Function.print(outs(), "after building cfg");
|
|
}
|
|
}
|
|
|
|
void MachORewriteInstance::runOptimizationPasses() {
|
|
BinaryFunctionPassManager Manager(*BC);
|
|
if (opts::Instrument) {
|
|
Manager.registerPass(std::make_unique<PatchEntries>());
|
|
Manager.registerPass(std::make_unique<Instrumentation>(opts::NeverPrint));
|
|
}
|
|
|
|
Manager.registerPass(std::make_unique<ShortenInstructions>(opts::NeverPrint));
|
|
|
|
Manager.registerPass(std::make_unique<RemoveNops>(opts::NeverPrint));
|
|
|
|
Manager.registerPass(std::make_unique<NormalizeCFG>(opts::PrintNormalized));
|
|
|
|
Manager.registerPass(
|
|
std::make_unique<ReorderBasicBlocks>(opts::PrintReordered));
|
|
Manager.registerPass(
|
|
std::make_unique<FixupBranches>(opts::PrintAfterBranchFixup));
|
|
// This pass should always run last.*
|
|
Manager.registerPass(
|
|
std::make_unique<FinalizeFunctions>(opts::PrintFinalized));
|
|
|
|
Manager.runPasses();
|
|
}
|
|
|
|
void MachORewriteInstance::mapInstrumentationSection(
|
|
StringRef SectionName, BOLTLinker::SectionMapper MapSection) {
|
|
if (!opts::Instrument)
|
|
return;
|
|
ErrorOr<BinarySection &> Section = BC->getUniqueSectionByName(SectionName);
|
|
if (!Section) {
|
|
llvm::errs() << "Cannot find " + SectionName + " section\n";
|
|
exit(1);
|
|
}
|
|
if (!Section->hasValidSectionID())
|
|
return;
|
|
MapSection(*Section, Section->getAddress());
|
|
}
|
|
|
|
void MachORewriteInstance::mapCodeSections(
|
|
BOLTLinker::SectionMapper MapSection) {
|
|
for (BinaryFunction *Function : BC->getAllBinaryFunctions()) {
|
|
if (!Function->isEmitted())
|
|
continue;
|
|
if (Function->getOutputAddress() == 0)
|
|
continue;
|
|
ErrorOr<BinarySection &> FuncSection = Function->getCodeSection();
|
|
if (!FuncSection)
|
|
report_error(
|
|
(Twine("Cannot find section for function ") + Function->getOneName())
|
|
.str(),
|
|
FuncSection.getError());
|
|
|
|
FuncSection->setOutputAddress(Function->getOutputAddress());
|
|
LLVM_DEBUG(dbgs() << "BOLT: mapping 0x"
|
|
<< Twine::utohexstr(FuncSection->getAllocAddress()) << " to 0x"
|
|
<< Twine::utohexstr(Function->getOutputAddress()) << '\n');
|
|
MapSection(*FuncSection, Function->getOutputAddress());
|
|
Function->setImageAddress(FuncSection->getAllocAddress());
|
|
Function->setImageSize(FuncSection->getOutputSize());
|
|
}
|
|
|
|
if (opts::Instrument) {
|
|
ErrorOr<BinarySection &> BOLT = BC->getUniqueSectionByName("__bolt");
|
|
if (!BOLT) {
|
|
llvm::errs() << "Cannot find __bolt section\n";
|
|
exit(1);
|
|
}
|
|
uint64_t Addr = BOLT->getAddress();
|
|
for (BinaryFunction *Function : BC->getAllBinaryFunctions()) {
|
|
if (!Function->isEmitted())
|
|
continue;
|
|
if (Function->getOutputAddress() != 0)
|
|
continue;
|
|
ErrorOr<BinarySection &> FuncSection = Function->getCodeSection();
|
|
assert(FuncSection && "cannot find section for function");
|
|
Addr = llvm::alignTo(Addr, 4);
|
|
FuncSection->setOutputAddress(Addr);
|
|
MapSection(*FuncSection, Addr);
|
|
Function->setFileOffset(Addr - BOLT->getAddress() +
|
|
BOLT->getInputFileOffset());
|
|
Function->setImageAddress(FuncSection->getAllocAddress());
|
|
Function->setImageSize(FuncSection->getOutputSize());
|
|
BC->registerNameAtAddress(Function->getOneName(), Addr, 0, 0);
|
|
Addr += FuncSection->getOutputSize();
|
|
}
|
|
}
|
|
}
|
|
|
|
void MachORewriteInstance::emitAndLink() {
|
|
std::error_code EC;
|
|
std::unique_ptr<::llvm::ToolOutputFile> TempOut =
|
|
std::make_unique<::llvm::ToolOutputFile>(
|
|
opts::OutputFilename + ".bolt.o", EC, sys::fs::OF_None);
|
|
check_error(EC, "cannot create output object file");
|
|
|
|
if (opts::KeepTmp)
|
|
TempOut->keep();
|
|
|
|
std::unique_ptr<buffer_ostream> BOS =
|
|
std::make_unique<buffer_ostream>(TempOut->os());
|
|
raw_pwrite_stream *OS = BOS.get();
|
|
auto Streamer = BC->createStreamer(*OS);
|
|
|
|
emitBinaryContext(*Streamer, *BC, getOrgSecPrefix());
|
|
Streamer->finish();
|
|
|
|
std::unique_ptr<MemoryBuffer> ObjectMemBuffer =
|
|
MemoryBuffer::getMemBuffer(BOS->str(), "in-memory object file", false);
|
|
std::unique_ptr<object::ObjectFile> Obj = cantFail(
|
|
object::ObjectFile::createObjectFile(ObjectMemBuffer->getMemBufferRef()),
|
|
"error creating in-memory object");
|
|
assert(Obj && "createObjectFile cannot return nullptr");
|
|
|
|
auto EFMM = std::make_unique<ExecutableFileMemoryManager>(*BC);
|
|
EFMM->setNewSecPrefix(getNewSecPrefix());
|
|
EFMM->setOrgSecPrefix(getOrgSecPrefix());
|
|
|
|
Linker = std::make_unique<JITLinkLinker>(*BC, std::move(EFMM));
|
|
Linker->loadObject(ObjectMemBuffer->getMemBufferRef(),
|
|
[this](auto MapSection) {
|
|
// Assign addresses to all sections. If key corresponds
|
|
// to the object created by ourselves, call our regular
|
|
// mapping function. If we are loading additional objects
|
|
// as part of runtime libraries for instrumentation,
|
|
// treat them as extra sections.
|
|
mapCodeSections(MapSection);
|
|
mapInstrumentationSection("__counters", MapSection);
|
|
mapInstrumentationSection("__tables", MapSection);
|
|
});
|
|
|
|
// TODO: Refactor addRuntimeLibSections to work properly on Mach-O
|
|
// and use it here.
|
|
// if (auto *RtLibrary = BC->getRuntimeLibrary()) {
|
|
// RtLibrary->link(*BC, ToolPath, *Linker, [this](auto MapSection) {
|
|
// mapInstrumentationSection("I__setup", MapSection);
|
|
// mapInstrumentationSection("I__fini", MapSection);
|
|
// mapInstrumentationSection("I__data", MapSection);
|
|
// mapInstrumentationSection("I__text", MapSection);
|
|
// mapInstrumentationSection("I__cstring", MapSection);
|
|
// mapInstrumentationSection("I__literal16", MapSection);
|
|
// });
|
|
// }
|
|
}
|
|
|
|
void MachORewriteInstance::writeInstrumentationSection(StringRef SectionName,
|
|
raw_pwrite_stream &OS) {
|
|
if (!opts::Instrument)
|
|
return;
|
|
ErrorOr<BinarySection &> Section = BC->getUniqueSectionByName(SectionName);
|
|
if (!Section) {
|
|
llvm::errs() << "Cannot find " + SectionName + " section\n";
|
|
exit(1);
|
|
}
|
|
if (!Section->hasValidSectionID())
|
|
return;
|
|
assert(Section->getInputFileOffset() &&
|
|
"Section input offset cannot be zero");
|
|
assert(Section->getAllocAddress() && "Section alloc address cannot be zero");
|
|
assert(Section->getOutputSize() && "Section output size cannot be zero");
|
|
OS.pwrite(reinterpret_cast<char *>(Section->getAllocAddress()),
|
|
Section->getOutputSize(), Section->getInputFileOffset());
|
|
}
|
|
|
|
void MachORewriteInstance::rewriteFile() {
|
|
std::error_code EC;
|
|
Out = std::make_unique<ToolOutputFile>(opts::OutputFilename, EC,
|
|
sys::fs::OF_None);
|
|
check_error(EC, "cannot create output executable file");
|
|
raw_fd_ostream &OS = Out->os();
|
|
OS << InputFile->getData();
|
|
|
|
for (auto &BFI : BC->getBinaryFunctions()) {
|
|
BinaryFunction &Function = BFI.second;
|
|
if (!Function.isSimple())
|
|
continue;
|
|
assert(Function.isEmitted() && "Simple function has not been emitted");
|
|
if (!opts::Instrument && (Function.getImageSize() > Function.getMaxSize()))
|
|
continue;
|
|
if (opts::Verbosity >= 2)
|
|
outs() << "BOLT: rewriting function \"" << Function << "\"\n";
|
|
OS.pwrite(reinterpret_cast<char *>(Function.getImageAddress()),
|
|
Function.getImageSize(), Function.getFileOffset());
|
|
}
|
|
|
|
for (const BinaryFunction *Function : BC->getInjectedBinaryFunctions()) {
|
|
OS.pwrite(reinterpret_cast<char *>(Function->getImageAddress()),
|
|
Function->getImageSize(), Function->getFileOffset());
|
|
}
|
|
|
|
writeInstrumentationSection("__counters", OS);
|
|
writeInstrumentationSection("__tables", OS);
|
|
|
|
// TODO: Refactor addRuntimeLibSections to work properly on Mach-O and
|
|
// use it here.
|
|
writeInstrumentationSection("I__setup", OS);
|
|
writeInstrumentationSection("I__fini", OS);
|
|
writeInstrumentationSection("I__data", OS);
|
|
writeInstrumentationSection("I__text", OS);
|
|
writeInstrumentationSection("I__cstring", OS);
|
|
writeInstrumentationSection("I__literal16", OS);
|
|
|
|
Out->keep();
|
|
EC = sys::fs::setPermissions(opts::OutputFilename,
|
|
sys::fs::perms::all_all);
|
|
check_error(EC, "cannot set permissions of output file");
|
|
}
|
|
|
|
void MachORewriteInstance::adjustCommandLineOptions() {
|
|
//FIXME! Upstream change
|
|
// opts::CheckOverlappingElements = false;
|
|
if (!opts::AlignText.getNumOccurrences())
|
|
opts::AlignText = BC->PageAlign;
|
|
if (opts::Instrument.getNumOccurrences())
|
|
opts::ForcePatch = true;
|
|
opts::JumpTables = JTS_MOVE;
|
|
opts::InstrumentCalls = false;
|
|
opts::RuntimeInstrumentationLib = "libbolt_rt_instr_osx.a";
|
|
}
|
|
|
|
void MachORewriteInstance::run() {
|
|
adjustCommandLineOptions();
|
|
|
|
readSpecialSections();
|
|
|
|
discoverFileObjects();
|
|
|
|
preprocessProfileData();
|
|
|
|
disassembleFunctions();
|
|
|
|
processProfileDataPreCFG();
|
|
|
|
buildFunctionsCFG();
|
|
|
|
processProfileData();
|
|
|
|
postProcessFunctions();
|
|
|
|
runOptimizationPasses();
|
|
|
|
emitAndLink();
|
|
|
|
rewriteFile();
|
|
}
|
|
|
|
MachORewriteInstance::~MachORewriteInstance() {}
|
|
|
|
} // namespace bolt
|
|
} // namespace llvm
|