
This adds the basic assembly generation support for the final EH proposal, which was newly adopted in Sep 2023 and advanced into Phase 4 in Jul 2024: https://github.com/WebAssembly/exception-handling/blob/main/proposals/exception-handling/Exceptions.md This adds support for the generation of new `try_table` and `throw_ref` instruction in .s asesmbly format. This does NOT yet include - Block annotation comment generation for .s format - .o object file generation - .s assembly parsing - Type checking (AsmTypeCheck) - Disassembler - Fixing unwind mismatches in CFGStackify These will be added as follow-up PRs. --- The format for `TRY_TABLE`, both for `MachineInstr` and `MCInst`, is as follows: ``` TRY_TABLE type number_of_catches catch_clauses* ``` where `catch_clause` is ``` catch_opcode tag+ destination ``` `catch_opcode` should be one of 0/1/2/3, which denotes `CATCH`/`CATCH_REF`/`CATCH_ALL`/`CATCH_ALL_REF` respectively. (See `BinaryFormat/Wasm.h`) `tag` exists when the catch is one of `CATCH` or `CATCH_REF`. The MIR format is printed as just the list of raw operands. The (stack-based) assembly instruction supports pretty-printing, including printing `catch` clauses by name, in InstPrinter. In addition to the new instructions `TRY_TABLE` and `THROW_REF`, this adds four pseudo instructions: `CATCH`, `CATCH_REF`, `CATCH_ALL`, and `CATCH_ALL_REF`. These are pseudo instructions to simulate block return values of `catch`, `catch_ref`, `catch_all`, `catch_all_ref` clauses in `try_table` respectively, given that we don't support block return values except for one case (`fixEndsAtEndOfFunction` in CFGStackify). These will be omitted when we lower the instructions to `MCInst` at the end. LateEHPrepare now will have one more stage to covert `CATCH`/`CATCH_ALL`s to `CATCH_REF`/`CATCH_ALL_REF`s when there is a `RETHROW` to rethrow its exception. The pass also converts `RETHROW`s into `THROW_REF`. Note that we still use `RETHROW` as an interim pseudo instruction until we convert them to `THROW_REF` in LateEHPrepare. CFGStackify has a new `placeTryTableMarker` function, which places `try_table`/`end_try_table` markers with a necessary `catch` clause and also `block`/`end_block` markers for the destination of the `catch` clause. In MCInstLower, now we need to support one more case for the multivalue block signature (`catch_ref`'s destination's `(i32, exnref)` return type). InstPrinter has a new routine to print the `catch_list` type, which is used to print `try_table` instructions. The new test, `exception.ll`'s source is the same as `exception-legacy.ll`, with the FileCheck expectations changed. One difference is the commands in this file have `-wasm-enable-exnref` to test the new format, and don't have `-wasm-disable-explicit-locals -wasm-keep-registers`, because the new custom InstPrinter routine to print `catch_list` only works for the stack-based instructions (`_S`), and we can't use `-wasm-keep-registers` for them. As in `exception-legacy.ll`, the FileCheck lines for the new tests do not contain the whole program; they mostly contain only the control flow instructions for readability.
199 lines
6.9 KiB
C++
199 lines
6.9 KiB
C++
//===-- WebAssemblyUtilities.cpp - WebAssembly Utility Functions ----------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
///
|
|
/// \file
|
|
/// This file implements several utility functions for WebAssembly.
|
|
///
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "WebAssemblyUtilities.h"
|
|
#include "WebAssemblyMachineFunctionInfo.h"
|
|
#include "WebAssemblyTargetMachine.h"
|
|
#include "llvm/CodeGen/MachineInstr.h"
|
|
#include "llvm/CodeGen/MachineLoopInfo.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/MC/MCContext.h"
|
|
using namespace llvm;
|
|
|
|
// Function names in libc++abi and libunwind
|
|
const char *const WebAssembly::CxaBeginCatchFn = "__cxa_begin_catch";
|
|
const char *const WebAssembly::CxaRethrowFn = "__cxa_rethrow";
|
|
const char *const WebAssembly::StdTerminateFn = "_ZSt9terminatev";
|
|
const char *const WebAssembly::PersonalityWrapperFn =
|
|
"_Unwind_Wasm_CallPersonality";
|
|
|
|
/// Test whether MI is a child of some other node in an expression tree.
|
|
bool WebAssembly::isChild(const MachineInstr &MI,
|
|
const WebAssemblyFunctionInfo &MFI) {
|
|
if (MI.getNumOperands() == 0)
|
|
return false;
|
|
const MachineOperand &MO = MI.getOperand(0);
|
|
if (!MO.isReg() || MO.isImplicit() || !MO.isDef())
|
|
return false;
|
|
Register Reg = MO.getReg();
|
|
return Reg.isVirtual() && MFI.isVRegStackified(Reg);
|
|
}
|
|
|
|
bool WebAssembly::mayThrow(const MachineInstr &MI) {
|
|
switch (MI.getOpcode()) {
|
|
case WebAssembly::THROW:
|
|
case WebAssembly::THROW_S:
|
|
case WebAssembly::THROW_REF:
|
|
case WebAssembly::THROW_REF_S:
|
|
case WebAssembly::RETHROW:
|
|
case WebAssembly::RETHROW_S:
|
|
return true;
|
|
}
|
|
if (isCallIndirect(MI.getOpcode()))
|
|
return true;
|
|
if (!MI.isCall())
|
|
return false;
|
|
|
|
const MachineOperand &MO = getCalleeOp(MI);
|
|
assert(MO.isGlobal() || MO.isSymbol());
|
|
|
|
if (MO.isSymbol()) {
|
|
// Some intrinsics are lowered to calls to external symbols, which are then
|
|
// lowered to calls to library functions. Most of libcalls don't throw, but
|
|
// we only list some of them here now.
|
|
// TODO Consider adding 'nounwind' info in TargetLowering::CallLoweringInfo
|
|
// instead for more accurate info.
|
|
const char *Name = MO.getSymbolName();
|
|
if (strcmp(Name, "memcpy") == 0 || strcmp(Name, "memmove") == 0 ||
|
|
strcmp(Name, "memset") == 0)
|
|
return false;
|
|
return true;
|
|
}
|
|
|
|
const auto *F = dyn_cast<Function>(MO.getGlobal());
|
|
if (!F)
|
|
return true;
|
|
if (F->doesNotThrow())
|
|
return false;
|
|
// These functions never throw
|
|
if (F->getName() == CxaBeginCatchFn || F->getName() == PersonalityWrapperFn ||
|
|
F->getName() == StdTerminateFn)
|
|
return false;
|
|
|
|
// TODO Can we exclude call instructions that are marked as 'nounwind' in the
|
|
// original LLVm IR? (Even when the callee may throw)
|
|
return true;
|
|
}
|
|
|
|
const MachineOperand &WebAssembly::getCalleeOp(const MachineInstr &MI) {
|
|
switch (MI.getOpcode()) {
|
|
case WebAssembly::CALL:
|
|
case WebAssembly::CALL_S:
|
|
case WebAssembly::RET_CALL:
|
|
case WebAssembly::RET_CALL_S:
|
|
return MI.getOperand(MI.getNumExplicitDefs());
|
|
case WebAssembly::CALL_INDIRECT:
|
|
case WebAssembly::CALL_INDIRECT_S:
|
|
case WebAssembly::RET_CALL_INDIRECT:
|
|
case WebAssembly::RET_CALL_INDIRECT_S:
|
|
return MI.getOperand(MI.getNumExplicitOperands() - 1);
|
|
default:
|
|
llvm_unreachable("Not a call instruction");
|
|
}
|
|
}
|
|
|
|
MCSymbolWasm *WebAssembly::getOrCreateFunctionTableSymbol(
|
|
MCContext &Ctx, const WebAssemblySubtarget *Subtarget) {
|
|
StringRef Name = "__indirect_function_table";
|
|
MCSymbolWasm *Sym = cast_or_null<MCSymbolWasm>(Ctx.lookupSymbol(Name));
|
|
if (Sym) {
|
|
if (!Sym->isFunctionTable())
|
|
Ctx.reportError(SMLoc(), "symbol is not a wasm funcref table");
|
|
} else {
|
|
bool is64 = Subtarget && Subtarget->getTargetTriple().isArch64Bit();
|
|
Sym = cast<MCSymbolWasm>(Ctx.getOrCreateSymbol(Name));
|
|
Sym->setFunctionTable(is64);
|
|
// The default function table is synthesized by the linker.
|
|
Sym->setUndefined();
|
|
}
|
|
// MVP object files can't have symtab entries for tables.
|
|
if (!(Subtarget && Subtarget->hasReferenceTypes()))
|
|
Sym->setOmitFromLinkingSection();
|
|
return Sym;
|
|
}
|
|
|
|
MCSymbolWasm *WebAssembly::getOrCreateFuncrefCallTableSymbol(
|
|
MCContext &Ctx, const WebAssemblySubtarget *Subtarget) {
|
|
StringRef Name = "__funcref_call_table";
|
|
MCSymbolWasm *Sym = cast_or_null<MCSymbolWasm>(Ctx.lookupSymbol(Name));
|
|
if (Sym) {
|
|
if (!Sym->isFunctionTable())
|
|
Ctx.reportError(SMLoc(), "symbol is not a wasm funcref table");
|
|
} else {
|
|
Sym = cast<MCSymbolWasm>(Ctx.getOrCreateSymbol(Name));
|
|
|
|
// Setting Weak ensure only one table is left after linking when multiple
|
|
// modules define the table.
|
|
Sym->setWeak(true);
|
|
|
|
wasm::WasmLimits Limits = {0, 1, 1};
|
|
wasm::WasmTableType TableType = {wasm::ValType::FUNCREF, Limits};
|
|
Sym->setType(wasm::WASM_SYMBOL_TYPE_TABLE);
|
|
Sym->setTableType(TableType);
|
|
}
|
|
// MVP object files can't have symtab entries for tables.
|
|
if (!(Subtarget && Subtarget->hasReferenceTypes()))
|
|
Sym->setOmitFromLinkingSection();
|
|
return Sym;
|
|
}
|
|
|
|
// Find a catch instruction from an EH pad.
|
|
MachineInstr *WebAssembly::findCatch(MachineBasicBlock *EHPad) {
|
|
assert(EHPad->isEHPad());
|
|
auto Pos = EHPad->begin();
|
|
// Skip any label or debug instructions. Also skip 'end' marker instructions
|
|
// that may exist after marker placement in CFGStackify.
|
|
while (Pos != EHPad->end() &&
|
|
(Pos->isLabel() || Pos->isDebugInstr() || isMarker(Pos->getOpcode())))
|
|
Pos++;
|
|
if (Pos != EHPad->end() && WebAssembly::isCatch(Pos->getOpcode()))
|
|
return &*Pos;
|
|
return nullptr;
|
|
}
|
|
|
|
unsigned WebAssembly::getCopyOpcodeForRegClass(const TargetRegisterClass *RC) {
|
|
assert(RC != nullptr);
|
|
switch (RC->getID()) {
|
|
case WebAssembly::I32RegClassID:
|
|
return WebAssembly::COPY_I32;
|
|
case WebAssembly::I64RegClassID:
|
|
return WebAssembly::COPY_I64;
|
|
case WebAssembly::F32RegClassID:
|
|
return WebAssembly::COPY_F32;
|
|
case WebAssembly::F64RegClassID:
|
|
return WebAssembly::COPY_F64;
|
|
case WebAssembly::V128RegClassID:
|
|
return WebAssembly::COPY_V128;
|
|
case WebAssembly::FUNCREFRegClassID:
|
|
return WebAssembly::COPY_FUNCREF;
|
|
case WebAssembly::EXTERNREFRegClassID:
|
|
return WebAssembly::COPY_EXTERNREF;
|
|
case WebAssembly::EXNREFRegClassID:
|
|
return WebAssembly::COPY_EXNREF;
|
|
default:
|
|
llvm_unreachable("Unexpected register class");
|
|
}
|
|
}
|
|
|
|
bool WebAssembly::canLowerMultivalueReturn(
|
|
const WebAssemblySubtarget *Subtarget) {
|
|
const auto &TM = static_cast<const WebAssemblyTargetMachine &>(
|
|
Subtarget->getTargetLowering()->getTargetMachine());
|
|
return Subtarget->hasMultivalue() && TM.usesMultivalueABI();
|
|
}
|
|
|
|
bool WebAssembly::canLowerReturn(size_t ResultSize,
|
|
const WebAssemblySubtarget *Subtarget) {
|
|
return ResultSize <= 1 || canLowerMultivalueReturn(Subtarget);
|
|
}
|