This commit adds support for WebAssembly's custom-page-sizes proposal to `wasm-ld`. An overview of the proposal can be found [here](https://github.com/WebAssembly/custom-page-sizes/blob/main/proposals/custom-page-sizes/Overview.md). In a sentence, it allows customizing a Wasm memory's page size, enabling Wasm to target environments with less than 64KiB of memory (the default Wasm page size) available for Wasm memories. This commit contains the following: * Adds a `--page-size=N` CLI flag to `wasm-ld` for configuring the linked Wasm binary's linear memory's page size. * When the page size is configured to a non-default value, then the final Wasm binary will use the encodings defined in the custom-page-sizes proposal to declare the linear memory's page size. * Defines a `__wasm_first_page_end` symbol, whose address points to the first page in the Wasm linear memory, a.k.a. is the Wasm memory's page size. This allows writing code that is compatible with any page size, and doesn't require re-compiling its object code. At the same time, because it just lowers to a constant rather than a memory access or something, it enables link-time optimization. * Adds tests for these new features. r? @sbc100 cc @sunfishcode
198 lines
6.9 KiB
C++
198 lines
6.9 KiB
C++
//===-- WebAssemblyUtilities.cpp - WebAssembly Utility Functions ----------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
///
|
|
/// \file
|
|
/// This file implements several utility functions for WebAssembly.
|
|
///
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "WebAssemblyUtilities.h"
|
|
#include "WebAssemblyMachineFunctionInfo.h"
|
|
#include "WebAssemblyTargetMachine.h"
|
|
#include "llvm/CodeGen/MachineInstr.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/MC/MCContext.h"
|
|
using namespace llvm;
|
|
|
|
// Function names in libc++abi and libunwind
|
|
const char *const WebAssembly::CxaBeginCatchFn = "__cxa_begin_catch";
|
|
const char *const WebAssembly::CxaRethrowFn = "__cxa_rethrow";
|
|
const char *const WebAssembly::StdTerminateFn = "_ZSt9terminatev";
|
|
const char *const WebAssembly::PersonalityWrapperFn =
|
|
"_Unwind_Wasm_CallPersonality";
|
|
|
|
/// Test whether MI is a child of some other node in an expression tree.
|
|
bool WebAssembly::isChild(const MachineInstr &MI,
|
|
const WebAssemblyFunctionInfo &MFI) {
|
|
if (MI.getNumOperands() == 0)
|
|
return false;
|
|
const MachineOperand &MO = MI.getOperand(0);
|
|
if (!MO.isReg() || MO.isImplicit() || !MO.isDef())
|
|
return false;
|
|
Register Reg = MO.getReg();
|
|
return Reg.isVirtual() && MFI.isVRegStackified(Reg);
|
|
}
|
|
|
|
bool WebAssembly::mayThrow(const MachineInstr &MI) {
|
|
switch (MI.getOpcode()) {
|
|
case WebAssembly::THROW:
|
|
case WebAssembly::THROW_S:
|
|
case WebAssembly::THROW_REF:
|
|
case WebAssembly::THROW_REF_S:
|
|
case WebAssembly::RETHROW:
|
|
case WebAssembly::RETHROW_S:
|
|
return true;
|
|
}
|
|
if (isCallIndirect(MI.getOpcode()))
|
|
return true;
|
|
if (!MI.isCall())
|
|
return false;
|
|
|
|
const MachineOperand &MO = getCalleeOp(MI);
|
|
assert(MO.isGlobal() || MO.isSymbol());
|
|
|
|
if (MO.isSymbol()) {
|
|
// Some intrinsics are lowered to calls to external symbols, which are then
|
|
// lowered to calls to library functions. Most of libcalls don't throw, but
|
|
// we only list some of them here now.
|
|
// TODO Consider adding 'nounwind' info in TargetLowering::CallLoweringInfo
|
|
// instead for more accurate info.
|
|
const char *Name = MO.getSymbolName();
|
|
if (strcmp(Name, "memcpy") == 0 || strcmp(Name, "memmove") == 0 ||
|
|
strcmp(Name, "memset") == 0)
|
|
return false;
|
|
return true;
|
|
}
|
|
|
|
const auto *F = dyn_cast<Function>(MO.getGlobal());
|
|
if (!F)
|
|
return true;
|
|
if (F->doesNotThrow())
|
|
return false;
|
|
// These functions never throw
|
|
if (F->getName() == CxaBeginCatchFn || F->getName() == PersonalityWrapperFn ||
|
|
F->getName() == StdTerminateFn)
|
|
return false;
|
|
|
|
// TODO Can we exclude call instructions that are marked as 'nounwind' in the
|
|
// original LLVm IR? (Even when the callee may throw)
|
|
return true;
|
|
}
|
|
|
|
const MachineOperand &WebAssembly::getCalleeOp(const MachineInstr &MI) {
|
|
switch (MI.getOpcode()) {
|
|
case WebAssembly::CALL:
|
|
case WebAssembly::CALL_S:
|
|
case WebAssembly::RET_CALL:
|
|
case WebAssembly::RET_CALL_S:
|
|
return MI.getOperand(MI.getNumExplicitDefs());
|
|
case WebAssembly::CALL_INDIRECT:
|
|
case WebAssembly::CALL_INDIRECT_S:
|
|
case WebAssembly::RET_CALL_INDIRECT:
|
|
case WebAssembly::RET_CALL_INDIRECT_S:
|
|
return MI.getOperand(MI.getNumExplicitOperands() - 1);
|
|
default:
|
|
llvm_unreachable("Not a call instruction");
|
|
}
|
|
}
|
|
|
|
MCSymbolWasm *WebAssembly::getOrCreateFunctionTableSymbol(
|
|
MCContext &Ctx, const WebAssemblySubtarget *Subtarget) {
|
|
StringRef Name = "__indirect_function_table";
|
|
MCSymbolWasm *Sym = cast_or_null<MCSymbolWasm>(Ctx.lookupSymbol(Name));
|
|
if (Sym) {
|
|
if (!Sym->isFunctionTable())
|
|
Ctx.reportError(SMLoc(), "symbol is not a wasm funcref table");
|
|
} else {
|
|
bool is64 = Subtarget && Subtarget->getTargetTriple().isArch64Bit();
|
|
Sym = cast<MCSymbolWasm>(Ctx.getOrCreateSymbol(Name));
|
|
Sym->setFunctionTable(is64);
|
|
// The default function table is synthesized by the linker.
|
|
Sym->setUndefined();
|
|
}
|
|
// MVP object files can't have symtab entries for tables.
|
|
if (!(Subtarget && Subtarget->hasCallIndirectOverlong()))
|
|
Sym->setOmitFromLinkingSection();
|
|
return Sym;
|
|
}
|
|
|
|
MCSymbolWasm *WebAssembly::getOrCreateFuncrefCallTableSymbol(
|
|
MCContext &Ctx, const WebAssemblySubtarget *Subtarget) {
|
|
StringRef Name = "__funcref_call_table";
|
|
MCSymbolWasm *Sym = cast_or_null<MCSymbolWasm>(Ctx.lookupSymbol(Name));
|
|
if (Sym) {
|
|
if (!Sym->isFunctionTable())
|
|
Ctx.reportError(SMLoc(), "symbol is not a wasm funcref table");
|
|
} else {
|
|
Sym = cast<MCSymbolWasm>(Ctx.getOrCreateSymbol(Name));
|
|
|
|
// Setting Weak ensure only one table is left after linking when multiple
|
|
// modules define the table.
|
|
Sym->setWeak(true);
|
|
|
|
wasm::WasmLimits Limits = {0, 1, 1, 0};
|
|
wasm::WasmTableType TableType = {wasm::ValType::FUNCREF, Limits};
|
|
Sym->setType(wasm::WASM_SYMBOL_TYPE_TABLE);
|
|
Sym->setTableType(TableType);
|
|
}
|
|
// MVP object files can't have symtab entries for tables.
|
|
if (!(Subtarget && Subtarget->hasCallIndirectOverlong()))
|
|
Sym->setOmitFromLinkingSection();
|
|
return Sym;
|
|
}
|
|
|
|
// Find a catch instruction from an EH pad.
|
|
MachineInstr *WebAssembly::findCatch(MachineBasicBlock *EHPad) {
|
|
assert(EHPad->isEHPad());
|
|
auto Pos = EHPad->begin();
|
|
// Skip any label or debug instructions. Also skip 'end' marker instructions
|
|
// that may exist after marker placement in CFGStackify.
|
|
while (Pos != EHPad->end() &&
|
|
(Pos->isLabel() || Pos->isDebugInstr() || isMarker(Pos->getOpcode())))
|
|
Pos++;
|
|
if (Pos != EHPad->end() && WebAssembly::isCatch(Pos->getOpcode()))
|
|
return &*Pos;
|
|
return nullptr;
|
|
}
|
|
|
|
unsigned WebAssembly::getCopyOpcodeForRegClass(const TargetRegisterClass *RC) {
|
|
assert(RC != nullptr);
|
|
switch (RC->getID()) {
|
|
case WebAssembly::I32RegClassID:
|
|
return WebAssembly::COPY_I32;
|
|
case WebAssembly::I64RegClassID:
|
|
return WebAssembly::COPY_I64;
|
|
case WebAssembly::F32RegClassID:
|
|
return WebAssembly::COPY_F32;
|
|
case WebAssembly::F64RegClassID:
|
|
return WebAssembly::COPY_F64;
|
|
case WebAssembly::V128RegClassID:
|
|
return WebAssembly::COPY_V128;
|
|
case WebAssembly::FUNCREFRegClassID:
|
|
return WebAssembly::COPY_FUNCREF;
|
|
case WebAssembly::EXTERNREFRegClassID:
|
|
return WebAssembly::COPY_EXTERNREF;
|
|
case WebAssembly::EXNREFRegClassID:
|
|
return WebAssembly::COPY_EXNREF;
|
|
default:
|
|
llvm_unreachable("Unexpected register class");
|
|
}
|
|
}
|
|
|
|
bool WebAssembly::canLowerMultivalueReturn(
|
|
const WebAssemblySubtarget *Subtarget) {
|
|
const auto &TM = static_cast<const WebAssemblyTargetMachine &>(
|
|
Subtarget->getTargetLowering()->getTargetMachine());
|
|
return Subtarget->hasMultivalue() && TM.usesMultivalueABI();
|
|
}
|
|
|
|
bool WebAssembly::canLowerReturn(size_t ResultSize,
|
|
const WebAssemblySubtarget *Subtarget) {
|
|
return ResultSize <= 1 || canLowerMultivalueReturn(Subtarget);
|
|
}
|