As discussed in [1], introduce BPF instructions with load-acquire and
store-release semantics under -mcpu=v4. Define 2 new flags:
BPF_LOAD_ACQ 0x100
BPF_STORE_REL 0x110
A "load-acquire" is a BPF_STX | BPF_ATOMIC instruction with the 'imm'
field set to BPF_LOAD_ACQ (0x100).
Similarly, a "store-release" is a BPF_STX | BPF_ATOMIC instruction with
the 'imm' field set to BPF_STORE_REL (0x110).
Unlike existing atomic read-modify-write operations that only support
BPF_W (32-bit) and BPF_DW (64-bit) size modifiers, load-acquires and
store-releases also support BPF_B (8-bit) and BPF_H (16-bit). An 8- or
16-bit load-acquire zero-extends the value before writing it to a 32-bit
register, just like ARM64 instruction LDAPRH and friends.
As an example (assuming little-endian):
long foo(long *ptr) {
return __atomic_load_n(ptr, __ATOMIC_ACQUIRE);
}
foo() can be compiled to:
db 10 00 00 00 01 00 00 r0 = load_acquire((u64 *)(r1 + 0x0))
95 00 00 00 00 00 00 00 exit
opcode (0xdb): BPF_ATOMIC | BPF_DW | BPF_STX
imm (0x00000100): BPF_LOAD_ACQ
Similarly:
void bar(short *ptr, short val) {
__atomic_store_n(ptr, val, __ATOMIC_RELEASE);
}
bar() can be compiled to:
cb 21 00 00 10 01 00 00 store_release((u16 *)(r1 + 0x0), w2)
95 00 00 00 00 00 00 00 exit
opcode (0xcb): BPF_ATOMIC | BPF_H | BPF_STX
imm (0x00000110): BPF_STORE_REL
Inline assembly is also supported.
Add a pre-defined macro, __BPF_FEATURE_LOAD_ACQ_STORE_REL, to let
developers detect this new feature. It can also be disabled using a new
llc option, -disable-load-acq-store-rel.
Using __ATOMIC_RELAXED for __atomic_store{,_n}() will generate a "plain"
store (BPF_MEM | BPF_STX) instruction:
void foo(short *ptr, short val) {
__atomic_store_n(ptr, val, __ATOMIC_RELAXED);
}
6b 21 00 00 00 00 00 00 *(u16 *)(r1 + 0x0) = w2
95 00 00 00 00 00 00 00 exit
Similarly, using __ATOMIC_RELAXED for __atomic_load{,_n}() will generate
a zero-extending, "plain" load (BPF_MEM | BPF_LDX) instruction:
int foo(char *ptr) {
return __atomic_load_n(ptr, __ATOMIC_RELAXED);
}
71 11 00 00 00 00 00 00 w1 = *(u8 *)(r1 + 0x0)
bc 10 08 00 00 00 00 00 w0 = (s8)w1
95 00 00 00 00 00 00 00 exit
Currently __ATOMIC_CONSUME is an alias for __ATOMIC_ACQUIRE. Using
__ATOMIC_SEQ_CST ("sequentially consistent") is not supported yet and
will cause an error:
$ clang --target=bpf -mcpu=v4 -c bar.c > /dev/null
bar.c:1:5: error: sequentially consistent (seq_cst) atomic load/store is
not supported
1 | int foo(int *ptr) { return __atomic_load_n(ptr, __ATOMIC_SEQ_CST); }
| ^
...
Finally, rename those isST*() and isLD*() helper functions in
BPFMISimplifyPatchable.cpp based on what the instructions actually do,
rather than their instruction class.
[1]
https://lore.kernel.org/all/20240729183246.4110549-1-yepeilin@google.com/
108 lines
3.2 KiB
C++
108 lines
3.2 KiB
C++
//===--- BPF.cpp - Implement BPF target feature support -------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements BPF TargetInfo objects.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "BPF.h"
|
|
#include "Targets.h"
|
|
#include "clang/Basic/MacroBuilder.h"
|
|
#include "clang/Basic/TargetBuiltins.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
|
|
using namespace clang;
|
|
using namespace clang::targets;
|
|
|
|
static constexpr int NumBuiltins =
|
|
clang::BPF::LastTSBuiltin - Builtin::FirstTSBuiltin;
|
|
|
|
#define GET_BUILTIN_STR_TABLE
|
|
#include "clang/Basic/BuiltinsBPF.inc"
|
|
#undef GET_BUILTIN_STR_TABLE
|
|
|
|
static constexpr Builtin::Info BuiltinInfos[] = {
|
|
#define GET_BUILTIN_INFOS
|
|
#include "clang/Basic/BuiltinsBPF.inc"
|
|
#undef GET_BUILTIN_INFOS
|
|
};
|
|
static_assert(std::size(BuiltinInfos) == NumBuiltins);
|
|
|
|
void BPFTargetInfo::getTargetDefines(const LangOptions &Opts,
|
|
MacroBuilder &Builder) const {
|
|
Builder.defineMacro("__bpf__");
|
|
Builder.defineMacro("__BPF__");
|
|
|
|
std::string CPU = getTargetOpts().CPU;
|
|
if (CPU == "probe") {
|
|
Builder.defineMacro("__BPF_CPU_VERSION__", "0");
|
|
return;
|
|
}
|
|
|
|
Builder.defineMacro("__BPF_FEATURE_ADDR_SPACE_CAST");
|
|
Builder.defineMacro("__BPF_FEATURE_MAY_GOTO");
|
|
Builder.defineMacro("__BPF_FEATURE_ATOMIC_MEM_ORDERING");
|
|
|
|
if (CPU.empty())
|
|
CPU = "v3";
|
|
|
|
if (CPU == "generic" || CPU == "v1") {
|
|
Builder.defineMacro("__BPF_CPU_VERSION__", "1");
|
|
return;
|
|
}
|
|
|
|
std::string CpuVerNumStr = CPU.substr(1);
|
|
Builder.defineMacro("__BPF_CPU_VERSION__", CpuVerNumStr);
|
|
|
|
int CpuVerNum = std::stoi(CpuVerNumStr);
|
|
if (CpuVerNum >= 2)
|
|
Builder.defineMacro("__BPF_FEATURE_JMP_EXT");
|
|
|
|
if (CpuVerNum >= 3) {
|
|
Builder.defineMacro("__BPF_FEATURE_JMP32");
|
|
Builder.defineMacro("__BPF_FEATURE_ALU32");
|
|
}
|
|
|
|
if (CpuVerNum >= 4) {
|
|
Builder.defineMacro("__BPF_FEATURE_LDSX");
|
|
Builder.defineMacro("__BPF_FEATURE_MOVSX");
|
|
Builder.defineMacro("__BPF_FEATURE_BSWAP");
|
|
Builder.defineMacro("__BPF_FEATURE_SDIV_SMOD");
|
|
Builder.defineMacro("__BPF_FEATURE_GOTOL");
|
|
Builder.defineMacro("__BPF_FEATURE_ST");
|
|
Builder.defineMacro("__BPF_FEATURE_LOAD_ACQ_STORE_REL");
|
|
}
|
|
}
|
|
|
|
static constexpr llvm::StringLiteral ValidCPUNames[] = {"generic", "v1", "v2",
|
|
"v3", "v4", "probe"};
|
|
|
|
bool BPFTargetInfo::isValidCPUName(StringRef Name) const {
|
|
return llvm::is_contained(ValidCPUNames, Name);
|
|
}
|
|
|
|
void BPFTargetInfo::fillValidCPUList(SmallVectorImpl<StringRef> &Values) const {
|
|
Values.append(std::begin(ValidCPUNames), std::end(ValidCPUNames));
|
|
}
|
|
|
|
llvm::SmallVector<Builtin::InfosShard>
|
|
BPFTargetInfo::getTargetBuiltins() const {
|
|
return {{&BuiltinStrings, BuiltinInfos}};
|
|
}
|
|
|
|
bool BPFTargetInfo::handleTargetFeatures(std::vector<std::string> &Features,
|
|
DiagnosticsEngine &Diags) {
|
|
for (const auto &Feature : Features) {
|
|
if (Feature == "+alu32") {
|
|
HasAlu32 = true;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|