Skip to content

Commit

Permalink
hwasan: Implement lazy thread initialization for the interceptor ABI.
Browse files Browse the repository at this point in the history
The problem is similar to D55986 but for threads: a process with the
interceptor hwasan library loaded might have some threads started by
instrumented libraries and some by uninstrumented libraries, and we
need to be able to run instrumented code on the latter.

The solution is to perform per-thread initialization lazily. If a
function needs to access shadow memory or add itself to the per-thread
ring buffer its prologue checks to see whether the value in the
sanitizer TLS slot is null, and if so it calls __hwasan_thread_enter
and reloads from the TLS slot. The runtime does the same thing if it
needs to access this data structure.

This change means that the code generator needs to know whether we
are targeting the interceptor runtime, since we don't want to pay
the cost of lazy initialization when targeting a platform with native
hwasan support. A flag -fsanitize-hwaddress-abi={interceptor,platform}
has been introduced for selecting the runtime ABI to target. The
default ABI is set to interceptor since it's assumed that it will
be more common that users will be compiling application code than
platform code.

Because we can no longer assume that the TLS slot is initialized,
the pthread_create interceptor is no longer necessary, so it has
been removed.

Ideally, lazy initialization should only cost one instruction in the
hot path, but at present the call may cause us to spill arguments
to the stack, which means more instructions in the hot path (or
theoretically in the cold path if the spills are moved with shrink
wrapping). With an appropriately chosen calling convention for
the per-thread initialization function (TODO) the hot path should
always need just one instruction and the cold path should need two
instructions with no spilling required.

Differential Revision: https://reviews.llvm.org/D56038

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@350429 91177308-0d34-0410-b5e6-96231b3b80d8
  • Loading branch information
pcc committed Jan 4, 2019
1 parent 1f63024 commit 1011e42
Show file tree
Hide file tree
Showing 2 changed files with 52 additions and 2 deletions.
29 changes: 27 additions & 2 deletions lib/Transforms/Instrumentation/HWAddressSanitizer.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -264,6 +264,7 @@ class HWAddressSanitizer : public FunctionPass {

Function *HwasanTagMemoryFunc;
Function *HwasanGenerateTagFunc;
Function *HwasanThreadEnterFunc;

Constant *ShadowGlobal;

Expand Down Expand Up @@ -391,6 +392,9 @@ void HWAddressSanitizer::initializeCallbacks(Module &M) {
HWAsanMemset = checkSanitizerInterfaceFunction(M.getOrInsertFunction(
MemIntrinCallbackPrefix + "memset", IRB.getInt8PtrTy(),
IRB.getInt8PtrTy(), IRB.getInt32Ty(), IntptrTy));

HwasanThreadEnterFunc = checkSanitizerInterfaceFunction(
M.getOrInsertFunction("__hwasan_thread_enter", IRB.getVoidTy()));
}

Value *HWAddressSanitizer::getDynamicShadowNonTls(IRBuilder<> &IRB) {
Expand Down Expand Up @@ -806,14 +810,35 @@ Value *HWAddressSanitizer::emitPrologue(IRBuilder<> &IRB,
Value *SlotPtr = getHwasanThreadSlotPtr(IRB, IntptrTy);
assert(SlotPtr);

Value *ThreadLong = IRB.CreateLoad(SlotPtr);
Instruction *ThreadLong = IRB.CreateLoad(SlotPtr);

Function *F = IRB.GetInsertBlock()->getParent();
if (F->getFnAttribute("hwasan-abi").getValueAsString() == "interceptor") {
Value *ThreadLongEqZero =
IRB.CreateICmpEQ(ThreadLong, ConstantInt::get(IntptrTy, 0));
auto *Br = cast<BranchInst>(SplitBlockAndInsertIfThen(
ThreadLongEqZero, cast<Instruction>(ThreadLongEqZero)->getNextNode(),
false, MDBuilder(*C).createBranchWeights(1, 100000)));

IRB.SetInsertPoint(Br);
// FIXME: This should call a new runtime function with a custom calling
// convention to avoid needing to spill all arguments here.
IRB.CreateCall(HwasanThreadEnterFunc);
LoadInst *ReloadThreadLong = IRB.CreateLoad(SlotPtr);

IRB.SetInsertPoint(&*Br->getSuccessor(0)->begin());
PHINode *ThreadLongPhi = IRB.CreatePHI(IntptrTy, 2);
ThreadLongPhi->addIncoming(ThreadLong, ThreadLong->getParent());
ThreadLongPhi->addIncoming(ReloadThreadLong, ReloadThreadLong->getParent());
ThreadLong = ThreadLongPhi;
}

// Extract the address field from ThreadLong. Unnecessary on AArch64 with TBI.
Value *ThreadLongMaybeUntagged =
TargetTriple.isAArch64() ? ThreadLong : untagPointer(IRB, ThreadLong);

if (WithFrameRecord) {
// Prepare ring buffer data.
Function *F = IRB.GetInsertBlock()->getParent();
auto PC = IRB.CreatePtrToInt(F, IntptrTy);
auto GetStackPointerFn =
Intrinsic::getDeclaration(F->getParent(), Intrinsic::frameaddress);
Expand Down
25 changes: 25 additions & 0 deletions test/Instrumentation/HWAddressSanitizer/lazy-thread-init.ll
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
; RUN: opt -S -hwasan < %s | FileCheck %s

target triple = "x86_64-unknown-linux-gnu"

declare void @bar([16 x i32]* %p)

define void @foo() sanitize_hwaddress "hwasan-abi"="interceptor" {
; CHECK: [[LOAD:%[^ ]*]] = load i64, i64* @__hwasan_tls
; CHECK: [[ICMP:%[^ ]*]] = icmp eq i64 [[LOAD]], 0
; CHECK: br i1 [[ICMP]], label %[[INIT:[^,]*]], label %[[CONT:[^,]*]], !prof [[PROF:![0-9]+]]

; CHECK: [[INIT]]:
; CHECK: call void @__hwasan_thread_enter()
; CHECK: [[RELOAD:%[^ ]*]] = load i64, i64* @__hwasan_tls
; CHECK: br label %[[CONT]]

; CHECK: [[CONT]]:
; CHECK: phi i64 [ [[LOAD]], %0 ], [ [[RELOAD]], %[[INIT]] ]

%p = alloca [16 x i32]
call void @bar([16 x i32]* %p)
ret void
}

; CHECK: [[PROF]] = !{!"branch_weights", i32 1, i32 100000}

0 comments on commit 1011e42

Please sign in to comment.