From 0f8f086e21ed1852884dfc281248fcba72059f49 Mon Sep 17 00:00:00 2001 From: Reid Kleckner Date: Thu, 2 Apr 2015 21:44:55 +0000 Subject: [PATCH] [ASan] Don't use stack malloc for 32-bit functions using inline asm This prevents us from running out of registers in the backend. Introducing stack malloc calls prevents the backend from recognizing the inline asm operands as stack objects. When the backend recognizes a stack object, it doesn't need to materialize the address of the memory in a physical register. Instead it generates a simple SP-based memory operand. Introducing a stack malloc forces the backend to find a free register for every memory operand. 32-bit x86 simply doesn't have enough registers for this to succeed in most cases. Reviewers: kcc, samsonov Differential Revision: http://reviews.llvm.org/D8790 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@233979 91177308-0d34-0410-b5e6-96231b3b80d8 --- .../Instrumentation/AddressSanitizer.cpp | 6 ++- .../AddressSanitizer/X86/asm_cpuid.ll | 53 +++++++++++++++++++ 2 files changed, 57 insertions(+), 2 deletions(-) create mode 100644 test/Instrumentation/AddressSanitizer/X86/asm_cpuid.ll diff --git a/lib/Transforms/Instrumentation/AddressSanitizer.cpp b/lib/Transforms/Instrumentation/AddressSanitizer.cpp index e483d6f9e3b..9ccb82b759f 100644 --- a/lib/Transforms/Instrumentation/AddressSanitizer.cpp +++ b/lib/Transforms/Instrumentation/AddressSanitizer.cpp @@ -1766,9 +1766,11 @@ void FunctionStackPoisoner::poisonStack() { uint64_t LocalStackSize = L.FrameSize; bool DoStackMalloc = ClUseAfterReturn && LocalStackSize <= kMaxStackMallocSize; - // Don't do dynamic alloca in presence of inline asm: too often it - // makes assumptions on which registers are available. + // Don't do dynamic alloca in presence of inline asm: too often it makes + // assumptions on which registers are available. Don't do stack malloc in the + // presence of inline asm on 32-bit platforms for the same reason. bool DoDynamicAlloca = ClDynamicAllocaStack && !HasNonEmptyInlineAsm; + DoStackMalloc &= !HasNonEmptyInlineAsm || ASan.LongSize != 32; Value *StaticAlloca = DoDynamicAlloca ? nullptr : createAllocaForLayout(IRB, L, false); diff --git a/test/Instrumentation/AddressSanitizer/X86/asm_cpuid.ll b/test/Instrumentation/AddressSanitizer/X86/asm_cpuid.ll new file mode 100644 index 00000000000..cfa91d4da63 --- /dev/null +++ b/test/Instrumentation/AddressSanitizer/X86/asm_cpuid.ll @@ -0,0 +1,53 @@ +; RUN: opt < %s -asan -S -o %t.ll +; RUN: FileCheck %s < %t.ll +; RUN: llc < %t.ll | FileCheck %s --check-prefix=ASM + +target datalayout = "e-m:x-p:32:32-i64:64-f80:32-n8:16:32-S32" +target triple = "i386-pc-windows-msvc" + +define void @MyCPUID(i32 %fxn, i32* %out) sanitize_address { + %fxn.ptr = alloca i32 + %a.ptr = alloca i32 + %b.ptr = alloca i32 + %c.ptr = alloca i32 + %d.ptr = alloca i32 + store i32 %fxn, i32* %fxn.ptr + call void asm sideeffect inteldialect "xchg ebx, esi\0A\09mov eax, dword ptr $4\0A\09cpuid\0A\09mov dword ptr $0, eax\0A\09mov dword ptr $1, ebx\0A\09mov dword ptr $2, ecx\0A\09mov dword ptr $3, edx\0A\09xchg ebx, esi", "=*m,=*m,=*m,=*m,*m,~{eax},~{ebx},~{ecx},~{edx},~{esi},~{dirflag},~{fpsr},~{flags}"(i32* %a.ptr, i32* %b.ptr, i32* %c.ptr, i32* %d.ptr, i32* %fxn.ptr) + + %a = load i32, i32* %a.ptr + %a.out = getelementptr inbounds i32, i32* %out, i32 0 + store i32 %a, i32* %a.out + + %b = load i32, i32* %b.ptr + %b.out = getelementptr inbounds i32, i32* %out, i32 1 + store i32 %b, i32* %b.out + + %c = load i32, i32* %c.ptr + %c.out = getelementptr inbounds i32, i32* %out, i32 2 + store i32 %c, i32* %c.out + + %d = load i32, i32* %d.ptr + %d.out = getelementptr inbounds i32, i32* %out, i32 3 + store i32 %d, i32* %d.out + + ret void +} + +; We used to introduce stack mallocs for UAR detection, but that makes LLVM run +; out of registers on 32-bit platforms. Therefore, we don't do stack malloc on +; such functions. + +; CHECK-LABEL: define void @MyCPUID(i32 %fxn, i32* %out) +; CHECK: %MyAlloca = alloca [96 x i8], align 32 +; CHECK-NOT: call {{.*}} @__asan_stack_malloc + +; The code generator should recognize that all operands are just stack memory. +; This is important with MS inline asm where operand lists are implicit and all +; local variables can be referenced freely. + +; ASM-LABEL: MyCPUID: +; ASM: cpuid +; ASM-NEXT: movl %eax, {{[0-9]+}}(%esp) +; ASM-NEXT: movl %ebx, {{[0-9]+}}(%esp) +; ASM-NEXT: movl %ecx, {{[0-9]+}}(%esp) +; ASM-NEXT: movl %edx, {{[0-9]+}}(%esp) -- 2.34.1