It's currently ambiguous in IR whether the source language explicitly did not want a stack a stack protector (in C, via function attribute no_stack_protector) or doesn't care for any given function. It's common for code that manipulates the stack via inline assembly or that has to set up its own stack canary (such as the Linux kernel) would like to avoid stack protectors in certain functions. In this case, we've been bitten by numerous bugs where a callee with a stack protector is inlined into an __attribute__((__no_stack_protector__)) caller, which generally breaks the caller's assumptions about not having a stack protector. LTO exacerbates the issue. While developers can avoid this by putting all no_stack_protector functions in one translation unit together and compiling those with -fno-stack-protector, it's generally not very ergonomic or as ergonomic as a function attribute, and still doesn't work for LTO. See also: https://lore.kernel.org/linux-pm/20200915172658.1432732-1-rkir@google.com/ https://lore.kernel.org/lkml/20200918201436.2932360-30-samitolvanen@google.com/T/#u Typically, when inlining a callee into a caller, the caller will be upgraded in its level of stack protection (see adjustCallerSSPLevel()). By adding an explicit attribute in the IR when the function attribute is used in the source language, we can now identify such cases and prevent inlining. Block inlining when the callee and caller differ in the case that one contains `nossp` when the other has `ssp`, `sspstrong`, or `sspreq`. Fixes pr/47479. Reviewed By: void Differential Revision: https://reviews.llvm.org/D87956
86 lines
2.5 KiB
LLVM
86 lines
2.5 KiB
LLVM
; RUN: opt < %s -S -partial-inliner -skip-partial-inlining-cost-analysis=true | FileCheck %s
|
|
|
|
|
|
define i32 @callee_most(i32 %v) unnamed_addr #0 #1 {
|
|
entry:
|
|
%cmp = icmp sgt i32 %v, 2000
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then:
|
|
br label %if.then2
|
|
|
|
if.then2:
|
|
%sub = sub i32 %v, 10
|
|
br label %if.end
|
|
|
|
if.end:
|
|
%v2 = phi i32 [ %v, %entry ], [ %sub, %if.then2 ]
|
|
%add = add nsw i32 %v2, 200
|
|
ret i32 %add
|
|
}
|
|
|
|
define i32 @callee_noinline(i32 %v) optnone noinline {
|
|
entry:
|
|
%cmp = icmp sgt i32 %v, 2000
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then:
|
|
br label %if.then2
|
|
|
|
if.then2:
|
|
%sub = sub i32 %v, 10
|
|
br label %if.end
|
|
|
|
if.end:
|
|
%v2 = phi i32 [ %v, %entry ], [ %sub, %if.then2 ]
|
|
%add = add nsw i32 %v2, 200
|
|
ret i32 %add
|
|
}
|
|
|
|
define i32 @callee_writeonly(i32 %v) writeonly {
|
|
entry:
|
|
%cmp = icmp sgt i32 %v, 2000
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then:
|
|
br label %if.then2
|
|
|
|
if.then2:
|
|
%sub = sub i32 %v, 10
|
|
br label %if.end
|
|
|
|
if.end:
|
|
%v2 = phi i32 [ %v, %entry ], [ %sub, %if.then2 ]
|
|
%add = add nsw i32 %v2, 200
|
|
ret i32 %add
|
|
}
|
|
; CHECK-LABEL: @caller
|
|
; CHECK: call void @callee_most.2.if.then(i32 %v
|
|
; CHECK: call i32 @callee_noinline(i32 %v)
|
|
; CHECK: call void @callee_writeonly.1.if.then(i32 %v
|
|
define i32 @caller(i32 %v) {
|
|
entry:
|
|
%c1 = call i32 @callee_most(i32 %v)
|
|
%c2 = call i32 @callee_noinline(i32 %v)
|
|
%c3 = call i32 @callee_writeonly(i32 %v)
|
|
ret i32 %c3
|
|
}
|
|
|
|
; CHECK: define internal void @callee_writeonly.1.if.then(i32 %v, i32* %sub.out) {
|
|
; CHECK: define internal void @callee_most.2.if.then(i32 %v, i32* %sub.out) [[FN_ATTRS:#[0-9]+]]
|
|
|
|
; attributes to preserve
|
|
attributes #0 = {
|
|
inlinehint minsize noduplicate noimplicitfloat norecurse noredzone nounwind
|
|
nonlazybind optsize safestack sanitize_address sanitize_hwaddress sanitize_memory
|
|
sanitize_thread sspstrong strictfp uwtable "foo"="bar"
|
|
"patchable-function"="prologue-short-redirect" "probe-stack"="_foo_guard" "stack-probe-size"="4096" }
|
|
|
|
; CHECK: attributes [[FN_ATTRS]] = { inlinehint minsize noduplicate noimplicitfloat norecurse noredzone nounwind nonlazybind optsize safestack sanitize_address sanitize_hwaddress sanitize_memory sanitize_thread sspstrong strictfp uwtable "foo"="bar" "patchable-function"="prologue-short-redirect" "probe-stack"="_foo_guard" "stack-probe-size"="4096" }
|
|
|
|
; attributes to drop
|
|
attributes #1 = {
|
|
alignstack=16 convergent inaccessiblememonly inaccessiblemem_or_argmemonly naked
|
|
noreturn readonly argmemonly returns_twice speculatable "thunk"
|
|
}
|