116 lines
4.7 KiB
LLVM
116 lines
4.7 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --check-attributes --check-globals
|
|
; RUN: opt -aa-pipeline=basic-aa -passes=openmp-opt -attributor-manifest-internal -attributor-annotate-decl-cs -S < %s | FileCheck %s --check-prefixes=CHECK,TUNIT
|
|
; RUN: opt -aa-pipeline=basic-aa -passes=openmp-opt-cgscc -attributor-manifest-internal -attributor-annotate-decl-cs -S < %s | FileCheck %s --check-prefixes=CHECK,CGSCC
|
|
|
|
target triple = "amdgcn-amd-amdhsa"
|
|
|
|
%struct.ident_t = type { i32, i32, i32, i32, ptr }
|
|
|
|
@G = internal addrspace(3) global i32 undef, align 4
|
|
|
|
; Make sure we do not delete the stores to @G without also replacing the load with `1`.
|
|
;.
|
|
; CHECK: @[[G:[a-zA-Z0-9_$"\\.-]+]] = internal addrspace(3) global i32 undef, align 4
|
|
;.
|
|
define void @kernel() "kernel" {
|
|
; TUNIT: Function Attrs: norecurse
|
|
; TUNIT-LABEL: define {{[^@]+}}@kernel
|
|
; TUNIT-SAME: () #[[ATTR0:[0-9]+]] {
|
|
; TUNIT-NEXT: [[CALL:%.*]] = call i32 @__kmpc_target_init(ptr undef, i8 1, i1 false)
|
|
; TUNIT-NEXT: [[CMP:%.*]] = icmp eq i32 [[CALL]], -1
|
|
; TUNIT-NEXT: br i1 [[CMP]], label [[IF_THEN:%.*]], label [[IF_ELSE:%.*]]
|
|
; TUNIT: if.then:
|
|
; TUNIT-NEXT: store i32 1, ptr addrspace(3) @G, align 4
|
|
; TUNIT-NEXT: br label [[IF_MERGE:%.*]]
|
|
; TUNIT: if.else:
|
|
; TUNIT-NEXT: call void @barrier() #[[ATTR4:[0-9]+]]
|
|
; TUNIT-NEXT: [[L:%.*]] = load i32, ptr addrspace(3) @G, align 4
|
|
; TUNIT-NEXT: call void @use1(i32 [[L]]) #[[ATTR4]]
|
|
; TUNIT-NEXT: br label [[IF_MERGE]]
|
|
; TUNIT: if.merge:
|
|
; TUNIT-NEXT: br i1 [[CMP]], label [[IF_THEN2:%.*]], label [[IF_END:%.*]]
|
|
; TUNIT: if.then2:
|
|
; TUNIT-NEXT: store i32 2, ptr addrspace(3) @G, align 4
|
|
; TUNIT-NEXT: call void @barrier() #[[ATTR4]]
|
|
; TUNIT-NEXT: br label [[IF_END]]
|
|
; TUNIT: if.end:
|
|
; TUNIT-NEXT: call void @__kmpc_target_deinit(ptr undef, i8 1)
|
|
; TUNIT-NEXT: ret void
|
|
;
|
|
; CGSCC: Function Attrs: norecurse
|
|
; CGSCC-LABEL: define {{[^@]+}}@kernel
|
|
; CGSCC-SAME: () #[[ATTR0:[0-9]+]] {
|
|
; CGSCC-NEXT: [[CALL:%.*]] = call i32 @__kmpc_target_init(ptr undef, i8 1, i1 false)
|
|
; CGSCC-NEXT: [[CMP:%.*]] = icmp eq i32 [[CALL]], -1
|
|
; CGSCC-NEXT: br i1 [[CMP]], label [[IF_THEN:%.*]], label [[IF_ELSE:%.*]]
|
|
; CGSCC: if.then:
|
|
; CGSCC-NEXT: store i32 1, ptr addrspace(3) @G, align 4
|
|
; CGSCC-NEXT: br label [[IF_MERGE:%.*]]
|
|
; CGSCC: if.else:
|
|
; CGSCC-NEXT: call void @barrier()
|
|
; CGSCC-NEXT: [[L:%.*]] = load i32, ptr addrspace(3) @G, align 4
|
|
; CGSCC-NEXT: call void @use1(i32 [[L]])
|
|
; CGSCC-NEXT: br label [[IF_MERGE]]
|
|
; CGSCC: if.merge:
|
|
; CGSCC-NEXT: br i1 [[CMP]], label [[IF_THEN2:%.*]], label [[IF_END:%.*]]
|
|
; CGSCC: if.then2:
|
|
; CGSCC-NEXT: store i32 2, ptr addrspace(3) @G, align 4
|
|
; CGSCC-NEXT: call void @barrier()
|
|
; CGSCC-NEXT: br label [[IF_END]]
|
|
; CGSCC: if.end:
|
|
; CGSCC-NEXT: call void @__kmpc_target_deinit(ptr undef, i8 1)
|
|
; CGSCC-NEXT: ret void
|
|
;
|
|
%call = call i32 @__kmpc_target_init(ptr undef, i8 1, i1 false)
|
|
%cmp = icmp eq i32 %call, -1
|
|
br i1 %cmp, label %if.then, label %if.else
|
|
if.then:
|
|
store i32 1, ptr addrspace(3) @G
|
|
br label %if.merge
|
|
if.else:
|
|
call void @barrier();
|
|
%l = load i32, ptr addrspace(3) @G
|
|
call void @use1(i32 %l)
|
|
br label %if.merge
|
|
if.merge:
|
|
br i1 %cmp, label %if.then2, label %if.end
|
|
if.then2:
|
|
store i32 2, ptr addrspace(3) @G
|
|
call void @barrier();
|
|
br label %if.end
|
|
if.end:
|
|
call void @__kmpc_target_deinit(ptr undef, i8 1)
|
|
ret void
|
|
}
|
|
|
|
declare void @barrier() norecurse nounwind nocallback
|
|
declare void @use1(i32) nosync norecurse nounwind nocallback
|
|
declare i32 @__kmpc_target_init(ptr, i8, i1) nocallback
|
|
declare void @__kmpc_target_deinit(ptr, i8) nocallback
|
|
|
|
!llvm.module.flags = !{!0, !1}
|
|
!nvvm.annotations = !{!2}
|
|
|
|
!0 = !{i32 7, !"openmp", i32 50}
|
|
!1 = !{i32 7, !"openmp-device", i32 50}
|
|
!2 = !{ptr @kernel, !"kernel", i32 1}
|
|
|
|
;.
|
|
; TUNIT: attributes #[[ATTR0]] = { norecurse "kernel" }
|
|
; TUNIT: attributes #[[ATTR1:[0-9]+]] = { nocallback norecurse nounwind }
|
|
; TUNIT: attributes #[[ATTR2:[0-9]+]] = { nocallback norecurse nosync nounwind }
|
|
; TUNIT: attributes #[[ATTR3:[0-9]+]] = { nocallback }
|
|
; TUNIT: attributes #[[ATTR4]] = { nounwind }
|
|
;.
|
|
; CGSCC: attributes #[[ATTR0]] = { norecurse "kernel" }
|
|
; CGSCC: attributes #[[ATTR1:[0-9]+]] = { nocallback norecurse nounwind }
|
|
; CGSCC: attributes #[[ATTR2:[0-9]+]] = { nocallback norecurse nosync nounwind }
|
|
; CGSCC: attributes #[[ATTR3:[0-9]+]] = { nocallback }
|
|
;.
|
|
; CHECK: [[META0:![0-9]+]] = !{i32 7, !"openmp", i32 50}
|
|
; CHECK: [[META1:![0-9]+]] = !{i32 7, !"openmp-device", i32 50}
|
|
; CHECK: [[META2:![0-9]+]] = !{ptr @kernel, !"kernel", i32 1}
|
|
;.
|
|
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
|
|
; CHECK: {{.*}}
|