xref: /llvm-project/clang/test/OpenMP/amdgcn_target_global_constructor.cpp (revision 68bcba6d7a1cc18996c0bcb7c62267c62d2040d0)
1 // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --function-signature --check-globals --include-generated-funcs --replace-value-regex "__omp_offloading_[0-9a-z]+_[0-9a-z]+" "reduction_size[.].+[.]" "pl_cond[.].+[.|,]" --prefix-filecheck-ir-name _
2 // REQUIRES: amdgpu-registered-target
3 
4 // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm-bc %s -o %t-ppc-host.bc
5 // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple amdgcn-amd-amdhsa -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -fopenmp-is-target-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s
6 // expected-no-diagnostics
7 #ifndef HEADER
8 #define HEADER
9 
10 void foo(void);
11 
12 struct S {
13   int a;
14   S() : a(1) {}
15   ~S() { foo(); }
16 };
17 
18 #pragma omp declare target
19 S A;
20 #pragma omp end declare target
21 
22 #endif
23 //.
24 // CHECK: @__omp_rtl_debug_kind = weak_odr hidden addrspace(1) constant i32 0
25 // CHECK: @__omp_rtl_assume_teams_oversubscription = weak_odr hidden addrspace(1) constant i32 0
26 // CHECK: @__omp_rtl_assume_threads_oversubscription = weak_odr hidden addrspace(1) constant i32 0
27 // CHECK: @__omp_rtl_assume_no_thread_state = weak_odr hidden addrspace(1) constant i32 0
28 // CHECK: @__omp_rtl_assume_no_nested_parallelism = weak_odr hidden addrspace(1) constant i32 0
29 // CHECK: @A = addrspace(1) global %struct.S zeroinitializer, align 4
30 // CHECK: @llvm.global_ctors = appending global [1 x { i32, ptr, ptr }] [{ i32, ptr, ptr } { i32 65535, ptr @_GLOBAL__sub_I_amdgcn_target_global_constructor.cpp, ptr null }]
31 // CHECK: @llvm.global_dtors = appending global [1 x { i32, ptr, ptr }] [{ i32, ptr, ptr } { i32 65535, ptr @__dtor_A, ptr null }]
32 // CHECK: @__oclc_ABI_version = weak_odr hidden local_unnamed_addr addrspace(4) constant i32 500
33 //.
34 // CHECK-LABEL: define {{[^@]+}}@__cxx_global_var_init
35 // CHECK-SAME: () #[[ATTR0:[0-9]+]] {
36 // CHECK-NEXT:  entry:
37 // CHECK-NEXT:    call void @_ZN1SC1Ev(ptr noundef nonnull align 4 dereferenceable(4) addrspacecast (ptr addrspace(1) @A to ptr)) #[[ATTR3:[0-9]+]]
38 // CHECK-NEXT:    ret void
39 //
40 //
41 // CHECK-LABEL: define {{[^@]+}}@_ZN1SC1Ev
42 // CHECK-SAME: (ptr noundef nonnull align 4 dereferenceable(4) [[THIS:%.*]]) unnamed_addr #[[ATTR1:[0-9]+]] comdat align 2 {
43 // CHECK-NEXT:  entry:
44 // CHECK-NEXT:    [[THIS_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
45 // CHECK-NEXT:    [[THIS_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[THIS_ADDR]] to ptr
46 // CHECK-NEXT:    store ptr [[THIS]], ptr [[THIS_ADDR_ASCAST]], align 8
47 // CHECK-NEXT:    [[THIS1:%.*]] = load ptr, ptr [[THIS_ADDR_ASCAST]], align 8
48 // CHECK-NEXT:    call void @_ZN1SC2Ev(ptr noundef nonnull align 4 dereferenceable(4) [[THIS1]]) #[[ATTR3]]
49 // CHECK-NEXT:    ret void
50 //
51 //
52 // CHECK-LABEL: define {{[^@]+}}@_ZN1SD1Ev
53 // CHECK-SAME: (ptr noundef nonnull align 4 dereferenceable(4) [[THIS:%.*]]) unnamed_addr #[[ATTR1]] comdat align 2 {
54 // CHECK-NEXT:  entry:
55 // CHECK-NEXT:    [[THIS_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
56 // CHECK-NEXT:    [[THIS_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[THIS_ADDR]] to ptr
57 // CHECK-NEXT:    store ptr [[THIS]], ptr [[THIS_ADDR_ASCAST]], align 8
58 // CHECK-NEXT:    [[THIS1:%.*]] = load ptr, ptr [[THIS_ADDR_ASCAST]], align 8
59 // CHECK-NEXT:    call void @_ZN1SD2Ev(ptr noundef nonnull align 4 dereferenceable(4) [[THIS1]]) #[[ATTR4:[0-9]+]]
60 // CHECK-NEXT:    ret void
61 //
62 //
63 // CHECK-LABEL: define {{[^@]+}}@__dtor_A
64 // CHECK-SAME: () #[[ATTR0]] {
65 // CHECK-NEXT:  entry:
66 // CHECK-NEXT:    call void @_ZN1SD1Ev(ptr addrspacecast (ptr addrspace(1) @A to ptr))
67 // CHECK-NEXT:    ret void
68 //
69 //
70 // CHECK-LABEL: define {{[^@]+}}@_ZN1SC2Ev
71 // CHECK-SAME: (ptr noundef nonnull align 4 dereferenceable(4) [[THIS:%.*]]) unnamed_addr #[[ATTR1]] comdat align 2 {
72 // CHECK-NEXT:  entry:
73 // CHECK-NEXT:    [[THIS_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
74 // CHECK-NEXT:    [[THIS_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[THIS_ADDR]] to ptr
75 // CHECK-NEXT:    store ptr [[THIS]], ptr [[THIS_ADDR_ASCAST]], align 8
76 // CHECK-NEXT:    [[THIS1:%.*]] = load ptr, ptr [[THIS_ADDR_ASCAST]], align 8
77 // CHECK-NEXT:    [[A:%.*]] = getelementptr inbounds nuw [[STRUCT_S:%.*]], ptr [[THIS1]], i32 0, i32 0
78 // CHECK-NEXT:    store i32 1, ptr [[A]], align 4
79 // CHECK-NEXT:    ret void
80 //
81 //
82 // CHECK-LABEL: define {{[^@]+}}@_ZN1SD2Ev
83 // CHECK-SAME: (ptr noundef nonnull align 4 dereferenceable(4) [[THIS:%.*]]) unnamed_addr #[[ATTR1]] comdat align 2 {
84 // CHECK-NEXT:  entry:
85 // CHECK-NEXT:    [[THIS_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
86 // CHECK-NEXT:    [[THIS_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[THIS_ADDR]] to ptr
87 // CHECK-NEXT:    store ptr [[THIS]], ptr [[THIS_ADDR_ASCAST]], align 8
88 // CHECK-NEXT:    [[THIS1:%.*]] = load ptr, ptr [[THIS_ADDR_ASCAST]], align 8
89 // CHECK-NEXT:    call void @_Z3foov() #[[ATTR3]]
90 // CHECK-NEXT:    ret void
91 //
92 //
93 // CHECK-LABEL: define {{[^@]+}}@_GLOBAL__sub_I_amdgcn_target_global_constructor.cpp
94 // CHECK-SAME: () #[[ATTR0]] {
95 // CHECK-NEXT:  entry:
96 // CHECK-NEXT:    call void @__cxx_global_var_init()
97 // CHECK-NEXT:    ret void
98 //
99 //.
100 // CHECK: attributes #[[ATTR0]] = { convergent noinline nounwind "no-trapping-math"="true" "stack-protector-buffer-size"="8" }
101 // CHECK: attributes #[[ATTR1]] = { convergent mustprogress noinline nounwind optnone "no-trapping-math"="true" "stack-protector-buffer-size"="8" }
102 // CHECK: attributes #[[ATTR2:[0-9]+]] = { convergent "no-trapping-math"="true" "stack-protector-buffer-size"="8" }
103 // CHECK: attributes #[[ATTR3]] = { convergent }
104 // CHECK: attributes #[[ATTR4]] = { convergent nounwind }
105 //.
106 // CHECK: [[META0:![0-9]+]] = !{i32 1, !"A", i32 0, i32 0}
107 // CHECK: [[META1:![0-9]+]] = !{i32 1, !"amdhsa_code_object_version", i32 500}
108 // CHECK: [[META2:![0-9]+]] = !{i32 1, !"wchar_size", i32 4}
109 // CHECK: [[META3:![0-9]+]] = !{i32 7, !"openmp", i32 51}
110 // CHECK: [[META4:![0-9]+]] = !{i32 7, !"openmp-device", i32 51}
111 // CHECK: [[META5:![0-9]+]] = !{!"{{.*}}clang version {{.*}}"}
112 //.
113