1 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
4 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
5 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
6 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
7
8 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
9 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
10 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
11 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
12 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
13 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
14 // SIMD-ONLY-NOT: {{__kmpc|__tgt}}
15
16 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
17 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
18 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
19 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
20 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
21 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
22
23 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
24 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
25 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
26 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
27 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
28 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
29 // SIMD-ONLY-NOT: {{__kmpc|__tgt}}
30
31 // expected-no-diagnostics
32 #ifndef HEADER
33 #define HEADER
34
35 void fn1();
36 void fn2();
37 void fn3();
38 void fn4();
39 void fn5();
40 void fn6();
41
42 int Arg;
43
44 // CHECK-LABEL: define {{.*}}void @{{.+}}gtid_test
gtid_test()45 void gtid_test() {
46 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
47 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
48 // CHECK: call void [[OFFLOADING_FUN_0:@.+]](
49 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
50 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
51 // CHECK: call void [[OFFLOADING_FUN_1:@.+]](
52 #ifdef OMP5
53 #pragma omp target teams distribute parallel for simd if(simd: true) nontemporal(Arg)
54 #else
55 #pragma omp target teams distribute parallel for simd
56 #endif // OMP5
57 for (int i = 0; i < 100; i++) {
58 Arg = 0;
59 }
60 // CHECK: define internal void [[OFFLOADING_FUN_0]](
61 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 1, {{.+}}* [[OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
62 // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_0]](
63 // CHECK: call void @__kmpc_for_static_init_4(
64 // OMP50: load i32,{{.*}}!nontemporal
65 // CHECK: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 3, {{.+}}* [[OMP_OUTLINED_0:@.+]] to void
66 // CHECK: call void @__kmpc_for_static_fini(
67
68 // CHECK: define{{.+}} void [[OMP_OUTLINED_0]](
69 // CHECK: call void @__kmpc_for_static_init_4(
70 // OMP45-NOT: !nontemporal
71 // OMP50: store i32 0,{{.*}}!nontemporal
72 // CHECK: call void @__kmpc_for_static_fini(
73 // CHECK: ret
74 #pragma omp target teams distribute parallel for simd if (parallel: false)
75 for(int i = 0 ; i < 100; i++) {
76 // CHECK: define internal void [[OFFLOADING_FUN_1]](
77 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
78 // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_1]](
79 // CHECK: call void @__kmpc_for_static_init_4(
80 // CHECK: call void @__kmpc_serialized_parallel(
81 // CHECK: call void [[OMP_OUTLINED_1:@.+]](
82 // CHECK: call void @__kmpc_end_serialized_parallel(
83 // CHECK: call void @__kmpc_for_static_fini(
84 // CHECK: define{{.+}} void [[OMP_OUTLINED_1]](
85 // CHECK: call void @__kmpc_for_static_init_4(
86 // CHECK: call void @{{.+}}gtid_test
87 // CHECK: call void @__kmpc_for_static_fini(
88 // CHECK: ret
89 gtid_test();
90 }
91 }
92
93
94 template <typename T>
tmain(T Arg)95 int tmain(T Arg) {
96 #pragma omp target teams distribute parallel for simd if (true)
97 for(int i = 0 ; i < 100; i++) {
98 fn1();
99 }
100 #pragma omp target teams distribute parallel for simd if (false)
101 for(int i = 0 ; i < 100; i++) {
102 fn2();
103 }
104 #pragma omp target teams distribute parallel for simd if (parallel: Arg)
105 for(int i = 0 ; i < 100; i++) {
106 fn3();
107 }
108 return 0;
109 }
110
111 // CHECK-LABEL: define {{.*}}i{{[0-9]+}} @main()
main()112 int main() {
113 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
114 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
115 // CHECK: call void [[OFFLOADING_FUN_0:@.+]](
116 // CHECK-NOT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
117 // CHECK: call void [[OFFLOADING_FUN_1:@.+]](
118 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
119 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
120 // CHECK: call void [[OFFLOADING_FUN_2:@.+]](
121 // CHECK: = call {{.*}}i{{.+}} @{{.+}}tmain
122 #pragma omp target teams distribute parallel for simd if (true)
123 for(int i = 0 ; i < 100; i++) {
124 // CHECK: define internal void [[OFFLOADING_FUN_0]](
125 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
126 // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_0]](
127
128 // CHECK: call void @__kmpc_for_static_init_4(
129 // CHECK: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, {{.+}}* [[OMP_OUTLINED_2:@.+]] to void
130 // CHECK: call void @__kmpc_for_static_fini(
131 // CHECK: define{{.+}} void [[OMP_OUTLINED_2]](
132 // CHECK: call void @__kmpc_for_static_init_4(
133 // CHECK: call {{.*}}void @{{.+}}fn4
134 // CHECK: call void @__kmpc_for_static_fini(
135
136 fn4();
137 }
138
139 #pragma omp target teams distribute parallel for simd if (false)
140 for(int i = 0 ; i < 100; i++) {
141 // CHECK: define internal void [[OFFLOADING_FUN_1]](
142 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
143 // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_1]](
144
145 // CHECK: call void @__kmpc_for_static_init_4(
146 // CHECK: call void @__kmpc_serialized_parallel(
147 // CHECK: call void [[OMP_OUTLINED_3:@.+]](
148 // CHECK: call void @__kmpc_end_serialized_parallel(
149 // CHECK: call void @__kmpc_for_static_fini(
150
151 // CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
152 // CHECK: call void @__kmpc_for_static_init_4(
153 // CHECK: call {{.*}}void @{{.+}}fn5
154 // CHECK: call void @__kmpc_for_static_fini(
155 fn5();
156 }
157
158 #pragma omp target teams distribute parallel for simd if (Arg)
159 for(int i = 0 ; i < 100; i++) {
160 // CHECK: define internal void [[OFFLOADING_FUN_2]](
161 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 1, {{.+}}* [[OMP_TEAMS_OUTLINED_2:@.+]] to {{.+}})
162 // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_2]](
163
164 // CHECK: call void @__kmpc_for_static_init_4(
165 // OMP45: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, {{.+}}* [[OMP_OUTLINED_4:@.+]] to void
166 // OMP50: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 3, {{.+}}* [[OMP_OUTLINED_4:@.+]] to void
167 // CHECK: call void @__kmpc_serialized_parallel(
168 // CHECK: call void [[OMP_OUTLINED_4:@.+]](
169 // CHECK: call void @__kmpc_end_serialized_parallel(
170 // CHECK: call void @__kmpc_for_static_fini(
171
172 // CHECK: define{{.+}} void [[OMP_OUTLINED_4]](
173 // CHECK: call void @__kmpc_for_static_init_4(
174 // CHECK: call {{.*}}void @{{.+}}fn6
175 // CHECK: call void @__kmpc_for_static_fini(
176 fn6();
177 }
178
179 return tmain(Arg);
180 }
181
182 // CHECK-LABEL: define {{.+}} @{{.+}}tmain
183
184 // CHECK: call void @__kmpc_for_static_init_4(
185 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, void {{.+}}* [[T_OUTLINE_FUN_1:@.+]] to void
186 // CHECK: call void @__kmpc_for_static_fini(
187
188 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_1]]
189 // CHECK: call void @__kmpc_for_static_init_4(
190 // CHECK: call {{.*}}void @{{.+}}fn1
191 // CHECK: call void @__kmpc_for_static_fini(
192 // CHECK: ret void
193
194 // CHECK: call void @__kmpc_for_static_init_4(
195 // CHECK: call {{.*}}void @__kmpc_serialized_parallel(
196 // CHECK: call void [[T_OUTLINE_FUN_2:@.+]](
197 // CHECK: call {{.*}}void @__kmpc_end_serialized_parallel(
198 // CHECK: call void @__kmpc_for_static_fini(
199
200 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_2]]
201 // CHECK: call void @__kmpc_for_static_init_4(
202 // CHECK: call {{.*}}void @{{.+}}fn2
203 // CHECK: call void @__kmpc_for_static_fini(
204 // CHECK: ret void
205
206 // CHECK: call void @__kmpc_for_static_init_4(
207 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, void {{.+}}* [[T_OUTLINE_FUN_3:@.+]] to void
208 // CHECK: call {{.*}}void @__kmpc_serialized_parallel(
209 // call void [[T_OUTLINE_FUN_3:@.+]](
210 // CHECK: call {{.*}}void @__kmpc_end_serialized_parallel(
211
212 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_3]]
213 // CHECK: call void @__kmpc_for_static_init_4(
214 // CHECK: call {{.*}}void @{{.+}}fn3
215 // CHECK: call void @__kmpc_for_static_fini(
216 // CHECK: ret void
217 #endif
218
219 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
220 // CHECK-DAG: !{!"llvm.loop.vectorize.enable", i1 true}
221 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
222 // OMP50-DAG: !{!"llvm.loop.vectorize.enable", i1 false}
223