1 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
4 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
5 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
6 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
7 
8 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
9 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
10 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
11 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
12 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
13 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
14 // SIMD-ONLY-NOT: {{__kmpc|__tgt}}
15 
16 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
17 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
18 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP45
19 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
20 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
21 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
22 
23 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
24 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
25 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
26 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -emit-llvm %s -o - | FileCheck %s --check-prefix SIMD-ONLY
27 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple aarch64-unknown-unknown -emit-pch -o %t %s
28 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -DOMP5 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple aarch64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix SIMD-ONLY
29 // SIMD-ONLY-NOT: {{__kmpc|__tgt}}
30 
31 // expected-no-diagnostics
32 #ifndef HEADER
33 #define HEADER
34 
35 void fn1();
36 void fn2();
37 void fn3();
38 void fn4();
39 void fn5();
40 void fn6();
41 
42 int Arg;
43 
44 // CHECK-LABEL: define {{.*}}void @{{.+}}gtid_test
gtid_test()45 void gtid_test() {
46 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
47 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
48 // CHECK: call void [[OFFLOADING_FUN_0:@.+]](
49 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
50 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
51 // CHECK: call void [[OFFLOADING_FUN_1:@.+]](
52 #ifdef OMP5
53 #pragma omp target teams distribute parallel for simd if(simd: true) nontemporal(Arg)
54 #else
55 #pragma omp target teams distribute parallel for simd
56 #endif // OMP5
57   for (int i = 0; i < 100; i++) {
58     Arg = 0;
59   }
60   // CHECK: define internal void [[OFFLOADING_FUN_0]](
61   // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 1, {{.+}}* [[OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
62   // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_0]](
63   // CHECK: call void @__kmpc_for_static_init_4(
64   // OMP50: load i32,{{.*}}!nontemporal
65   // CHECK: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 3, {{.+}}* [[OMP_OUTLINED_0:@.+]] to void
66   // CHECK: call void @__kmpc_for_static_fini(
67 
68   // CHECK: define{{.+}} void [[OMP_OUTLINED_0]](
69   // CHECK: call void @__kmpc_for_static_init_4(
70   // OMP45-NOT: !nontemporal
71   // OMP50: store i32 0,{{.*}}!nontemporal
72   // CHECK: call void @__kmpc_for_static_fini(
73   // CHECK: ret
74 #pragma omp target teams distribute parallel for simd if (parallel: false)
75   for(int i = 0 ; i < 100; i++) {
76   // CHECK: define internal void [[OFFLOADING_FUN_1]](
77   // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
78   // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_1]](
79   // CHECK: call void @__kmpc_for_static_init_4(
80   // CHECK: call void @__kmpc_serialized_parallel(
81   // CHECK: call void [[OMP_OUTLINED_1:@.+]](
82   // CHECK: call void @__kmpc_end_serialized_parallel(
83   // CHECK: call void @__kmpc_for_static_fini(
84   // CHECK: define{{.+}} void [[OMP_OUTLINED_1]](
85   // CHECK: call void @__kmpc_for_static_init_4(
86   // CHECK: call void @{{.+}}gtid_test
87   // CHECK: call void @__kmpc_for_static_fini(
88   // CHECK: ret
89     gtid_test();
90   }
91 }
92 
93 
94 template <typename T>
tmain(T Arg)95 int tmain(T Arg) {
96 #pragma omp target teams distribute parallel for simd if (true)
97   for(int i = 0 ; i < 100; i++) {
98     fn1();
99   }
100 #pragma omp target teams distribute parallel for simd if (false)
101   for(int i = 0 ; i < 100; i++) {
102     fn2();
103   }
104 #pragma omp target teams distribute parallel for simd if (parallel: Arg)
105   for(int i = 0 ; i < 100; i++) {
106     fn3();
107   }
108   return 0;
109 }
110 
111 // CHECK-LABEL: define {{.*}}i{{[0-9]+}} @main()
main()112 int main() {
113 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
114 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
115 // CHECK: call void [[OFFLOADING_FUN_0:@.+]](
116 // CHECK-NOT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
117 // CHECK: call void [[OFFLOADING_FUN_1:@.+]](
118 // CHECK: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @{{.+}}, i64 -1, i64 100)
119 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
120 // CHECK: call void [[OFFLOADING_FUN_2:@.+]](
121 // CHECK: = call {{.*}}i{{.+}} @{{.+}}tmain
122 #pragma omp target teams distribute parallel for simd if (true)
123   for(int i = 0 ; i < 100; i++) {
124     // CHECK: define internal void [[OFFLOADING_FUN_0]](
125     // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
126     // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_0]](
127 
128     // CHECK: call void @__kmpc_for_static_init_4(
129     // CHECK: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, {{.+}}* [[OMP_OUTLINED_2:@.+]] to void
130     // CHECK: call void @__kmpc_for_static_fini(
131     // CHECK: define{{.+}} void [[OMP_OUTLINED_2]](
132     // CHECK: call void @__kmpc_for_static_init_4(
133     // CHECK: call {{.*}}void @{{.+}}fn4
134     // CHECK: call void @__kmpc_for_static_fini(
135 
136     fn4();
137   }
138 
139 #pragma omp target teams distribute parallel for simd if (false)
140   for(int i = 0 ; i < 100; i++) {
141     // CHECK: define internal void [[OFFLOADING_FUN_1]](
142     // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
143     // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_1]](
144 
145     // CHECK: call void @__kmpc_for_static_init_4(
146     // CHECK: call void @__kmpc_serialized_parallel(
147     // CHECK: call void [[OMP_OUTLINED_3:@.+]](
148     // CHECK: call void @__kmpc_end_serialized_parallel(
149     // CHECK: call void @__kmpc_for_static_fini(
150 
151     // CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
152     // CHECK: call void @__kmpc_for_static_init_4(
153     // CHECK: call {{.*}}void @{{.+}}fn5
154     // CHECK: call void @__kmpc_for_static_fini(
155     fn5();
156   }
157 
158 #pragma omp target teams distribute parallel for simd if (Arg)
159   for(int i = 0 ; i < 100; i++) {
160     // CHECK: define internal void [[OFFLOADING_FUN_2]](
161     // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 1, {{.+}}* [[OMP_TEAMS_OUTLINED_2:@.+]] to {{.+}})
162     // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_2]](
163 
164     // CHECK: call void @__kmpc_for_static_init_4(
165     // OMP45: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, {{.+}}* [[OMP_OUTLINED_4:@.+]] to void
166     // OMP50: call void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 3, {{.+}}* [[OMP_OUTLINED_4:@.+]] to void
167     // CHECK: call void @__kmpc_serialized_parallel(
168     // CHECK: call void [[OMP_OUTLINED_4:@.+]](
169     // CHECK: call void @__kmpc_end_serialized_parallel(
170     // CHECK: call void @__kmpc_for_static_fini(
171 
172     // CHECK: define{{.+}} void [[OMP_OUTLINED_4]](
173     // CHECK: call void @__kmpc_for_static_init_4(
174     // CHECK: call {{.*}}void @{{.+}}fn6
175     // CHECK: call void @__kmpc_for_static_fini(
176     fn6();
177   }
178 
179   return tmain(Arg);
180 }
181 
182 // CHECK-LABEL: define {{.+}} @{{.+}}tmain
183 
184 // CHECK: call void @__kmpc_for_static_init_4(
185 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, void {{.+}}* [[T_OUTLINE_FUN_1:@.+]] to void
186 // CHECK: call void @__kmpc_for_static_fini(
187 
188 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_1]]
189 // CHECK: call void @__kmpc_for_static_init_4(
190 // CHECK: call {{.*}}void @{{.+}}fn1
191 // CHECK: call void @__kmpc_for_static_fini(
192 // CHECK: ret void
193 
194 // CHECK: call void @__kmpc_for_static_init_4(
195 // CHECK: call {{.*}}void @__kmpc_serialized_parallel(
196 // CHECK: call void [[T_OUTLINE_FUN_2:@.+]](
197 // CHECK: call {{.*}}void @__kmpc_end_serialized_parallel(
198 // CHECK: call void @__kmpc_for_static_fini(
199 
200 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_2]]
201 // CHECK: call void @__kmpc_for_static_init_4(
202 // CHECK: call {{.*}}void @{{.+}}fn2
203 // CHECK: call void @__kmpc_for_static_fini(
204 // CHECK: ret void
205 
206 // CHECK: call void @__kmpc_for_static_init_4(
207 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_call(%{{.+}}* @{{.+}}, i{{.+}} 2, void {{.+}}* [[T_OUTLINE_FUN_3:@.+]] to void
208 // CHECK: call {{.*}}void @__kmpc_serialized_parallel(
209 // call void [[T_OUTLINE_FUN_3:@.+]](
210 // CHECK: call {{.*}}void @__kmpc_end_serialized_parallel(
211 
212 // CHECK: define internal {{.*}}void [[T_OUTLINE_FUN_3]]
213 // CHECK: call void @__kmpc_for_static_init_4(
214 // CHECK: call {{.*}}void @{{.+}}fn3
215 // CHECK: call void @__kmpc_for_static_fini(
216 // CHECK: ret void
217 #endif
218 
219 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
220 // CHECK-DAG: !{!"llvm.loop.vectorize.enable", i1 true}
221 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
222 // OMP50-DAG: !{!"llvm.loop.vectorize.enable", i1 false}
223