1 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -emit-llvm %s -fexceptions -fcxx-exceptions -o - | FileCheck %s
2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
4 
5 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -emit-llvm %s -fexceptions -fcxx-exceptions -o - | FileCheck --check-prefix SIMD-ONLY0 %s
6 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -emit-pch -o %t %s
7 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
8 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
9 
10 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -emit-llvm %s -fexceptions -fcxx-exceptions -o - | FileCheck %s
11 // RUN: %clang_cc1 -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -emit-pch -o %t %s
12 // RUN: %clang_cc1 -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
13 
14 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -emit-llvm %s -fexceptions -fcxx-exceptions -o - | FileCheck --check-prefix SIMD-ONLY0 %s
15 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -emit-pch -o %t %s
16 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-ibm-linux-gnu -fexceptions -fcxx-exceptions -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
17 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
18 
19 // expected-no-diagnostics
20 #ifndef HEADER
21 #define HEADER
22 
23 typedef __INTPTR_TYPE__ intptr_t;
24 
25 // CHECK-DAG: [[IDENT_T_TY:%.+]] = type { i32, i32, i32, i32, i8* }
26 // CHECK-DAG: [[S_TY:%.+]] = type { [[INTPTR_T_TY:i[0-9]+]], [[INTPTR_T_TY]], [[INTPTR_T_TY]] }
27 // CHECK-DAG: [[STR:@.+]] = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00"
28 // CHECK-DAG: [[DEF_LOC_2:@.+]] = private unnamed_addr constant [[IDENT_T_TY]] { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* [[STR]], i32 0, i32 0) }
29 
30 void foo();
31 
32 struct S {
33   intptr_t a, b, c;
SS34   S(intptr_t a) : a(a) {}
operator charS35   operator char() { return a; }
~SS36   ~S() {}
37 };
38 
39 template <typename T, int C>
tmain()40 int tmain() {
41 #pragma omp target
42 #pragma omp teams distribute parallel for num_threads(C)
43   for (int i = 0; i < 100; i++)
44     foo();
45 #pragma omp target
46 #pragma omp teams distribute parallel for num_threads(T(23))
47   for (int i = 0; i < 100; i++)
48     foo();
49   return 0;
50 }
51 
main()52 int main() {
53   S s(0);
54   char a = s;
55 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
56 // CHECK: call void [[OFFLOADING_FUN_0:@.+]](
57 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
58 // CHECK: call void [[OFFLOADING_FUN_1:@.+]](
59 // CHECK: invoke{{.+}} [[TMAIN_5:@.+]]()
60 // CHECK: invoke{{.+}} [[TMAIN_1:@.+]]()
61 #pragma omp target
62   // CHECK: define internal void [[OFFLOADING_FUN_0]](
63   // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
64 #pragma omp teams distribute parallel for num_threads(2)
65   for (int i = 0; i < 100; i++) {
66     // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_0]](
67     // CHECK:       call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 2)
68     // CHECK:       call {{.*}}void {{.*}} @__kmpc_fork_call(
69     foo();
70   }
71 #pragma omp target
72   // CHECK: define internal void [[OFFLOADING_FUN_1]](
73 
74   // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 1, {{.+}}* [[OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
75 #pragma omp teams distribute parallel for num_threads(a)
76   for (int i = 0; i < 100; i++) {
77     // CHECK: define{{.+}} void [[OMP_TEAMS_OUTLINED_1]](
78     // CHECK-DAG: [[A_ADDR:%.+]] = alloca i64,
79     // CHECK-DAG: [[A_REF:%.+]] = bitcast i64* [[A_ADDR]] to i8*
80     // CHECK-DAG: [[A_VAL:%.+]] = load i8, i8* [[A_REF]],
81     // CHECK-DAG: [[A_EXT:%.+]] = sext i8 [[A_VAL]] to {{.+}}
82     // CHECK: call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 [[A_EXT]])
83     // CHECK: call {{.*}}void {{.*}} @__kmpc_fork_call(
84     foo();
85   }
86   return a + tmain<char, 5>() + tmain<S, 1>();
87 }
88 
89 // tmain 5
90 // CHECK-DAG: define {{.*}}i{{[0-9]+}} [[TMAIN_5]]()
91 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
92 // CHECK: call void [[T_OFFLOADING_FUN_0:@.+]](
93 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
94 // CHECK: call void [[T_OFFLOADING_FUN_1:@.+]](
95 
96 // tmain 1
97 // CHECK-DAG: define {{.*}}i{{[0-9]+}} [[TMAIN_1]]()
98 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
99 // CHECK: call void [[T_OFFLOADING_FUN_2:@.+]](
100 // CHECK: call i{{[0-9]+}} @__tgt_target_teams_mapper(%struct.ident_t* @{{.+}},
101 // CHECK: call void [[T_OFFLOADING_FUN_3:@.+]](
102 
103 // CHECK: define internal void [[T_OFFLOADING_FUN_0]](
104 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[T_OMP_TEAMS_OUTLINED_0:@.+]] to {{.+}})
105 
106 // CHECK: define{{.+}} void [[T_OMP_TEAMS_OUTLINED_0]](
107 // CHECK:       call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 5)
108 // CHECK:       call {{.*}}void {{.*}} @__kmpc_fork_call(
109 
110 // CHECK: define internal void [[T_OFFLOADING_FUN_1]](
111 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[T_OMP_TEAMS_OUTLINED_1:@.+]] to {{.+}})
112 
113 // CHECK: define{{.+}} void [[T_OMP_TEAMS_OUTLINED_1]](
114 // CHECK:       call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 23)
115 // CHECK:       call {{.*}}void {{.*}} @__kmpc_fork_call(
116 
117 // CHECK: define internal void [[T_OFFLOADING_FUN_2]](
118 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 0, {{.+}}* [[T_OMP_TEAMS_OUTLINED_2:@.+]] to {{.+}})
119 
120 // CHECK: define{{.+}} void [[T_OMP_TEAMS_OUTLINED_2]](
121 // CHECK:       call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 1)
122 // CHECK:       call {{.*}}void {{.*}} @__kmpc_fork_call(
123 
124 // CHECK: define internal void [[T_OFFLOADING_FUN_3]](
125 // CHECK: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 {{.+}}, {{.+}}* [[T_OMP_TEAMS_OUTLINED_3:@.+]] to {{.+}})
126 
127 // CHECK: define{{.+}} void [[T_OMP_TEAMS_OUTLINED_3]]({{.+}}, {{.+}}, {{.+}} [[NUM_TH_CPT_IN:%.+]])
128 // CHECK: [[NUM_TH_CPT:%.+]] = alloca i64,
129 // CHECK: store {{.+}} [[NUM_TH_CPT_IN]], {{.+}} [[NUM_TH_CPT]],
130 // CHECK: [[NUM_TH_REF:%.+]] = bitcast i64* [[NUM_TH_CPT]] to i8*
131 // CHECK-DAG:   [[NUM_TH_VAL:%.+]] = load {{.+}}, {{.+}} [[NUM_TH_REF]],
132 // CHECK-DAG:   [[NUM_TH_SEXT:%.+]] = sext i8 [[NUM_TH_VAL]] to {{.+}}
133 // CHECK:       call {{.*}}void @__kmpc_push_num_threads([[IDENT_T_TY]]* [[DEF_LOC_2]], i32 {{.+}}, i32 [[NUM_TH_SEXT]])
134 // CHECK:       call {{.*}}void {{.*}} @__kmpc_fork_call(
135 #endif
136