/clang/test/OpenMP/taskgroup_task_reduction_codegen.cpp

https://github.com/hfinkel/llvm-project-cxxjit · C++ · 233 lines · 23 code · 18 blank · 192 comment · 0 complexity · 9c73a25405b97aaa5bb680fb862da450 MD5 · raw file

  1. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - | FileCheck %s
  2. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  3. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
  4. // RUN: %clang_cc1 -fopenmp -x c++ %s -verify -debug-info-kind=limited -emit-llvm -o - -triple x86_64-apple-darwin10 | FileCheck %s --check-prefix=CHECK --check-prefix=DEBUG
  5. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
  6. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  7. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
  8. // RUN: %clang_cc1 -fopenmp-simd -x c++ %s -verify -debug-info-kind=limited -emit-llvm -o - -triple x86_64-apple-darwin10 | FileCheck --check-prefix SIMD-ONLY0 %s
  9. // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
  10. // expected-no-diagnostics
  11. #ifndef HEADER
  12. #define HEADER
  13. // CHECK-DAG: @reduction_size.[[ID:.+]]_[[CID:[0-9]+]].artificial.
  14. // CHECK-DAG: @reduction_size.[[ID]]_[[CID]].artificial..cache.
  15. struct S {
  16. int a;
  17. S() : a(0) {}
  18. S(const S&) {}
  19. S& operator=(const S&) {return *this;}
  20. ~S() {}
  21. friend S operator+(const S&a, const S&b) {return a;}
  22. };
  23. int main(int argc, char **argv) {
  24. int a;
  25. float b;
  26. S c[5];
  27. short d[argc];
  28. #pragma omp taskgroup task_reduction(+: a, b, argc)
  29. {
  30. #pragma omp taskgroup task_reduction(-:c, d)
  31. ;
  32. }
  33. return 0;
  34. }
  35. // CHECK-LABEL: @main
  36. // CHECK: alloca i32,
  37. // CHECK: [[ARGC_ADDR:%.+]] = alloca i32,
  38. // CHECK: [[ARGV_ADDR:%.+]] = alloca i8**,
  39. // CHECK: [[A:%.+]] = alloca i32,
  40. // CHECK: [[B:%.+]] = alloca float,
  41. // CHECK: [[C:%.+]] = alloca [5 x %struct.S],
  42. // CHECK: [[RD_IN1:%.+]] = alloca [3 x [[T1:%[^,]+]]],
  43. // CHECK: [[TD1:%.+]] = alloca i8*,
  44. // CHECK: [[RD_IN2:%.+]] = alloca [2 x [[T2:%[^,]+]]],
  45. // CHECK: [[TD2:%.+]] = alloca i8*,
  46. // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t*
  47. // CHECK: [[VLA:%.+]] = alloca i16, i64 [[VLA_SIZE:%[^,]+]],
  48. // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* {{[^,]+}}, i32 [[GTID]])
  49. // CHECK-DAG: [[BC_A:%.+]] = bitcast i32* [[A]] to i8*
  50. // CHECK-DAG: store i8* [[BC_A]], i8** [[A_REF:[^,]+]],
  51. // CHECK-DAG: [[A_REF]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA:%[^,]+]], i32 0, i32 0
  52. // CHECK-DAG: [[GEPA]] = getelementptr inbounds [3 x [[T1]]], [3 x [[T1]]]* [[RD_IN1]], i64 0, i64
  53. // CHECK-DAG: [[TMP6:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA]], i32 0, i32 1
  54. // CHECK-DAG: store i64 4, i64* [[TMP6]],
  55. // CHECK-DAG: [[TMP7:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA]], i32 0, i32 2
  56. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[AINIT:.+]] to i8*), i8** [[TMP7]],
  57. // CHECK-DAG: [[TMP8:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA]], i32 0, i32 3
  58. // CHECK-DAG: store i8* null, i8** [[TMP8]],
  59. // CHECK-DAG: [[TMP9:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA]], i32 0, i32 4
  60. // CHECK-DAG: store i8* bitcast (void (i8*, i8*)* @[[ACOMB:.+]] to i8*), i8** [[TMP9]],
  61. // CHECK-DAG: [[TMP10:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPA]], i32 0, i32 5
  62. // CHECK-DAG: [[TMP11:%.+]] = bitcast i32* [[TMP10]] to i8*
  63. // CHECK-DAG: call void @llvm.memset.p0i8.i64(i8* align 8 [[TMP11]], i8 0, i64 4, i1 false)
  64. // CHECK-DAG: [[TMP13:%.+]] = bitcast float* [[B]] to i8*
  65. // CHECK-DAG: store i8* [[TMP13]], i8** [[TMP12:%[^,]+]],
  66. // CHECK-DAG: [[TMP12]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB:%[^,]+]], i32 0, i32 0
  67. // CHECK-DAG: [[GEPB]] = getelementptr inbounds [3 x [[T1]]], [3 x [[T1]]]* [[RD_IN1]], i64 0, i64
  68. // CHECK-DAG: [[TMP14:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB]], i32 0, i32 1
  69. // CHECK-DAG: store i64 4, i64* [[TMP14]],
  70. // CHECK-DAG: [[TMP15:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB]], i32 0, i32 2
  71. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[BINIT:.+]] to i8*), i8** [[TMP15]],
  72. // CHECK-DAG: [[TMP16:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB]], i32 0, i32 3
  73. // CHECK-DAG: store i8* null, i8** [[TMP16]],
  74. // CHECK-DAG: [[TMP17:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB]], i32 0, i32 4
  75. // CHECK-DAG: store i8* bitcast (void (i8*, i8*)* @[[BCOMB:.+]] to i8*), i8** [[TMP17]],
  76. // CHECK-DAG: [[TMP18:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPB]], i32 0, i32 5
  77. // CHECK-DAG: [[TMP19:%.+]] = bitcast i32* [[TMP18]] to i8*
  78. // CHECK-DAG: call void @llvm.memset.p0i8.i64(i8* align 8 [[TMP19]], i8 0, i64 4, i1 false)
  79. // CHECK-DAG: [[TMP21:%.+]] = bitcast i32* [[ARGC_ADDR]] to i8*
  80. // CHECK-DAG: store i8* [[TMP21]], i8** [[TMP20:%[^,]+]],
  81. // CHECK-DAG: [[TMP20]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC:%[^,]+]], i32 0, i32 0
  82. // CHECK-DAG: [[GEPARGC]] = getelementptr inbounds [3 x [[T1]]], [3 x [[T1]]]* [[RD_IN1]], i64 0, i64
  83. // CHECK-DAG: [[TMP22:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC]], i32 0, i32 1
  84. // CHECK-DAG: store i64 4, i64* [[TMP22]],
  85. // CHECK-DAG: [[TMP23:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC]], i32 0, i32 2
  86. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[ARGCINIT:.+]] to i8*), i8** [[TMP23]],
  87. // CHECK-DAG: [[TMP24:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC]], i32 0, i32 3
  88. // CHECK-DAG: store i8* null, i8** [[TMP24]],
  89. // CHECK-DAG: [[TMP25:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC]], i32 0, i32 4
  90. // CHECK-DAG: store i8* bitcast (void (i8*, i8*)* @[[ARGCCOMB:.+]] to i8*), i8** [[TMP25]],
  91. // CHECK-DAG: [[TMP26:%.+]] = getelementptr inbounds [[T1]], [[T1]]* [[GEPARGC]], i32 0, i32 5
  92. // CHECK-DAG: [[TMP27:%.+]] = bitcast i32* [[TMP26]] to i8*
  93. // CHECK-DAG: call void @llvm.memset.p0i8.i64(i8* align 8 [[TMP27]], i8 0, i64 4, i1 false)
  94. // CHECK-DAG: [[TMP28:%.+]] = bitcast [3 x [[T1]]]* [[RD_IN1]] to i8*
  95. // CHECK-DAG: [[TMP29:%.+]] = call i8* @__kmpc_task_reduction_init(i32 [[GTID]], i32 3, i8* [[TMP28]])
  96. // DEBUG-DAG: call void @llvm.dbg.declare(metadata i8** [[TD1]],
  97. // CHECK-DAG: store i8* [[TMP29]], i8** [[TD1]],
  98. // CHECK-DAG: call void @__kmpc_taskgroup(%struct.ident_t* {{[^,]+}}, i32 [[GTID]])
  99. // CHECK-DAG: [[TMP31:%.+]] = bitcast [5 x %struct.S]* [[C]] to i8*
  100. // CHECK-DAG: store i8* [[TMP31]], i8** [[TMP30:%[^,]+]],
  101. // CHECK-DAG: [[TMP30]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC:%[^,]+]], i32 0, i32 0
  102. // CHECK-DAG: [[GEPC]] = getelementptr inbounds [2 x [[T2]]], [2 x [[T2]]]* [[RD_IN2]], i64 0, i64
  103. // CHECK-DAG: [[TMP32:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC]], i32 0, i32 1
  104. // CHECK-DAG: store i64 20, i64* [[TMP32]],
  105. // CHECK-DAG: [[TMP33:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC]], i32 0, i32 2
  106. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[CINIT:.+]] to i8*), i8** [[TMP33]],
  107. // CHECK-DAG: [[TMP34:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC]], i32 0, i32 3
  108. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[CFINI:.+]] to i8*), i8** [[TMP34]],
  109. // CHECK-DAG: [[TMP35:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC]], i32 0, i32 4
  110. // CHECK-DAG: store i8* bitcast (void (i8*, i8*)* @[[CCOMB:.+]] to i8*), i8** [[TMP35]],
  111. // CHECK-DAG: [[TMP36:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPC]], i32 0, i32 5
  112. // CHECK-DAG: [[TMP37:%.+]] = bitcast i32* [[TMP36]] to i8*
  113. // CHECK-DAG: call void @llvm.memset.p0i8.i64(i8* align 8 [[TMP37]], i8 0, i64 4, i1 false)
  114. // CHECK-DAG: [[TMP39:%.+]] = bitcast i16* [[VLA]] to i8*
  115. // CHECK-DAG: store i8* [[TMP39]], i8** [[TMP38:%[^,]+]],
  116. // CHECK-DAG: [[TMP38]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA:%[^,]+]], i32 0, i32 0
  117. // CHECK-DAG: [[GEPVLA]] = getelementptr inbounds [2 x [[T2]]], [2 x [[T2]]]* [[RD_IN2]], i64 0, i64
  118. // CHECK-DAG: [[TMP40:%.+]] = mul nuw i64 [[VLA_SIZE]], 2
  119. // CHECK-DAG: [[TMP41:%.+]] = udiv exact i64 [[TMP40]], ptrtoint (i16* getelementptr (i16, i16* null, i32 1) to i64)
  120. // CHECK-DAG: [[TMP42:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA]], i32 0, i32 1
  121. // CHECK-DAG: store i64 [[TMP40]], i64* [[TMP42]],
  122. // CHECK-DAG: [[TMP43:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA]], i32 0, i32 2
  123. // CHECK-DAG: store i8* bitcast (void (i8*)* @[[VLAINIT:.+]] to i8*), i8** [[TMP43]],
  124. // CHECK-DAG: [[TMP44:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA]], i32 0, i32 3
  125. // CHECK-DAG: store i8* null, i8** [[TMP44]],
  126. // CHECK-DAG: [[TMP45:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA]], i32 0, i32 4
  127. // CHECK-DAG: store i8* bitcast (void (i8*, i8*)* @[[VLACOMB:.+]] to i8*), i8** [[TMP45]],
  128. // CHECK-DAG: [[TMP46:%.+]] = getelementptr inbounds [[T2]], [[T2]]* [[GEPVLA]], i32 0, i32 5
  129. // CHECK-DAG: store i32 1, i32* [[TMP46]],
  130. // CHECK: [[TMP47:%.+]] = bitcast [2 x [[T2]]]* [[RD_IN2]] to i8*
  131. // CHECK: [[TMP48:%.+]] = call i8* @__kmpc_task_reduction_init(i32 [[GTID]], i32 2, i8* [[TMP47]])
  132. // CHECK: store i8* [[TMP48]], i8** [[TD2]],
  133. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* {{[^,]+}}, i32 [[GTID]])
  134. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* {{[^,]+}}, i32 [[GTID]])
  135. // CHECK-DAG: define internal void @[[AINIT]](i8*)
  136. // CHECK-DAG: store i32 0, i32* %
  137. // CHECK-DAG: ret void
  138. // CHECK-DAG: }
  139. // CHECK-DAG: define internal void @[[ACOMB]](i8*, i8*)
  140. // CHECK-DAG: add nsw i32 %
  141. // CHECK-DAG: store i32 %
  142. // CHECK-DAG: ret void
  143. // CHECK-DAG: }
  144. // CHECK-DAG: define internal void @[[BINIT]](i8*)
  145. // CHECK-DAG: store float 0.000000e+00, float* %
  146. // CHECK-DAG: ret void
  147. // CHECK-DAG: }
  148. // CHECK-DAG: define internal void @[[BCOMB]](i8*, i8*)
  149. // CHECK-DAG: fadd float %
  150. // CHECK-DAG: store float %
  151. // CHECK-DAG: ret void
  152. // CHECK-DAG: }
  153. // CHECK-DAG: define internal void @[[ARGCINIT]](i8*)
  154. // CHECK-DAG: store i32 0, i32* %
  155. // CHECK-DAG: ret void
  156. // CHECK-DAG: }
  157. // CHECK-DAG: define internal void @[[ARGCCOMB]](i8*, i8*)
  158. // CHECK-DAG: add nsw i32 %
  159. // CHECK-DAG: store i32 %
  160. // CHECK-DAG: ret void
  161. // CHECK-DAG: }
  162. // CHECK-DAG: define internal void @[[CINIT]](i8*)
  163. // CHECK-DAG: phi %struct.S* [
  164. // CHECK-DAG: call {{.+}}(%struct.S* {{.+}})
  165. // CHECK-DAG: br i1 %
  166. // CHECK-DAG: ret void
  167. // CHECK-DAG: }
  168. // CHECK-DAG: define internal void @[[CFINI]](i8*)
  169. // CHECK-DAG: phi %struct.S* [
  170. // CHECK-DAG: call {{.+}}(%struct.S* {{.+}})
  171. // CHECK-DAG: br i1 %
  172. // CHECK-DAG: ret void
  173. // CHECK-DAG: }
  174. // CHECK-DAG: define internal void @[[CCOMB]](i8*, i8*)
  175. // CHECK-DAG: phi %struct.S* [
  176. // CHECK-DAG: phi %struct.S* [
  177. // CHECK-DAG: call {{.+}}(%struct.S* {{.+}}, %struct.S* {{.+}}, %struct.S* {{.+}})
  178. // CHECK-DAG: call {{.+}}(%struct.S* {{.+}}, %struct.S* {{.+}})
  179. // CHECK-DAG: call {{.+}}(%struct.S* {{.+}})
  180. // CHECK-DAG: br i1 %
  181. // CHECK-DAG: ret void
  182. // CHECK_DAG: }
  183. // CHECK-DAG: define internal void @[[VLAINIT]](i8*)
  184. // CHECK-DAG: call i32 @__kmpc_global_thread_num(%struct.ident_t* {{[^,]+}})
  185. // CHECK-DAG: call i8* @__kmpc_threadprivate_cached(%struct.ident_t*
  186. // CHECK-DAG: phi i16* [
  187. // CHECK-DAG: store i16 0, i16* %
  188. // CHECK-DAG: br i1 %
  189. // CHECK-DAG: ret void
  190. // CHECK-DAG: }
  191. // CHECK-DAG: define internal void @[[VLACOMB]](i8*, i8*)
  192. // CHECK-DAG: call i32 @__kmpc_global_thread_num(%struct.ident_t* {{[^,]+}})
  193. // CHECK-DAG: call i8* @__kmpc_threadprivate_cached(%struct.ident_t*
  194. // CHECK-DAG: phi i16* [
  195. // CHECK-DAG: phi i16* [
  196. // CHECK-DAG: sext i16 %{{.+}} to i32
  197. // CHECK-DAG: add nsw i32 %
  198. // CHECK-DAG: trunc i32 %{{.+}} to i16
  199. // CHECK-DAG: store i16 %
  200. // CHECK_DAG: br i1 %
  201. // CHECK-DAG: ret void
  202. // CHECK-DAG: }
  203. #endif
  204. // DEBUG-LABEL: distinct !DICompileUnit
  205. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[AINIT]]",
  206. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[ACOMB]]",
  207. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[BINIT]]",
  208. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[BCOMB]]",
  209. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[ARGCINIT]]",
  210. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[ARGCCOMB]]",
  211. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[CINIT]]",
  212. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[CFINI]]",
  213. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[CCOMB]]",
  214. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[VLAINIT]]",
  215. // DEBUG-DAG: distinct !DISubprogram(linkageName: "[[VLACOMB]]",