master_taskloop_codegen.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225
  1. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s
  2. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  3. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s
  4. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
  5. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  6. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
  7. // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
  8. // expected-no-diagnostics
  9. #ifndef HEADER
  10. #define HEADER
  11. // CHECK-LABEL: @main
  12. int main(int argc, char **argv) {
  13. // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
  14. // CHECK: call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]],
  15. // CHECK: call i32 @__kmpc_omp_task(%struct.ident_t* [[DEFLOC]], i32 [[GTID]],
  16. #pragma omp task
  17. ;
  18. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  19. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  20. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  21. // CHECK: [[THEN]]
  22. // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  23. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
  24. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  25. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  26. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  27. // CHECK: store i64 0, i64* [[DOWN]],
  28. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  29. // CHECK: store i64 9, i64* [[UP]],
  30. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  31. // CHECK: store i64 1, i64* [[ST]],
  32. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  33. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null)
  34. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  35. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  36. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  37. // CHECK: [[EXIT]]
  38. #pragma omp master taskloop priority(argc)
  39. for (int i = 0; i < 10; ++i)
  40. ;
  41. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  42. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  43. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  44. // CHECK: [[THEN]]
  45. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
  46. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  47. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  48. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  49. // CHECK: store i64 0, i64* [[DOWN]],
  50. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  51. // CHECK: store i64 9, i64* [[UP]],
  52. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  53. // CHECK: store i64 1, i64* [[ST]],
  54. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  55. // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
  56. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
  57. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  58. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  59. // CHECK: [[EXIT]]
  60. #pragma omp master taskloop nogroup grainsize(argc)
  61. for (int i = 0; i < 10; ++i)
  62. ;
  63. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  64. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  65. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  66. // CHECK: [[THEN]]
  67. // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  68. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
  69. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  70. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  71. // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0
  72. // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32
  73. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  74. // CHECK: store i64 0, i64* [[DOWN]],
  75. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  76. // CHECK: store i64 %{{.+}}, i64* [[UP]],
  77. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  78. // CHECK: store i64 1, i64* [[ST]],
  79. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  80. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null)
  81. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  82. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  83. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  84. // CHECK: [[EXIT]]
  85. int i;
  86. #pragma omp master taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(4)
  87. for (i = 0; i < argc; ++i)
  88. for (int j = argc; j < argv[argc][argc]; ++j)
  89. ;
  90. }
  91. // CHECK: define internal i32 [[TASK1]](
  92. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  93. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  94. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  95. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  96. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  97. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  98. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  99. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  100. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  101. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  102. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  103. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  104. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  105. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  106. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  107. // CHECK: br label
  108. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  109. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  110. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  111. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  112. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  113. // CHECK: load i32, i32* %
  114. // CHECK: store i32 %
  115. // CHECK: load i32, i32* %
  116. // CHECK: add nsw i32 %{{.+}}, 1
  117. // CHECK: store i32 %{{.+}}, i32* %
  118. // CHECK: br label %
  119. // CHECK: ret i32 0
  120. // CHECK: define internal i32 [[TASK2]](
  121. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  122. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  123. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  124. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  125. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  126. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  127. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  128. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  129. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  130. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  131. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  132. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  133. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  134. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  135. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  136. // CHECK: br label
  137. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  138. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  139. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  140. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  141. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  142. // CHECK: load i32, i32* %
  143. // CHECK: store i32 %
  144. // CHECK: load i32, i32* %
  145. // CHECK: add nsw i32 %{{.+}}, 1
  146. // CHECK: store i32 %{{.+}}, i32* %
  147. // CHECK: br label %
  148. // CHECK: ret i32 0
  149. // CHECK: define internal i32 [[TASK3]](
  150. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  151. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  152. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  153. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  154. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  155. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  156. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  157. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  158. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  159. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  160. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  161. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  162. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  163. // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
  164. // CHECK: br label
  165. // CHECK: ret i32 0
  166. // CHECK-LABEL: @_ZN1SC2Ei
  167. struct S {
  168. int a;
  169. S(int c) {
  170. // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
  171. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
  172. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  173. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  174. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  175. // CHECK: store i64 0, i64* [[DOWN]],
  176. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  177. // CHECK: store i64 %{{.+}}, i64* [[UP]],
  178. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  179. // CHECK: store i64 1, i64* [[ST]],
  180. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  181. // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
  182. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null)
  183. #pragma omp master taskloop shared(c) num_tasks(a)
  184. for (a = 0; a < c; ++a)
  185. ;
  186. }
  187. } s(1);
  188. // CHECK: define internal i32 [[TASK4]](
  189. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  190. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  191. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  192. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  193. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  194. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  195. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  196. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  197. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  198. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  199. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  200. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  201. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  202. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  203. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  204. // CHECK: br label
  205. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  206. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  207. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  208. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  209. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  210. // CHECK: load i32, i32* %
  211. // CHECK: store i32 %
  212. // CHECK: load i32, i32* %
  213. // CHECK: add nsw i32 %{{.+}}, 1
  214. // CHECK: store i32 %{{.+}}, i32* %
  215. // CHECK: br label %
  216. // CHECK: ret i32 0
  217. #endif