parallel_master_taskloop_codegen.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250
  1. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s
  2. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  3. // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s
  4. // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
  5. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
  6. // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
  7. // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
  8. // expected-no-diagnostics
  9. #ifndef HEADER
  10. #define HEADER
  11. // CHECK-LABEL: @main
  12. int main(int argc, char **argv) {
  13. // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
  14. // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64)* [[OMP_OUTLINED1:@.+]] to void (i32*, i32*, ...)*), i64 [[PRIORITY:%.+]])
  15. // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64)* [[OMP_OUTLINED2:@.+]] to void (i32*, i32*, ...)*), i64 [[GRAINSIZE:%.+]])
  16. // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i8***, i64, i64)* [[OMP_OUTLINED3:@.+]] to void (i32*, i32*, ...)*), i32* [[ARGC:%.+]], i8*** [[ARGV:%.+]], i64 [[COND:%.+]], i64 [[NUM_TASKS:%.+]])
  17. // CHECK: call void @__kmpc_serialized_parallel(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  18. // CHECK: call void [[OMP_OUTLINED3]](i32* %{{.+}}, i32* %{{.+}}, i32* [[ARGC]], i8*** [[ARGV]], i64 [[COND]], i64 [[NUM_TASKS]])
  19. // CHECK: call void @__kmpc_end_serialized_parallel(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  20. // CHECK: define internal void [[OMP_OUTLINED1]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i64 %{{.+}})
  21. // CHECK: [[PRIO_ADDR:%.+]] = bitcast i64* %{{.+}} to i32*
  22. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
  23. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  24. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  25. // CHECK: [[THEN]]
  26. // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  27. // CHECK: [[PRIO:%.+]] = load i32, i32* [[PRIO_ADDR]],
  28. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
  29. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  30. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  31. // CHECK: [[PRIO_ADDR:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 4
  32. // CHECK: [[PRIO_ADDR_CAST:%.+]] = bitcast %{{.+}}* [[PRIO_ADDR]] to i32*
  33. // CHECK: store i32 [[PRIO]], i32* [[PRIO_ADDR_CAST]],
  34. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  35. // CHECK: store i64 0, i64* [[DOWN]],
  36. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  37. // CHECK: store i64 9, i64* [[UP]],
  38. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  39. // CHECK: store i64 1, i64* [[ST]],
  40. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  41. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null)
  42. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  43. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  44. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  45. // CHECK: [[EXIT]]
  46. // CHECK: define internal i32 [[TASK1]](
  47. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  48. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  49. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  50. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  51. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  52. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  53. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  54. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  55. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  56. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  57. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  58. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  59. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  60. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  61. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  62. // CHECK: br label
  63. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  64. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  65. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  66. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  67. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  68. // CHECK: load i32, i32* %
  69. // CHECK: store i32 %
  70. // CHECK: load i32, i32* %
  71. // CHECK: add nsw i32 %{{.+}}, 1
  72. // CHECK: store i32 %{{.+}}, i32* %
  73. // CHECK: br label %
  74. // CHECK: ret i32 0
  75. #pragma omp parallel master taskloop priority(argc)
  76. for (int i = 0; i < 10; ++i)
  77. ;
  78. // CHECK: define internal void [[OMP_OUTLINED2]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i64 %{{.+}})
  79. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
  80. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  81. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  82. // CHECK: [[THEN]]
  83. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
  84. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  85. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  86. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  87. // CHECK: store i64 0, i64* [[DOWN]],
  88. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  89. // CHECK: store i64 9, i64* [[UP]],
  90. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  91. // CHECK: store i64 1, i64* [[ST]],
  92. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  93. // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
  94. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
  95. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  96. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  97. // CHECK: [[EXIT]]
  98. // CHECK: define internal i32 [[TASK2]](
  99. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  100. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  101. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  102. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  103. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  104. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  105. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  106. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  107. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  108. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  109. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  110. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  111. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  112. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  113. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  114. // CHECK: br label
  115. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  116. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  117. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  118. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  119. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  120. // CHECK: load i32, i32* %
  121. // CHECK: store i32 %
  122. // CHECK: load i32, i32* %
  123. // CHECK: add nsw i32 %{{.+}}, 1
  124. // CHECK: store i32 %{{.+}}, i32* %
  125. // CHECK: br label %
  126. // CHECK: ret i32 0
  127. #pragma omp parallel master taskloop nogroup grainsize(argc)
  128. for (int i = 0; i < 10; ++i)
  129. ;
  130. // CHECK: define internal void [[OMP_OUTLINED3]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i32* dereferenceable(4) %{{.+}}, i8*** dereferenceable(8) %{{.+}}, i64 %{{.+}}, i64 %{{.+}})
  131. // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
  132. // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
  133. // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
  134. // CHECK: [[THEN]]
  135. // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  136. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
  137. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  138. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  139. // CHECK: [[COND_VAL:%.+]] = load i8, i8* %{{.+}},
  140. // CHECK: [[COND_BOOL:%.+]] = trunc i8 [[COND_VAL]] to i1
  141. // CHECK: [[IF_INT:%.+]] = sext i1 [[COND_BOOL]] to i32
  142. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  143. // CHECK: store i64 0, i64* [[DOWN]],
  144. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  145. // CHECK: store i64 %{{.+}}, i64* [[UP]],
  146. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  147. // CHECK: store i64 1, i64* [[ST]],
  148. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  149. // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
  150. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null)
  151. // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  152. // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
  153. // CHECK-NEXT: br label {{%?}}[[EXIT]]
  154. // CHECK: [[EXIT]]
  155. // CHECK: define internal i32 [[TASK3]](
  156. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  157. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  158. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  159. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  160. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  161. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  162. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  163. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  164. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  165. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  166. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  167. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  168. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  169. // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
  170. // CHECK: br label
  171. // CHECK: ret i32 0
  172. int i;
  173. #pragma omp parallel master taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(argc)
  174. for (i = 0; i < argc; ++i)
  175. for (int j = argc; j < argv[argc][argc]; ++j)
  176. ;
  177. }
  178. // CHECK-LABEL: @_ZN1SC2Ei
  179. struct S {
  180. int a;
  181. S(int c) {
  182. // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, %struct.S*, i32*, i64)* [[OMP_OUTLINED4:@.+]] to void (i32*, i32*, ...)*), %struct.S* %{{.+}}, i32* %{{.+}}, i64 %{{.+}})
  183. // CHECK: define internal void [[OMP_OUTLINED4]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, %struct.S* %{{.+}}, i32* dereferenceable(4) %{{.+}}, i64 %{{.+}})
  184. // CHECK: [[CONV:%.+]] = bitcast i64* %{{.+}} to i8*
  185. // CHECK: [[CONDI8:%.+]] = load i8, i8* [[CONV]],
  186. // CHECK: [[COND:%.+]] = trunc i8 [[CONDI8]] to i1
  187. // CHECK: [[IS_FINAL:%.+]] = select i1 [[COND:%.+]], i32 2, i32 0
  188. // CHECK: [[FLAGS:%.+]] = or i32 [[IS_FINAL]], 1
  189. // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]], i32 [[FLAGS]], i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
  190. // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
  191. // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
  192. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
  193. // CHECK: store i64 0, i64* [[DOWN]],
  194. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
  195. // CHECK: store i64 %{{.+}}, i64* [[UP]],
  196. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
  197. // CHECK: store i64 1, i64* [[ST]],
  198. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  199. // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null)
  200. #pragma omp parallel master taskloop shared(c) num_tasks(4) final(c)
  201. for (a = 0; a < c; ++a)
  202. ;
  203. }
  204. } s(1);
  205. // CHECK: define internal i32 [[TASK4]](
  206. // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
  207. // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
  208. // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
  209. // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
  210. // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
  211. // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
  212. // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
  213. // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
  214. // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
  215. // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
  216. // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
  217. // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
  218. // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
  219. // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
  220. // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
  221. // CHECK: br label
  222. // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
  223. // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
  224. // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
  225. // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
  226. // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
  227. // CHECK: load i32, i32* %
  228. // CHECK: store i32 %
  229. // CHECK: load i32, i32* %
  230. // CHECK: add nsw i32 %{{.+}}, 1
  231. // CHECK: store i32 %{{.+}}, i32* %
  232. // CHECK: br label %
  233. // CHECK: ret i32 0
  234. #endif