xref: /llvm-project/clang/test/OpenMP/for_non_rectangular_codegen.c (revision 1c9ec74e3f2a55b4a74ad54e60b58b03baf896d9)
10cfe5ae0SAlexey Bataev // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --function-signature --include-generated-funcs --replace-value-regex "__omp_offloading_[0-9a-z]+_[0-9a-z]+" "reduction_size[.].+[.]" "pl_cond[.].+[.|,]" --prefix-filecheck-ir-name _
20cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp -x c -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
30cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -fopenmp -x c -triple x86_64-unknown-unknown -emit-pch -o %t %s
40cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -fopenmp -x c -triple x86_64-unknown-unknown -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
50cfe5ae0SAlexey Bataev 
60cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp-simd -x c -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
70cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -x c -triple x86_64-unknown-unknown -emit-pch -o %t %s
80cfe5ae0SAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -x c -triple x86_64-unknown-unknown -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
90cfe5ae0SAlexey Bataev // expected-no-diagnostics
100cfe5ae0SAlexey Bataev #ifndef HEADER
110cfe5ae0SAlexey Bataev #define HEADER
120cfe5ae0SAlexey Bataev 
collapsed(int mp)130cfe5ae0SAlexey Bataev void collapsed(int mp) {
140cfe5ae0SAlexey Bataev #pragma omp for collapse(3)
150cfe5ae0SAlexey Bataev   for (int j = 0; j < mp; ++j) {
160cfe5ae0SAlexey Bataev     for (int i = j; i < mp; ++i) {
170cfe5ae0SAlexey Bataev       for (int i0 = 0; i0 < 10; ++i0) {
180cfe5ae0SAlexey Bataev         ;
190cfe5ae0SAlexey Bataev       }
200cfe5ae0SAlexey Bataev     }
210cfe5ae0SAlexey Bataev   }
220cfe5ae0SAlexey Bataev }
230cfe5ae0SAlexey Bataev 
240cfe5ae0SAlexey Bataev #endif // HEADER
250cfe5ae0SAlexey Bataev // CHECK-LABEL: define {{[^@]+}}@collapsed
260cfe5ae0SAlexey Bataev // CHECK-SAME: (i32 noundef [[MP:%.*]]) #[[ATTR0:[0-9]+]] {
270cfe5ae0SAlexey Bataev // CHECK-NEXT:  entry:
280cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MP_ADDR:%.*]] = alloca i32, align 4
290cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTOMP_IV:%.*]] = alloca i64, align 8
300cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP:%.*]] = alloca i32, align 4
310cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[_TMP1:%.*]] = alloca i32, align 4
320cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[_TMP2:%.*]] = alloca i32, align 4
330cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4
340cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTLB_MIN:%.*]] = alloca i32, align 4
350cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTLB_MAX:%.*]] = alloca i32, align 4
360cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTMIN_LESS_MAX:%.*]] = alloca i32, align 4
370cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTUPPER:%.*]] = alloca i32, align 4
380cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTLOWER:%.*]] = alloca i32, align 4
390cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTCAPTURE_EXPR_3:%.*]] = alloca i64, align 8
400cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[J:%.*]] = alloca i32, align 4
410cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[I:%.*]] = alloca i32, align 4
420cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[I0:%.*]] = alloca i32, align 4
430cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[_TMP15:%.*]] = alloca i32, align 4
440cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTOMP_LB:%.*]] = alloca i64, align 8
450cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTOMP_UB:%.*]] = alloca i64, align 8
460cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTOMP_STRIDE:%.*]] = alloca i64, align 8
470cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4
480cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[J19:%.*]] = alloca i32, align 4
490cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[I20:%.*]] = alloca i32, align 4
500cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[I021:%.*]] = alloca i32, align 4
510cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(ptr @[[GLOB2:[0-9]+]])
520cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[MP]], ptr [[MP_ADDR]], align 4
530cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP1:%.*]] = load i32, ptr [[MP_ADDR]], align 4
540cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[TMP1]], ptr [[DOTCAPTURE_EXPR_]], align 4
550cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 0, ptr [[TMP]], align 4
560cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP2:%.*]] = load i32, ptr [[TMP]], align 4
570cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[TMP2]], ptr [[DOTLB_MIN]], align 4
580cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP3:%.*]] = load i32, ptr [[DOTCAPTURE_EXPR_]], align 4
590cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB:%.*]] = sub nsw i32 [[TMP3]], 1
600cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV:%.*]] = sdiv i32 [[SUB]], 1
610cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL:%.*]] = mul nsw i32 [[DIV]], 1
620cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 0, [[MUL]]
630cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[ADD]], ptr [[TMP]], align 4
640cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP4:%.*]] = load i32, ptr [[TMP]], align 4
650cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[TMP4]], ptr [[DOTLB_MAX]], align 4
660cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP5:%.*]] = load i32, ptr [[DOTLB_MIN]], align 4
670cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP6:%.*]] = load i32, ptr [[DOTLB_MAX]], align 4
680cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[TMP5]], [[TMP6]]
690cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV:%.*]] = zext i1 [[CMP]] to i32
700cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[CONV]], ptr [[DOTMIN_LESS_MAX]], align 4
710cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP7:%.*]] = load i32, ptr [[MP_ADDR]], align 4
720cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[TMP7]], ptr [[DOTUPPER]], align 4
730cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP8:%.*]] = load i32, ptr [[DOTMIN_LESS_MAX]], align 4
740cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TOBOOL:%.*]] = icmp ne i32 [[TMP8]], 0
750cfe5ae0SAlexey Bataev // CHECK-NEXT:    br i1 [[TOBOOL]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]]
760cfe5ae0SAlexey Bataev // CHECK:       cond.true:
770cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP9:%.*]] = load i32, ptr [[DOTLB_MIN]], align 4
780cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[COND_END:%.*]]
790cfe5ae0SAlexey Bataev // CHECK:       cond.false:
800cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP10:%.*]] = load i32, ptr [[DOTLB_MAX]], align 4
810cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[COND_END]]
820cfe5ae0SAlexey Bataev // CHECK:       cond.end:
830cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[COND:%.*]] = phi i32 [ [[TMP9]], [[COND_TRUE]] ], [ [[TMP10]], [[COND_FALSE]] ]
840cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[COND]], ptr [[TMP]], align 4
850cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[COND]], ptr [[DOTLOWER]], align 4
860cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP11:%.*]] = load i32, ptr [[DOTCAPTURE_EXPR_]], align 4
870cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB4:%.*]] = sub nsw i32 [[TMP11]], 0
880cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV5:%.*]] = sdiv i32 [[SUB4]], 1
890cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV6:%.*]] = sext i32 [[DIV5]] to i64
900cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP12:%.*]] = load i32, ptr [[DOTUPPER]], align 4
910cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP13:%.*]] = load i32, ptr [[DOTLOWER]], align 4
920cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB7:%.*]] = sub i32 [[TMP12]], [[TMP13]]
930cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB8:%.*]] = sub i32 [[SUB7]], 1
940cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD9:%.*]] = add i32 [[SUB8]], 1
950cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV10:%.*]] = udiv i32 [[ADD9]], 1
960cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV11:%.*]] = zext i32 [[DIV10]] to i64
970cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL12:%.*]] = mul nsw i64 [[CONV6]], [[CONV11]]
980cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL13:%.*]] = mul nsw i64 [[MUL12]], 10
990cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB14:%.*]] = sub nsw i64 [[MUL13]], 1
1000cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 [[SUB14]], ptr [[DOTCAPTURE_EXPR_3]], align 8
1010cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 0, ptr [[J]], align 4
1020cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP14:%.*]] = load i32, ptr [[J]], align 4
1030cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[TMP14]], ptr [[I]], align 4
1040cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 0, ptr [[I0]], align 4
1050cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 0, ptr [[_TMP15]], align 4
1060cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP15:%.*]] = load i32, ptr [[DOTCAPTURE_EXPR_]], align 4
1070cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CMP16:%.*]] = icmp slt i32 0, [[TMP15]]
1080cfe5ae0SAlexey Bataev // CHECK-NEXT:    br i1 [[CMP16]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]]
1090cfe5ae0SAlexey Bataev // CHECK:       omp.precond.then:
1100cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 0, ptr [[DOTOMP_LB]], align 8
1110cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP16:%.*]] = load i64, ptr [[DOTCAPTURE_EXPR_3]], align 8
1120cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 [[TMP16]], ptr [[DOTOMP_UB]], align 8
1130cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 1, ptr [[DOTOMP_STRIDE]], align 8
1140cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 0, ptr [[DOTOMP_IS_LAST]], align 4
1150cfe5ae0SAlexey Bataev // CHECK-NEXT:    call void @__kmpc_for_static_init_8(ptr @[[GLOB1:[0-9]+]], i32 [[TMP0]], i32 34, ptr [[DOTOMP_IS_LAST]], ptr [[DOTOMP_LB]], ptr [[DOTOMP_UB]], ptr [[DOTOMP_STRIDE]], i64 1, i64 1)
1160cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP17:%.*]] = load i64, ptr [[DOTOMP_UB]], align 8
1170cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP18:%.*]] = load i64, ptr [[DOTCAPTURE_EXPR_3]], align 8
1180cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CMP22:%.*]] = icmp sgt i64 [[TMP17]], [[TMP18]]
1190cfe5ae0SAlexey Bataev // CHECK-NEXT:    br i1 [[CMP22]], label [[COND_TRUE24:%.*]], label [[COND_FALSE25:%.*]]
1200cfe5ae0SAlexey Bataev // CHECK:       cond.true24:
1210cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP19:%.*]] = load i64, ptr [[DOTCAPTURE_EXPR_3]], align 8
1220cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[COND_END26:%.*]]
1230cfe5ae0SAlexey Bataev // CHECK:       cond.false25:
1240cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP20:%.*]] = load i64, ptr [[DOTOMP_UB]], align 8
1250cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[COND_END26]]
1260cfe5ae0SAlexey Bataev // CHECK:       cond.end26:
1270cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[COND27:%.*]] = phi i64 [ [[TMP19]], [[COND_TRUE24]] ], [ [[TMP20]], [[COND_FALSE25]] ]
1280cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 [[COND27]], ptr [[DOTOMP_UB]], align 8
1290cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP21:%.*]] = load i64, ptr [[DOTOMP_LB]], align 8
1300cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 [[TMP21]], ptr [[DOTOMP_IV]], align 8
1310cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_INNER_FOR_COND:%.*]]
1320cfe5ae0SAlexey Bataev // CHECK:       omp.inner.for.cond:
1330cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP22:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1340cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP23:%.*]] = load i64, ptr [[DOTOMP_UB]], align 8
1350cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CMP28:%.*]] = icmp sle i64 [[TMP22]], [[TMP23]]
1360cfe5ae0SAlexey Bataev // CHECK-NEXT:    br i1 [[CMP28]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]]
1370cfe5ae0SAlexey Bataev // CHECK:       omp.inner.for.body:
1380cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP24:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1390cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP25:%.*]] = load i32, ptr [[DOTUPPER]], align 4
1400cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP26:%.*]] = load i32, ptr [[DOTLOWER]], align 4
1410cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB30:%.*]] = sub i32 [[TMP25]], [[TMP26]]
1420cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB31:%.*]] = sub i32 [[SUB30]], 1
1430cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD32:%.*]] = add i32 [[SUB31]], 1
1440cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV33:%.*]] = udiv i32 [[ADD32]], 1
1450cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL34:%.*]] = mul i32 1, [[DIV33]]
1460cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL35:%.*]] = mul i32 [[MUL34]], 10
1470cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV36:%.*]] = zext i32 [[MUL35]] to i64
1480cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV37:%.*]] = sdiv i64 [[TMP24]], [[CONV36]]
1490cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL38:%.*]] = mul nsw i64 [[DIV37]], 1
1500cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD39:%.*]] = add nsw i64 0, [[MUL38]]
1510cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV40:%.*]] = trunc i64 [[ADD39]] to i32
1520cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[CONV40]], ptr [[J19]], align 4
1530cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP27:%.*]] = load i32, ptr [[J19]], align 4
1540cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV41:%.*]] = sext i32 [[TMP27]] to i64
1550cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP28:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1560cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP29:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1570cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP30:%.*]] = load i32, ptr [[DOTUPPER]], align 4
1580cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP31:%.*]] = load i32, ptr [[DOTLOWER]], align 4
1590cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB42:%.*]] = sub i32 [[TMP30]], [[TMP31]]
1600cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB43:%.*]] = sub i32 [[SUB42]], 1
1610cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD44:%.*]] = add i32 [[SUB43]], 1
1620cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV45:%.*]] = udiv i32 [[ADD44]], 1
1630cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL46:%.*]] = mul i32 1, [[DIV45]]
1640cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL47:%.*]] = mul i32 [[MUL46]], 10
1650cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV48:%.*]] = zext i32 [[MUL47]] to i64
1660cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV49:%.*]] = sdiv i64 [[TMP29]], [[CONV48]]
1670cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP32:%.*]] = load i32, ptr [[DOTUPPER]], align 4
1680cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP33:%.*]] = load i32, ptr [[DOTLOWER]], align 4
1690cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB50:%.*]] = sub i32 [[TMP32]], [[TMP33]]
1700cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB51:%.*]] = sub i32 [[SUB50]], 1
1710cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD52:%.*]] = add i32 [[SUB51]], 1
1720cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV53:%.*]] = udiv i32 [[ADD52]], 1
1730cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL54:%.*]] = mul i32 1, [[DIV53]]
1740cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL55:%.*]] = mul i32 [[MUL54]], 10
1750cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV56:%.*]] = zext i32 [[MUL55]] to i64
1760cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL57:%.*]] = mul nsw i64 [[DIV49]], [[CONV56]]
1770cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB58:%.*]] = sub nsw i64 [[TMP28]], [[MUL57]]
1780cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV59:%.*]] = sdiv i64 [[SUB58]], 10
1790cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL60:%.*]] = mul nsw i64 [[DIV59]], 1
1800cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD61:%.*]] = add nsw i64 [[CONV41]], [[MUL60]]
1810cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV62:%.*]] = trunc i64 [[ADD61]] to i32
1820cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[CONV62]], ptr [[I20]], align 4
1830cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP34:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1840cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP35:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
1850cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP36:%.*]] = load i32, ptr [[DOTUPPER]], align 4
1860cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP37:%.*]] = load i32, ptr [[DOTLOWER]], align 4
1870cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB63:%.*]] = sub i32 [[TMP36]], [[TMP37]]
1880cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB64:%.*]] = sub i32 [[SUB63]], 1
1890cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD65:%.*]] = add i32 [[SUB64]], 1
1900cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV66:%.*]] = udiv i32 [[ADD65]], 1
1910cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL67:%.*]] = mul i32 1, [[DIV66]]
1920cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL68:%.*]] = mul i32 [[MUL67]], 10
1930cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV69:%.*]] = zext i32 [[MUL68]] to i64
1940cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV70:%.*]] = sdiv i64 [[TMP35]], [[CONV69]]
1950cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP38:%.*]] = load i32, ptr [[DOTUPPER]], align 4
1960cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP39:%.*]] = load i32, ptr [[DOTLOWER]], align 4
1970cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB71:%.*]] = sub i32 [[TMP38]], [[TMP39]]
1980cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB72:%.*]] = sub i32 [[SUB71]], 1
1990cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD73:%.*]] = add i32 [[SUB72]], 1
2000cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV74:%.*]] = udiv i32 [[ADD73]], 1
2010cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL75:%.*]] = mul i32 1, [[DIV74]]
2020cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL76:%.*]] = mul i32 [[MUL75]], 10
2030cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV77:%.*]] = zext i32 [[MUL76]] to i64
2040cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL78:%.*]] = mul nsw i64 [[DIV70]], [[CONV77]]
2050cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB79:%.*]] = sub nsw i64 [[TMP34]], [[MUL78]]
2060cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP40:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
2070cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP41:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
2080cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP42:%.*]] = load i32, ptr [[DOTUPPER]], align 4
2090cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP43:%.*]] = load i32, ptr [[DOTLOWER]], align 4
2100cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB80:%.*]] = sub i32 [[TMP42]], [[TMP43]]
2110cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB81:%.*]] = sub i32 [[SUB80]], 1
2120cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD82:%.*]] = add i32 [[SUB81]], 1
2130cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV83:%.*]] = udiv i32 [[ADD82]], 1
2140cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL84:%.*]] = mul i32 1, [[DIV83]]
2150cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL85:%.*]] = mul i32 [[MUL84]], 10
2160cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV86:%.*]] = zext i32 [[MUL85]] to i64
2170cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV87:%.*]] = sdiv i64 [[TMP41]], [[CONV86]]
2180cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP44:%.*]] = load i32, ptr [[DOTUPPER]], align 4
2190cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP45:%.*]] = load i32, ptr [[DOTLOWER]], align 4
2200cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB88:%.*]] = sub i32 [[TMP44]], [[TMP45]]
2210cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB89:%.*]] = sub i32 [[SUB88]], 1
2220cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD90:%.*]] = add i32 [[SUB89]], 1
2230cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV91:%.*]] = udiv i32 [[ADD90]], 1
2240cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL92:%.*]] = mul i32 1, [[DIV91]]
2250cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL93:%.*]] = mul i32 [[MUL92]], 10
2260cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV94:%.*]] = zext i32 [[MUL93]] to i64
2270cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL95:%.*]] = mul nsw i64 [[DIV87]], [[CONV94]]
2280cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB96:%.*]] = sub nsw i64 [[TMP40]], [[MUL95]]
2290cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[DIV97:%.*]] = sdiv i64 [[SUB96]], 10
2300cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL98:%.*]] = mul nsw i64 [[DIV97]], 10
2310cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[SUB99:%.*]] = sub nsw i64 [[SUB79]], [[MUL98]]
2320cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[MUL100:%.*]] = mul nsw i64 [[SUB99]], 1
2330cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD101:%.*]] = add nsw i64 0, [[MUL100]]
2340cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CONV102:%.*]] = trunc i64 [[ADD101]] to i32
2350cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i32 [[CONV102]], ptr [[I021]], align 4
2360cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP46:%.*]] = load i32, ptr [[I20]], align 4
2370cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP47:%.*]] = load i32, ptr [[MP_ADDR]], align 4
2380cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[CMP103:%.*]] = icmp slt i32 [[TMP46]], [[TMP47]]
2390cfe5ae0SAlexey Bataev // CHECK-NEXT:    br i1 [[CMP103]], label [[OMP_BODY_NEXT:%.*]], label [[OMP_BODY_CONTINUE:%.*]]
2400cfe5ae0SAlexey Bataev // CHECK:       omp.body.next:
2410cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_BODY_CONTINUE]]
2420cfe5ae0SAlexey Bataev // CHECK:       omp.body.continue:
2430cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_INNER_FOR_INC:%.*]]
2440cfe5ae0SAlexey Bataev // CHECK:       omp.inner.for.inc:
2450cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[TMP48:%.*]] = load i64, ptr [[DOTOMP_IV]], align 8
2460cfe5ae0SAlexey Bataev // CHECK-NEXT:    [[ADD105:%.*]] = add nsw i64 [[TMP48]], 1
2470cfe5ae0SAlexey Bataev // CHECK-NEXT:    store i64 [[ADD105]], ptr [[DOTOMP_IV]], align 8
2480cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_INNER_FOR_COND]]
2490cfe5ae0SAlexey Bataev // CHECK:       omp.inner.for.end:
2500cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_LOOP_EXIT:%.*]]
2510cfe5ae0SAlexey Bataev // CHECK:       omp.loop.exit:
2520cfe5ae0SAlexey Bataev // CHECK-NEXT:    call void @__kmpc_for_static_fini(ptr @[[GLOB1]], i32 [[TMP0]])
2530cfe5ae0SAlexey Bataev // CHECK-NEXT:    br label [[OMP_PRECOND_END]]
2540cfe5ae0SAlexey Bataev // CHECK:       omp.precond.end:
2550cfe5ae0SAlexey Bataev // CHECK-NEXT:    call void @__kmpc_barrier(ptr @[[GLOB3:[0-9]+]], i32 [[TMP0]])
2560cfe5ae0SAlexey Bataev // CHECK-NEXT:    ret void
2570cfe5ae0SAlexey Bataev //
258*1c9ec74eSDhruva Chakrabarti //
259*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-LABEL: define {{[^@]+}}@collapsed
260*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-SAME: (i32 noundef [[MP:%.*]]) #[[ATTR0:[0-9]+]] {
261*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:  entry:
262*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[MP_ADDR:%.*]] = alloca i32, align 4
263*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[J:%.*]] = alloca i32, align 4
264*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[I:%.*]] = alloca i32, align 4
265*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[I0:%.*]] = alloca i32, align 4
266*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 [[MP]], ptr [[MP_ADDR]], align 4
267*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 0, ptr [[J]], align 4
268*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND:%.*]]
269*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.cond:
270*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP0:%.*]] = load i32, ptr [[J]], align 4
271*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP1:%.*]] = load i32, ptr [[MP_ADDR]], align 4
272*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]]
273*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END12:%.*]]
274*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.body:
275*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP2:%.*]] = load i32, ptr [[J]], align 4
276*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 [[TMP2]], ptr [[I]], align 4
277*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND1:%.*]]
278*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.cond1:
279*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP3:%.*]] = load i32, ptr [[I]], align 4
280*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP4:%.*]] = load i32, ptr [[MP_ADDR]], align 4
281*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[CMP2:%.*]] = icmp slt i32 [[TMP3]], [[TMP4]]
282*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br i1 [[CMP2]], label [[FOR_BODY3:%.*]], label [[FOR_END9:%.*]]
283*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.body3:
284*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 0, ptr [[I0]], align 4
285*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND4:%.*]]
286*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.cond4:
287*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP5:%.*]] = load i32, ptr [[I0]], align 4
288*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[CMP5:%.*]] = icmp slt i32 [[TMP5]], 10
289*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END:%.*]]
290*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.body6:
291*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_INC:%.*]]
292*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.inc:
293*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP6:%.*]] = load i32, ptr [[I0]], align 4
294*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[INC:%.*]] = add nsw i32 [[TMP6]], 1
295*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 [[INC]], ptr [[I0]], align 4
296*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND4]], !llvm.loop [[LOOP2:![0-9]+]]
297*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.end:
298*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_INC7:%.*]]
299*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.inc7:
300*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP7:%.*]] = load i32, ptr [[I]], align 4
301*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[INC8:%.*]] = add nsw i32 [[TMP7]], 1
302*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 [[INC8]], ptr [[I]], align 4
303*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND1]], !llvm.loop [[LOOP4:![0-9]+]]
304*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.end9:
305*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_INC10:%.*]]
306*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.inc10:
307*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[TMP8:%.*]] = load i32, ptr [[J]], align 4
308*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    [[INC11:%.*]] = add nsw i32 [[TMP8]], 1
309*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    store i32 [[INC11]], ptr [[J]], align 4
310*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    br label [[FOR_COND]], !llvm.loop [[LOOP5:![0-9]+]]
311*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0:       for.end12:
312*1c9ec74eSDhruva Chakrabarti // SIMD-ONLY0-NEXT:    ret void
313*1c9ec74eSDhruva Chakrabarti //
314