xref: /llvm-project/llvm/test/Transforms/LoopIdiom/X86/memset-size-compute.ll (revision f8742b8d6a3489dc8974f4166d413a66cb8d9c21)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt -passes=loop-idiom -S %s | FileCheck %s
3
4target datalayout = "e-m:o-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
5target triple = "x86_64-apple-macosx11.0.0"
6
7; Make sure the number of bytes is computed correctly in the presence of zero
8; extensions and preserved add flags.
9define void @test(ptr %ptr) {
10; CHECK-LABEL: @test(
11; CHECK-NEXT:  entry:
12; CHECK-NEXT:    br label [[FOR_BODY_PREHEADER:%.*]]
13; CHECK:       dead:
14; CHECK-NEXT:    br label [[FOR_BODY_PREHEADER]]
15; CHECK:       for.body.preheader:
16; CHECK-NEXT:    [[LIM_0:%.*]] = phi i32 [ 65, [[ENTRY:%.*]] ], [ 1, [[DEAD:%.*]] ]
17; CHECK-NEXT:    [[SCEVGEP:%.*]] = getelementptr i8, ptr [[PTR:%.*]], i64 8
18; CHECK-NEXT:    [[UMAX:%.*]] = call i32 @llvm.umax.i32(i32 [[LIM_0]], i32 2)
19; CHECK-NEXT:    [[TMP0:%.*]] = add nsw i32 [[UMAX]], -1
20; CHECK-NEXT:    [[TMP1:%.*]] = zext nneg i32 [[TMP0]] to i64
21; CHECK-NEXT:    [[TMP2:%.*]] = shl nuw nsw i64 [[TMP1]], 3
22; CHECK-NEXT:    call void @llvm.memset.p0.i64(ptr align 8 [[SCEVGEP]], i8 0, i64 [[TMP2]], i1 false)
23; CHECK-NEXT:    br label [[FOR_BODY:%.*]]
24; CHECK:       for.body:
25; CHECK-NEXT:    [[IV:%.*]] = phi i32 [ [[IV_NEXT:%.*]], [[FOR_BODY]] ], [ 1, [[FOR_BODY_PREHEADER]] ]
26; CHECK-NEXT:    [[IV_EXT:%.*]] = zext i32 [[IV]] to i64
27; CHECK-NEXT:    [[GEP:%.*]] = getelementptr inbounds i64, ptr [[PTR]], i64 [[IV_EXT]]
28; CHECK-NEXT:    [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1
29; CHECK-NEXT:    [[CMP64:%.*]] = icmp ult i32 [[IV_NEXT]], [[LIM_0]]
30; CHECK-NEXT:    br i1 [[CMP64]], label [[FOR_BODY]], label [[EXIT:%.*]]
31; CHECK:       exit:
32; CHECK-NEXT:    ret void
33;
34entry:
35  br label %for.body.preheader
36
37dead:
38  br label %for.body.preheader
39
40for.body.preheader:
41  %lim.0 = phi i32 [ 65, %entry ], [ 1, %dead ]
42  br label %for.body
43
44for.body:
45  %iv = phi i32 [ %iv.next, %for.body ], [ 1, %for.body.preheader ]
46  %iv.ext = zext i32 %iv to i64
47  %gep = getelementptr inbounds i64, ptr %ptr, i64 %iv.ext
48  store i64 0, ptr %gep, align 8
49  %iv.next = add nuw nsw i32 %iv, 1
50  %cmp64 = icmp ult i32 %iv.next, %lim.0
51  br i1 %cmp64, label %for.body, label %exit
52
53exit:
54  ret void
55}
56