xref: /llvm-project/llvm/test/Transforms/InstCombine/memcmp-3.ll (revision 90ba33099cbb17e7c159e9ebc5a512037db99d6d)
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; Verify that calls to memcmp with arrays of elements larger than char
3; are folded correctly.
4; RUN: opt < %s -passes=instcombine -S -data-layout="E" | FileCheck %s --check-prefixes=BE
5; RUN: opt < %s -passes=instcombine -S -data-layout="e" | FileCheck %s --check-prefixes=LE
6
7declare i32 @memcmp(ptr, ptr, i64)
8
9; BE representation: { 'a', 'b', 'c', ..., 'f', 'g', 'h' }
10; LE representation: { 'b', 'a', 'd', ..., 'e', 'h', 'g' }
11@ia16a = constant [4 x i16] [i16 24930, i16 25444, i16 25958, i16 26472]
12
13; Same as the BE representation above except ending in "gg".
14@i8a = constant [8 x i8] c"abcdefgg"
15
16; Fold memcmp(ia16a, i8a, N) for N in [0, 8].
17
18define void @fold_memcmp_ia16a_i8a(ptr %pcmp) {
19; BE-LABEL: @fold_memcmp_ia16a_i8a(
20; BE-NEXT:    store i32 0, ptr [[PCMP:%.*]], align 4
21; BE-NEXT:    [[PSTOR1:%.*]] = getelementptr i8, ptr [[PCMP]], i64 4
22; BE-NEXT:    store i32 0, ptr [[PSTOR1]], align 4
23; BE-NEXT:    [[PSTOR2:%.*]] = getelementptr i8, ptr [[PCMP]], i64 8
24; BE-NEXT:    store i32 0, ptr [[PSTOR2]], align 4
25; BE-NEXT:    [[PSTOR3:%.*]] = getelementptr i8, ptr [[PCMP]], i64 12
26; BE-NEXT:    store i32 0, ptr [[PSTOR3]], align 4
27; BE-NEXT:    [[PSTOR4:%.*]] = getelementptr i8, ptr [[PCMP]], i64 16
28; BE-NEXT:    store i32 0, ptr [[PSTOR4]], align 4
29; BE-NEXT:    [[PSTOR5:%.*]] = getelementptr i8, ptr [[PCMP]], i64 20
30; BE-NEXT:    store i32 0, ptr [[PSTOR5]], align 4
31; BE-NEXT:    [[PSTOR6:%.*]] = getelementptr i8, ptr [[PCMP]], i64 24
32; BE-NEXT:    store i32 0, ptr [[PSTOR6]], align 4
33; BE-NEXT:    [[PSTOR7:%.*]] = getelementptr i8, ptr [[PCMP]], i64 28
34; BE-NEXT:    store i32 0, ptr [[PSTOR7]], align 4
35; BE-NEXT:    [[PSTOR8:%.*]] = getelementptr i8, ptr [[PCMP]], i64 32
36; BE-NEXT:    store i32 1, ptr [[PSTOR8]], align 4
37; BE-NEXT:    ret void
38;
39; LE-LABEL: @fold_memcmp_ia16a_i8a(
40; LE-NEXT:    store i32 0, ptr [[PCMP:%.*]], align 4
41; LE-NEXT:    [[PSTOR1:%.*]] = getelementptr i8, ptr [[PCMP]], i64 4
42; LE-NEXT:    store i32 1, ptr [[PSTOR1]], align 4
43; LE-NEXT:    [[PSTOR2:%.*]] = getelementptr i8, ptr [[PCMP]], i64 8
44; LE-NEXT:    store i32 1, ptr [[PSTOR2]], align 4
45; LE-NEXT:    [[PSTOR3:%.*]] = getelementptr i8, ptr [[PCMP]], i64 12
46; LE-NEXT:    store i32 1, ptr [[PSTOR3]], align 4
47; LE-NEXT:    [[PSTOR4:%.*]] = getelementptr i8, ptr [[PCMP]], i64 16
48; LE-NEXT:    store i32 1, ptr [[PSTOR4]], align 4
49; LE-NEXT:    [[PSTOR5:%.*]] = getelementptr i8, ptr [[PCMP]], i64 20
50; LE-NEXT:    store i32 1, ptr [[PSTOR5]], align 4
51; LE-NEXT:    [[PSTOR6:%.*]] = getelementptr i8, ptr [[PCMP]], i64 24
52; LE-NEXT:    store i32 1, ptr [[PSTOR6]], align 4
53; LE-NEXT:    [[PSTOR7:%.*]] = getelementptr i8, ptr [[PCMP]], i64 28
54; LE-NEXT:    store i32 1, ptr [[PSTOR7]], align 4
55; LE-NEXT:    [[PSTOR8:%.*]] = getelementptr i8, ptr [[PCMP]], i64 32
56; LE-NEXT:    store i32 1, ptr [[PSTOR8]], align 4
57; LE-NEXT:    ret void
58;
59
60  %cmp0 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 0)
61  store i32 %cmp0, ptr %pcmp
62
63  %cmp1 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 1)
64  %pstor1 = getelementptr i32, ptr %pcmp, i64 1
65  store i32 %cmp1, ptr %pstor1
66
67  %cmp2 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 2)
68  %pstor2 = getelementptr i32, ptr %pcmp, i64 2
69  store i32 %cmp2, ptr %pstor2
70
71  %cmp3 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 3)
72  %pstor3 = getelementptr i32, ptr %pcmp, i64 3
73  store i32 %cmp3, ptr %pstor3
74
75  %cmp4 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 4)
76  %pstor4 = getelementptr i32, ptr %pcmp, i64 4
77  store i32 %cmp4, ptr %pstor4
78
79  %cmp5 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 5)
80  %pstor5 = getelementptr i32, ptr %pcmp, i64 5
81  store i32 %cmp5, ptr %pstor5
82
83  %cmp6 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 6)
84  %pstor6 = getelementptr i32, ptr %pcmp, i64 6
85  store i32 %cmp6, ptr %pstor6
86
87  %cmp7 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 7)
88  %pstor7 = getelementptr i32, ptr %pcmp, i64 7
89  store i32 %cmp7, ptr %pstor7
90
91  %cmp8 = call i32 @memcmp(ptr @ia16a, ptr @i8a, i64 8)
92  %pstor8 = getelementptr i32, ptr %pcmp, i64 8
93  store i32 %cmp8, ptr %pstor8
94
95  ret void
96}
97
98
99; Fold memcmp(ia16a + 1, i8a + 2, N) for N in [0, 6].
100
101define void @fold_memcmp_ia16a_p1_i8a_p1(ptr %pcmp) {
102; BE-LABEL: @fold_memcmp_ia16a_p1_i8a_p1(
103; BE-NEXT:    store i32 0, ptr [[PCMP:%.*]], align 4
104; BE-NEXT:    [[PSTOR1:%.*]] = getelementptr i8, ptr [[PCMP]], i64 4
105; BE-NEXT:    store i32 1, ptr [[PSTOR1]], align 4
106; BE-NEXT:    [[PSTOR2:%.*]] = getelementptr i8, ptr [[PCMP]], i64 8
107; BE-NEXT:    store i32 1, ptr [[PSTOR2]], align 4
108; BE-NEXT:    [[PSTOR3:%.*]] = getelementptr i8, ptr [[PCMP]], i64 12
109; BE-NEXT:    store i32 1, ptr [[PSTOR3]], align 4
110; BE-NEXT:    [[PSTOR4:%.*]] = getelementptr i8, ptr [[PCMP]], i64 16
111; BE-NEXT:    store i32 1, ptr [[PSTOR4]], align 4
112; BE-NEXT:    [[PSTOR5:%.*]] = getelementptr i8, ptr [[PCMP]], i64 20
113; BE-NEXT:    store i32 1, ptr [[PSTOR5]], align 4
114; BE-NEXT:    [[PSTOR6:%.*]] = getelementptr i8, ptr [[PCMP]], i64 24
115; BE-NEXT:    store i32 1, ptr [[PSTOR6]], align 4
116; BE-NEXT:    ret void
117;
118; LE-LABEL: @fold_memcmp_ia16a_p1_i8a_p1(
119; LE-NEXT:    store i32 0, ptr [[PCMP:%.*]], align 4
120; LE-NEXT:    [[PSTOR1:%.*]] = getelementptr i8, ptr [[PCMP]], i64 4
121; LE-NEXT:    store i32 1, ptr [[PSTOR1]], align 4
122; LE-NEXT:    [[PSTOR2:%.*]] = getelementptr i8, ptr [[PCMP]], i64 8
123; LE-NEXT:    store i32 1, ptr [[PSTOR2]], align 4
124; LE-NEXT:    [[PSTOR3:%.*]] = getelementptr i8, ptr [[PCMP]], i64 12
125; LE-NEXT:    store i32 1, ptr [[PSTOR3]], align 4
126; LE-NEXT:    [[PSTOR4:%.*]] = getelementptr i8, ptr [[PCMP]], i64 16
127; LE-NEXT:    store i32 1, ptr [[PSTOR4]], align 4
128; LE-NEXT:    [[PSTOR5:%.*]] = getelementptr i8, ptr [[PCMP]], i64 20
129; LE-NEXT:    store i32 1, ptr [[PSTOR5]], align 4
130; LE-NEXT:    [[PSTOR6:%.*]] = getelementptr i8, ptr [[PCMP]], i64 24
131; LE-NEXT:    store i32 1, ptr [[PSTOR6]], align 4
132; LE-NEXT:    ret void
133;
134  %p0 = getelementptr [4 x i16], ptr @ia16a, i64 0, i64 1
135  %q = getelementptr [8 x i8], ptr @i8a, i64 0, i64 1
136
137  %cmp0 = call i32 @memcmp(ptr %p0, ptr %q, i64 0)
138  store i32 %cmp0, ptr %pcmp
139
140  %cmp1 = call i32 @memcmp(ptr %p0, ptr %q, i64 1)
141  %pstor1 = getelementptr i32, ptr %pcmp, i64 1
142  store i32 %cmp1, ptr %pstor1
143
144  %cmp2 = call i32 @memcmp(ptr %p0, ptr %q, i64 2)
145  %pstor2 = getelementptr i32, ptr %pcmp, i64 2
146  store i32 %cmp2, ptr %pstor2
147
148  %cmp3 = call i32 @memcmp(ptr %p0, ptr %q, i64 3)
149  %pstor3 = getelementptr i32, ptr %pcmp, i64 3
150  store i32 %cmp3, ptr %pstor3
151
152  %cmp4 = call i32 @memcmp(ptr %p0, ptr %q, i64 4)
153  %pstor4 = getelementptr i32, ptr %pcmp, i64 4
154  store i32 %cmp4, ptr %pstor4
155
156  %cmp5 = call i32 @memcmp(ptr %p0, ptr %q, i64 5)
157  %pstor5 = getelementptr i32, ptr %pcmp, i64 5
158  store i32 %cmp5, ptr %pstor5
159
160  %cmp6 = call i32 @memcmp(ptr %p0, ptr %q, i64 6)
161  %pstor6 = getelementptr i32, ptr %pcmp, i64 6
162  store i32 %cmp6, ptr %pstor6
163
164  ret void
165}
166