1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2; RUN: opt < %s -passes=div-rem-pairs -S -mtriple=powerpc64-unknown-unknown | FileCheck %s 3 4declare void @foo(i32, i32) 5 6define void @decompose_illegal_srem_same_block(i32 %a, i32 %b) { 7; CHECK-LABEL: @decompose_illegal_srem_same_block( 8; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 [[A:%.*]], [[B:%.*]] 9; CHECK-NEXT: [[T0:%.*]] = mul i32 [[DIV]], [[B]] 10; CHECK-NEXT: [[REM:%.*]] = sub i32 [[A]], [[T0]] 11; CHECK-NEXT: call void @foo(i32 [[REM]], i32 [[DIV]]) 12; CHECK-NEXT: ret void 13; 14 %div = sdiv i32 %a, %b 15 %t0 = mul i32 %div, %b 16 %rem = sub i32 %a, %t0 17 call void @foo(i32 %rem, i32 %div) 18 ret void 19} 20 21define void @decompose_illegal_urem_same_block(i32 %a, i32 %b) { 22; CHECK-LABEL: @decompose_illegal_urem_same_block( 23; CHECK-NEXT: [[DIV:%.*]] = udiv i32 [[A:%.*]], [[B:%.*]] 24; CHECK-NEXT: [[T0:%.*]] = mul i32 [[DIV]], [[B]] 25; CHECK-NEXT: [[REM:%.*]] = sub i32 [[A]], [[T0]] 26; CHECK-NEXT: call void @foo(i32 [[REM]], i32 [[DIV]]) 27; CHECK-NEXT: ret void 28; 29 %div = udiv i32 %a, %b 30 %t0 = mul i32 %div, %b 31 %rem = sub i32 %a, %t0 32 call void @foo(i32 %rem, i32 %div) 33 ret void 34} 35 36; Recompose and hoist the srem if it's safe and free, otherwise keep as-is.. 37 38define i16 @hoist_srem(i16 %a, i16 %b) { 39; CHECK-LABEL: @hoist_srem( 40; CHECK-NEXT: entry: 41; CHECK-NEXT: [[DIV:%.*]] = sdiv i16 [[A:%.*]], [[B:%.*]] 42; CHECK-NEXT: [[CMP:%.*]] = icmp eq i16 [[DIV]], 42 43; CHECK-NEXT: br i1 [[CMP]], label [[IF:%.*]], label [[END:%.*]] 44; CHECK: if: 45; CHECK-NEXT: [[T0:%.*]] = mul i16 [[DIV]], [[B]] 46; CHECK-NEXT: [[REM:%.*]] = sub i16 [[A]], [[T0]] 47; CHECK-NEXT: br label [[END]] 48; CHECK: end: 49; CHECK-NEXT: [[RET:%.*]] = phi i16 [ [[REM]], [[IF]] ], [ 3, [[ENTRY:%.*]] ] 50; CHECK-NEXT: ret i16 [[RET]] 51; 52entry: 53 %div = sdiv i16 %a, %b 54 %cmp = icmp eq i16 %div, 42 55 br i1 %cmp, label %if, label %end 56 57if: 58 %t0 = mul i16 %div, %b 59 %rem = sub i16 %a, %t0 60 br label %end 61 62end: 63 %ret = phi i16 [ %rem, %if ], [ 3, %entry ] 64 ret i16 %ret 65} 66 67; Recompose and hoist the urem if it's safe and free, otherwise keep as-is.. 68 69define i8 @hoist_urem(i8 %a, i8 %b) { 70; CHECK-LABEL: @hoist_urem( 71; CHECK-NEXT: entry: 72; CHECK-NEXT: [[DIV:%.*]] = udiv i8 [[A:%.*]], [[B:%.*]] 73; CHECK-NEXT: [[CMP:%.*]] = icmp eq i8 [[DIV]], 42 74; CHECK-NEXT: br i1 [[CMP]], label [[IF:%.*]], label [[END:%.*]] 75; CHECK: if: 76; CHECK-NEXT: [[T0:%.*]] = mul i8 [[DIV]], [[B]] 77; CHECK-NEXT: [[REM:%.*]] = sub i8 [[A]], [[T0]] 78; CHECK-NEXT: br label [[END]] 79; CHECK: end: 80; CHECK-NEXT: [[RET:%.*]] = phi i8 [ [[REM]], [[IF]] ], [ 3, [[ENTRY:%.*]] ] 81; CHECK-NEXT: ret i8 [[RET]] 82; 83entry: 84 %div = udiv i8 %a, %b 85 %cmp = icmp eq i8 %div, 42 86 br i1 %cmp, label %if, label %end 87 88if: 89 %t0 = mul i8 %div, %b 90 %rem = sub i8 %a, %t0 91 br label %end 92 93end: 94 %ret = phi i8 [ %rem, %if ], [ 3, %entry ] 95 ret i8 %ret 96} 97 98; Be careful with RAUW/invalidation if this is a srem-of-srem. 99 100define i32 @srem_of_srem_unexpanded(i32 %X, i32 %Y, i32 %Z) { 101; CHECK-LABEL: @srem_of_srem_unexpanded( 102; CHECK-NEXT: [[T0:%.*]] = mul nsw i32 [[Z:%.*]], [[Y:%.*]] 103; CHECK-NEXT: [[X_FROZEN:%.*]] = freeze i32 [[X:%.*]] 104; CHECK-NEXT: [[T0_FROZEN:%.*]] = freeze i32 [[T0]] 105; CHECK-NEXT: [[T1:%.*]] = sdiv i32 [[X_FROZEN]], [[T0_FROZEN]] 106; CHECK-NEXT: [[T2:%.*]] = mul nsw i32 [[T0]], [[T1]] 107; CHECK-NEXT: [[TMP1:%.*]] = mul i32 [[T1]], [[T0_FROZEN]] 108; CHECK-NEXT: [[T3_DECOMPOSED:%.*]] = sub i32 [[X_FROZEN]], [[TMP1]] 109; CHECK-NEXT: [[Y_FROZEN:%.*]] = freeze i32 [[Y]] 110; CHECK-NEXT: [[T4:%.*]] = sdiv i32 [[T3_DECOMPOSED]], [[Y_FROZEN]] 111; CHECK-NEXT: [[T5:%.*]] = mul nsw i32 [[T4]], [[Y]] 112; CHECK-NEXT: [[TMP2:%.*]] = mul i32 [[T4]], [[Y_FROZEN]] 113; CHECK-NEXT: [[T6_DECOMPOSED:%.*]] = sub i32 [[T3_DECOMPOSED]], [[TMP2]] 114; CHECK-NEXT: ret i32 [[T6_DECOMPOSED]] 115; 116 %t0 = mul nsw i32 %Z, %Y 117 %t1 = sdiv i32 %X, %t0 118 %t2 = mul nsw i32 %t0, %t1 119 %t3 = srem i32 %X, %t0 120 %t4 = sdiv i32 %t3, %Y 121 %t5 = mul nsw i32 %t4, %Y 122 %t6 = srem i32 %t3, %Y 123 ret i32 %t6 124} 125define i32 @srem_of_srem_expanded(i32 %X, i32 %Y, i32 %Z) { 126; CHECK-LABEL: @srem_of_srem_expanded( 127; CHECK-NEXT: [[T0:%.*]] = mul nsw i32 [[Z:%.*]], [[Y:%.*]] 128; CHECK-NEXT: [[T1:%.*]] = sdiv i32 [[X:%.*]], [[T0]] 129; CHECK-NEXT: [[T2:%.*]] = mul nsw i32 [[T0]], [[T1]] 130; CHECK-NEXT: [[T3:%.*]] = sub nsw i32 [[X]], [[T2]] 131; CHECK-NEXT: [[T4:%.*]] = sdiv i32 [[T3]], [[Y]] 132; CHECK-NEXT: [[T5:%.*]] = mul nsw i32 [[T4]], [[Y]] 133; CHECK-NEXT: [[T6:%.*]] = sub nsw i32 [[T3]], [[T5]] 134; CHECK-NEXT: ret i32 [[T6]] 135; 136 %t0 = mul nsw i32 %Z, %Y 137 %t1 = sdiv i32 %X, %t0 138 %t2 = mul nsw i32 %t0, %t1 139 %t3 = sub nsw i32 %X, %t2 140 %t4 = sdiv i32 %t3, %Y 141 %t5 = mul nsw i32 %t4, %Y 142 %t6 = sub nsw i32 %t3, %t5 143 ret i32 %t6 144} 145 146; If the target doesn't have a unified div/rem op for the type, keep decomposed rem 147 148define i128 @dont_hoist_urem(i128 %a, i128 %b) { 149; CHECK-LABEL: @dont_hoist_urem( 150; CHECK-NEXT: entry: 151; CHECK-NEXT: [[DIV:%.*]] = udiv i128 [[A:%.*]], [[B:%.*]] 152; CHECK-NEXT: [[CMP:%.*]] = icmp eq i128 [[DIV]], 42 153; CHECK-NEXT: br i1 [[CMP]], label [[IF:%.*]], label [[END:%.*]] 154; CHECK: if: 155; CHECK-NEXT: [[T0:%.*]] = mul i128 [[DIV]], [[B]] 156; CHECK-NEXT: [[REM:%.*]] = sub i128 [[A]], [[T0]] 157; CHECK-NEXT: br label [[END]] 158; CHECK: end: 159; CHECK-NEXT: [[RET:%.*]] = phi i128 [ [[REM]], [[IF]] ], [ 3, [[ENTRY:%.*]] ] 160; CHECK-NEXT: ret i128 [[RET]] 161; 162entry: 163 %div = udiv i128 %a, %b 164 %cmp = icmp eq i128 %div, 42 165 br i1 %cmp, label %if, label %end 166 167if: 168 %t0 = mul i128 %div, %b 169 %rem = sub i128 %a, %t0 170 br label %end 171 172end: 173 %ret = phi i128 [ %rem, %if ], [ 3, %entry ] 174 ret i128 %ret 175} 176