1; RUN: llc -verify-machineinstrs < %s | FileCheck %s 2; ModuleID = 'new.bc' 3target datalayout = "e-m:e-i64:64-n32:64" 4target triple = "powerpc64le--linux-gnu" 5 6@.str.87 = external hidden unnamed_addr constant [5 x i8], align 1 7@.str.1.88 = external hidden unnamed_addr constant [4 x i8], align 1 8@.str.2.89 = external hidden unnamed_addr constant [5 x i8], align 1 9@.str.3.90 = external hidden unnamed_addr constant [4 x i8], align 1 10@.str.4.91 = external hidden unnamed_addr constant [14 x i8], align 1 11@.str.5.92 = external hidden unnamed_addr constant [13 x i8], align 1 12@.str.6.93 = external hidden unnamed_addr constant [10 x i8], align 1 13@.str.7.94 = external hidden unnamed_addr constant [9 x i8], align 1 14@.str.8.95 = external hidden unnamed_addr constant [2 x i8], align 1 15@.str.9.96 = external hidden unnamed_addr constant [2 x i8], align 1 16@.str.10.97 = external hidden unnamed_addr constant [3 x i8], align 1 17@.str.11.98 = external hidden unnamed_addr constant [3 x i8], align 1 18 19; Function Attrs: nounwind 20declare void @llvm.lifetime.start.p0(i64, ptr nocapture) #0 21 22; Function Attrs: nounwind 23declare void @llvm.lifetime.end.p0(i64, ptr nocapture) #0 24 25; Function Attrs: nounwind 26declare ptr @halide_string_to_string(ptr, ptr, ptr) #1 27 28; Function Attrs: nounwind 29declare ptr @halide_int64_to_string(ptr, ptr, i64, i32) #1 30 31;; Hardware loop should not be generated in the loop that already has a user 32;; defined hardware loop. Only one mtctr should be in the final assembly. 33; CHECK-LABEL: halide_double_to_string 34; CHECK-COUNT-1: mtctr 35 36; Function Attrs: nounwind 37define weak ptr @halide_double_to_string(ptr %dst, ptr %end, double %arg, i32 %scientific) #1 { 38entry: 39 %arg.addr = alloca double, align 8 40 %bits = alloca i64, align 8 41 %buf = alloca [512 x i8], align 1 42 store double %arg, ptr %arg.addr, align 8, !tbaa !4 43 call void @llvm.lifetime.start.p0(i64 8, ptr %bits) #0 44 store i64 0, ptr %bits, align 8, !tbaa !8 45 %call = call ptr @memcpy(ptr %bits, ptr %arg.addr, i64 8) #2 46 %0 = load i64, ptr %bits, align 8, !tbaa !8 47 %and = and i64 %0, 4503599627370495 48 %shr = lshr i64 %0, 52 49 %shr.tr = trunc i64 %shr to i32 50 %conv = and i32 %shr.tr, 2047 51 %shr2 = lshr i64 %0, 63 52 %conv3 = trunc i64 %shr2 to i32 53 %cmp = icmp eq i32 %conv, 2047 54 br i1 %cmp, label %if.then, label %if.else.15 55 56if.then: ; preds = %entry 57 %tobool = icmp eq i64 %and, 0 58 %tobool5 = icmp ne i32 %conv3, 0 59 br i1 %tobool, label %if.else.9, label %if.then.4 60 61if.then.4: ; preds = %if.then 62 br i1 %tobool5, label %if.then.6, label %if.else 63 64if.then.6: ; preds = %if.then.4 65 %call7 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.87) #3 66 br label %cleanup.148 67 68if.else: ; preds = %if.then.4 69 %call8 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.1.88) #3 70 br label %cleanup.148 71 72if.else.9: ; preds = %if.then 73 br i1 %tobool5, label %if.then.11, label %if.else.13 74 75if.then.11: ; preds = %if.else.9 76 %call12 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.2.89) #3 77 br label %cleanup.148 78 79if.else.13: ; preds = %if.else.9 80 %call14 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.3.90) #3 81 br label %cleanup.148 82 83if.else.15: ; preds = %entry 84 %cmp16 = icmp eq i32 %conv, 0 85 %cmp17 = icmp eq i64 %and, 0 86 %or.cond = and i1 %cmp17, %cmp16 87 br i1 %or.cond, label %if.then.18, label %if.end.32 88 89if.then.18: ; preds = %if.else.15 90 %tobool19 = icmp eq i32 %scientific, 0 91 %tobool21 = icmp ne i32 %conv3, 0 92 br i1 %tobool19, label %if.else.26, label %if.then.20 93 94if.then.20: ; preds = %if.then.18 95 br i1 %tobool21, label %if.then.22, label %if.else.24 96 97if.then.22: ; preds = %if.then.20 98 %call23 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.4.91) #3 99 br label %cleanup.148 100 101if.else.24: ; preds = %if.then.20 102 %call25 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.5.92) #3 103 br label %cleanup.148 104 105if.else.26: ; preds = %if.then.18 106 br i1 %tobool21, label %if.then.28, label %if.else.30 107 108if.then.28: ; preds = %if.else.26 109 %call29 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.6.93) #3 110 br label %cleanup.148 111 112if.else.30: ; preds = %if.else.26 113 %call31 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.7.94) #3 114 br label %cleanup.148 115 116if.end.32: ; preds = %if.else.15 117 %tobool33 = icmp eq i32 %conv3, 0 118 br i1 %tobool33, label %if.end.37, label %if.then.34 119 120if.then.34: ; preds = %if.end.32 121 %call35 = call ptr @halide_string_to_string(ptr %dst, ptr %end, ptr @.str.8.95) #3 122 %sub36 = fsub double -0.000000e+00, %arg 123 store double %sub36, ptr %arg.addr, align 8, !tbaa !4 124 br label %if.end.37 125 126if.end.37: ; preds = %if.then.34, %if.end.32 127 %.pr = phi double [ %sub36, %if.then.34 ], [ %arg, %if.end.32 ] 128 %dst.addr.0 = phi ptr [ %call35, %if.then.34 ], [ %dst, %if.end.32 ] 129 %tobool38 = icmp eq i32 %scientific, 0 130 br i1 %tobool38, label %if.else.62, label %while.condthread-pre-split 131 132while.condthread-pre-split: ; preds = %if.end.37 133 %cmp40.261 = fcmp olt double %.pr, 1.000000e+00 134 br i1 %cmp40.261, label %while.body, label %while.cond.41thread-pre-split 135 136while.body: ; preds = %while.body, %while.condthread-pre-split 137 %exponent_base_10.0262 = phi i32 [ %dec, %while.body ], [ 0, %while.condthread-pre-split ] 138 %1 = phi double [ %mul, %while.body ], [ %.pr, %while.condthread-pre-split ] 139 %mul = fmul double %1, 1.000000e+01 140 %dec = add nsw i32 %exponent_base_10.0262, -1 141 %cmp40 = fcmp olt double %mul, 1.000000e+00 142 br i1 %cmp40, label %while.body, label %while.cond.while.cond.41thread-pre-split_crit_edge 143 144while.cond.while.cond.41thread-pre-split_crit_edge: ; preds = %while.body 145 store double %mul, ptr %arg.addr, align 8, !tbaa !4 146 br label %while.cond.41thread-pre-split 147 148while.cond.41thread-pre-split: ; preds = %while.cond.while.cond.41thread-pre-split_crit_edge, %while.condthread-pre-split 149 %.pr246 = phi double [ %mul, %while.cond.while.cond.41thread-pre-split_crit_edge ], [ %.pr, %while.condthread-pre-split ] 150 %exponent_base_10.0.lcssa = phi i32 [ %dec, %while.cond.while.cond.41thread-pre-split_crit_edge ], [ 0, %while.condthread-pre-split ] 151 %cmp42.257 = fcmp ult double %.pr246, 1.000000e+01 152 br i1 %cmp42.257, label %while.end.44, label %while.body.43 153 154while.body.43: ; preds = %while.body.43, %while.cond.41thread-pre-split 155 %exponent_base_10.1258 = phi i32 [ %inc, %while.body.43 ], [ %exponent_base_10.0.lcssa, %while.cond.41thread-pre-split ] 156 %2 = phi double [ %div, %while.body.43 ], [ %.pr246, %while.cond.41thread-pre-split ] 157 %div = fdiv double %2, 1.000000e+01 158 %inc = add nsw i32 %exponent_base_10.1258, 1 159 %cmp42 = fcmp ult double %div, 1.000000e+01 160 br i1 %cmp42, label %while.cond.41.while.end.44_crit_edge, label %while.body.43 161 162while.cond.41.while.end.44_crit_edge: ; preds = %while.body.43 163 store double %div, ptr %arg.addr, align 8, !tbaa !4 164 br label %while.end.44 165 166while.end.44: ; preds = %while.cond.41.while.end.44_crit_edge, %while.cond.41thread-pre-split 167 %exponent_base_10.1.lcssa = phi i32 [ %inc, %while.cond.41.while.end.44_crit_edge ], [ %exponent_base_10.0.lcssa, %while.cond.41thread-pre-split ] 168 %.lcssa = phi double [ %div, %while.cond.41.while.end.44_crit_edge ], [ %.pr246, %while.cond.41thread-pre-split ] 169 %mul45 = fmul double %.lcssa, 1.000000e+06 170 %add = fadd double %mul45, 5.000000e-01 171 %conv46 = fptoui double %add to i64 172 %div47 = udiv i64 %conv46, 1000000 173 %3 = mul i64 %div47, -1000000 174 %sub49 = add i64 %conv46, %3 175 %call50 = call ptr @halide_int64_to_string(ptr %dst.addr.0, ptr %end, i64 %div47, i32 1) #3 176 %call51 = call ptr @halide_string_to_string(ptr %call50, ptr %end, ptr @.str.9.96) #3 177 %call52 = call ptr @halide_int64_to_string(ptr %call51, ptr %end, i64 %sub49, i32 6) #3 178 %cmp53 = icmp sgt i32 %exponent_base_10.1.lcssa, -1 179 br i1 %cmp53, label %if.then.54, label %if.else.56 180 181if.then.54: ; preds = %while.end.44 182 %call55 = call ptr @halide_string_to_string(ptr %call52, ptr %end, ptr @.str.10.97) #3 183 br label %if.end.59 184 185if.else.56: ; preds = %while.end.44 186 %call57 = call ptr @halide_string_to_string(ptr %call52, ptr %end, ptr @.str.11.98) #3 187 %sub58 = sub nsw i32 0, %exponent_base_10.1.lcssa 188 br label %if.end.59 189 190if.end.59: ; preds = %if.else.56, %if.then.54 191 %exponent_base_10.2 = phi i32 [ %exponent_base_10.1.lcssa, %if.then.54 ], [ %sub58, %if.else.56 ] 192 %dst.addr.1 = phi ptr [ %call55, %if.then.54 ], [ %call57, %if.else.56 ] 193 %conv60 = sext i32 %exponent_base_10.2 to i64 194 %call61 = call ptr @halide_int64_to_string(ptr %dst.addr.1, ptr %end, i64 %conv60, i32 2) #3 195 br label %cleanup.148 196 197if.else.62: ; preds = %if.end.37 198 br i1 %cmp16, label %if.then.64, label %if.end.66 199 200if.then.64: ; preds = %if.else.62 201 %call65 = call ptr @halide_double_to_string(ptr %dst.addr.0, ptr %end, double 0.000000e+00, i32 0) #3 202 br label %cleanup.148 203 204if.end.66: ; preds = %if.else.62 205 %add68 = or i64 %and, 4503599627370496 206 %sub70 = add nsw i32 %conv, -1075 207 %cmp71 = icmp ult i32 %conv, 1075 208 br i1 %cmp71, label %if.then.72, label %if.end.105 209 210if.then.72: ; preds = %if.end.66 211 %cmp73 = icmp slt i32 %sub70, -52 212 br i1 %cmp73, label %if.end.84, label %if.else.76 213 214if.else.76: ; preds = %if.then.72 215 %sub77 = sub nsw i32 1075, %conv 216 %sh_prom = zext i32 %sub77 to i64 217 %shr78 = lshr i64 %add68, %sh_prom 218 %shl81 = shl i64 %shr78, %sh_prom 219 %sub82 = sub i64 %add68, %shl81 220 br label %if.end.84 221 222if.end.84: ; preds = %if.else.76, %if.then.72 223 %integer_part.0 = phi i64 [ %shr78, %if.else.76 ], [ 0, %if.then.72 ] 224 %f.0.in = phi i64 [ %sub82, %if.else.76 ], [ %add68, %if.then.72 ] 225 %f.0 = uitofp i64 %f.0.in to double 226 %conv85.244 = zext i32 %sub70 to i64 227 %shl86 = shl i64 %conv85.244, 52 228 %add88 = add i64 %shl86, 4696837146684686336 229 %4 = bitcast i64 %add88 to double 230 %mul90 = fmul double %4, %f.0 231 %add91 = fadd double %mul90, 5.000000e-01 232 %conv92 = fptoui double %add91 to i64 233 %conv93 = uitofp i64 %conv92 to double 234 %and96 = and i64 %conv92, 1 235 %notlhs = fcmp oeq double %conv93, %add91 236 %notrhs = icmp ne i64 %and96, 0 237 %not.or.cond245 = and i1 %notrhs, %notlhs 238 %dec99 = sext i1 %not.or.cond245 to i64 239 %fractional_part.0 = add i64 %dec99, %conv92 240 %cmp101 = icmp eq i64 %fractional_part.0, 1000000 241 %inc103 = zext i1 %cmp101 to i64 242 %inc103.integer_part.0 = add i64 %inc103, %integer_part.0 243 %.fractional_part.0 = select i1 %cmp101, i64 0, i64 %fractional_part.0 244 br label %if.end.105 245 246if.end.105: ; preds = %if.end.84, %if.end.66 247 %integer_part.2 = phi i64 [ %inc103.integer_part.0, %if.end.84 ], [ %add68, %if.end.66 ] 248 %integer_exponent.0 = phi i32 [ 0, %if.end.84 ], [ %sub70, %if.end.66 ] 249 %fractional_part.2 = phi i64 [ %.fractional_part.0, %if.end.84 ], [ 0, %if.end.66 ] 250 call void @llvm.lifetime.start.p0(i64 512, ptr %buf) #0 251 %add.ptr = getelementptr inbounds [512 x i8], ptr %buf, i64 0, i64 512 252 %add.ptr106 = getelementptr inbounds [512 x i8], ptr %buf, i64 0, i64 480 253 %call109 = call ptr @halide_int64_to_string(ptr %add.ptr106, ptr %add.ptr, i64 %integer_part.2, i32 1) #3 254 %cmp110.252 = icmp sgt i32 %integer_exponent.0, 0 255 br i1 %cmp110.252, label %for.cond.112.preheader, label %for.cond.cleanup 256 257for.cond.112.preheader: ; preds = %if.end.138, %if.end.105 258 %i.0255 = phi i32 [ %inc140, %if.end.138 ], [ 0, %if.end.105 ] 259 %int_part_ptr.0253 = phi ptr [ %int_part_ptr.1, %if.end.138 ], [ %add.ptr106, %if.end.105 ] 260 %int_part_ptr.02534 = ptrtoint ptr %int_part_ptr.0253 to i64 261 %cmp114.249 = icmp eq ptr %call109, %int_part_ptr.0253 262 br i1 %cmp114.249, label %if.end.138, label %for.body.116.preheader 263 264for.body.116.preheader: ; preds = %for.cond.112.preheader 265 %5 = sub i64 0, %int_part_ptr.02534 266 %scevgep5 = getelementptr i8, ptr %call109, i64 %5 267 %scevgep56 = ptrtoint ptr %scevgep5 to i64 268 call void @llvm.set.loop.iterations.i64(i64 %scevgep56) 269 br label %for.body.116 270 271for.cond.cleanup: ; preds = %if.end.138, %if.end.105 272 %int_part_ptr.0.lcssa = phi ptr [ %add.ptr106, %if.end.105 ], [ %int_part_ptr.1, %if.end.138 ] 273 %call142 = call ptr @halide_string_to_string(ptr %dst.addr.0, ptr %end, ptr %int_part_ptr.0.lcssa) #3 274 %call143 = call ptr @halide_string_to_string(ptr %call142, ptr %end, ptr @.str.9.96) #3 275 %call144 = call ptr @halide_int64_to_string(ptr %call143, ptr %end, i64 %fractional_part.2, i32 6) #3 276 call void @llvm.lifetime.end.p0(i64 512, ptr %buf) #0 277 br label %cleanup.148 278 279for.cond.cleanup.115: ; preds = %for.body.116 280 br i1 %cmp125, label %if.then.136, label %if.end.138 281 282for.body.116: ; preds = %for.body.116, %for.body.116.preheader 283 %call109.pn = phi ptr [ %p.0251, %for.body.116 ], [ %call109, %for.body.116.preheader ] 284 %carry.0250 = phi i32 [ %carry.1, %for.body.116 ], [ 0, %for.body.116.preheader ] 285 %call109.pn2 = ptrtoint ptr %call109.pn to i64 286 %p.0251 = getelementptr inbounds i8, ptr %call109.pn, i64 -1 287 %scevgep3 = getelementptr i8, ptr inttoptr (i64 -1 to ptr), i64 %call109.pn2 288 %6 = load i8, ptr %scevgep3, align 1, !tbaa !10 289 %sub118 = add i8 %6, -48 290 %conv120 = sext i8 %sub118 to i32 291 %mul121 = shl nsw i32 %conv120, 1 292 %add122 = or i32 %mul121, %carry.0250 293 %7 = trunc i32 %add122 to i8 294 %cmp125 = icmp sgt i8 %7, 9 295 %sub128 = add nsw i32 %add122, 246 296 %carry.1 = zext i1 %cmp125 to i32 297 %new_digit.0.in = select i1 %cmp125, i32 %sub128, i32 %add122 298 %add133 = add nsw i32 %new_digit.0.in, 48 299 %conv134 = trunc i32 %add133 to i8 300 %scevgep = getelementptr i8, ptr inttoptr (i64 -1 to ptr), i64 %call109.pn2 301 store i8 %conv134, ptr %scevgep, align 1, !tbaa !10 302 %8 = call i1 @llvm.loop.decrement(i64 1) 303 br i1 %8, label %for.body.116, label %for.cond.cleanup.115 304 305if.then.136: ; preds = %for.cond.cleanup.115 306 %incdec.ptr137 = getelementptr inbounds i8, ptr %int_part_ptr.0253, i64 -1 307 store i8 49, ptr %incdec.ptr137, align 1, !tbaa !10 308 br label %if.end.138 309 310if.end.138: ; preds = %if.then.136, %for.cond.cleanup.115, %for.cond.112.preheader 311 %int_part_ptr.1 = phi ptr [ %incdec.ptr137, %if.then.136 ], [ %call109, %for.cond.112.preheader ], [ %int_part_ptr.0253, %for.cond.cleanup.115 ] 312 %inc140 = add nuw nsw i32 %i.0255, 1 313 %exitcond = icmp eq i32 %inc140, %integer_exponent.0 314 br i1 %exitcond, label %for.cond.cleanup, label %for.cond.112.preheader 315 316cleanup.148: ; preds = %for.cond.cleanup, %if.then.64, %if.end.59, %if.else.30, %if.then.28, %if.else.24, %if.then.22, %if.else.13, %if.then.11, %if.else, %if.then.6 317 %retval.1 = phi ptr [ %call7, %if.then.6 ], [ %call8, %if.else ], [ %call12, %if.then.11 ], [ %call14, %if.else.13 ], [ %call23, %if.then.22 ], [ %call25, %if.else.24 ], [ %call29, %if.then.28 ], [ %call31, %if.else.30 ], [ %call65, %if.then.64 ], [ %call61, %if.end.59 ], [ %call144, %for.cond.cleanup ] 318 call void @llvm.lifetime.end.p0(i64 8, ptr %bits) #0 319 ret ptr %retval.1 320} 321 322; Function Attrs: nounwind 323declare ptr @memcpy(ptr, ptr nocapture readonly, i64) #1 324 325; Function Attrs: nounwind 326declare void @llvm.set.loop.iterations.i64(i64) #0 327 328; Function Attrs: nounwind 329declare i1 @llvm.loop.decrement(i64) #0 330 331attributes #0 = { nounwind } 332attributes #1 = { nounwind "disable-tail-calls"="false" "less-precise-fpmad"="false" "frame-pointer"="all" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" } 333attributes #2 = { nounwind } 334attributes #3 = { nounwind } 335 336!llvm.ident = !{!0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0, !0} 337!llvm.module.flags = !{!1, !2, !3} 338 339!0 = !{!"clang version 3.7.0 (branches/release_37 246867) (llvm/branches/release_37 246866)"} 340!1 = !{i32 2, !"halide_use_soft_float_abi", i32 0} 341!2 = !{i32 2, !"halide_mcpu", !"pwr8"} 342!3 = !{i32 2, !"halide_mattrs", !"+altivec,+vsx,+power8-altivec,+direct-move"} 343!4 = !{!5, !5, i64 0} 344!5 = !{!"double", !6, i64 0} 345!6 = !{!"omnipotent char", !7, i64 0} 346!7 = !{!"Simple C/C++ TBAA"} 347!8 = !{!9, !9, i64 0} 348!9 = !{!"long long", !6, i64 0} 349!10 = !{!6, !6, i64 0} 350