16e689cbaSTeresa Johnson; Test basic memory profiler instrumentation. 27ed8124dSTeresa Johnson; 33e8eff37SArthur Eubanks; RUN: opt < %s -passes='function(memprof),memprof-module' -S | FileCheck --check-prefixes=CHECK,CHECK-S3 %s 43e8eff37SArthur Eubanks; RUN: opt < %s -passes='function(memprof),memprof-module' -memprof-mapping-scale=5 -S | FileCheck --check-prefixes=CHECK,CHECK-S5 %s 57ed8124dSTeresa Johnson 6226d80ebSTeresa Johnson; We need the requires since both memprof and memprof-module require reading module level metadata which is done once by the memprof-globals-md analysis 7226d80ebSTeresa Johnson; RUN: opt < %s -passes='function(memprof),module(memprof-module)' -S | FileCheck --check-prefixes=CHECK,CHECK-S3 %s 8226d80ebSTeresa Johnson; RUN: opt < %s -passes='function(memprof),module(memprof-module)' -memprof-mapping-scale=5 -S | FileCheck --check-prefixes=CHECK,CHECK-S5 %s 97ed8124dSTeresa Johnson 107ed8124dSTeresa Johnsontarget datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64" 117ed8124dSTeresa Johnsontarget triple = "x86_64-unknown-linux-gnu" 127b789562SFangrui Song 13*5171712bSMatt Arsenault; CHECK: @llvm.used = appending global [1 x ptr] [ptr @memprof.module_ctor] 14*5171712bSMatt Arsenault; CHECK: @llvm.global_ctors = appending global [1 x { i32, ptr, ptr }] [{ i32, ptr, ptr } { i32 1, ptr @memprof.module_ctor, ptr null }] 157ed8124dSTeresa Johnson 16*5171712bSMatt Arsenaultdefine i32 @test_load(ptr %a) { 177ed8124dSTeresa Johnsonentry: 18*5171712bSMatt Arsenault %tmp1 = load i32, ptr %a, align 4 197ed8124dSTeresa Johnson ret i32 %tmp1 207ed8124dSTeresa Johnson} 217ed8124dSTeresa Johnson; CHECK-LABEL: @test_load 22*5171712bSMatt Arsenault; CHECK: %[[SHADOW_OFFSET:[^ ]*]] = load i64, ptr @__memprof_shadow_memory_dynamic_address 23*5171712bSMatt Arsenault; CHECK-NEXT: %[[LOAD_ADDR:[^ ]*]] = ptrtoint ptr %a to i64 247ed8124dSTeresa Johnson; CHECK-NEXT: %[[MASKED_ADDR:[^ ]*]] = and i64 %[[LOAD_ADDR]], -64 257ed8124dSTeresa Johnson; CHECK-S3-NEXT: %[[SHIFTED_ADDR:[^ ]*]] = lshr i64 %[[MASKED_ADDR]], 3 267ed8124dSTeresa Johnson; CHECK-S5-NEXT: %[[SHIFTED_ADDR:[^ ]*]] = lshr i64 %[[MASKED_ADDR]], 5 277ed8124dSTeresa Johnson; CHECK-NEXT: add i64 %[[SHIFTED_ADDR]], %[[SHADOW_OFFSET]] 287ed8124dSTeresa Johnson; CHECK-NEXT: %[[LOAD_SHADOW_PTR:[^ ]*]] = inttoptr 29*5171712bSMatt Arsenault; CHECK-NEXT: %[[LOAD_SHADOW:[^ ]*]] = load i64, ptr %[[LOAD_SHADOW_PTR]] 307ed8124dSTeresa Johnson; CHECK-NEXT: %[[NEW_SHADOW:[^ ]*]] = add i64 %[[LOAD_SHADOW]], 1 31*5171712bSMatt Arsenault; CHECK-NEXT: store i64 %[[NEW_SHADOW]], ptr %[[LOAD_SHADOW_PTR]] 327ed8124dSTeresa Johnson; The actual load. 33*5171712bSMatt Arsenault; CHECK-NEXT: %tmp1 = load i32, ptr %a 347ed8124dSTeresa Johnson; CHECK-NEXT: ret i32 %tmp1 357ed8124dSTeresa Johnson 36*5171712bSMatt Arsenaultdefine void @test_store(ptr %a) { 377ed8124dSTeresa Johnsonentry: 38*5171712bSMatt Arsenault store i32 42, ptr %a, align 4 397ed8124dSTeresa Johnson ret void 407ed8124dSTeresa Johnson} 417ed8124dSTeresa Johnson; CHECK-LABEL: @test_store 42*5171712bSMatt Arsenault; CHECK: %[[SHADOW_OFFSET:[^ ]*]] = load i64, ptr @__memprof_shadow_memory_dynamic_address 43*5171712bSMatt Arsenault; CHECK-NEXT: %[[STORE_ADDR:[^ ]*]] = ptrtoint ptr %a to i64 447ed8124dSTeresa Johnson; CHECK-NEXT: %[[MASKED_ADDR:[^ ]*]] = and i64 %[[STORE_ADDR]], -64 457ed8124dSTeresa Johnson; CHECK-S3-NEXT: %[[SHIFTED_ADDR:[^ ]*]] = lshr i64 %[[MASKED_ADDR]], 3 467ed8124dSTeresa Johnson; CHECK-S5-NEXT: %[[SHIFTED_ADDR:[^ ]*]] = lshr i64 %[[MASKED_ADDR]], 5 477ed8124dSTeresa Johnson; CHECK-NEXT: add i64 %[[SHIFTED_ADDR]], %[[SHADOW_OFFSET]] 487ed8124dSTeresa Johnson; CHECK-NEXT: %[[STORE_SHADOW_PTR:[^ ]*]] = inttoptr 49*5171712bSMatt Arsenault; CHECK-NEXT: %[[STORE_SHADOW:[^ ]*]] = load i64, ptr %[[STORE_SHADOW_PTR]] 507ed8124dSTeresa Johnson; CHECK-NEXT: %[[NEW_SHADOW:[^ ]*]] = add i64 %[[STORE_SHADOW]], 1 51*5171712bSMatt Arsenault; CHECK-NEXT: store i64 %[[NEW_SHADOW]], ptr %[[STORE_SHADOW_PTR]] 527ed8124dSTeresa Johnson; The actual store. 53*5171712bSMatt Arsenault; CHECK-NEXT: store i32 42, ptr %a 547ed8124dSTeresa Johnson; CHECK-NEXT: ret void 557ed8124dSTeresa Johnson 56*5171712bSMatt Arsenaultdefine void @FP80Test(ptr nocapture %a) nounwind uwtable { 577ed8124dSTeresa Johnsonentry: 58*5171712bSMatt Arsenault store x86_fp80 0xK3FFF8000000000000000, ptr %a, align 16 597ed8124dSTeresa Johnson ret void 607ed8124dSTeresa Johnson} 617ed8124dSTeresa Johnson; CHECK-LABEL: @FP80Test 627ed8124dSTeresa Johnson; Exactly one shadow update for store access. 637ed8124dSTeresa Johnson; CHECK-NOT: store i64 647ed8124dSTeresa Johnson; CHECK: %[[NEW_ST_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 657ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_ST_SHADOW]] 667ed8124dSTeresa Johnson; CHECK-NOT: store i64 677ed8124dSTeresa Johnson; The actual store. 68*5171712bSMatt Arsenault; CHECK: store x86_fp80 0xK3FFF8000000000000000, ptr %a 697ed8124dSTeresa Johnson; CHECK: ret void 707ed8124dSTeresa Johnson 71*5171712bSMatt Arsenaultdefine void @i40test(ptr %a, ptr %b) nounwind uwtable { 727ed8124dSTeresa Johnsonentry: 73*5171712bSMatt Arsenault %t = load i40, ptr %a 74*5171712bSMatt Arsenault store i40 %t, ptr %b, align 8 757ed8124dSTeresa Johnson ret void 767ed8124dSTeresa Johnson} 777ed8124dSTeresa Johnson; CHECK-LABEL: @i40test 787ed8124dSTeresa Johnson; Exactly one shadow update for load access. 797ed8124dSTeresa Johnson; CHECK-NOT: store i64 807ed8124dSTeresa Johnson; CHECK: %[[NEW_LD_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 817ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_LD_SHADOW]] 827ed8124dSTeresa Johnson; CHECK-NOT: store i64 837ed8124dSTeresa Johnson; The actual load. 84*5171712bSMatt Arsenault; CHECK: %t = load i40, ptr %a 857ed8124dSTeresa Johnson; Exactly one shadow update for store access. 867ed8124dSTeresa Johnson; CHECK-NOT: store i64 877ed8124dSTeresa Johnson; CHECK: %[[NEW_ST_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 887ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_ST_SHADOW]] 897ed8124dSTeresa Johnson; CHECK-NOT: store i64 907ed8124dSTeresa Johnson; The actual store. 91*5171712bSMatt Arsenault; CHECK: store i40 %t, ptr %b 927ed8124dSTeresa Johnson; CHECK: ret void 937ed8124dSTeresa Johnson 94*5171712bSMatt Arsenaultdefine void @i64test_align1(ptr %b) nounwind uwtable { 957ed8124dSTeresa Johnson entry: 96*5171712bSMatt Arsenault store i64 0, ptr %b, align 1 977ed8124dSTeresa Johnson ret void 987ed8124dSTeresa Johnson} 997ed8124dSTeresa Johnson; CHECK-LABEL: @i64test 1007ed8124dSTeresa Johnson; Exactly one shadow update for store access. 1017ed8124dSTeresa Johnson; CHECK-NOT: store i64 1027ed8124dSTeresa Johnson; CHECK: %[[NEW_ST_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 1037ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_ST_SHADOW]] 1047ed8124dSTeresa Johnson; CHECK-NOT: store i64 1057ed8124dSTeresa Johnson; The actual store. 106*5171712bSMatt Arsenault; CHECK: store i64 0, ptr %b 1077ed8124dSTeresa Johnson; CHECK: ret void 1087ed8124dSTeresa Johnson 109*5171712bSMatt Arsenaultdefine void @i80test(ptr %a, ptr %b) nounwind uwtable { 1107ed8124dSTeresa Johnson entry: 111*5171712bSMatt Arsenault %t = load i80, ptr %a 112*5171712bSMatt Arsenault store i80 %t, ptr %b, align 8 1137ed8124dSTeresa Johnson ret void 1147ed8124dSTeresa Johnson} 1157ed8124dSTeresa Johnson; CHECK-LABEL: i80test 1167ed8124dSTeresa Johnson; Exactly one shadow update for load access. 1177ed8124dSTeresa Johnson; CHECK-NOT: store i64 1187ed8124dSTeresa Johnson; CHECK: %[[NEW_LD_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 1197ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_LD_SHADOW]] 1207ed8124dSTeresa Johnson; CHECK-NOT: store i64 1217ed8124dSTeresa Johnson; The actual load. 122*5171712bSMatt Arsenault; CHECK: %t = load i80, ptr %a 1237ed8124dSTeresa Johnson; Exactly one shadow update for store access. 1247ed8124dSTeresa Johnson; CHECK-NOT: store i64 1257ed8124dSTeresa Johnson; CHECK: %[[NEW_ST_SHADOW:[^ ]*]] = add i64 %{{.*}}, 1 1267ed8124dSTeresa Johnson; CHECK-NEXT: store i64 %[[NEW_ST_SHADOW]] 1277ed8124dSTeresa Johnson; CHECK-NOT: store i64 1287ed8124dSTeresa Johnson; The actual store. 129*5171712bSMatt Arsenault; CHECK: store i80 %t, ptr %b 1307ed8124dSTeresa Johnson; CHECK: ret void 1317ed8124dSTeresa Johnson 132226d80ebSTeresa Johnson; memprof should not instrument functions with available_externally linkage. 133*5171712bSMatt Arsenaultdefine available_externally i32 @f_available_externally(ptr %a) { 1347ed8124dSTeresa Johnsonentry: 135*5171712bSMatt Arsenault %tmp1 = load i32, ptr %a 1367ed8124dSTeresa Johnson ret i32 %tmp1 1377ed8124dSTeresa Johnson} 1387ed8124dSTeresa Johnson; CHECK-LABEL: @f_available_externally 139226d80ebSTeresa Johnson; CHECK-NOT: __memprof_shadow_memory_dynamic_address 1407ed8124dSTeresa Johnson; CHECK: ret i32 1417ed8124dSTeresa Johnson 142*5171712bSMatt Arsenaultdeclare void @llvm.memset.p0.i64(ptr nocapture, i8, i64, i1) nounwind 143*5171712bSMatt Arsenaultdeclare void @llvm.memmove.p0.p0.i64(ptr nocapture, ptr nocapture readonly, i64, i1) nounwind 144*5171712bSMatt Arsenaultdeclare void @llvm.memcpy.p0.p0.i64(ptr nocapture, ptr nocapture readonly, i64, i1) nounwind 1457ed8124dSTeresa Johnson 146*5171712bSMatt Arsenaultdefine void @memintr_test(ptr %a, ptr %b) nounwind uwtable { 1477ed8124dSTeresa Johnson entry: 148*5171712bSMatt Arsenault tail call void @llvm.memset.p0.i64(ptr %a, i8 0, i64 100, i1 false) 149*5171712bSMatt Arsenault tail call void @llvm.memmove.p0.p0.i64(ptr %a, ptr %b, i64 100, i1 false) 150*5171712bSMatt Arsenault tail call void @llvm.memcpy.p0.p0.i64(ptr %a, ptr %b, i64 100, i1 false) 1517ed8124dSTeresa Johnson ret void 1527ed8124dSTeresa Johnson} 1537ed8124dSTeresa Johnson 1547ed8124dSTeresa Johnson; CHECK-LABEL: memintr_test 155226d80ebSTeresa Johnson; CHECK: __memprof_memset 156226d80ebSTeresa Johnson; CHECK: __memprof_memmove 157226d80ebSTeresa Johnson; CHECK: __memprof_memcpy 1587ed8124dSTeresa Johnson; CHECK: ret void 1597ed8124dSTeresa Johnson 160*5171712bSMatt Arsenaultdeclare void @llvm.memset.element.unordered.atomic.p0.i64(ptr nocapture writeonly, i8, i64, i32) nounwind 161*5171712bSMatt Arsenaultdeclare void @llvm.memmove.element.unordered.atomic.p0.p0.i64(ptr nocapture writeonly, ptr nocapture readonly, i64, i32) nounwind 162*5171712bSMatt Arsenaultdeclare void @llvm.memcpy.element.unordered.atomic.p0.p0.i64(ptr nocapture writeonly, ptr nocapture readonly, i64, i32) nounwind 1637ed8124dSTeresa Johnson 164*5171712bSMatt Arsenaultdefine void @memintr_element_atomic_test(ptr %a, ptr %b) nounwind uwtable { 1657ed8124dSTeresa Johnson ; This is a canary test to make sure that these don't get lowered into calls that don't 166226d80ebSTeresa Johnson ; have the element-atomic property. Eventually, memprof will have to be enhanced to lower 1677ed8124dSTeresa Johnson ; these properly. 1687ed8124dSTeresa Johnson ; CHECK-LABEL: memintr_element_atomic_test 169*5171712bSMatt Arsenault ; CHECK: tail call void @llvm.memset.element.unordered.atomic.p0.i64(ptr align 1 %a, i8 0, i64 100, i32 1) 170*5171712bSMatt Arsenault ; CHECK: tail call void @llvm.memmove.element.unordered.atomic.p0.p0.i64(ptr align 1 %a, ptr align 1 %b, i64 100, i32 1) 171*5171712bSMatt Arsenault ; CHECK: tail call void @llvm.memcpy.element.unordered.atomic.p0.p0.i64(ptr align 1 %a, ptr align 1 %b, i64 100, i32 1) 1727ed8124dSTeresa Johnson ; CHECK: ret void 173*5171712bSMatt Arsenault tail call void @llvm.memset.element.unordered.atomic.p0.i64(ptr align 1 %a, i8 0, i64 100, i32 1) 174*5171712bSMatt Arsenault tail call void @llvm.memmove.element.unordered.atomic.p0.p0.i64(ptr align 1 %a, ptr align 1 %b, i64 100, i32 1) 175*5171712bSMatt Arsenault tail call void @llvm.memcpy.element.unordered.atomic.p0.p0.i64(ptr align 1 %a, ptr align 1 %b, i64 100, i32 1) 1767ed8124dSTeresa Johnson ret void 1777ed8124dSTeresa Johnson} 1787ed8124dSTeresa Johnson 1797ed8124dSTeresa Johnson 180226d80ebSTeresa Johnson; CHECK: define internal void @memprof.module_ctor() 181226d80ebSTeresa Johnson; CHECK: call void @__memprof_init() 182