1faa2c678SKrzysztof Drewniak; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py 2faa2c678SKrzysztof Drewniak; RUN: llc -global-isel -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -stop-after=instruction-select -verify-machineinstrs -o - %s | FileCheck -check-prefix=UNPACKED %s 3faa2c678SKrzysztof Drewniak; RUN: llc -global-isel -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx810 -stop-after=instruction-select -verify-machineinstrs -o - %s | FileCheck -check-prefix=PACKED %s 4faa2c678SKrzysztof Drewniak 5faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 6faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 7faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 8faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 9faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 10faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 11faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 12faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 13faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 14faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 15faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 16faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 17ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 18faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 19faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 20*c3cfbbc4Spvanhout ; 21faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 22faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 23faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 24faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 25faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 26faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 27faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 28faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 29faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 30faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 31faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 32ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 33faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 34faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 35faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 0) 36faa2c678SKrzysztof Drewniak ret half %val 37faa2c678SKrzysztof Drewniak} 38faa2c678SKrzysztof Drewniak 39faa2c678SKrzysztof Drewniakdefine amdgpu_ps <2 x half> @raw_tbuffer_load_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 40faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 41faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 42faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 43faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 44faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 45faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 46faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 47faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 48faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 49faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 50faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 51ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN:%[0-9]+]]:vreg_64 = TBUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (<2 x s16>) from %ir.rsrc, align 1, addrspace 8) 52faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN]].sub0 53faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN]].sub1 54faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 65535 55faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 56faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY6]], [[COPY8]], implicit $exec 57faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 58faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_1:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY7]], [[COPY9]], implicit $exec 59faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sreg_32 = S_MOV_B32 16 60faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 61faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY10]], [[V_AND_B32_e64_1]], implicit $exec 62faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_]], [[V_LSHLREV_B32_e64_]], implicit $exec 63faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[V_OR_B32_e64_]] 64faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 65*c3cfbbc4Spvanhout ; 66faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 67faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 68faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 69faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 70faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 71faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 72faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 73faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 74faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 75faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 76faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 77ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_XY_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_XY_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (<2 x s16>) from %ir.rsrc, align 1, addrspace 8) 78faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_XY_OFFEN]] 79faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 80faa2c678SKrzysztof Drewniak %val = call <2 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v2f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 0) 81faa2c678SKrzysztof Drewniak ret <2 x half> %val 82faa2c678SKrzysztof Drewniak} 83faa2c678SKrzysztof Drewniak 84faa2c678SKrzysztof Drewniak; FIXME: Crashes 85faa2c678SKrzysztof Drewniak; define amdgpu_ps <3 x half> @raw_tbuffer_load_v3f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 86faa2c678SKrzysztof Drewniak; %val = call <3 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v3f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 0) 87faa2c678SKrzysztof Drewniak; ret <3 x half> %val 88faa2c678SKrzysztof Drewniak; } 89faa2c678SKrzysztof Drewniak 90faa2c678SKrzysztof Drewniakdefine amdgpu_ps <4 x half> @raw_tbuffer_load_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 91faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 92faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 93faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 94faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 95faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 96faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 97faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 98faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 99faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 100faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 101faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 102ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN:%[0-9]+]]:vreg_128 = TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 103faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub0 104faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub1 105faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub2 106faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub3 107faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 65535 108faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 109faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY6]], [[COPY10]], implicit $exec 110faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY11:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 111faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_1:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY7]], [[COPY11]], implicit $exec 112faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sreg_32 = S_MOV_B32 16 113faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY12:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 114faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY12]], [[V_AND_B32_e64_1]], implicit $exec 115faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_]], [[V_LSHLREV_B32_e64_]], implicit $exec 116faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY13:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 117faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_2:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY8]], [[COPY13]], implicit $exec 118faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY14:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 119faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_3:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY9]], [[COPY14]], implicit $exec 120faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY15:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 121faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_1:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY15]], [[V_AND_B32_e64_3]], implicit $exec 122faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_1:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_2]], [[V_LSHLREV_B32_e64_1]], implicit $exec 123faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[V_OR_B32_e64_]] 124faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr1 = COPY [[V_OR_B32_e64_1]] 125faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 126*c3cfbbc4Spvanhout ; 127faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 128faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 129faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 130faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 131faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 132faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 133faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 134faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 135faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 136faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 137faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 138ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_XYZW_OFFEN:%[0-9]+]]:vreg_64 = TBUFFER_LOAD_FORMAT_D16_XYZW_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 139faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub0 140faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[TBUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub1 141faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[COPY6]] 142faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr1 = COPY [[COPY7]] 143faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 144faa2c678SKrzysztof Drewniak %val = call <4 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v4f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 0) 145faa2c678SKrzysztof Drewniak ret <4 x half> %val 146faa2c678SKrzysztof Drewniak} 147faa2c678SKrzysztof Drewniak 148faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset(ptr addrspace(8) %rsrc, i32 inreg %voffset, i32 %soffset) { 149faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset 150faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 151faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.2(0x80000000) 152faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4 153faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 154faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr0 155faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY $vgpr1 156faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:vgpr_32 = COPY $vgpr2 157faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:vgpr_32 = COPY $vgpr3 158faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:sreg_32 = COPY $sgpr2 159faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:vgpr_32 = COPY $vgpr4 160faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 161faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[COPY4]] 162faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B64_:%[0-9]+]]:sreg_64_xexec = S_MOV_B64 $exec 163faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 164faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.2: 165faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.3(0x80000000) 166faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 167faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY]], implicit $exec 168faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_1:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY1]], implicit $exec 169faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_2:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY2]], implicit $exec 170faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_3:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY3]], implicit $exec 171faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE1:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[V_READFIRSTLANE_B32_]], %subreg.sub0, [[V_READFIRSTLANE_B32_1]], %subreg.sub1, [[V_READFIRSTLANE_B32_2]], %subreg.sub2, [[V_READFIRSTLANE_B32_3]], %subreg.sub3 172faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub0_sub1 173faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub2_sub3 174faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub0_sub1 175faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub2_sub3 176faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U64_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY9]], [[COPY7]], implicit $exec 177faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U64_e64_1:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY10]], [[COPY8]], implicit $exec 178*c3cfbbc4Spvanhout ; UNPACKED-NEXT: [[S_AND_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[V_CMP_EQ_U64_e64_]], [[V_CMP_EQ_U64_e64_1]], implicit-def dead $scc 179faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_4:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY5]], implicit $exec 180faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U32_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U32_e64 [[V_READFIRSTLANE_B32_4]], [[COPY5]], implicit $exec 181*c3cfbbc4Spvanhout ; UNPACKED-NEXT: [[S_AND_B64_1:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[S_AND_B64_]], [[V_CMP_EQ_U32_e64_]], implicit-def dead $scc 182faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_AND_SAVEEXEC_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_SAVEEXEC_B64 killed [[S_AND_B64_1]], implicit-def $exec, implicit-def $scc, implicit $exec 183faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 184faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.3: 185faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.4(0x40000000), %bb.2(0x40000000) 186faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 187ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY6]], [[REG_SEQUENCE1]], [[V_READFIRSTLANE_B32_4]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 188faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $exec = S_XOR_B64_term $exec, [[S_AND_SAVEEXEC_B64_]], implicit-def $scc 189faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_WATERFALL_LOOP %bb.2, implicit $exec 190faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 191faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.4: 192faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.5(0x80000000) 193faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 194faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $exec = S_MOV_B64_term [[S_MOV_B64_]] 195faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 196faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.5: 197faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 198faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 199*c3cfbbc4Spvanhout ; 200faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset 201faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 202faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.2(0x80000000) 203faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4 204faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 205faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr0 206faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY $vgpr1 207faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:vgpr_32 = COPY $vgpr2 208faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:vgpr_32 = COPY $vgpr3 209faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:sreg_32 = COPY $sgpr2 210faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:vgpr_32 = COPY $vgpr4 211faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 212faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[COPY4]] 213faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[S_MOV_B64_:%[0-9]+]]:sreg_64_xexec = S_MOV_B64 $exec 214faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 215faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.2: 216faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.3(0x80000000) 217faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 218faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY]], implicit $exec 219faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_1:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY1]], implicit $exec 220faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_2:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY2]], implicit $exec 221faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_3:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY3]], implicit $exec 222faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE1:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[V_READFIRSTLANE_B32_]], %subreg.sub0, [[V_READFIRSTLANE_B32_1]], %subreg.sub1, [[V_READFIRSTLANE_B32_2]], %subreg.sub2, [[V_READFIRSTLANE_B32_3]], %subreg.sub3 223faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY7:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub0_sub1 224faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY8:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub2_sub3 225faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY9:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub0_sub1 226faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY10:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub2_sub3 227faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U64_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY9]], [[COPY7]], implicit $exec 228faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U64_e64_1:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY10]], [[COPY8]], implicit $exec 229*c3cfbbc4Spvanhout ; PACKED-NEXT: [[S_AND_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[V_CMP_EQ_U64_e64_]], [[V_CMP_EQ_U64_e64_1]], implicit-def dead $scc 230faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_4:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY5]], implicit $exec 231faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U32_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U32_e64 [[V_READFIRSTLANE_B32_4]], [[COPY5]], implicit $exec 232*c3cfbbc4Spvanhout ; PACKED-NEXT: [[S_AND_B64_1:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[S_AND_B64_]], [[V_CMP_EQ_U32_e64_]], implicit-def dead $scc 233faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[S_AND_SAVEEXEC_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_SAVEEXEC_B64 killed [[S_AND_B64_1]], implicit-def $exec, implicit-def $scc, implicit $exec 234faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 235faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.3: 236faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.4(0x40000000), %bb.2(0x40000000) 237faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 238ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY6]], [[REG_SEQUENCE1]], [[V_READFIRSTLANE_B32_4]], 0, 78, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 239faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $exec = S_XOR_B64_term $exec, [[S_AND_SAVEEXEC_B64_]], implicit-def $scc 240faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_WATERFALL_LOOP %bb.2, implicit $exec 241faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 242faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.4: 243faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.5(0x80000000) 244faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 245faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $exec = S_MOV_B64_term [[S_MOV_B64_]] 246faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 247faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.5: 248faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 249faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 250faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 0) 251faa2c678SKrzysztof Drewniak ret half %val 252faa2c678SKrzysztof Drewniak} 253faa2c678SKrzysztof Drewniak 254faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_glc(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 255faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_glc 256faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 257faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 258faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 259faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 260faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 261faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 262faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 263faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 264faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 265faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 266ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 1, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 267faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 268faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 269*c3cfbbc4Spvanhout ; 270faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_glc 271faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 272faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 273faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 274faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 275faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 276faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 277faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 278faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 279faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 280faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 281ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 1, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 282faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 283faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 284faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 1) 285faa2c678SKrzysztof Drewniak ret half %val 286faa2c678SKrzysztof Drewniak} 287faa2c678SKrzysztof Drewniak 288faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 289faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc 290faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 291faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 292faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 293faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 294faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 295faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 296faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 297faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 298faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 299faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 300ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 2, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 301faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 302faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 303*c3cfbbc4Spvanhout ; 304faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc 305faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 306faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 307faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 308faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 309faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 310faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 311faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 312faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 313faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 314faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 315ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 2, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 316faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 317faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 318faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 2) 319faa2c678SKrzysztof Drewniak ret half %val 320faa2c678SKrzysztof Drewniak} 321faa2c678SKrzysztof Drewniak 322faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc_glc(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 323faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc_glc 324faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 325faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 326faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 327faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 328faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 329faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 330faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 331faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 332faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 333faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 334ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 3, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 335faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 336faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 337*c3cfbbc4Spvanhout ; 338faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_slc_glc 339faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 340faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 341faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 342faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 343faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 344faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 345faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 346faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 347faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 348faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 349ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 3, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 350faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 351faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 352faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 3) 353faa2c678SKrzysztof Drewniak ret half %val 354faa2c678SKrzysztof Drewniak} 355faa2c678SKrzysztof Drewniak 356faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_dlc(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 357faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_dlc 358faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 359faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 360faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 361faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 362faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 363faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 364faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 365faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 366faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 367faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 368ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 4, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 369faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 370faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 371*c3cfbbc4Spvanhout ; 372faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_tbuffer_load_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_dlc 373faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 374faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 375faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 376faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 377faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 378faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 379faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 380faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 381faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 382faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 383ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = TBUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 78, 4, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 384faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[TBUFFER_LOAD_FORMAT_D16_X_OFFEN]] 385faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 386faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 78, i32 4) 387faa2c678SKrzysztof Drewniak ret half %val 388faa2c678SKrzysztof Drewniak} 389faa2c678SKrzysztof Drewniak 390faa2c678SKrzysztof Drewniakdeclare half @llvm.amdgcn.raw.ptr.tbuffer.load.f16(ptr addrspace(8), i32, i32, i32 immarg, i32 immarg) #0 391faa2c678SKrzysztof Drewniakdeclare <2 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v2f16(ptr addrspace(8), i32, i32, i32 immarg, i32 immarg) #0 392faa2c678SKrzysztof Drewniakdeclare <3 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v3f16(ptr addrspace(8), i32, i32, i32 immarg, i32 immarg) #0 393faa2c678SKrzysztof Drewniakdeclare <4 x half> @llvm.amdgcn.raw.ptr.tbuffer.load.v4f16(ptr addrspace(8), i32, i32, i32 immarg, i32 immarg) #0 394faa2c678SKrzysztof Drewniak 395faa2c678SKrzysztof Drewniakattributes #0 = { nounwind readonly } 396