1faa2c678SKrzysztof Drewniak; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py 2faa2c678SKrzysztof Drewniak; RUN: llc -global-isel -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx810 -stop-after=instruction-select -verify-machineinstrs -o - %s | FileCheck -check-prefix=PACKED %s 3faa2c678SKrzysztof Drewniak; RUN: llc -global-isel -mtriple=amdgcn-mesa-mesa3d -mcpu=tonga -stop-after=instruction-select -verify-machineinstrs -o - %s | FileCheck -check-prefix=UNPACKED %s 4faa2c678SKrzysztof Drewniak 5faa2c678SKrzysztof Drewniak; Natural mapping 6faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_ptr_buffer_load_format_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 7faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_ptr_buffer_load_format_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 8faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 9faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 10faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 11faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 12faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 13faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 14faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 15faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 16faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 17faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 18ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 19faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[BUFFER_LOAD_FORMAT_D16_X_OFFEN]] 20faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 21*c3cfbbc4Spvanhout ; 22faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_ptr_buffer_load_format_f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 23faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 24faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 25faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 26faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 27faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 28faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 29faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 30faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 31faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 32faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 33ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 34faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 35faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 36faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.buffer.load.format.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 37faa2c678SKrzysztof Drewniak ret half %val 38faa2c678SKrzysztof Drewniak} 39faa2c678SKrzysztof Drewniak 40faa2c678SKrzysztof Drewniakdefine amdgpu_ps <2 x half> @raw_ptr_buffer_load_format_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 41faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_ptr_buffer_load_format_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 42faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 43faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 44faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 45faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 46faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 47faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 48faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 49faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 50faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 51faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 52ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XY_OFFEN:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_FORMAT_D16_XY_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (<2 x s16>) from %ir.rsrc, align 1, addrspace 8) 53faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[BUFFER_LOAD_FORMAT_D16_XY_OFFEN]] 54faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 55*c3cfbbc4Spvanhout ; 56faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_ptr_buffer_load_format_v2f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 57faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 58faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 59faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 60faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 61faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 62faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 63faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 64faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 65faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 66faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 67ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN:%[0-9]+]]:vreg_64 = BUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (<2 x s16>) from %ir.rsrc, align 1, addrspace 8) 68faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN]].sub0 69faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XY_gfx80_OFFEN]].sub1 70faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 65535 71faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 72faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY6]], [[COPY8]], implicit $exec 73faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 74faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_1:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY7]], [[COPY9]], implicit $exec 75faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sreg_32 = S_MOV_B32 16 76faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 77faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY10]], [[V_AND_B32_e64_1]], implicit $exec 78faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_]], [[V_LSHLREV_B32_e64_]], implicit $exec 79faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[V_OR_B32_e64_]] 80faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 81faa2c678SKrzysztof Drewniak %val = call <2 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v2f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 82faa2c678SKrzysztof Drewniak ret <2 x half> %val 83faa2c678SKrzysztof Drewniak} 84faa2c678SKrzysztof Drewniak 85faa2c678SKrzysztof Drewniak; FIXME 86faa2c678SKrzysztof Drewniak; define amdgpu_ps <3 x half> @raw_ptr_buffer_load_format_v3f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 87faa2c678SKrzysztof Drewniak; %val = call <3 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v3f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 88faa2c678SKrzysztof Drewniak; ret <3 x half> %val 89faa2c678SKrzysztof Drewniak; } 90faa2c678SKrzysztof Drewniak 91faa2c678SKrzysztof Drewniakdefine amdgpu_ps <4 x half> @raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset(ptr addrspace(8) inreg %rsrc, i32 %voffset, i32 inreg %soffset) { 92faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 93faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 94faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 95faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 96faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 97faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 98faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 99faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 100faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 101faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 102faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 103ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN:%[0-9]+]]:vreg_64 = BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 104faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub0 105faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub1 106faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[COPY6]] 107faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr1 = COPY [[COPY7]] 108faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 109*c3cfbbc4Spvanhout ; 110faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset 111faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 112faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 113faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 114faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 115faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 116faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 117faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 118faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 119faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 120faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 121ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN:%[0-9]+]]:vreg_128 = BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 0, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 122faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub0 123faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub1 124faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub2 125faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub3 126faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 65535 127faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 128faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY6]], [[COPY10]], implicit $exec 129faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY11:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 130faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_1:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY7]], [[COPY11]], implicit $exec 131faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sreg_32 = S_MOV_B32 16 132faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY12:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 133faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY12]], [[V_AND_B32_e64_1]], implicit $exec 134faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_]], [[V_LSHLREV_B32_e64_]], implicit $exec 135faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY13:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 136faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_2:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY8]], [[COPY13]], implicit $exec 137faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY14:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 138faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_3:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY9]], [[COPY14]], implicit $exec 139faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY15:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 140faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_1:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY15]], [[V_AND_B32_e64_3]], implicit $exec 141faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_1:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_2]], [[V_LSHLREV_B32_e64_1]], implicit $exec 142faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[V_OR_B32_e64_]] 143faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr1 = COPY [[V_OR_B32_e64_1]] 144faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 145faa2c678SKrzysztof Drewniak %val = call <4 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v4f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 146faa2c678SKrzysztof Drewniak ret <4 x half> %val 147faa2c678SKrzysztof Drewniak} 148faa2c678SKrzysztof Drewniak 149faa2c678SKrzysztof Drewniak; Waterfall for rsrc and soffset, copy for voffset 150faa2c678SKrzysztof Drewniakdefine amdgpu_ps half @raw_ptr_buffer_load_format_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset(ptr addrspace(8) %rsrc, i32 inreg %voffset, i32 %soffset) { 151faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_ptr_buffer_load_format_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset 152faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 153faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.2(0x80000000) 154faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4 155faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 156faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr0 157faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY $vgpr1 158faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:vgpr_32 = COPY $vgpr2 159faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:vgpr_32 = COPY $vgpr3 160faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:sreg_32 = COPY $sgpr2 161faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:vgpr_32 = COPY $vgpr4 162faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 163faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[COPY4]] 164faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[S_MOV_B64_:%[0-9]+]]:sreg_64_xexec = S_MOV_B64 $exec 165faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 166faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.2: 167faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.3(0x80000000) 168faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 169faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY]], implicit $exec 170faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_1:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY1]], implicit $exec 171faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_2:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY2]], implicit $exec 172faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_3:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY3]], implicit $exec 173faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE1:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[V_READFIRSTLANE_B32_]], %subreg.sub0, [[V_READFIRSTLANE_B32_1]], %subreg.sub1, [[V_READFIRSTLANE_B32_2]], %subreg.sub2, [[V_READFIRSTLANE_B32_3]], %subreg.sub3 174faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY7:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub0_sub1 175faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY8:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub2_sub3 176faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY9:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub0_sub1 177faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY10:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub2_sub3 178faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U64_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY9]], [[COPY7]], implicit $exec 179faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U64_e64_1:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY10]], [[COPY8]], implicit $exec 180*c3cfbbc4Spvanhout ; PACKED-NEXT: [[S_AND_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[V_CMP_EQ_U64_e64_]], [[V_CMP_EQ_U64_e64_1]], implicit-def dead $scc 181faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_READFIRSTLANE_B32_4:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY5]], implicit $exec 182faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[V_CMP_EQ_U32_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U32_e64 [[V_READFIRSTLANE_B32_4]], [[COPY5]], implicit $exec 183*c3cfbbc4Spvanhout ; PACKED-NEXT: [[S_AND_B64_1:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[S_AND_B64_]], [[V_CMP_EQ_U32_e64_]], implicit-def dead $scc 184faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[S_AND_SAVEEXEC_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_SAVEEXEC_B64 killed [[S_AND_B64_1]], implicit-def $exec, implicit-def $scc, implicit $exec 185faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 186faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.3: 187faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.4(0x40000000), %bb.2(0x40000000) 188faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 189ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_X_OFFEN:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_FORMAT_D16_X_OFFEN [[COPY6]], [[REG_SEQUENCE1]], [[V_READFIRSTLANE_B32_4]], 0, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 190faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $exec = S_XOR_B64_term $exec, [[S_AND_SAVEEXEC_B64_]], implicit-def $scc 191faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_WATERFALL_LOOP %bb.2, implicit $exec 192faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 193faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.4: 194faa2c678SKrzysztof Drewniak ; PACKED-NEXT: successors: %bb.5(0x80000000) 195faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 196faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $exec = S_MOV_B64_term [[S_MOV_B64_]] 197faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 198faa2c678SKrzysztof Drewniak ; PACKED-NEXT: bb.5: 199faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[BUFFER_LOAD_FORMAT_D16_X_OFFEN]] 200faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 201*c3cfbbc4Spvanhout ; 202faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_ptr_buffer_load_format_f16__vgpr_rsrc__sgpr_voffset__vgpr_soffset 203faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 204faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.2(0x80000000) 205faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $vgpr0, $vgpr1, $vgpr2, $vgpr3, $vgpr4 206faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 207faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr0 208faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY $vgpr1 209faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:vgpr_32 = COPY $vgpr2 210faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:vgpr_32 = COPY $vgpr3 211faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:sreg_32 = COPY $sgpr2 212faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:vgpr_32 = COPY $vgpr4 213faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 214faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[COPY4]] 215faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B64_:%[0-9]+]]:sreg_64_xexec = S_MOV_B64 $exec 216faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 217faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.2: 218faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.3(0x80000000) 219faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 220faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY]], implicit $exec 221faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_1:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY1]], implicit $exec 222faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_2:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY2]], implicit $exec 223faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_3:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY3]], implicit $exec 224faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE1:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[V_READFIRSTLANE_B32_]], %subreg.sub0, [[V_READFIRSTLANE_B32_1]], %subreg.sub1, [[V_READFIRSTLANE_B32_2]], %subreg.sub2, [[V_READFIRSTLANE_B32_3]], %subreg.sub3 225faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub0_sub1 226faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vreg_64 = COPY [[REG_SEQUENCE]].sub2_sub3 227faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub0_sub1 228faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:sreg_64 = COPY [[REG_SEQUENCE1]].sub2_sub3 229faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U64_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY9]], [[COPY7]], implicit $exec 230faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U64_e64_1:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U64_e64 [[COPY10]], [[COPY8]], implicit $exec 231*c3cfbbc4Spvanhout ; UNPACKED-NEXT: [[S_AND_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[V_CMP_EQ_U64_e64_]], [[V_CMP_EQ_U64_e64_1]], implicit-def dead $scc 232faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_READFIRSTLANE_B32_4:%[0-9]+]]:sreg_32 = V_READFIRSTLANE_B32 [[COPY5]], implicit $exec 233faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_CMP_EQ_U32_e64_:%[0-9]+]]:sreg_64_xexec = V_CMP_EQ_U32_e64 [[V_READFIRSTLANE_B32_4]], [[COPY5]], implicit $exec 234*c3cfbbc4Spvanhout ; UNPACKED-NEXT: [[S_AND_B64_1:%[0-9]+]]:sreg_64_xexec = S_AND_B64 [[S_AND_B64_]], [[V_CMP_EQ_U32_e64_]], implicit-def dead $scc 235faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_AND_SAVEEXEC_B64_:%[0-9]+]]:sreg_64_xexec = S_AND_SAVEEXEC_B64 killed [[S_AND_B64_1]], implicit-def $exec, implicit-def $scc, implicit $exec 236faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 237faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.3: 238faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.4(0x40000000), %bb.2(0x40000000) 239faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 240ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN [[COPY6]], [[REG_SEQUENCE1]], [[V_READFIRSTLANE_B32_4]], 0, 0, 0, implicit $exec :: (dereferenceable load (s16) from %ir.rsrc, align 1, addrspace 8) 241faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $exec = S_XOR_B64_term $exec, [[S_AND_SAVEEXEC_B64_]], implicit-def $scc 242faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_WATERFALL_LOOP %bb.2, implicit $exec 243faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 244faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.4: 245faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: successors: %bb.5(0x80000000) 246faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 247faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $exec = S_MOV_B64_term [[S_MOV_B64_]] 248faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 249faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: bb.5: 250faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[BUFFER_LOAD_FORMAT_D16_X_gfx80_OFFEN]] 251faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0 252faa2c678SKrzysztof Drewniak %val = call half @llvm.amdgcn.raw.ptr.buffer.load.format.f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 253faa2c678SKrzysztof Drewniak ret half %val 254faa2c678SKrzysztof Drewniak} 255faa2c678SKrzysztof Drewniak 256faa2c678SKrzysztof Drewniakdefine amdgpu_ps <4 x half> @raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_voffset_add_4095(ptr addrspace(8) inreg %rsrc, i32 %voffset.base, i32 inreg %soffset) { 257faa2c678SKrzysztof Drewniak ; PACKED-LABEL: name: raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_voffset_add_4095 258faa2c678SKrzysztof Drewniak ; PACKED: bb.1 (%ir-block.0): 259faa2c678SKrzysztof Drewniak ; PACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 260faa2c678SKrzysztof Drewniak ; PACKED-NEXT: {{ $}} 261faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 262faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 263faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 264faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 265faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 266faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 267faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 268ab379378SKrzysztof Drewniak ; PACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN:%[0-9]+]]:vreg_64 = BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 4095, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 269faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub0 270faa2c678SKrzysztof Drewniak ; PACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_OFFEN]].sub1 271faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr0 = COPY [[COPY6]] 272faa2c678SKrzysztof Drewniak ; PACKED-NEXT: $vgpr1 = COPY [[COPY7]] 273faa2c678SKrzysztof Drewniak ; PACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 274*c3cfbbc4Spvanhout ; 275faa2c678SKrzysztof Drewniak ; UNPACKED-LABEL: name: raw_ptr_buffer_load_format_v4f16__sgpr_rsrc__vgpr_voffset__sgpr_soffset_voffset_add_4095 276faa2c678SKrzysztof Drewniak ; UNPACKED: bb.1 (%ir-block.0): 277faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: liveins: $sgpr2, $sgpr3, $sgpr4, $sgpr5, $sgpr6, $vgpr0 278faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: {{ $}} 279faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY $sgpr2 280faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY $sgpr3 281faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY2:%[0-9]+]]:sreg_32 = COPY $sgpr4 282faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY $sgpr5 283faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY $vgpr0 284faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY $sgpr6 285faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_128 = REG_SEQUENCE [[COPY]], %subreg.sub0, [[COPY1]], %subreg.sub1, [[COPY2]], %subreg.sub2, [[COPY3]], %subreg.sub3 286ab379378SKrzysztof Drewniak ; UNPACKED-NEXT: [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN:%[0-9]+]]:vreg_128 = BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN [[COPY4]], [[REG_SEQUENCE]], [[COPY5]], 4095, 0, 0, implicit $exec :: (dereferenceable load (<4 x s16>) from %ir.rsrc, align 1, addrspace 8) 287faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub0 288faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub1 289faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY8:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub2 290faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY9:%[0-9]+]]:vgpr_32 = COPY [[BUFFER_LOAD_FORMAT_D16_XYZW_gfx80_OFFEN]].sub3 291faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 65535 292faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY10:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 293faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY6]], [[COPY10]], implicit $exec 294faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY11:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 295faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_1:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY7]], [[COPY11]], implicit $exec 296faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sreg_32 = S_MOV_B32 16 297faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY12:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 298faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY12]], [[V_AND_B32_e64_1]], implicit $exec 299faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_]], [[V_LSHLREV_B32_e64_]], implicit $exec 300faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY13:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 301faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_2:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY8]], [[COPY13]], implicit $exec 302faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY14:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_]] 303faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_AND_B32_e64_3:%[0-9]+]]:vgpr_32 = V_AND_B32_e64 [[COPY9]], [[COPY14]], implicit $exec 304faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[COPY15:%[0-9]+]]:vgpr_32 = COPY [[S_MOV_B32_1]] 305faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_LSHLREV_B32_e64_1:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 [[COPY15]], [[V_AND_B32_e64_3]], implicit $exec 306faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: [[V_OR_B32_e64_1:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[V_AND_B32_e64_2]], [[V_LSHLREV_B32_e64_1]], implicit $exec 307faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr0 = COPY [[V_OR_B32_e64_]] 308faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: $vgpr1 = COPY [[V_OR_B32_e64_1]] 309faa2c678SKrzysztof Drewniak ; UNPACKED-NEXT: SI_RETURN_TO_EPILOG implicit $vgpr0, implicit $vgpr1 310faa2c678SKrzysztof Drewniak %voffset = add i32 %voffset.base, 4095 311faa2c678SKrzysztof Drewniak %val = call <4 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v4f16(ptr addrspace(8) %rsrc, i32 %voffset, i32 %soffset, i32 0) 312faa2c678SKrzysztof Drewniak ret <4 x half> %val 313faa2c678SKrzysztof Drewniak} 314faa2c678SKrzysztof Drewniak 315faa2c678SKrzysztof Drewniakdeclare half @llvm.amdgcn.raw.ptr.buffer.load.format.f16(ptr addrspace(8), i32, i32, i32 immarg) #0 316faa2c678SKrzysztof Drewniakdeclare <2 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v2f16(ptr addrspace(8), i32, i32, i32 immarg) #0 317faa2c678SKrzysztof Drewniakdeclare <3 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v3f16(ptr addrspace(8), i32, i32, i32 immarg) #0 318faa2c678SKrzysztof Drewniakdeclare <4 x half> @llvm.amdgcn.raw.ptr.buffer.load.format.v4f16(ptr addrspace(8), i32, i32, i32 immarg) #0 319faa2c678SKrzysztof Drewniak 320faa2c678SKrzysztof Drewniakattributes #0 = { nounwind readonly } 321