|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py |
| 2 | +; RUN: llc -global-isel -march=amdgcn -mcpu=gfx900 -verify-machineinstrs -stop-after twoaddressinstruction < %s | FileCheck %s |
| 3 | + |
| 4 | +; FIXME: the operand "undef %16.sub0_sub1:sgpr_96" will fail machine |
| 5 | +; verification because sgpr_96 does not fully support sub0_sub1. |
| 6 | +define amdgpu_ps <3 x i32> @s_load_constant_v3i32_align4(<3 x i32> addrspace(4)* inreg %ptr) { |
| 7 | + ; CHECK-LABEL: name: s_load_constant_v3i32_align4 |
| 8 | + ; CHECK: bb.0 (%ir-block.0): |
| 9 | + ; CHECK-NEXT: liveins: $sgpr0, $sgpr1 |
| 10 | + ; CHECK-NEXT: {{ $}} |
| 11 | + ; CHECK-NEXT: [[COPY:%[0-9]+]]:sreg_32 = COPY killed $sgpr0 |
| 12 | + ; CHECK-NEXT: [[COPY1:%[0-9]+]]:sreg_32 = COPY killed $sgpr1 |
| 13 | + ; CHECK-NEXT: undef %0.sub0:sreg_64 = COPY killed [[COPY]] |
| 14 | + ; CHECK-NEXT: %0.sub1:sreg_64 = COPY killed [[COPY1]] |
| 15 | + ; CHECK-NEXT: [[S_LOAD_DWORDX2_IMM:%[0-9]+]]:sreg_64_xexec = S_LOAD_DWORDX2_IMM %0, 0, 0 :: (load (<2 x s32>) from %ir.ptr, align 4, addrspace 4) |
| 16 | + ; CHECK-NEXT: [[S_LOAD_DWORD_IMM:%[0-9]+]]:sreg_32_xm0_xexec = S_LOAD_DWORD_IMM killed %0, 8, 0 :: (load (s32) from %ir.ptr + 8, addrspace 4) |
| 17 | + ; CHECK-NEXT: undef %16.sub0_sub1:sgpr_96 = COPY killed [[S_LOAD_DWORDX2_IMM]] |
| 18 | + ; CHECK-NEXT: [[COPY2:%[0-9]+]]:sgpr_96 = COPY killed %16 |
| 19 | + ; CHECK-NEXT: [[COPY2]].sub2:sgpr_96 = COPY undef [[S_LOAD_DWORD_IMM]] |
| 20 | + ; CHECK-NEXT: [[COPY3:%[0-9]+]]:sreg_32 = COPY [[COPY2]].sub0 |
| 21 | + ; CHECK-NEXT: $sgpr0 = COPY killed [[COPY3]] |
| 22 | + ; CHECK-NEXT: [[COPY4:%[0-9]+]]:sreg_32 = COPY killed [[COPY2]].sub1 |
| 23 | + ; CHECK-NEXT: $sgpr1 = COPY killed [[COPY4]] |
| 24 | + ; CHECK-NEXT: [[COPY5:%[0-9]+]]:sreg_32 = COPY killed [[S_LOAD_DWORD_IMM]] |
| 25 | + ; CHECK-NEXT: $sgpr2 = COPY killed [[COPY5]] |
| 26 | + ; CHECK-NEXT: SI_RETURN_TO_EPILOG implicit killed $sgpr0, implicit killed $sgpr1, implicit killed $sgpr2 |
| 27 | + %load = load <3 x i32>, <3 x i32> addrspace(4)* %ptr, align 4 |
| 28 | + ret <3 x i32> %load |
| 29 | +} |
0 commit comments