diff options
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/ds-alignment.ll')
| -rw-r--r-- | llvm/test/CodeGen/AMDGPU/ds-alignment.ll | 84 |
1 files changed, 42 insertions, 42 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/ds-alignment.ll b/llvm/test/CodeGen/AMDGPU/ds-alignment.ll index b1664c59a7e4..93422e259b82 100644 --- a/llvm/test/CodeGen/AMDGPU/ds-alignment.ll +++ b/llvm/test/CodeGen/AMDGPU/ds-alignment.ll @@ -209,27 +209,28 @@ define amdgpu_kernel void @ds8align1(ptr addrspace(3) %in, ptr addrspace(3) %out ; ALIGNED-SDAG-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x24 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(0) ; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v0, s0 -; ALIGNED-SDAG-NEXT: ds_read_u8 v1, v0 -; ALIGNED-SDAG-NEXT: ds_read_u8 v2, v0 offset:1 -; ALIGNED-SDAG-NEXT: ds_read_u8 v3, v0 offset:2 -; ALIGNED-SDAG-NEXT: ds_read_u8 v4, v0 offset:3 +; ALIGNED-SDAG-NEXT: ds_read_u8 v2, v0 +; ALIGNED-SDAG-NEXT: ds_read_u8 v3, v0 offset:1 +; ALIGNED-SDAG-NEXT: ds_read_u8 v4, v0 offset:2 ; ALIGNED-SDAG-NEXT: ds_read_u8 v5, v0 offset:4 ; ALIGNED-SDAG-NEXT: ds_read_u8 v6, v0 offset:5 +; ALIGNED-SDAG-NEXT: ds_read_u8 v7, v0 offset:3 ; ALIGNED-SDAG-NEXT: ds_read_u8 v8, v0 offset:6 ; ALIGNED-SDAG-NEXT: ds_read_u8 v0, v0 offset:7 -; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v7, s1 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(3) -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v5 offset:4 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(3) -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v6 offset:5 -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v1 -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v2 offset:1 -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v3 offset:2 -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v4 offset:3 +; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v1, s1 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(4) +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v5 offset:4 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(4) +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v6 offset:5 +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v2 +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v3 offset:1 +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v4 offset:2 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v8 offset:6 +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v7 offset:3 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b8 v7, v0 offset:7 +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v8 offset:6 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) +; ALIGNED-SDAG-NEXT: ds_write_b8 v1, v0 offset:7 ; ALIGNED-SDAG-NEXT: s_endpgm ; ; ALIGNED-GISEL-LABEL: ds8align1: @@ -492,23 +493,24 @@ define amdgpu_kernel void @ds12align2(ptr addrspace(3) %in, ptr addrspace(3) %ou ; ALIGNED-SDAG-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x24 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(0) ; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v0, s0 -; ALIGNED-SDAG-NEXT: ds_read_u16 v1, v0 offset:8 ; ALIGNED-SDAG-NEXT: ds_read_u16 v2, v0 -; ALIGNED-SDAG-NEXT: ds_read_u16 v3, v0 offset:2 +; ALIGNED-SDAG-NEXT: ds_read_u16 v3, v0 offset:8 ; ALIGNED-SDAG-NEXT: ds_read_u16 v4, v0 offset:4 -; ALIGNED-SDAG-NEXT: ds_read_u16 v5, v0 offset:6 -; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v6, s1 +; ALIGNED-SDAG-NEXT: ds_read_u16 v5, v0 offset:2 +; ALIGNED-SDAG-NEXT: ds_read_u16 v6, v0 offset:6 ; ALIGNED-SDAG-NEXT: ds_read_u16 v0, v0 offset:10 +; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v1, s1 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(4) +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v3 offset:8 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(4) +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v4 offset:4 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v2 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(5) -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v1 offset:8 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(3) -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v4 offset:4 -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v2 -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v3 offset:2 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v5 offset:2 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(5) -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v5 offset:6 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v6 offset:6 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(5) -; ALIGNED-SDAG-NEXT: ds_write_b16 v6, v0 offset:10 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v0 offset:10 ; ALIGNED-SDAG-NEXT: s_endpgm ; ; ALIGNED-GISEL-LABEL: ds12align2: @@ -808,29 +810,27 @@ define amdgpu_kernel void @ds16align2(ptr addrspace(3) %in, ptr addrspace(3) %ou ; ALIGNED-SDAG-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x24 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(0) ; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v0, s0 -; ALIGNED-SDAG-NEXT: ds_read_u16 v1, v0 offset:12 ; ALIGNED-SDAG-NEXT: ds_read_u16 v2, v0 ; ALIGNED-SDAG-NEXT: ds_read_u16 v3, v0 offset:2 ; ALIGNED-SDAG-NEXT: ds_read_u16 v4, v0 offset:4 -; ALIGNED-SDAG-NEXT: ds_read_u16 v5, v0 offset:6 -; ALIGNED-SDAG-NEXT: ds_read_u16 v6, v0 offset:8 -; ALIGNED-SDAG-NEXT: ds_read_u16 v7, v0 offset:10 -; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v8, s1 +; ALIGNED-SDAG-NEXT: ds_read_u16 v5, v0 offset:12 +; ALIGNED-SDAG-NEXT: ds_read_u16 v6, v0 offset:6 +; ALIGNED-SDAG-NEXT: ds_read_u16 v7, v0 offset:8 +; ALIGNED-SDAG-NEXT: ds_read_u16 v8, v0 offset:10 ; ALIGNED-SDAG-NEXT: ds_read_u16 v0, v0 offset:14 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v1 offset:12 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v2 -; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(6) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v4 offset:4 +; ALIGNED-SDAG-NEXT: v_mov_b32_e32 v1, s1 +; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(4) +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v5 offset:12 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v2 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v4 offset:4 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(5) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v6 offset:8 -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v3 offset:2 -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v5 offset:6 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v7 offset:8 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v3 offset:2 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v6 offset:6 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v7 offset:10 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v8 offset:10 ; ALIGNED-SDAG-NEXT: s_waitcnt lgkmcnt(7) -; ALIGNED-SDAG-NEXT: ds_write_b16 v8, v0 offset:14 +; ALIGNED-SDAG-NEXT: ds_write_b16 v1, v0 offset:14 ; ALIGNED-SDAG-NEXT: s_endpgm ; ; ALIGNED-GISEL-LABEL: ds16align2: |
