From 5aee09da12a1ba8553792d9017785e51199e38c2 Mon Sep 17 00:00:00 2001 From: Tom Stellard Date: Sat, 15 Jun 2013 00:09:31 +0000 Subject: [PATCH] R600: Add SI load support for v[24]i32 and store for v2i32 Also add a seperate vector lit test file, since r600 doesn't seem to handle v2i32 load/store yet, but we can test both for SI. Patch by: Aaron Watry Reviewed-by: Tom Stellard Signed-off-by: Aaron Watry git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@184021 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/Target/R600/SIInstructions.td | 5 +++++ test/CodeGen/R600/load.vec.ll | 19 +++++++++++++++++++ 2 files changed, 24 insertions(+) create mode 100644 test/CodeGen/R600/load.vec.ll diff --git a/lib/Target/R600/SIInstructions.td b/lib/Target/R600/SIInstructions.td index e8ed2dd5da4..9c96c080c08 100644 --- a/lib/Target/R600/SIInstructions.td +++ b/lib/Target/R600/SIInstructions.td @@ -1638,6 +1638,10 @@ defm : MUBUFLoad_Pattern ; defm : MUBUFLoad_Pattern ; +defm : MUBUFLoad_Pattern ; +defm : MUBUFLoad_Pattern ; multiclass MUBUFStore_Pattern { @@ -1654,6 +1658,7 @@ multiclass MUBUFStore_Pattern { defm : MUBUFStore_Pattern ; defm : MUBUFStore_Pattern ; +defm : MUBUFStore_Pattern ; defm : MUBUFStore_Pattern ; /********** ====================== **********/ diff --git a/test/CodeGen/R600/load.vec.ll b/test/CodeGen/R600/load.vec.ll new file mode 100644 index 00000000000..08e034e4562 --- /dev/null +++ b/test/CodeGen/R600/load.vec.ll @@ -0,0 +1,19 @@ +; RUN: llc < %s -march=r600 -mcpu=SI | FileCheck --check-prefix=SI-CHECK %s + +; load a v2i32 value from the global address space. +; SI-CHECK: @load_v2i32 +; SI-CHECK: BUFFER_LOAD_DWORDX2 VGPR{{[0-9]+}} +define void @load_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in) { + %a = load <2 x i32> addrspace(1) * %in + store <2 x i32> %a, <2 x i32> addrspace(1)* %out + ret void +} + +; load a v4i32 value from the global address space. +; SI-CHECK: @load_v4i32 +; SI-CHECK: BUFFER_LOAD_DWORDX4 VGPR{{[0-9]+}} +define void @load_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) { + %a = load <4 x i32> addrspace(1) * %in + store <4 x i32> %a, <4 x i32> addrspace(1)* %out + ret void +}