mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-08 03:30:22 +00:00
dab5145cb3
Summary: Constant stores of f16 vectors can create NvCast nodes from various operand types to v4f16 or v8f16 depending on patterns in the stored constants. This patch adds nvcast rules with v4f16 and v8f16 values. AArchISelLowering::LowerBUILD_VECTOR has the details on which constant patterns generate the nvcast nodes. Reviewers: jmolloy, srhines, ab Subscribers: rengolin, aemerson, llvm-commits Differential Revision: http://reviews.llvm.org/D9201 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@235610 91177308-0d34-0410-b5e6-96231b3b80d8
90 lines
2.9 KiB
LLVM
90 lines
2.9 KiB
LLVM
; RUN: llc < %s -asm-verbose=false -mtriple=aarch64-none-eabi | FileCheck %s
|
|
|
|
; Test pattern (v4f16 (AArch64NvCast (v2i32 FPR64:$src)))
|
|
define void @nvcast_v2i32(<4 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v2i32:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].2s, #0xab, lsl #16
|
|
; CHECK-NEXT: str d[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <4 x half> <half 0xH0000, half 0xH00AB, half 0xH0000, half 0xH00AB>, <4 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v4f16 (AArch64NvCast (v4i16 FPR64:$src)))
|
|
define void @nvcast_v4i16(<4 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v4i16:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].4h, #0xab
|
|
; CHECK-NEXT: str d[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <4 x half> <half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB>, <4 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v4f16 (AArch64NvCast (v8i8 FPR64:$src)))
|
|
define void @nvcast_v8i8(<4 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v8i8:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].8b, #0xab
|
|
; CHECK-NEXT: str d[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <4 x half> <half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB>, <4 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v4f16 (AArch64NvCast (f64 FPR64:$src)))
|
|
define void @nvcast_f64(<4 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_f64:
|
|
; CHECK-NEXT: movi d[[REG:[0-9]+]], #0000000000000000
|
|
; CHECK-NEXT: str d[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <4 x half> zeroinitializer, <4 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
; Test pattern (v8f16 (AArch64NvCast (v4i32 FPR128:$src)))
|
|
define void @nvcast_v4i32(<8 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v4i32:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].4s, #0xab, lsl #16
|
|
; CHECK-NEXT: str q[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <8 x half> <half 0xH0000, half 0xH00AB, half 0xH0000, half 0xH00AB, half 0xH0000, half 0xH00AB, half 0xH0000, half 0xH00AB>, <8 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v8f16 (AArch64NvCast (v8i16 FPR128:$src)))
|
|
define void @nvcast_v8i16(<8 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v8i16:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].8h, #0xab
|
|
; CHECK-NEXT: str q[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <8 x half> <half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB, half 0xH00AB>, <8 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v8f16 (AArch64NvCast (v16i8 FPR128:$src)))
|
|
define void @nvcast_v16i8(<8 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v16i8:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].16b, #0xab
|
|
; CHECK-NEXT: str q[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <8 x half> <half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB, half 0xHABAB>, <8 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
|
|
; Test pattern (v8f16 (AArch64NvCast (v2i64 FPR128:$src)))
|
|
define void @nvcast_v2i64(<8 x half>* %a) #0 {
|
|
; CHECK-LABEL: nvcast_v2i64:
|
|
; CHECK-NEXT: movi v[[REG:[0-9]+]].2d, #0000000000000000
|
|
; CHECK-NEXT: str q[[REG]], [x0]
|
|
; CHECK-NEXT: ret
|
|
store volatile <8 x half> zeroinitializer, <8 x half>* %a
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind }
|