mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-11-23 00:20:25 +00:00
ARM: ensure fixed-point conversions have sane types
We were generating intrinsics for NEON fixed-point conversions that didn't
exist (e.g. float -> i16). There are two cases to consider:
+ iN is smaller than float. In this case we can do the conversion but need an
extend or truncate as well.
+ iN is larger than float. In this case using the NEON conversion would be
incorrect so we don't perform any combining.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@185158 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
@@ -156,3 +156,44 @@ define <4 x i16> @vcvt_f32tof16(<4 x float>* %A) nounwind {
|
||||
|
||||
declare <4 x float> @llvm.arm.neon.vcvthf2fp(<4 x i16>) nounwind readnone
|
||||
declare <4 x i16> @llvm.arm.neon.vcvtfp2hf(<4 x float>) nounwind readnone
|
||||
|
||||
|
||||
define <4 x i16> @fix_float_to_i16(<4 x float> %in) {
|
||||
; CHECK: fix_float_to_i16:
|
||||
; CHECK: vcvt.u32.f32 [[TMP:q[0-9]+]], {{q[0-9]+}}, #1
|
||||
; CHECK: vmovn.i32 {{d[0-9]+}}, [[TMP]]
|
||||
|
||||
%scale = fmul <4 x float> %in, <float 2.0, float 2.0, float 2.0, float 2.0>
|
||||
%conv = fptoui <4 x float> %scale to <4 x i16>
|
||||
ret <4 x i16> %conv
|
||||
}
|
||||
|
||||
define <2 x i64> @fix_float_to_i64(<2 x float> %in) {
|
||||
; CHECK: fix_float_to_i64:
|
||||
; CHECK: bl
|
||||
; CHECK: bl
|
||||
|
||||
%scale = fmul <2 x float> %in, <float 2.0, float 2.0>
|
||||
%conv = fptoui <2 x float> %scale to <2 x i64>
|
||||
ret <2 x i64> %conv
|
||||
}
|
||||
|
||||
define <4 x i16> @fix_double_to_i16(<4 x double> %in) {
|
||||
; CHECK: fix_double_to_i16:
|
||||
; CHECK: vcvt.s32.f64
|
||||
; CHECK: vcvt.s32.f64
|
||||
|
||||
%scale = fmul <4 x double> %in, <double 2.0, double 2.0, double 2.0, double 2.0>
|
||||
%conv = fptoui <4 x double> %scale to <4 x i16>
|
||||
ret <4 x i16> %conv
|
||||
}
|
||||
|
||||
define <2 x i64> @fix_double_to_i64(<2 x double> %in) {
|
||||
; CHECK: fix_double_to_i64:
|
||||
; CHECK: bl
|
||||
; CHECK: bl
|
||||
%scale = fmul <2 x double> %in, <double 2.0, double 2.0>
|
||||
%conv = fptoui <2 x double> %scale to <2 x i64>
|
||||
ret <2 x i64> %conv
|
||||
}
|
||||
|
||||
|
||||
@@ -95,3 +95,44 @@ entry:
|
||||
}
|
||||
|
||||
declare void @foo_float32x4_t(<4 x float>)
|
||||
|
||||
define <4 x float> @fix_unsigned_i16_to_float(<4 x i16> %in) {
|
||||
; CHECK: fix_unsigned_i16_to_float:
|
||||
; CHECK: vmovl.u16 [[TMP:q[0-9]+]], {{d[0-9]+}}
|
||||
; CHECK: vcvt.f32.u32 {{q[0-9]+}}, [[TMP]], #1
|
||||
|
||||
%conv = uitofp <4 x i16> %in to <4 x float>
|
||||
%shift = fdiv <4 x float> %conv, <float 2.0, float 2.0, float 2.0, float 2.0>
|
||||
ret <4 x float> %shift
|
||||
}
|
||||
|
||||
define <4 x float> @fix_signed_i16_to_float(<4 x i16> %in) {
|
||||
; CHECK: fix_signed_i16_to_float:
|
||||
; CHECK: vmovl.s16 [[TMP:q[0-9]+]], {{d[0-9]+}}
|
||||
; CHECK: vcvt.f32.s32 {{q[0-9]+}}, [[TMP]], #1
|
||||
|
||||
%conv = sitofp <4 x i16> %in to <4 x float>
|
||||
%shift = fdiv <4 x float> %conv, <float 2.0, float 2.0, float 2.0, float 2.0>
|
||||
ret <4 x float> %shift
|
||||
}
|
||||
|
||||
define <2 x float> @fix_i64_to_float(<2 x i64> %in) {
|
||||
; CHECK: fix_i64_to_float:
|
||||
; CHECK: bl
|
||||
; CHECK: bl
|
||||
|
||||
%conv = uitofp <2 x i64> %in to <2 x float>
|
||||
%shift = fdiv <2 x float> %conv, <float 2.0, float 2.0>
|
||||
ret <2 x float> %shift
|
||||
}
|
||||
|
||||
define <2 x double> @fix_i64_to_double(<2 x i64> %in) {
|
||||
; CHECK: fix_i64_to_double:
|
||||
; CHECK: bl
|
||||
; CHECK: bl
|
||||
|
||||
%conv = uitofp <2 x i64> %in to <2 x double>
|
||||
%shift = fdiv <2 x double> %conv, <double 2.0, double 2.0>
|
||||
ret <2 x double> %shift
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user