mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-02-23 20:29:30 +00:00
This is a follow-up to the FIXME that was added with D7474 ( http://reviews.llvm.org/rL229531 ). I thought this load folding bug had been made hard-to-hit, but it turns out to be very easy when targeting 32-bit x86 and causes a miscompile/crash in Wine: https://bugs.winehq.org/show_bug.cgi?id=38826 https://llvm.org/bugs/show_bug.cgi?id=22371#c25 The quick fix is to simply remove the scalar FP logical instructions from the load folding table in X86InstrInfo, but that causes us to miss load folds that should be possible when lowering fabs, fneg, fcopysign. So the majority of this patch is altering those lowerings to use *vector* FP logical instructions (because that's all x86 gives us anyway). That lets us do the load folding legally. Differential Revision: http://reviews.llvm.org/D11477 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@243361 91177308-0d34-0410-b5e6-96231b3b80d8
76 lines
2.3 KiB
LLVM
76 lines
2.3 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx | FileCheck %s
|
|
|
|
|
|
define <2 x double> @fabs_v2f64(<2 x double> %p)
|
|
{
|
|
; CHECK-LABEL: fabs_v2f64
|
|
; CHECK: vandpd
|
|
%t = call <2 x double> @llvm.fabs.v2f64(<2 x double> %p)
|
|
ret <2 x double> %t
|
|
}
|
|
declare <2 x double> @llvm.fabs.v2f64(<2 x double> %p)
|
|
|
|
define <4 x float> @fabs_v4f32(<4 x float> %p)
|
|
{
|
|
; CHECK-LABEL: fabs_v4f32
|
|
; CHECK: vandps
|
|
%t = call <4 x float> @llvm.fabs.v4f32(<4 x float> %p)
|
|
ret <4 x float> %t
|
|
}
|
|
declare <4 x float> @llvm.fabs.v4f32(<4 x float> %p)
|
|
|
|
define <4 x double> @fabs_v4f64(<4 x double> %p)
|
|
{
|
|
; CHECK-LABEL: fabs_v4f64
|
|
; CHECK: vandpd
|
|
%t = call <4 x double> @llvm.fabs.v4f64(<4 x double> %p)
|
|
ret <4 x double> %t
|
|
}
|
|
declare <4 x double> @llvm.fabs.v4f64(<4 x double> %p)
|
|
|
|
define <8 x float> @fabs_v8f32(<8 x float> %p)
|
|
{
|
|
; CHECK-LABEL: fabs_v8f32
|
|
; CHECK: vandps
|
|
%t = call <8 x float> @llvm.fabs.v8f32(<8 x float> %p)
|
|
ret <8 x float> %t
|
|
}
|
|
declare <8 x float> @llvm.fabs.v8f32(<8 x float> %p)
|
|
|
|
; PR20354: when generating code for a vector fabs op,
|
|
; make sure that we're only turning off the sign bit of each float value.
|
|
; No constant pool loads or vector ops are needed for the fabs of a
|
|
; bitcasted integer constant; we should just return an integer constant
|
|
; that has the sign bits turned off.
|
|
;
|
|
; So instead of something like this:
|
|
; movabsq (constant pool load of mask for sign bits)
|
|
; vmovq (move from integer register to vector/fp register)
|
|
; vandps (mask off sign bits)
|
|
; vmovq (move vector/fp register back to integer return register)
|
|
;
|
|
; We should generate:
|
|
; mov (put constant value in return register)
|
|
|
|
define i64 @fabs_v2f32_1() {
|
|
; CHECK-LABEL: fabs_v2f32_1:
|
|
; CHECK: movabsq $9223372032559808512, %rax # imm = 0x7FFFFFFF00000000
|
|
; CHECK-NEXT: retq
|
|
%bitcast = bitcast i64 18446744069414584320 to <2 x float> ; 0xFFFF_FFFF_0000_0000
|
|
%fabs = call <2 x float> @llvm.fabs.v2f32(<2 x float> %bitcast)
|
|
%ret = bitcast <2 x float> %fabs to i64
|
|
ret i64 %ret
|
|
}
|
|
|
|
define i64 @fabs_v2f32_2() {
|
|
; CHECK-LABEL: fabs_v2f32_2:
|
|
; CHECK: movl $2147483647, %eax # imm = 0x7FFFFFFF
|
|
; CHECK-NEXT: retq
|
|
%bitcast = bitcast i64 4294967295 to <2 x float> ; 0x0000_0000_FFFF_FFFF
|
|
%fabs = call <2 x float> @llvm.fabs.v2f32(<2 x float> %bitcast)
|
|
%ret = bitcast <2 x float> %fabs to i64
|
|
ret i64 %ret
|
|
}
|
|
|
|
declare <2 x float> @llvm.fabs.v2f32(<2 x float> %p)
|