mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-17 21:35:07 +00:00
e573fb3255
The previous codegen for the slow path (when values are in VFP / NEON registers) was incorrect if the source is NaN. The new codegen uses NEON vbsl instruction to copy the sign bit. e.g. vmov.i32 d1, #0x80000000 vbsl d1, d2, d0 If NEON is not available, it uses integer instructions to copy the sign bit. rdar://9034702 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@126295 91177308-0d34-0410-b5e6-96231b3b80d8
45 lines
1.2 KiB
LLVM
45 lines
1.2 KiB
LLVM
; RUN: llc < %s -mtriple=armv7-apple-darwin -mcpu=cortex-a8 | FileCheck %s -check-prefix=SOFT
|
|
; RUN: llc < %s -mtriple=armv7-gnueabi -float-abi=hard -mcpu=cortex-a8 | FileCheck %s -check-prefix=HARD
|
|
|
|
; rdar://8984306
|
|
define float @test1(float %x, float %y) nounwind {
|
|
entry:
|
|
; SOFT: test1:
|
|
; SOFT: lsr r1, r1, #31
|
|
; SOFT: bfi r0, r1, #31, #1
|
|
|
|
; HARD: test1:
|
|
; HARD: vmov.i32 [[REG1:(d[0-9]+)]], #0x80000000
|
|
; HARD: vbsl [[REG1]], d2, d0
|
|
%0 = tail call float @copysignf(float %x, float %y) nounwind
|
|
ret float %0
|
|
}
|
|
|
|
define double @test2(double %x, double %y) nounwind {
|
|
entry:
|
|
; SOFT: test2:
|
|
; SOFT: lsr r2, r3, #31
|
|
; SOFT: bfi r1, r2, #31, #1
|
|
|
|
; HARD: test2:
|
|
; HARD: vmov.i32 [[REG2:(d[0-9]+)]], #0x80000000
|
|
; HARD: vshl.i64 [[REG2]], [[REG2]], #32
|
|
; HARD: vbsl [[REG2]], d1, d0
|
|
%0 = tail call double @copysign(double %x, double %y) nounwind
|
|
ret double %0
|
|
}
|
|
|
|
define double @test3(double %x, double %y, double %z) nounwind {
|
|
entry:
|
|
; SOFT: test3:
|
|
; SOFT: vmov.i32 [[REG3:(d[0-9]+)]], #0x80000000
|
|
; SOFT: vshl.i64 [[REG3]], [[REG3]], #32
|
|
; SOFT: vbsl [[REG3]],
|
|
%0 = fmul double %x, %y
|
|
%1 = tail call double @copysign(double %0, double %z) nounwind
|
|
ret double %1
|
|
}
|
|
|
|
declare double @copysign(double, double) nounwind
|
|
declare float @copysignf(float, float) nounwind
|