mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-17 21:35:07 +00:00
d7d003c2b7
Machine CSE and other optimizations can remove instructions so folding is possible at peephole while not possible at ISel. This patch is a rework of r160919 and was tested on clang self-host on my local machine. rdar://10554090 and rdar://11873276 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@161152 91177308-0d34-0410-b5e6-96231b3b80d8
63 lines
1.5 KiB
LLVM
63 lines
1.5 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-linux -mattr=+sse2 -mcpu=nehalem | FileCheck %s
|
|
; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse2 -mcpu=nehalem | FileCheck %s
|
|
|
|
define double @t1(float* nocapture %x) nounwind readonly ssp {
|
|
entry:
|
|
; CHECK: t1:
|
|
; CHECK: movss ([[A0:%rdi|%rcx]]), %xmm0
|
|
; CHECK: cvtss2sd %xmm0, %xmm0
|
|
|
|
%0 = load float* %x, align 4
|
|
%1 = fpext float %0 to double
|
|
ret double %1
|
|
}
|
|
|
|
define float @t2(double* nocapture %x) nounwind readonly ssp optsize {
|
|
entry:
|
|
; CHECK: t2:
|
|
; CHECK: cvtsd2ss ([[A0]]), %xmm0
|
|
%0 = load double* %x, align 8
|
|
%1 = fptrunc double %0 to float
|
|
ret float %1
|
|
}
|
|
|
|
define float @squirtf(float* %x) nounwind {
|
|
entry:
|
|
; CHECK: squirtf:
|
|
; CHECK: movss ([[A0]]), %xmm0
|
|
; CHECK: sqrtss %xmm0, %xmm0
|
|
%z = load float* %x
|
|
%t = call float @llvm.sqrt.f32(float %z)
|
|
ret float %t
|
|
}
|
|
|
|
define double @squirt(double* %x) nounwind {
|
|
entry:
|
|
; CHECK: squirt:
|
|
; CHECK: sqrtsd ([[A0]]), %xmm0
|
|
%z = load double* %x
|
|
%t = call double @llvm.sqrt.f64(double %z)
|
|
ret double %t
|
|
}
|
|
|
|
define float @squirtf_size(float* %x) nounwind optsize {
|
|
entry:
|
|
; CHECK: squirtf_size:
|
|
; CHECK: sqrtss ([[A0]]), %xmm0
|
|
%z = load float* %x
|
|
%t = call float @llvm.sqrt.f32(float %z)
|
|
ret float %t
|
|
}
|
|
|
|
define double @squirt_size(double* %x) nounwind optsize {
|
|
entry:
|
|
; CHECK: squirt_size:
|
|
; CHECK: sqrtsd ([[A0]]), %xmm0
|
|
%z = load double* %x
|
|
%t = call double @llvm.sqrt.f64(double %z)
|
|
ret double %t
|
|
}
|
|
|
|
declare float @llvm.sqrt.f32(float)
|
|
declare double @llvm.sqrt.f64(double)
|