mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-15 23:31:37 +00:00
8603a3d1c5
Only do for f32 since I'm unclear on both what this is expecting for the refinement steps in terms of accuracy, and what f64 instruction actually provides. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@225827 91177308-0d34-0410-b5e6-96231b3b80d8
28 lines
964 B
LLVM
28 lines
964 B
LLVM
; RUN: llc -march=amdgcn -mcpu=tahiti -verify-machineinstrs < %s | FileCheck %s
|
|
; RUN: llc -march=amdgcn -mcpu=tahiti -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck %s
|
|
|
|
; Run with unsafe-fp-math to make sure nothing tries to turn this into 1 / rsqrt(x)
|
|
|
|
; CHECK: {{^}}fsqrt_f32:
|
|
; CHECK: v_sqrt_f32_e32 {{v[0-9]+, v[0-9]+}}
|
|
|
|
define void @fsqrt_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
|
|
%r0 = load float addrspace(1)* %in
|
|
%r1 = call float @llvm.sqrt.f32(float %r0)
|
|
store float %r1, float addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
; CHECK: {{^}}fsqrt_f64:
|
|
; CHECK: v_sqrt_f64_e32 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
|
|
|
|
define void @fsqrt_f64(double addrspace(1)* %out, double addrspace(1)* %in) {
|
|
%r0 = load double addrspace(1)* %in
|
|
%r1 = call double @llvm.sqrt.f64(double %r0)
|
|
store double %r1, double addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
declare float @llvm.sqrt.f32(float %Val)
|
|
declare double @llvm.sqrt.f64(double %Val)
|