mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-10-30 16:17:05 +00:00 
			
		
		
		
	r238842 added the TargetRecip system for controlling use of reciprocal estimates for sqrt and division using a set of parameters that can be set by the frontend. Clang now supports a sophisticated -mrecip option, and this will allow that option to effectively control the relevant code-generation functionality of the PPC backend. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@241985 91177308-0d34-0410-b5e6-96231b3b80d8
		
			
				
	
	
		
			255 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			255 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
| ; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -enable-unsafe-fp-math -mattr=-vsx | FileCheck %s
 | |
| ; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -enable-unsafe-fp-math -mattr=-vsx -recip=sqrtf:0,sqrtd:0 | FileCheck %s -check-prefix=CHECK-NONR
 | |
| ; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -mattr=-vsx | FileCheck -check-prefix=CHECK-SAFE %s
 | |
| target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
 | |
| target triple = "powerpc64-unknown-linux-gnu"
 | |
| 
 | |
| declare double @llvm.sqrt.f64(double)
 | |
| declare float @llvm.sqrt.f32(float)
 | |
| declare <4 x float> @llvm.sqrt.v4f32(<4 x float>)
 | |
| 
 | |
| define double @foo(double %a, double %b) nounwind {
 | |
|   %x = call double @llvm.sqrt.f64(double %b)
 | |
|   %r = fdiv double %a, %x
 | |
|   ret double %r
 | |
| 
 | |
| ; CHECK: @foo
 | |
| ; CHECK-DAG: frsqrte
 | |
| ; CHECK-DAG: fnmsub
 | |
| ; CHECK: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK: blr
 | |
| 
 | |
| ; CHECK-NONR: @foo
 | |
| ; CHECK-NONR: frsqrte
 | |
| ; CHECK-NONR-NOT: fmadd
 | |
| ; CHECK-NONR: fmul
 | |
| ; CHECK-NONR-NOT: fmadd
 | |
| ; CHECK-NONR: blr
 | |
| 
 | |
| ; CHECK-SAFE: @foo
 | |
| ; CHECK-SAFE: fsqrt
 | |
| ; CHECK-SAFE: fdiv
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define double @foof(double %a, float %b) nounwind {
 | |
|   %x = call float @llvm.sqrt.f32(float %b)
 | |
|   %y = fpext float %x to double
 | |
|   %r = fdiv double %a, %y
 | |
|   ret double %r
 | |
| 
 | |
| ; CHECK: @foof
 | |
| ; CHECK-DAG: frsqrtes
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK: fmuls
 | |
| ; CHECK-NEXT: fmadds
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-SAFE: @foof
 | |
| ; CHECK-SAFE: fsqrts
 | |
| ; CHECK-SAFE: fdiv
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define float @food(float %a, double %b) nounwind {
 | |
|   %x = call double @llvm.sqrt.f64(double %b)
 | |
|   %y = fptrunc double %x to float
 | |
|   %r = fdiv float %a, %y
 | |
|   ret float %r
 | |
| 
 | |
| ; CHECK: @foo
 | |
| ; CHECK-DAG: frsqrte
 | |
| ; CHECK-DAG: fnmsub
 | |
| ; CHECK: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: frsp
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-SAFE: @foo
 | |
| ; CHECK-SAFE: fsqrt
 | |
| ; CHECK-SAFE: fdivs
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define float @goo(float %a, float %b) nounwind {
 | |
|   %x = call float @llvm.sqrt.f32(float %b)
 | |
|   %r = fdiv float %a, %x
 | |
|   ret float %r
 | |
| 
 | |
| ; CHECK: @goo
 | |
| ; CHECK-DAG: frsqrtes
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK: fmuls
 | |
| ; CHECK-NEXT: fmadds
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-NONR: @goo
 | |
| ; CHECK-NONR: frsqrtes
 | |
| ; CHECK-NONR-NOT: fmadds
 | |
| ; CHECK-NONR: fmuls
 | |
| ; CHECK-NONR-NOT: fmadds
 | |
| ; CHECK-NONR: blr
 | |
| 
 | |
| ; CHECK-SAFE: @goo
 | |
| ; CHECK-SAFE: fsqrts
 | |
| ; CHECK-SAFE: fdivs
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| ; Recognize that this is rsqrt(a) * rcp(b) * c, 
 | |
| ; not 1 / ( 1 / sqrt(a)) * rcp(b) * c.
 | |
| define float @rsqrt_fmul(float %a, float %b, float %c) {
 | |
|   %x = call float @llvm.sqrt.f32(float %a)
 | |
|   %y = fmul float %x, %b 
 | |
|   %z = fdiv float %c, %y
 | |
|   ret float %z
 | |
| 
 | |
| ; CHECK: @rsqrt_fmul
 | |
| ; CHECK-DAG: frsqrtes
 | |
| ; CHECK-DAG: fres
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK-DAG: fmuls
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK-DAG: fmadds
 | |
| ; CHECK-DAG: fmadds
 | |
| ; CHECK: fmuls
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-SAFE: @rsqrt_fmul
 | |
| ; CHECK-SAFE: fsqrts
 | |
| ; CHECK-SAFE: fmuls
 | |
| ; CHECK-SAFE: fdivs
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define <4 x float> @hoo(<4 x float> %a, <4 x float> %b) nounwind {
 | |
|   %x = call <4 x float> @llvm.sqrt.v4f32(<4 x float> %b)
 | |
|   %r = fdiv <4 x float> %a, %x
 | |
|   ret <4 x float> %r
 | |
| 
 | |
| ; CHECK: @hoo
 | |
| ; CHECK: vrsqrtefp
 | |
| 
 | |
| ; CHECK-SAFE: @hoo
 | |
| ; CHECK-SAFE-NOT: vrsqrtefp
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define double @foo2(double %a, double %b) nounwind {
 | |
|   %r = fdiv double %a, %b
 | |
|   ret double %r
 | |
| 
 | |
| ; CHECK: @foo2
 | |
| ; CHECK-DAG: fre
 | |
| ; CHECK-DAG: fnmsub
 | |
| ; CHECK: fmadd
 | |
| ; CHECK-NEXT: fnmsub
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-SAFE: @foo2
 | |
| ; CHECK-SAFE: fdiv
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define float @goo2(float %a, float %b) nounwind {
 | |
|   %r = fdiv float %a, %b
 | |
|   ret float %r
 | |
| 
 | |
| ; CHECK: @goo2
 | |
| ; CHECK-DAG: fres
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK: fmadds
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: blr
 | |
| 
 | |
| ; CHECK-SAFE: @goo2
 | |
| ; CHECK-SAFE: fdivs
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define <4 x float> @hoo2(<4 x float> %a, <4 x float> %b) nounwind {
 | |
|   %r = fdiv <4 x float> %a, %b
 | |
|   ret <4 x float> %r
 | |
| 
 | |
| ; CHECK: @hoo2
 | |
| ; CHECK: vrefp
 | |
| 
 | |
| ; CHECK-SAFE: @hoo2
 | |
| ; CHECK-SAFE-NOT: vrefp
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define double @foo3(double %a) nounwind {
 | |
|   %r = call double @llvm.sqrt.f64(double %a)
 | |
|   ret double %r
 | |
| 
 | |
| ; CHECK: @foo3
 | |
| ; CHECK: fcmpu
 | |
| ; CHECK-DAG: frsqrte
 | |
| ; CHECK-DAG: fnmsub
 | |
| ; CHECK: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmadd
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK-NEXT: fmul
 | |
| ; CHECK: blr
 | |
| 
 | |
| ; CHECK-SAFE: @foo3
 | |
| ; CHECK-SAFE: fsqrt
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define float @goo3(float %a) nounwind {
 | |
|   %r = call float @llvm.sqrt.f32(float %a)
 | |
|   ret float %r
 | |
| 
 | |
| ; CHECK: @goo3
 | |
| ; CHECK: fcmpu
 | |
| ; CHECK-DAG: frsqrtes
 | |
| ; CHECK-DAG: fnmsubs
 | |
| ; CHECK: fmuls
 | |
| ; CHECK-NEXT: fmadds
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK-NEXT: fmuls
 | |
| ; CHECK: blr
 | |
| 
 | |
| ; CHECK-SAFE: @goo3
 | |
| ; CHECK-SAFE: fsqrts
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 | |
| define <4 x float> @hoo3(<4 x float> %a) nounwind {
 | |
|   %r = call <4 x float> @llvm.sqrt.v4f32(<4 x float> %a)
 | |
|   ret <4 x float> %r
 | |
| 
 | |
| ; CHECK: @hoo3
 | |
| ; CHECK: vrsqrtefp
 | |
| ; CHECK-DAG: vcmpeqfp
 | |
| 
 | |
| ; CHECK-SAFE: @hoo3
 | |
| ; CHECK-SAFE-NOT: vrsqrtefp
 | |
| ; CHECK-SAFE: blr
 | |
| }
 | |
| 
 |