mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-11-04 05:17:07 +00:00 
			
		
		
		
	what it does. Enhance it to return false to optimizing vector sign extensions from vector comparisions, which is the idiom used to get a splatted vector for a vector comparison. Doing this breaks vector-casts.ll, add some compensating transformations to handle the important case they cover without depending on this canonicalization. This fixes rdar://7434900 a serious pessimization of vector compares. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@95855 91177308-0d34-0410-b5e6-96231b3b80d8
		
			
				
	
	
		
			124 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			124 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
; RUN: opt < %s -instcombine -S | FileCheck %s
 | 
						|
 | 
						|
; This turns into a&1 != 0
 | 
						|
define <2 x i1> @test1(<2 x i64> %a) {
 | 
						|
  %t = trunc <2 x i64> %a to <2 x i1>
 | 
						|
  ret <2 x i1> %t
 | 
						|
 | 
						|
; CHECK: @test1
 | 
						|
; CHECK:   and <2 x i64> %a, <i64 1, i64 1>
 | 
						|
; CHECK:   icmp ne <2 x i64> %tmp, zeroinitializer
 | 
						|
}
 | 
						|
 | 
						|
; The ashr turns into an lshr.
 | 
						|
define <2 x i64> @test2(<2 x i64> %a) {
 | 
						|
  %b = and <2 x i64> %a, <i64 65535, i64 65535>
 | 
						|
  %t = ashr <2 x i64> %b, <i64 1, i64 1>
 | 
						|
  ret <2 x i64> %t
 | 
						|
 | 
						|
; CHECK: @test2
 | 
						|
; CHECK:   and <2 x i64> %a, <i64 65535, i64 65535>
 | 
						|
; CHECK:   lshr <2 x i64> %b, <i64 1, i64 1>
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
 | 
						|
define <2 x i64> @test3(<4 x float> %a, <4 x float> %b) nounwind readnone {
 | 
						|
entry:
 | 
						|
	%cmp = fcmp ord <4 x float> %a, zeroinitializer	
 | 
						|
	%sext = sext <4 x i1> %cmp to <4 x i32>	
 | 
						|
	%cmp4 = fcmp ord <4 x float> %b, zeroinitializer
 | 
						|
	%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
 | 
						|
	%and = and <4 x i32> %sext, %sext5
 | 
						|
	%conv = bitcast <4 x i32> %and to <2 x i64>
 | 
						|
	ret <2 x i64> %conv
 | 
						|
        
 | 
						|
; CHECK: @test3
 | 
						|
; CHECK:   fcmp ord <4 x float> %a, %b
 | 
						|
}
 | 
						|
 | 
						|
define <2 x i64> @test4(<4 x float> %a, <4 x float> %b) nounwind readnone {
 | 
						|
entry:
 | 
						|
	%cmp = fcmp uno <4 x float> %a, zeroinitializer
 | 
						|
	%sext = sext <4 x i1> %cmp to <4 x i32>
 | 
						|
	%cmp4 = fcmp uno <4 x float> %b, zeroinitializer
 | 
						|
	%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
 | 
						|
	%or = or <4 x i32> %sext, %sext5
 | 
						|
	%conv = bitcast <4 x i32> %or to <2 x i64>
 | 
						|
	ret <2 x i64> %conv
 | 
						|
; CHECK: @test4
 | 
						|
; CHECK:   fcmp uno <4 x float> %a, %b
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
; rdar://7434900
 | 
						|
define <2 x i64> @test5(<4 x float> %a, <4 x float> %b) nounwind readnone {
 | 
						|
entry:
 | 
						|
	%cmp = fcmp ult <4 x float> %a, zeroinitializer	
 | 
						|
	%sext = sext <4 x i1> %cmp to <4 x i32>	
 | 
						|
	%cmp4 = fcmp ult <4 x float> %b, zeroinitializer
 | 
						|
	%sext5 = sext <4 x i1> %cmp4 to <4 x i32>
 | 
						|
	%and = and <4 x i32> %sext, %sext5
 | 
						|
	%conv = bitcast <4 x i32> %and to <2 x i64>
 | 
						|
	ret <2 x i64> %conv
 | 
						|
        
 | 
						|
; CHECK: @test5
 | 
						|
; CHECK:   sext <4 x i1> %cmp to <4 x i32>	
 | 
						|
; CHECK:   sext <4 x i1> %cmp4 to <4 x i32>	
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
define void @convert(<2 x i32>* %dst.addr, <2 x i64> %src) nounwind {
 | 
						|
entry:
 | 
						|
  %val = trunc <2 x i64> %src to <2 x i32>
 | 
						|
  %add = add <2 x i32> %val, <i32 1, i32 1>
 | 
						|
  store <2 x i32> %add, <2 x i32>* %dst.addr
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define <2 x i65> @foo(<2 x i64> %t) {
 | 
						|
  %a = trunc <2 x i64> %t to <2 x i32>
 | 
						|
  %b = zext <2 x i32> %a to <2 x i65>
 | 
						|
  ret <2 x i65> %b
 | 
						|
}
 | 
						|
define <2 x i64> @bar(<2 x i65> %t) {
 | 
						|
  %a = trunc <2 x i65> %t to <2 x i32>
 | 
						|
  %b = zext <2 x i32> %a to <2 x i64>
 | 
						|
  ret <2 x i64> %b
 | 
						|
}
 | 
						|
define <2 x i65> @foos(<2 x i64> %t) {
 | 
						|
  %a = trunc <2 x i64> %t to <2 x i32>
 | 
						|
  %b = sext <2 x i32> %a to <2 x i65>
 | 
						|
  ret <2 x i65> %b
 | 
						|
}
 | 
						|
define <2 x i64> @bars(<2 x i65> %t) {
 | 
						|
  %a = trunc <2 x i65> %t to <2 x i32>
 | 
						|
  %b = sext <2 x i32> %a to <2 x i64>
 | 
						|
  ret <2 x i64> %b
 | 
						|
}
 | 
						|
define <2 x i64> @quxs(<2 x i64> %t) {
 | 
						|
  %a = trunc <2 x i64> %t to <2 x i32>
 | 
						|
  %b = sext <2 x i32> %a to <2 x i64>
 | 
						|
  ret <2 x i64> %b
 | 
						|
}
 | 
						|
define <2 x i64> @quxt(<2 x i64> %t) {
 | 
						|
  %a = shl <2 x i64> %t, <i64 32, i64 32>
 | 
						|
  %b = ashr <2 x i64> %a, <i64 32, i64 32>
 | 
						|
  ret <2 x i64> %b
 | 
						|
}
 | 
						|
define <2 x double> @fa(<2 x double> %t) {
 | 
						|
  %a = fptrunc <2 x double> %t to <2 x float>
 | 
						|
  %b = fpext <2 x float> %a to <2 x double>
 | 
						|
  ret <2 x double> %b
 | 
						|
}
 | 
						|
define <2 x double> @fb(<2 x double> %t) {
 | 
						|
  %a = fptoui <2 x double> %t to <2 x i64>
 | 
						|
  %b = uitofp <2 x i64> %a to <2 x double>
 | 
						|
  ret <2 x double> %b
 | 
						|
}
 | 
						|
define <2 x double> @fc(<2 x double> %t) {
 | 
						|
  %a = fptosi <2 x double> %t to <2 x i64>
 | 
						|
  %b = sitofp <2 x i64> %a to <2 x double>
 | 
						|
  ret <2 x double> %b
 | 
						|
}
 |