mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-11-03 14:21:30 +00:00 
			
		
		
		
	The C and C++ semantics for compare_exchange require it to return a bool
indicating success. This gets mapped to LLVM IR which follows each cmpxchg with
an icmp of the value loaded against the desired value.
When lowered to ldxr/stxr loops, this extra comparison is redundant: its
results are implicit in the control-flow of the function.
This commit makes two changes: it replaces that icmp with appropriate PHI
nodes, and then makes sure earlyCSE is called after expansion to actually make
use of the opportunities revealed.
I've also added -{arm,aarch64}-enable-atomic-tidy options, so that
existing fragile tests aren't perturbed too much by the change. Many
of them either rely on undef/unreachable too pervasively to be
restored to something well-defined (particularly while making sure
they test the same obscure assert from many years ago), or depend on a
particular CFG shape, which is disrupted by SimplifyCFG.
rdar://problem/16227836
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@209883 91177308-0d34-0410-b5e6-96231b3b80d8
		
	
		
			
				
	
	
		
			182 lines
		
	
	
		
			4.8 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			182 lines
		
	
	
		
			4.8 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
; RUN: llc < %s -mtriple=armv6-apple-ios5.0 -mattr=+vfp2 -arm-atomic-cfg-tidy=0 | FileCheck %s -check-prefix=CHECKV6
 | 
						|
; RUN: llc < %s -mtriple=thumbv7-apple-ios5.0 -arm-atomic-cfg-tidy=0 | FileCheck %s -check-prefix=CHECKT2D
 | 
						|
; RUN: llc < %s -mtriple=armv6-linux-gnueabi -relocation-model=pic -mattr=+vfp2 -arm-atomic-cfg-tidy=0 \
 | 
						|
; RUN:    | FileCheck %s -check-prefix=CHECKELF
 | 
						|
 | 
						|
; Enable tailcall optimization for iOS 5.0
 | 
						|
; rdar://9120031
 | 
						|
 | 
						|
@t = weak global i32 ()* null           ; <i32 ()**> [#uses=1]
 | 
						|
 | 
						|
declare void @g(i32, i32, i32, i32)
 | 
						|
 | 
						|
define void @t1() {
 | 
						|
; CHECKELF-LABEL: t1:
 | 
						|
; CHECKELF: bl g(PLT)
 | 
						|
        call void @g( i32 1, i32 2, i32 3, i32 4 )
 | 
						|
        ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @t2() {
 | 
						|
; CHECKV6-LABEL: t2:
 | 
						|
; CHECKV6: bx r0
 | 
						|
; CHECKT2D-LABEL: t2:
 | 
						|
; CHECKT2D: ldr
 | 
						|
; CHECKT2D-NEXT: ldr
 | 
						|
; CHECKT2D-NEXT: bx r0
 | 
						|
        %tmp = load i32 ()** @t         ; <i32 ()*> [#uses=1]
 | 
						|
        %tmp.upgrd.2 = tail call i32 %tmp( )            ; <i32> [#uses=0]
 | 
						|
        ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @t3() {
 | 
						|
; CHECKV6-LABEL: t3:
 | 
						|
; CHECKV6: b _t2
 | 
						|
; CHECKELF-LABEL: t3:
 | 
						|
; CHECKELF: b t2(PLT)
 | 
						|
; CHECKT2D-LABEL: t3:
 | 
						|
; CHECKT2D: b.w _t2
 | 
						|
 | 
						|
        tail call void @t2( )            ; <i32> [#uses=0]
 | 
						|
        ret void
 | 
						|
}
 | 
						|
 | 
						|
; Sibcall optimization of expanded libcalls. rdar://8707777
 | 
						|
define double @t4(double %a) nounwind readonly ssp {
 | 
						|
entry:
 | 
						|
; CHECKV6-LABEL: t4:
 | 
						|
; CHECKV6: b _sin
 | 
						|
; CHECKELF-LABEL: t4:
 | 
						|
; CHECKELF: b sin(PLT)
 | 
						|
  %0 = tail call double @sin(double %a) nounwind readonly ; <double> [#uses=1]
 | 
						|
  ret double %0
 | 
						|
}
 | 
						|
 | 
						|
define float @t5(float %a) nounwind readonly ssp {
 | 
						|
entry:
 | 
						|
; CHECKV6-LABEL: t5:
 | 
						|
; CHECKV6: b _sinf
 | 
						|
; CHECKELF-LABEL: t5:
 | 
						|
; CHECKELF: b sinf(PLT)
 | 
						|
  %0 = tail call float @sinf(float %a) nounwind readonly ; <float> [#uses=1]
 | 
						|
  ret float %0
 | 
						|
}
 | 
						|
 | 
						|
declare float @sinf(float) nounwind readonly
 | 
						|
 | 
						|
declare double @sin(double) nounwind readonly
 | 
						|
 | 
						|
define i32 @t6(i32 %a, i32 %b) nounwind readnone {
 | 
						|
entry:
 | 
						|
; CHECKV6-LABEL: t6:
 | 
						|
; CHECKV6: b ___divsi3
 | 
						|
; CHECKELF-LABEL: t6:
 | 
						|
; CHECKELF: b __aeabi_idiv(PLT)
 | 
						|
  %0 = sdiv i32 %a, %b
 | 
						|
  ret i32 %0
 | 
						|
}
 | 
						|
 | 
						|
; Make sure the tail call instruction isn't deleted
 | 
						|
; rdar://8309338
 | 
						|
declare void @foo() nounwind
 | 
						|
 | 
						|
define void @t7() nounwind {
 | 
						|
entry:
 | 
						|
; CHECKT2D-LABEL: t7:
 | 
						|
; CHECKT2D: blxeq _foo
 | 
						|
; CHECKT2D-NEXT: pop.w
 | 
						|
; CHECKT2D-NEXT: b.w _foo
 | 
						|
  br i1 undef, label %bb, label %bb1.lr.ph
 | 
						|
 | 
						|
bb1.lr.ph:
 | 
						|
  tail call void @foo() nounwind
 | 
						|
  unreachable
 | 
						|
 | 
						|
bb:
 | 
						|
  tail call void @foo() nounwind
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
; Make sure codegenprep is duplicating ret instructions to enable tail calls.
 | 
						|
; rdar://11140249
 | 
						|
define i32 @t8(i32 %x) nounwind ssp {
 | 
						|
entry:
 | 
						|
; CHECKT2D-LABEL: t8:
 | 
						|
; CHECKT2D-NOT: push
 | 
						|
  %and = and i32 %x, 1
 | 
						|
  %tobool = icmp eq i32 %and, 0
 | 
						|
  br i1 %tobool, label %if.end, label %if.then
 | 
						|
 | 
						|
if.then:                                          ; preds = %entry
 | 
						|
; CHECKT2D: bne.w _a
 | 
						|
  %call = tail call i32 @a(i32 %x) nounwind
 | 
						|
  br label %return
 | 
						|
 | 
						|
if.end:                                           ; preds = %entry
 | 
						|
  %and1 = and i32 %x, 2
 | 
						|
  %tobool2 = icmp eq i32 %and1, 0
 | 
						|
  br i1 %tobool2, label %if.end5, label %if.then3
 | 
						|
 | 
						|
if.then3:                                         ; preds = %if.end
 | 
						|
; CHECKT2D: bne.w _b
 | 
						|
  %call4 = tail call i32 @b(i32 %x) nounwind
 | 
						|
  br label %return
 | 
						|
 | 
						|
if.end5:                                          ; preds = %if.end
 | 
						|
; CHECKT2D: b.w _c
 | 
						|
  %call6 = tail call i32 @c(i32 %x) nounwind
 | 
						|
  br label %return
 | 
						|
 | 
						|
return:                                           ; preds = %if.end5, %if.then3, %if.then
 | 
						|
  %retval.0 = phi i32 [ %call, %if.then ], [ %call4, %if.then3 ], [ %call6, %if.end5 ]
 | 
						|
  ret i32 %retval.0
 | 
						|
}
 | 
						|
 | 
						|
declare i32 @a(i32)
 | 
						|
 | 
						|
declare i32 @b(i32)
 | 
						|
 | 
						|
declare i32 @c(i32)
 | 
						|
 | 
						|
; PR12419
 | 
						|
; rdar://11195178
 | 
						|
; Use the correct input chain for the tailcall node or else the call to
 | 
						|
; _ZN9MutexLockD1Ev would be lost.
 | 
						|
%class.MutexLock = type { i8 }
 | 
						|
 | 
						|
@x = external global i32, align 4
 | 
						|
 | 
						|
define i32 @t9() nounwind {
 | 
						|
; CHECKT2D-LABEL: t9:
 | 
						|
; CHECKT2D: blx __ZN9MutexLockC1Ev
 | 
						|
; CHECKT2D: blx __ZN9MutexLockD1Ev
 | 
						|
; CHECKT2D: b.w ___divsi3
 | 
						|
  %lock = alloca %class.MutexLock, align 1
 | 
						|
  %1 = call %class.MutexLock* @_ZN9MutexLockC1Ev(%class.MutexLock* %lock)
 | 
						|
  %2 = load i32* @x, align 4
 | 
						|
  %3 = sdiv i32 1000, %2
 | 
						|
  %4 = call %class.MutexLock* @_ZN9MutexLockD1Ev(%class.MutexLock* %lock)
 | 
						|
  ret i32 %3
 | 
						|
}
 | 
						|
 | 
						|
declare %class.MutexLock* @_ZN9MutexLockC1Ev(%class.MutexLock*) unnamed_addr nounwind align 2
 | 
						|
 | 
						|
declare %class.MutexLock* @_ZN9MutexLockD1Ev(%class.MutexLock*) unnamed_addr nounwind align 2
 | 
						|
 | 
						|
; rdar://13827621
 | 
						|
; Correctly preserve the input chain for the tailcall node in the bitcast case,
 | 
						|
; otherwise the call to floorf is lost.
 | 
						|
define float @libcall_tc_test2(float* nocapture %a, float %b) {
 | 
						|
; CHECKT2D-LABEL: libcall_tc_test2:
 | 
						|
; CHECKT2D: blx _floorf
 | 
						|
; CHECKT2D: b.w _truncf
 | 
						|
  %1 = load float* %a, align 4
 | 
						|
  %call = tail call float @floorf(float %1)
 | 
						|
  store float %call, float* %a, align 4
 | 
						|
  %call1 = tail call float @truncf(float %b)
 | 
						|
  ret float %call1
 | 
						|
}
 | 
						|
 | 
						|
declare float @floorf(float) readnone
 | 
						|
declare float @truncf(float) readnone
 |