mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-10-30 16:17:05 +00:00 
			
		
		
		
	The C and C++ semantics for compare_exchange require it to return a bool
indicating success. This gets mapped to LLVM IR which follows each cmpxchg with
an icmp of the value loaded against the desired value.
When lowered to ldxr/stxr loops, this extra comparison is redundant: its
results are implicit in the control-flow of the function.
This commit makes two changes: it replaces that icmp with appropriate PHI
nodes, and then makes sure earlyCSE is called after expansion to actually make
use of the opportunities revealed.
I've also added -{arm,aarch64}-enable-atomic-tidy options, so that
existing fragile tests aren't perturbed too much by the change. Many
of them either rely on undef/unreachable too pervasively to be
restored to something well-defined (particularly while making sure
they test the same obscure assert from many years ago), or depend on a
particular CFG shape, which is disrupted by SimplifyCFG.
rdar://problem/16227836
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@209883 91177308-0d34-0410-b5e6-96231b3b80d8
		
	
		
			
				
	
	
		
			22 lines
		
	
	
		
			713 B
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			22 lines
		
	
	
		
			713 B
		
	
	
	
		
			LLVM
		
	
	
	
	
	
| ; Tests for the two-address instruction pass.
 | |
| ; RUN: llc -mtriple=arm-eabi -mcpu=cortex-a9 -arm-atomic-cfg-tidy=0 %s -o - | FileCheck %s
 | |
| 
 | |
| define void @PR13378() nounwind {
 | |
| ; This was orriginally a crasher trying to schedule the instructions.
 | |
| ; CHECK-LABEL:      PR13378:
 | |
| ; CHECK:        vld1.32
 | |
| ; CHECK-NEXT:   vst1.32
 | |
| ; CHECK-NEXT:   vst1.32
 | |
| ; CHECK-NEXT:   vmov.f32
 | |
| ; CHECK-NEXT:   vmov.f32
 | |
| ; CHECK-NEXT:   vst1.32
 | |
| 
 | |
| entry:
 | |
|   %0 = load <4 x float>* undef, align 4
 | |
|   store <4 x float> zeroinitializer, <4 x float>* undef, align 4
 | |
|   store <4 x float> %0, <4 x float>* undef, align 4
 | |
|   %1 = insertelement <4 x float> %0, float 1.000000e+00, i32 3
 | |
|   store <4 x float> %1, <4 x float>* undef, align 4
 | |
|   unreachable
 | |
| }
 |