mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-14 11:32:34 +00:00
d84561bf69
In a previous iteration of the pass, we would try to compensate for writeback by updating later instructions and/or inserting a SUBS to reset the base register if necessary. Since such a SUBS sets the condition flags it's not generally safe to do this. For now, only merge LDR/STRs if there is no writeback to the base register (LDM that loads into the base register) or the base register is killed by one of the merged instructions. These cases are clear wins both in terms of instruction count and performance. Also add three new test cases, and update the existing ones accordingly. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@215729 91177308-0d34-0410-b5e6-96231b3b80d8
78 lines
2.5 KiB
LLVM
78 lines
2.5 KiB
LLVM
; RUN: llc < %s -mtriple=thumb-apple-darwin -disable-cgp-branch-opts -disable-post-ra -verify-machineinstrs | FileCheck %s -check-prefix=CHECK
|
|
; RUN: llc < %s -mtriple=thumb-apple-darwin -disable-cgp-branch-opts -disable-post-ra -regalloc=basic -verify-machineinstrs | FileCheck %s -check-prefix=CHECK
|
|
|
|
%struct.state = type { i32, %struct.info*, float**, i32, i32, i32, i32, i32, i32, i32, i32, i32, i64, i64, i64, i64, i64, i64, i8* }
|
|
%struct.info = type { i32, i32, i32, i32, i32, i32, i32, i8* }
|
|
|
|
define void @t1(%struct.state* %v) {
|
|
; CHECK-LABEL: t1:
|
|
; CHECK: push
|
|
; CHECK: add r7, sp, #12
|
|
; CHECK: lsls r[[R0:[0-9]+]]
|
|
; CHECK: mov r[[R1:[0-9]+]], sp
|
|
; CHECK: subs r[[R2:[0-9]+]], r[[R1]], r[[R0]]
|
|
; CHECK: mov sp, r[[R2]]
|
|
%tmp6 = load i32* null
|
|
%tmp8 = alloca float, i32 %tmp6
|
|
store i32 1, i32* null
|
|
br i1 false, label %bb123.preheader, label %return
|
|
|
|
bb123.preheader:
|
|
br i1 false, label %bb43, label %return
|
|
|
|
bb43:
|
|
call fastcc void @f1( float* %tmp8, float* null, i32 0 )
|
|
%tmp70 = load i32* null
|
|
%tmp85 = getelementptr float* %tmp8, i32 0
|
|
call fastcc void @f2( float* null, float* null, float* %tmp85, i32 %tmp70 )
|
|
ret void
|
|
|
|
return:
|
|
ret void
|
|
}
|
|
|
|
declare fastcc void @f1(float*, float*, i32)
|
|
|
|
declare fastcc void @f2(float*, float*, float*, i32)
|
|
|
|
%struct.comment = type { i8**, i32*, i32, i8* }
|
|
@str215 = external global [2 x i8]
|
|
|
|
define void @t2(%struct.comment* %vc, i8* %tag, i8* %contents) {
|
|
; CHECK-LABEL: t2:
|
|
; CHECK: push
|
|
; CHECK: add r7, sp, #12
|
|
; CHECK: sub sp, #
|
|
; CHECK: mov r[[R0:[0-9]+]], sp
|
|
; CHECK: str r{{[0-9+]}}, [r[[R0]]
|
|
; CHECK: str r{{[0-9+]}}, [r[[R0]]
|
|
; CHECK-NOT: ldr r0, [sp
|
|
; CHECK: mov r[[R1:[0-9]+]], sp
|
|
; CHECK: subs r[[R2:[0-9]+]], r[[R1]], r{{[0-9]+}}
|
|
; CHECK: mov sp, r[[R2]]
|
|
; CHECK-NOT: ldr r0, [sp
|
|
; CHECK: bx
|
|
%tmp1 = call i32 @strlen( i8* %tag )
|
|
%tmp3 = call i32 @strlen( i8* %contents )
|
|
%tmp4 = add i32 %tmp1, 2
|
|
%tmp5 = add i32 %tmp4, %tmp3
|
|
%tmp6 = alloca i8, i32 %tmp5
|
|
%tmp9 = call i8* @strcpy( i8* %tmp6, i8* %tag )
|
|
%tmp6.len = call i32 @strlen( i8* %tmp6 )
|
|
%tmp6.indexed = getelementptr i8* %tmp6, i32 %tmp6.len
|
|
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %tmp6.indexed, i8* getelementptr inbounds ([2 x i8]* @str215, i32 0, i32 0), i32 2, i32 1, i1 false)
|
|
%tmp15 = call i8* @strcat( i8* %tmp6, i8* %contents )
|
|
call fastcc void @comment_add( %struct.comment* %vc, i8* %tmp6 )
|
|
ret void
|
|
}
|
|
|
|
declare i32 @strlen(i8*)
|
|
|
|
declare i8* @strcat(i8*, i8*)
|
|
|
|
declare fastcc void @comment_add(%struct.comment*, i8*)
|
|
|
|
declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i32, i1) nounwind
|
|
|
|
declare i8* @strcpy(i8*, i8*)
|