mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-12 17:32:19 +00:00
4b5324ad2c
optimized x86-64 (and x86) calls so that they work (... at least for my test cases). Should fix the following problems: Problem 1: When i introduced the optimized handling of arguments for tail called functions (using a sequence of copyto/copyfrom virtual registers instead of always lowering to top of the stack) i did not handle byval arguments correctly e.g they did not work at all :). Problem 2: On x86-64 after the arguments of the tail called function are moved to their registers (which include ESI/RSI etc), tail call optimization performs byval lowering which causes xSI,xDI, xCX registers to be overwritten. This is handled in this patch by moving the arguments to virtual registers first and after the byval lowering the arguments are moved from those virtual registers back to RSI/RDI/RCX. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@49584 91177308-0d34-0410-b5e6-96231b3b80d8
20 lines
681 B
LLVM
20 lines
681 B
LLVM
; RUN: llvm-as < %s | llc -march=x86 -tailcallopt | grep TAILCALL
|
|
; check for the 2 byval moves
|
|
; RUN: llvm-as < %s | llc -march=x86 -tailcallopt | grep rep | wc -l | grep 2
|
|
%struct.s = type {i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32, i32, i32, i32, i32, i32, i32, i32 }
|
|
|
|
define fastcc i32 @tailcallee(%struct.s* byval %a) {
|
|
entry:
|
|
%tmp2 = getelementptr %struct.s* %a, i32 0, i32 0
|
|
%tmp3 = load i32* %tmp2
|
|
ret i32 %tmp3
|
|
}
|
|
|
|
define fastcc i32 @tailcaller(%struct.s* byval %a) {
|
|
entry:
|
|
%tmp4 = tail call fastcc i32 @tailcallee(%struct.s* %a byval)
|
|
ret i32 %tmp4
|
|
}
|