mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-16 11:30:51 +00:00
32b845d223
See r230786 and r230794 for similar changes to gep and load respectively. Call is a bit different because it often doesn't have a single explicit type - usually the type is deduced from the arguments, and just the return type is explicit. In those cases there's no need to change the IR. When that's not the case, the IR usually contains the pointer type of the first operand - but since typed pointers are going away, that representation is insufficient so I'm just stripping the "pointerness" of the explicit type away. This does make the IR a bit weird - it /sort of/ reads like the type of the first operand: "call void () %x(" but %x is actually of type "void ()*" and will eventually be just of type "ptr". But this seems not too bad and I don't think it would benefit from repeating the type ("void (), void () * %x(" and then eventually "void (), ptr %x(") as has been done with gep and load. This also has a side benefit: since the explicit type is no longer a pointer, there's no ambiguity between an explicit type and a function that returns a function pointer. Previously this case needed an explicit type (eg: a function returning a void() function was written as "call void () () * @x(" rather than "call void () * @x(" because of the ambiguity between a function returning a pointer to a void() function and a function returning void). No ambiguity means even function pointer return types can just be written alone, without writing the whole function's type. This leaves /only/ the varargs case where the explicit type is required. Given the special type syntax in call instructions, the regex-fu used for migration was a bit more involved in its own unique way (as every one of these is) so here it is. Use it in conjunction with the apply.sh script and associated find/xargs commands I've provided in rr230786 to migrate your out of tree tests. Do let me know if any of this doesn't cover your cases & we can iterate on a more general script/regexes to help others with out of tree tests. About 9 test cases couldn't be automatically migrated - half of those were functions returning function pointers, where I just had to manually delete the function argument types now that we didn't need an explicit function type there. The other half were typedefs of function types used in calls - just had to manually drop the * from those. import fileinput import sys import re pat = re.compile(r'((?:=|:|^|\s)call\s(?:[^@]*?))(\s*$|\s*(?:(?:\[\[[a-zA-Z0-9_]+\]\]|[@%](?:(")?[\\\?@a-zA-Z0-9_.]*?(?(3)"|)|{{.*}}))(?:\(|$)|undef|inttoptr|bitcast|null|asm).*$)') addrspace_end = re.compile(r"addrspace\(\d+\)\s*\*$") func_end = re.compile("(?:void.*|\)\s*)\*$") def conv(match, line): if not match or re.search(addrspace_end, match.group(1)) or not re.search(func_end, match.group(1)): return line return line[:match.start()] + match.group(1)[:match.group(1).rfind('*')].rstrip() + match.group(2) + line[match.end():] for line in sys.stdin: sys.stdout.write(conv(re.search(pat, line), line)) git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@235145 91177308-0d34-0410-b5e6-96231b3b80d8
315 lines
7.2 KiB
LLVM
315 lines
7.2 KiB
LLVM
; RUN: llc < %s -mattr=-avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s
|
|
; RUN: llc < %s -mattr=+avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s --check-prefix=AVX
|
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
|
|
target triple = "x86_64-apple-darwin10.0.0"
|
|
|
|
; Make sure that fast-isel folds the immediate into the binop even though it
|
|
; is non-canonical.
|
|
define i32 @test1(i32 %i) nounwind ssp {
|
|
%and = and i32 8, %i
|
|
ret i32 %and
|
|
}
|
|
|
|
; CHECK-LABEL: test1:
|
|
; CHECK: andl $8,
|
|
|
|
|
|
; rdar://9289512 - The load should fold into the compare.
|
|
define void @test2(i64 %x) nounwind ssp {
|
|
entry:
|
|
%x.addr = alloca i64, align 8
|
|
store i64 %x, i64* %x.addr, align 8
|
|
%tmp = load i64, i64* %x.addr, align 8
|
|
%cmp = icmp sgt i64 %tmp, 42
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then: ; preds = %entry
|
|
br label %if.end
|
|
|
|
if.end: ; preds = %if.then, %entry
|
|
ret void
|
|
; CHECK-LABEL: test2:
|
|
; CHECK: movq %rdi, -8(%rsp)
|
|
; CHECK: cmpq $42, -8(%rsp)
|
|
}
|
|
|
|
|
|
|
|
|
|
@G = external global i32
|
|
define i64 @test3() nounwind {
|
|
%A = ptrtoint i32* @G to i64
|
|
ret i64 %A
|
|
; CHECK-LABEL: test3:
|
|
; CHECK: movq _G@GOTPCREL(%rip), %rax
|
|
; CHECK-NEXT: ret
|
|
}
|
|
|
|
|
|
|
|
; rdar://9289558
|
|
@rtx_length = external global [153 x i8]
|
|
|
|
define i32 @test4(i64 %idxprom9) nounwind {
|
|
%arrayidx10 = getelementptr inbounds [153 x i8], [153 x i8]* @rtx_length, i32 0, i64 %idxprom9
|
|
%tmp11 = load i8, i8* %arrayidx10, align 1
|
|
%conv = zext i8 %tmp11 to i32
|
|
ret i32 %conv
|
|
|
|
; CHECK-LABEL: test4:
|
|
; CHECK: movq _rtx_length@GOTPCREL(%rip), %rax
|
|
; CHECK-NEXT: movzbl (%rax,%rdi), %eax
|
|
; CHECK-NEXT: ret
|
|
}
|
|
|
|
|
|
; PR3242 - Out of range shifts should not be folded by fastisel.
|
|
define void @test5(i32 %x, i32* %p) nounwind {
|
|
%y = ashr i32 %x, 50000
|
|
store i32 %y, i32* %p
|
|
ret void
|
|
|
|
; CHECK-LABEL: test5:
|
|
; CHECK: movl $50000, %ecx
|
|
; CHECK: sarl %cl, %edi
|
|
; CHECK: ret
|
|
}
|
|
|
|
; rdar://9289501 - fast isel should fold trivial multiplies to shifts.
|
|
define i64 @test6(i64 %x) nounwind ssp {
|
|
entry:
|
|
%mul = mul nsw i64 %x, 8
|
|
ret i64 %mul
|
|
|
|
; CHECK-LABEL: test6:
|
|
; CHECK: shlq $3, %rdi
|
|
}
|
|
|
|
define i32 @test7(i32 %x) nounwind ssp {
|
|
entry:
|
|
%mul = mul nsw i32 %x, 8
|
|
ret i32 %mul
|
|
; CHECK-LABEL: test7:
|
|
; CHECK: shll $3, %edi
|
|
}
|
|
|
|
|
|
; rdar://9289507 - folding of immediates into 64-bit operations.
|
|
define i64 @test8(i64 %x) nounwind ssp {
|
|
entry:
|
|
%add = add nsw i64 %x, 7
|
|
ret i64 %add
|
|
|
|
; CHECK-LABEL: test8:
|
|
; CHECK: addq $7, %rdi
|
|
}
|
|
|
|
define i64 @test9(i64 %x) nounwind ssp {
|
|
entry:
|
|
%add = mul nsw i64 %x, 7
|
|
ret i64 %add
|
|
; CHECK-LABEL: test9:
|
|
; CHECK: imulq $7, %rdi, %rax
|
|
}
|
|
|
|
; rdar://9297011 - Don't reject udiv by a power of 2.
|
|
define i32 @test10(i32 %X) nounwind {
|
|
%Y = udiv i32 %X, 8
|
|
ret i32 %Y
|
|
; CHECK-LABEL: test10:
|
|
; CHECK: shrl $3,
|
|
}
|
|
|
|
define i32 @test11(i32 %X) nounwind {
|
|
%Y = sdiv exact i32 %X, 8
|
|
ret i32 %Y
|
|
; CHECK-LABEL: test11:
|
|
; CHECK: sarl $3,
|
|
}
|
|
|
|
|
|
; rdar://9297006 - Trunc to bool.
|
|
define void @test12(i8 %tmp) nounwind ssp noredzone {
|
|
entry:
|
|
%tobool = trunc i8 %tmp to i1
|
|
br i1 %tobool, label %if.then, label %if.end
|
|
|
|
if.then: ; preds = %entry
|
|
call void @test12(i8 0) noredzone
|
|
br label %if.end
|
|
|
|
if.end: ; preds = %if.then, %entry
|
|
ret void
|
|
; CHECK-LABEL: test12:
|
|
; CHECK: testb $1,
|
|
; CHECK-NEXT: je L
|
|
; CHECK-NEXT: xorl %edi, %edi
|
|
; CHECK-NEXT: callq
|
|
}
|
|
|
|
declare void @test13f(i1 %X)
|
|
|
|
define void @test13() nounwind {
|
|
call void @test13f(i1 0)
|
|
ret void
|
|
; CHECK-LABEL: test13:
|
|
; CHECK: xorl %edi, %edi
|
|
; CHECK-NEXT: callq
|
|
}
|
|
|
|
|
|
|
|
; rdar://9297003 - fast isel bails out on all functions taking bools
|
|
define void @test14(i8 %tmp) nounwind ssp noredzone {
|
|
entry:
|
|
%tobool = trunc i8 %tmp to i1
|
|
call void @test13f(i1 zeroext %tobool) noredzone
|
|
ret void
|
|
; CHECK-LABEL: test14:
|
|
; CHECK: andb $1,
|
|
; CHECK: callq
|
|
}
|
|
|
|
declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8*, i64, i32, i1)
|
|
|
|
; rdar://9289488 - fast-isel shouldn't bail out on llvm.memcpy
|
|
define void @test15(i8* %a, i8* %b) nounwind {
|
|
call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 4, i32 4, i1 false)
|
|
ret void
|
|
; CHECK-LABEL: test15:
|
|
; CHECK-NEXT: movl (%rsi), %eax
|
|
; CHECK-NEXT: movl %eax, (%rdi)
|
|
; CHECK-NEXT: ret
|
|
}
|
|
|
|
; Handling for varargs calls
|
|
declare void @test16callee(...) nounwind
|
|
define void @test16() nounwind {
|
|
; CHECK-LABEL: test16:
|
|
; CHECK: movl $1, %edi
|
|
; CHECK: movb $0, %al
|
|
; CHECK: callq _test16callee
|
|
call void (...) @test16callee(i32 1)
|
|
br label %block2
|
|
|
|
block2:
|
|
; CHECK: movsd LCP{{.*}}_{{.*}}(%rip), %xmm0
|
|
; CHECK: movb $1, %al
|
|
; CHECK: callq _test16callee
|
|
|
|
; AVX: vmovsd LCP{{.*}}_{{.*}}(%rip), %xmm0
|
|
; AVX: movb $1, %al
|
|
; AVX: callq _test16callee
|
|
call void (...) @test16callee(double 1.000000e+00)
|
|
ret void
|
|
}
|
|
|
|
|
|
declare void @foo() unnamed_addr ssp align 2
|
|
|
|
; Verify that we don't fold the load into the compare here. That would move it
|
|
; w.r.t. the call.
|
|
define i32 @test17(i32 *%P) ssp nounwind {
|
|
entry:
|
|
%tmp = load i32, i32* %P
|
|
%cmp = icmp ne i32 %tmp, 5
|
|
call void @foo()
|
|
br i1 %cmp, label %if.then, label %if.else
|
|
|
|
if.then: ; preds = %entry
|
|
ret i32 1
|
|
|
|
if.else: ; preds = %entry
|
|
ret i32 2
|
|
; CHECK-LABEL: test17:
|
|
; CHECK: movl (%rdi), %eax
|
|
; CHECK: callq _foo
|
|
; CHECK: cmpl $5, %eax
|
|
; CHECK-NEXT: je
|
|
}
|
|
|
|
; Check that 0.0 is materialized using xorps
|
|
define void @test18(float* %p1) {
|
|
store float 0.0, float* %p1
|
|
ret void
|
|
; CHECK-LABEL: test18:
|
|
; CHECK: xorps
|
|
}
|
|
|
|
; Without any type hints, doubles use the smaller xorps instead of xorpd.
|
|
define void @test19(double* %p1) {
|
|
store double 0.0, double* %p1
|
|
ret void
|
|
; CHECK-LABEL: test19:
|
|
; CHECK: xorps
|
|
}
|
|
|
|
; Check that we fast-isel sret
|
|
%struct.a = type { i64, i64, i64 }
|
|
define void @test20() nounwind ssp {
|
|
entry:
|
|
%tmp = alloca %struct.a, align 8
|
|
call void @test20sret(%struct.a* sret %tmp)
|
|
ret void
|
|
; CHECK-LABEL: test20:
|
|
; CHECK: leaq (%rsp), %rdi
|
|
; CHECK: callq _test20sret
|
|
}
|
|
declare void @test20sret(%struct.a* sret)
|
|
|
|
; Check that -0.0 is not materialized using xor
|
|
define void @test21(double* %p1) {
|
|
store double -0.0, double* %p1
|
|
ret void
|
|
; CHECK-LABEL: test21:
|
|
; CHECK-NOT: xor
|
|
; CHECK: movsd LCPI
|
|
}
|
|
|
|
; Check that immediate arguments to a function
|
|
; do not cause massive spilling and are used
|
|
; as immediates just before the call.
|
|
define void @test22() nounwind {
|
|
entry:
|
|
call void @foo22(i32 0)
|
|
call void @foo22(i32 1)
|
|
call void @foo22(i32 2)
|
|
call void @foo22(i32 3)
|
|
ret void
|
|
; CHECK-LABEL: test22:
|
|
; CHECK: xorl %edi, %edi
|
|
; CHECK: callq _foo22
|
|
; CHECK: movl $1, %edi
|
|
; CHECK: callq _foo22
|
|
; CHECK: movl $2, %edi
|
|
; CHECK: callq _foo22
|
|
; CHECK: movl $3, %edi
|
|
; CHECK: callq _foo22
|
|
}
|
|
|
|
declare void @foo22(i32)
|
|
|
|
; PR13563
|
|
define void @test23(i8* noalias sret %result) {
|
|
%a = alloca i8
|
|
%b = call i8* @foo23()
|
|
ret void
|
|
; CHECK-LABEL: test23:
|
|
; CHECK: call
|
|
; CHECK: movq %rdi, %rax
|
|
; CHECK: ret
|
|
}
|
|
|
|
declare i8* @foo23()
|
|
|
|
declare void @takesi32ptr(i32* %arg)
|
|
|
|
; CHECK-LABEL: allocamaterialize
|
|
define void @allocamaterialize() {
|
|
%a = alloca i32
|
|
; CHECK: leaq {{.*}}, %rdi
|
|
call void @takesi32ptr(i32* %a)
|
|
ret void
|
|
}
|