mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-27 13:30:05 +00:00
7b837d8c75
This adds a second implementation of the AArch64 architecture to LLVM, accessible in parallel via the "arm64" triple. The plan over the coming weeks & months is to merge the two into a single backend, during which time thorough code review should naturally occur. Everything will be easier with the target in-tree though, hence this commit. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@205090 91177308-0d34-0410-b5e6-96231b3b80d8
103 lines
4.9 KiB
LLVM
103 lines
4.9 KiB
LLVM
; RUN: llc -mtriple arm64-apple-ios -O3 -o - < %s | FileCheck %s
|
|
; <rdar://problem/14477220>
|
|
|
|
%class.Complex = type { float, float }
|
|
%class.Complex_int = type { i32, i32 }
|
|
%class.Complex_long = type { i64, i64 }
|
|
|
|
; CHECK-LABEL: @test
|
|
; CHECK: add [[BASE:x[0-9]+]], x0, x1, lsl #3
|
|
; CHECK: ldp [[CPLX1_I:s[0-9]+]], [[CPLX1_R:s[0-9]+]], {{\[}}[[BASE]]]
|
|
; CHECK: ldp [[CPLX2_I:s[0-9]+]], [[CPLX2_R:s[0-9]+]], {{\[}}[[BASE]], #64]
|
|
; CHECK: fadd {{s[0-9]+}}, [[CPLX2_I]], [[CPLX1_I]]
|
|
; CHECK: fadd {{s[0-9]+}}, [[CPLX2_R]], [[CPLX1_R]]
|
|
; CHECK: ret
|
|
define void @test(%class.Complex* nocapture %out, i64 %out_start) {
|
|
entry:
|
|
%arrayidx = getelementptr inbounds %class.Complex* %out, i64 %out_start
|
|
%0 = bitcast %class.Complex* %arrayidx to i64*
|
|
%1 = load i64* %0, align 4
|
|
%t0.sroa.0.0.extract.trunc = trunc i64 %1 to i32
|
|
%2 = bitcast i32 %t0.sroa.0.0.extract.trunc to float
|
|
%t0.sroa.2.0.extract.shift = lshr i64 %1, 32
|
|
%t0.sroa.2.0.extract.trunc = trunc i64 %t0.sroa.2.0.extract.shift to i32
|
|
%3 = bitcast i32 %t0.sroa.2.0.extract.trunc to float
|
|
%add = add i64 %out_start, 8
|
|
%arrayidx2 = getelementptr inbounds %class.Complex* %out, i64 %add
|
|
%i.i = getelementptr inbounds %class.Complex* %arrayidx2, i64 0, i32 0
|
|
%4 = load float* %i.i, align 4
|
|
%add.i = fadd float %4, %2
|
|
%retval.sroa.0.0.vec.insert.i = insertelement <2 x float> undef, float %add.i, i32 0
|
|
%r.i = getelementptr inbounds %class.Complex* %arrayidx2, i64 0, i32 1
|
|
%5 = load float* %r.i, align 4
|
|
%add5.i = fadd float %5, %3
|
|
%retval.sroa.0.4.vec.insert.i = insertelement <2 x float> %retval.sroa.0.0.vec.insert.i, float %add5.i, i32 1
|
|
%ref.tmp.sroa.0.0.cast = bitcast %class.Complex* %arrayidx to <2 x float>*
|
|
store <2 x float> %retval.sroa.0.4.vec.insert.i, <2 x float>* %ref.tmp.sroa.0.0.cast, align 4
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @test_int
|
|
; CHECK: add [[BASE:x[0-9]+]], x0, x1, lsl #3
|
|
; CHECK: ldp [[CPLX1_I:w[0-9]+]], [[CPLX1_R:w[0-9]+]], {{\[}}[[BASE]]]
|
|
; CHECK: ldp [[CPLX2_I:w[0-9]+]], [[CPLX2_R:w[0-9]+]], {{\[}}[[BASE]], #64]
|
|
; CHECK: add {{w[0-9]+}}, [[CPLX2_I]], [[CPLX1_I]]
|
|
; CHECK: add {{w[0-9]+}}, [[CPLX2_R]], [[CPLX1_R]]
|
|
; CHECK: ret
|
|
define void @test_int(%class.Complex_int* nocapture %out, i64 %out_start) {
|
|
entry:
|
|
%arrayidx = getelementptr inbounds %class.Complex_int* %out, i64 %out_start
|
|
%0 = bitcast %class.Complex_int* %arrayidx to i64*
|
|
%1 = load i64* %0, align 4
|
|
%t0.sroa.0.0.extract.trunc = trunc i64 %1 to i32
|
|
%2 = bitcast i32 %t0.sroa.0.0.extract.trunc to i32
|
|
%t0.sroa.2.0.extract.shift = lshr i64 %1, 32
|
|
%t0.sroa.2.0.extract.trunc = trunc i64 %t0.sroa.2.0.extract.shift to i32
|
|
%3 = bitcast i32 %t0.sroa.2.0.extract.trunc to i32
|
|
%add = add i64 %out_start, 8
|
|
%arrayidx2 = getelementptr inbounds %class.Complex_int* %out, i64 %add
|
|
%i.i = getelementptr inbounds %class.Complex_int* %arrayidx2, i64 0, i32 0
|
|
%4 = load i32* %i.i, align 4
|
|
%add.i = add i32 %4, %2
|
|
%retval.sroa.0.0.vec.insert.i = insertelement <2 x i32> undef, i32 %add.i, i32 0
|
|
%r.i = getelementptr inbounds %class.Complex_int* %arrayidx2, i64 0, i32 1
|
|
%5 = load i32* %r.i, align 4
|
|
%add5.i = add i32 %5, %3
|
|
%retval.sroa.0.4.vec.insert.i = insertelement <2 x i32> %retval.sroa.0.0.vec.insert.i, i32 %add5.i, i32 1
|
|
%ref.tmp.sroa.0.0.cast = bitcast %class.Complex_int* %arrayidx to <2 x i32>*
|
|
store <2 x i32> %retval.sroa.0.4.vec.insert.i, <2 x i32>* %ref.tmp.sroa.0.0.cast, align 4
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @test_long
|
|
; CHECK: add [[BASE:x[0-9]+]], x0, x1, lsl #4
|
|
; CHECK: ldp [[CPLX1_I:x[0-9]+]], [[CPLX1_R:x[0-9]+]], {{\[}}[[BASE]]]
|
|
; CHECK: ldp [[CPLX2_I:x[0-9]+]], [[CPLX2_R:x[0-9]+]], {{\[}}[[BASE]], #128]
|
|
; CHECK: add {{x[0-9]+}}, [[CPLX2_I]], [[CPLX1_I]]
|
|
; CHECK: add {{x[0-9]+}}, [[CPLX2_R]], [[CPLX1_R]]
|
|
; CHECK: ret
|
|
define void @test_long(%class.Complex_long* nocapture %out, i64 %out_start) {
|
|
entry:
|
|
%arrayidx = getelementptr inbounds %class.Complex_long* %out, i64 %out_start
|
|
%0 = bitcast %class.Complex_long* %arrayidx to i128*
|
|
%1 = load i128* %0, align 4
|
|
%t0.sroa.0.0.extract.trunc = trunc i128 %1 to i64
|
|
%2 = bitcast i64 %t0.sroa.0.0.extract.trunc to i64
|
|
%t0.sroa.2.0.extract.shift = lshr i128 %1, 64
|
|
%t0.sroa.2.0.extract.trunc = trunc i128 %t0.sroa.2.0.extract.shift to i64
|
|
%3 = bitcast i64 %t0.sroa.2.0.extract.trunc to i64
|
|
%add = add i64 %out_start, 8
|
|
%arrayidx2 = getelementptr inbounds %class.Complex_long* %out, i64 %add
|
|
%i.i = getelementptr inbounds %class.Complex_long* %arrayidx2, i32 0, i32 0
|
|
%4 = load i64* %i.i, align 4
|
|
%add.i = add i64 %4, %2
|
|
%retval.sroa.0.0.vec.insert.i = insertelement <2 x i64> undef, i64 %add.i, i32 0
|
|
%r.i = getelementptr inbounds %class.Complex_long* %arrayidx2, i32 0, i32 1
|
|
%5 = load i64* %r.i, align 4
|
|
%add5.i = add i64 %5, %3
|
|
%retval.sroa.0.4.vec.insert.i = insertelement <2 x i64> %retval.sroa.0.0.vec.insert.i, i64 %add5.i, i32 1
|
|
%ref.tmp.sroa.0.0.cast = bitcast %class.Complex_long* %arrayidx to <2 x i64>*
|
|
store <2 x i64> %retval.sroa.0.4.vec.insert.i, <2 x i64>* %ref.tmp.sroa.0.0.cast, align 4
|
|
ret void
|
|
}
|