mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-08 03:30:22 +00:00
7c9c6ed761
Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=|:|^)\s*load (?:atomic )?(?:volatile )?(.*?))(| addrspace\(\d+\) *)\*($| *(?:%|@|null|undef|blockaddress|getelementptr|addrspacecast|bitcast|inttoptr|\[\[[a-zA-Z]|\{\{).*$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@230794 91177308-0d34-0410-b5e6-96231b3b80d8
152 lines
4.0 KiB
LLVM
152 lines
4.0 KiB
LLVM
; Test 128-bit floating-point loads.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
|
|
|
|
; Check loads with no offset.
|
|
define double @f1(i64 %src) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: ld %f0, 0(%r2)
|
|
; CHECK: ld %f2, 8(%r2)
|
|
; CHECK: br %r14
|
|
%ptr = inttoptr i64 %src to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the highest aligned offset that allows LD for both halves.
|
|
define double @f2(i64 %src) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: ld %f0, 4080(%r2)
|
|
; CHECK: ld %f2, 4088(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, 4080
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the next doubleword up, which requires a mixture of LD and LDY.
|
|
define double @f3(i64 %src) {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: ld %f0, 4088(%r2)
|
|
; CHECK: ldy %f2, 4096(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, 4088
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the next doubleword after that, which requires LDY for both halves.
|
|
define double @f4(i64 %src) {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: ldy %f0, 4096(%r2)
|
|
; CHECK: ldy %f2, 4104(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, 4096
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the highest aligned offset that allows LDY for both halves.
|
|
define double @f5(i64 %src) {
|
|
; CHECK-LABEL: f5:
|
|
; CHECK: ldy %f0, 524272(%r2)
|
|
; CHECK: ldy %f2, 524280(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, 524272
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the next doubleword up, which requires separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define double @f6(i64 %src) {
|
|
; CHECK-LABEL: f6:
|
|
; CHECK: lay %r1, 524280(%r2)
|
|
; CHECK: ld %f0, 0(%r1)
|
|
; CHECK: ld %f2, 8(%r1)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, 524280
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the highest aligned negative offset, which needs a combination of
|
|
; LDY and LD.
|
|
define double @f7(i64 %src) {
|
|
; CHECK-LABEL: f7:
|
|
; CHECK: ldy %f0, -8(%r2)
|
|
; CHECK: ld %f2, 0(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, -8
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the next doubleword down, which requires LDY for both halves.
|
|
define double @f8(i64 %src) {
|
|
; CHECK-LABEL: f8:
|
|
; CHECK: ldy %f0, -16(%r2)
|
|
; CHECK: ldy %f2, -8(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, -16
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the lowest offset that allows LDY for both halves.
|
|
define double @f9(i64 %src) {
|
|
; CHECK-LABEL: f9:
|
|
; CHECK: ldy %f0, -524288(%r2)
|
|
; CHECK: ldy %f2, -524280(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, -524288
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check the next doubleword down, which requires separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define double @f10(i64 %src) {
|
|
; CHECK-LABEL: f10:
|
|
; CHECK: agfi %r2, -524296
|
|
; CHECK: ld %f0, 0(%r2)
|
|
; CHECK: ld %f2, 8(%r2)
|
|
; CHECK: br %r14
|
|
%add = add i64 %src, -524296
|
|
%ptr = inttoptr i64 %add to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|
|
|
|
; Check that indices are allowed.
|
|
define double @f11(i64 %src, i64 %index) {
|
|
; CHECK-LABEL: f11:
|
|
; CHECK: ld %f0, 4088({{%r2,%r3|%r3,%r2}})
|
|
; CHECK: ldy %f2, 4096({{%r2,%r3|%r3,%r2}})
|
|
; CHECK: br %r14
|
|
%add1 = add i64 %src, %index
|
|
%add2 = add i64 %add1, 4088
|
|
%ptr = inttoptr i64 %add2 to fp128 *
|
|
%val = load fp128 , fp128 *%ptr
|
|
%trunc = fptrunc fp128 %val to double
|
|
ret double %trunc
|
|
}
|