mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-28 04:33:05 +00:00
4de1039403
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@204804 91177308-0d34-0410-b5e6-96231b3b80d8
304 lines
13 KiB
LLVM
304 lines
13 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=knl | FileCheck %s
|
|
|
|
declare <16 x float> @llvm.x86.avx512.gather.dps.mask.512 (<16 x float>, i16, <16 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dps.mask.512 (i8*, i16, <16 x i32>, <16 x float>, i32)
|
|
declare <8 x double> @llvm.x86.avx512.gather.dpd.mask.512 (<8 x double>, i8, <8 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dpd.mask.512 (i8*, i8, <8 x i32>, <8 x double>, i32)
|
|
|
|
declare <8 x float> @llvm.x86.avx512.gather.qps.mask.512 (<8 x float>, i8, <8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qps.mask.512 (i8*, i8, <8 x i64>, <8 x float>, i32)
|
|
declare <8 x double> @llvm.x86.avx512.gather.qpd.mask.512 (<8 x double>, i8, <8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpd.mask.512 (i8*, i8, <8 x i64>, <8 x double>, i32)
|
|
|
|
;CHECK-LABEL: gather_mask_dps
|
|
;CHECK: kmovw
|
|
;CHECK: vgatherdps
|
|
;CHECK: vpadd
|
|
;CHECK: vscatterdps
|
|
;CHECK: ret
|
|
define void @gather_mask_dps(<16 x i32> %ind, <16 x float> %src, i16 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <16 x float> @llvm.x86.avx512.gather.dps.mask.512 (<16 x float> %src, i16 %mask, <16 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <16 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dps.mask.512 (i8* %stbuf, i16 %mask, <16 x i32>%ind2, <16 x float> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_dpd
|
|
;CHECK: kmovw
|
|
;CHECK: vgatherdpd
|
|
;CHECK: vpadd
|
|
;CHECK: vscatterdpd
|
|
;CHECK: ret
|
|
define void @gather_mask_dpd(<8 x i32> %ind, <8 x double> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x double> @llvm.x86.avx512.gather.dpd.mask.512 (<8 x double> %src, i8 %mask, <8 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dpd.mask.512 (i8* %stbuf, i8 %mask, <8 x i32>%ind2, <8 x double> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qps
|
|
;CHECK: kmovw
|
|
;CHECK: vgatherqps
|
|
;CHECK: vpadd
|
|
;CHECK: vscatterqps
|
|
;CHECK: ret
|
|
define void @gather_mask_qps(<8 x i64> %ind, <8 x float> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x float> @llvm.x86.avx512.gather.qps.mask.512 (<8 x float> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qps.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind2, <8 x float> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qpd
|
|
;CHECK: kmovw
|
|
;CHECK: vgatherqpd
|
|
;CHECK: vpadd
|
|
;CHECK: vscatterqpd
|
|
;CHECK: ret
|
|
define void @gather_mask_qpd(<8 x i64> %ind, <8 x double> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x double> @llvm.x86.avx512.gather.qpd.mask.512 (<8 x double> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpd.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind2, <8 x double> %x, i32 4)
|
|
ret void
|
|
}
|
|
;;
|
|
;; Integer Gather/Scatter
|
|
;;
|
|
declare <16 x i32> @llvm.x86.avx512.gather.dpi.mask.512 (<16 x i32>, i16, <16 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dpi.mask.512 (i8*, i16, <16 x i32>, <16 x i32>, i32)
|
|
declare <8 x i64> @llvm.x86.avx512.gather.dpq.mask.512 (<8 x i64>, i8, <8 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dpq.mask.512 (i8*, i8, <8 x i32>, <8 x i64>, i32)
|
|
|
|
declare <8 x i32> @llvm.x86.avx512.gather.qpi.mask.512 (<8 x i32>, i8, <8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpi.mask.512 (i8*, i8, <8 x i64>, <8 x i32>, i32)
|
|
declare <8 x i64> @llvm.x86.avx512.gather.qpq.mask.512 (<8 x i64>, i8, <8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpq.mask.512 (i8*, i8, <8 x i64>, <8 x i64>, i32)
|
|
|
|
;CHECK-LABEL: gather_mask_dd
|
|
;CHECK: kmovw
|
|
;CHECK: vpgatherdd
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterdd
|
|
;CHECK: ret
|
|
define void @gather_mask_dd(<16 x i32> %ind, <16 x i32> %src, i16 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <16 x i32> @llvm.x86.avx512.gather.dpi.mask.512 (<16 x i32> %src, i16 %mask, <16 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <16 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dpi.mask.512 (i8* %stbuf, i16 %mask, <16 x i32>%ind2, <16 x i32> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qd
|
|
;CHECK: kmovw
|
|
;CHECK: vpgatherqd
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterqd
|
|
;CHECK: ret
|
|
define void @gather_mask_qd(<8 x i64> %ind, <8 x i32> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x i32> @llvm.x86.avx512.gather.qpi.mask.512 (<8 x i32> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpi.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind2, <8 x i32> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qq
|
|
;CHECK: kmovw
|
|
;CHECK: vpgatherqq
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterqq
|
|
;CHECK: ret
|
|
define void @gather_mask_qq(<8 x i64> %ind, <8 x i64> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x i64> @llvm.x86.avx512.gather.qpq.mask.512 (<8 x i64> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpq.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind2, <8 x i64> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_dq
|
|
;CHECK: kmovw
|
|
;CHECK: vpgatherdq
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterdq
|
|
;CHECK: ret
|
|
define void @gather_mask_dq(<8 x i32> %ind, <8 x i64> %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x i64> @llvm.x86.avx512.gather.dpq.mask.512 (<8 x i64> %src, i8 %mask, <8 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dpq.mask.512 (i8* %stbuf, i8 %mask, <8 x i32>%ind2, <8 x i64> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;; FP Intinsics without masks
|
|
|
|
declare <16 x float> @llvm.x86.avx512.gather.dps.512 (<16 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dps.512 (i8*, <16 x i32>, <16 x float>, i32)
|
|
declare <8 x float> @llvm.x86.avx512.gather.qps.512 (<8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qps.512 (i8*, <8 x i64>, <8 x float>, i32)
|
|
declare <8 x double> @llvm.x86.avx512.gather.qpd.512 (<8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpd.512 (i8*, <8 x i64>, <8 x double>, i32)
|
|
|
|
;CHECK-LABEL: gather_dps
|
|
;CHECK: kxnorw
|
|
;CHECK: vgatherdps
|
|
;CHECK: vscatterdps
|
|
;CHECK: ret
|
|
define void @gather_dps(<16 x i32> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <16 x float> @llvm.x86.avx512.gather.dps.512 (<16 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <16 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dps.512 (i8* %stbuf, <16 x i32>%ind2, <16 x float> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_qps
|
|
;CHECK: kxnorw
|
|
;CHECK: vgatherqps
|
|
;CHECK: vscatterqps
|
|
;CHECK: ret
|
|
define void @gather_qps(<8 x i64> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x float> @llvm.x86.avx512.gather.qps.512 (<8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qps.512 (i8* %stbuf, <8 x i64>%ind2, <8 x float> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_qpd
|
|
;CHECK: kxnorw
|
|
;CHECK: vgatherqpd
|
|
;CHECK: vpadd
|
|
;CHECK: vscatterqpd
|
|
;CHECK: ret
|
|
define void @gather_qpd(<8 x i64> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x double> @llvm.x86.avx512.gather.qpd.512 (<8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpd.512 (i8* %stbuf, <8 x i64>%ind2, <8 x double> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;; Integer Intinsics without masks
|
|
|
|
declare <16 x i32> @llvm.x86.avx512.gather.dpi.512 (<16 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dpi.512 (i8*, <16 x i32>, <16 x i32>, i32)
|
|
declare <8 x i64> @llvm.x86.avx512.gather.dpq.512 (<8 x i32>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.dpq.512 (i8*, <8 x i32>, <8 x i64>, i32)
|
|
|
|
declare <8 x i32> @llvm.x86.avx512.gather.qpi.512 (<8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpi.512 (i8*, <8 x i64>, <8 x i32>, i32)
|
|
declare <8 x i64> @llvm.x86.avx512.gather.qpq.512 (<8 x i64>, i8*, i32)
|
|
declare void @llvm.x86.avx512.scatter.qpq.512 (i8*, <8 x i64>, <8 x i64>, i32)
|
|
|
|
;CHECK-LABEL: gather_dpi
|
|
;CHECK: kxnorw
|
|
;CHECK: vpgatherdd
|
|
;CHECK: vpscatterdd
|
|
;CHECK: ret
|
|
define void @gather_dpi(<16 x i32> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <16 x i32> @llvm.x86.avx512.gather.dpi.512 (<16 x i32>%ind, i8* %base, i32 4)
|
|
%ind2 = add <16 x i32> %ind, <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
|
|
call void @llvm.x86.avx512.scatter.dpi.512 (i8* %stbuf, <16 x i32>%ind2, <16 x i32> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_qpq
|
|
;CHECK: vpxord %zmm
|
|
;CHECK: kxnorw
|
|
;CHECK: vpgatherqq
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterqq
|
|
;CHECK: ret
|
|
define void @gather_qpq(<8 x i64> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x i64> @llvm.x86.avx512.gather.qpq.512 (<8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpq.512 (i8* %stbuf, <8 x i64>%ind2, <8 x i64> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_qpi
|
|
;CHECK: vpxor %ymm
|
|
;CHECK: kxnorw
|
|
;CHECK: vpgatherqd
|
|
;CHECK: vpadd
|
|
;CHECK: vpscatterqd
|
|
;CHECK: ret
|
|
define void @gather_qpi(<8 x i64> %ind, i8* %base, i8* %stbuf) {
|
|
%x = call <8 x i32> @llvm.x86.avx512.gather.qpi.512 (<8 x i64>%ind, i8* %base, i32 4)
|
|
%ind2 = add <8 x i64> %ind, <i64 0, i64 1, i64 2, i64 3, i64 0, i64 1, i64 2, i64 3>
|
|
call void @llvm.x86.avx512.scatter.qpi.512 (i8* %stbuf, <8 x i64>%ind2, <8 x i32> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_dpd_execdomain
|
|
;CHECK: vgatherdpd
|
|
;CHECK: vmovapd
|
|
;CHECK: ret
|
|
define void @gather_mask_dpd_execdomain(<8 x i32> %ind, <8 x double> %src, i8 %mask, i8* %base, <8 x double>* %stbuf) {
|
|
%x = call <8 x double> @llvm.x86.avx512.gather.dpd.mask.512 (<8 x double> %src, i8 %mask, <8 x i32>%ind, i8* %base, i32 4)
|
|
store <8 x double> %x, <8 x double>* %stbuf
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qpd_execdomain
|
|
;CHECK: vgatherqpd
|
|
;CHECK: vmovapd
|
|
;CHECK: ret
|
|
define void @gather_mask_qpd_execdomain(<8 x i64> %ind, <8 x double> %src, i8 %mask, i8* %base, <8 x double>* %stbuf) {
|
|
%x = call <8 x double> @llvm.x86.avx512.gather.qpd.mask.512 (<8 x double> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
store <8 x double> %x, <8 x double>* %stbuf
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_dps_execdomain
|
|
;CHECK: vgatherdps
|
|
;CHECK: vmovaps
|
|
;CHECK: ret
|
|
define <16 x float> @gather_mask_dps_execdomain(<16 x i32> %ind, <16 x float> %src, i16 %mask, i8* %base) {
|
|
%res = call <16 x float> @llvm.x86.avx512.gather.dps.mask.512 (<16 x float> %src, i16 %mask, <16 x i32>%ind, i8* %base, i32 4)
|
|
ret <16 x float> %res;
|
|
}
|
|
|
|
;CHECK-LABEL: gather_mask_qps_execdomain
|
|
;CHECK: vgatherqps
|
|
;CHECK: vmovaps
|
|
;CHECK: ret
|
|
define <8 x float> @gather_mask_qps_execdomain(<8 x i64> %ind, <8 x float> %src, i8 %mask, i8* %base) {
|
|
%res = call <8 x float> @llvm.x86.avx512.gather.qps.mask.512 (<8 x float> %src, i8 %mask, <8 x i64>%ind, i8* %base, i32 4)
|
|
ret <8 x float> %res;
|
|
}
|
|
|
|
;CHECK-LABEL: scatter_mask_dpd_execdomain
|
|
;CHECK: vmovapd
|
|
;CHECK: vscatterdpd
|
|
;CHECK: ret
|
|
define void @scatter_mask_dpd_execdomain(<8 x i32> %ind, <8 x double>* %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = load <8 x double>* %src, align 64
|
|
call void @llvm.x86.avx512.scatter.dpd.mask.512 (i8* %stbuf, i8 %mask, <8 x i32>%ind, <8 x double> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: scatter_mask_qpd_execdomain
|
|
;CHECK: vmovapd
|
|
;CHECK: vscatterqpd
|
|
;CHECK: ret
|
|
define void @scatter_mask_qpd_execdomain(<8 x i64> %ind, <8 x double>* %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = load <8 x double>* %src, align 64
|
|
call void @llvm.x86.avx512.scatter.qpd.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind, <8 x double> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: scatter_mask_dps_execdomain
|
|
;CHECK: vmovaps
|
|
;CHECK: vscatterdps
|
|
;CHECK: ret
|
|
define void @scatter_mask_dps_execdomain(<16 x i32> %ind, <16 x float>* %src, i16 %mask, i8* %base, i8* %stbuf) {
|
|
%x = load <16 x float>* %src, align 64
|
|
call void @llvm.x86.avx512.scatter.dps.mask.512 (i8* %stbuf, i16 %mask, <16 x i32>%ind, <16 x float> %x, i32 4)
|
|
ret void
|
|
}
|
|
|
|
;CHECK-LABEL: scatter_mask_qps_execdomain
|
|
;CHECK: vmovaps
|
|
;CHECK: vscatterqps
|
|
;CHECK: ret
|
|
define void @scatter_mask_qps_execdomain(<8 x i64> %ind, <8 x float>* %src, i8 %mask, i8* %base, i8* %stbuf) {
|
|
%x = load <8 x float>* %src, align 32
|
|
call void @llvm.x86.avx512.scatter.qps.mask.512 (i8* %stbuf, i8 %mask, <8 x i64>%ind, <8 x float> %x, i32 4)
|
|
ret void
|
|
}
|