mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-08-09 11:25:55 +00:00
Fix AVX2 Gather execution domains.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@204713 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
@@ -8791,12 +8791,18 @@ multiclass avx2_gather<bits<8> opc, string OpcodeStr, RegisterClass RC256,
|
|||||||
let mayLoad = 1, Constraints
|
let mayLoad = 1, Constraints
|
||||||
= "@earlyclobber $dst,@earlyclobber $mask_wb, $src1 = $dst, $mask = $mask_wb"
|
= "@earlyclobber $dst,@earlyclobber $mask_wb, $src1 = $dst, $mask = $mask_wb"
|
||||||
in {
|
in {
|
||||||
defm VGATHERDPD : avx2_gather<0x92, "vgatherdpd", VR256, vx64mem, vx64mem>, VEX_W;
|
|
||||||
defm VGATHERQPD : avx2_gather<0x93, "vgatherqpd", VR256, vx64mem, vy64mem>, VEX_W;
|
|
||||||
defm VGATHERDPS : avx2_gather<0x92, "vgatherdps", VR256, vx32mem, vy32mem>;
|
|
||||||
defm VGATHERQPS : avx2_gather<0x93, "vgatherqps", VR128, vx32mem, vy32mem>;
|
|
||||||
defm VPGATHERDQ : avx2_gather<0x90, "vpgatherdq", VR256, vx64mem, vx64mem>, VEX_W;
|
defm VPGATHERDQ : avx2_gather<0x90, "vpgatherdq", VR256, vx64mem, vx64mem>, VEX_W;
|
||||||
defm VPGATHERQQ : avx2_gather<0x91, "vpgatherqq", VR256, vx64mem, vy64mem>, VEX_W;
|
defm VPGATHERQQ : avx2_gather<0x91, "vpgatherqq", VR256, vx64mem, vy64mem>, VEX_W;
|
||||||
defm VPGATHERDD : avx2_gather<0x90, "vpgatherdd", VR256, vx32mem, vy32mem>;
|
defm VPGATHERDD : avx2_gather<0x90, "vpgatherdd", VR256, vx32mem, vy32mem>;
|
||||||
defm VPGATHERQD : avx2_gather<0x91, "vpgatherqd", VR128, vx32mem, vy32mem>;
|
defm VPGATHERQD : avx2_gather<0x91, "vpgatherqd", VR128, vx32mem, vy32mem>;
|
||||||
|
|
||||||
|
let ExeDomain = SSEPackedDouble in {
|
||||||
|
defm VGATHERDPD : avx2_gather<0x92, "vgatherdpd", VR256, vx64mem, vx64mem>, VEX_W;
|
||||||
|
defm VGATHERQPD : avx2_gather<0x93, "vgatherqpd", VR256, vx64mem, vy64mem>, VEX_W;
|
||||||
|
}
|
||||||
|
|
||||||
|
let ExeDomain = SSEPackedSingle in {
|
||||||
|
defm VGATHERDPS : avx2_gather<0x92, "vgatherdps", VR256, vx32mem, vy32mem>;
|
||||||
|
defm VGATHERQPS : avx2_gather<0x93, "vgatherqps", VR128, vx32mem, vy32mem>;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
@@ -15,4 +15,20 @@ define <4 x float> @test_x86_avx2_gather_d_ps(i8* %a1,
|
|||||||
; CHECK: vgatherdps
|
; CHECK: vgatherdps
|
||||||
; CHECK-NOT: [[DST]]
|
; CHECK-NOT: [[DST]]
|
||||||
; CHECK: [[DST:%xmm[0-9]+]]{{$}}
|
; CHECK: [[DST:%xmm[0-9]+]]{{$}}
|
||||||
|
; CHECK: vmovaps
|
||||||
|
; CHECK: ret
|
||||||
|
|
||||||
|
declare <2 x double> @llvm.x86.avx2.gather.d.pd(<2 x double>, i8*,
|
||||||
|
<4 x i32>, <2 x double>, i8) nounwind readonly
|
||||||
|
|
||||||
|
define <2 x double> @test_x86_avx2_gather_d_pd(i8* %a1,
|
||||||
|
<4 x i32> %idx, <2 x double> %mask) {
|
||||||
|
%res = call <2 x double> @llvm.x86.avx2.gather.d.pd(<2 x double> undef,
|
||||||
|
i8* %a1, <4 x i32> %idx, <2 x double> %mask, i8 2) ;
|
||||||
|
ret <2 x double> %res
|
||||||
|
}
|
||||||
|
|
||||||
|
; CHECK: test_x86_avx2_gather_d_pd
|
||||||
|
; CHECK: vgatherdpd
|
||||||
|
; CHECK: vmovapd
|
||||||
; CHECK: ret
|
; CHECK: ret
|
||||||
|
@@ -1142,7 +1142,7 @@ define <8 x float> @test_gather_mask(<8 x float> %a0, float* %a,
|
|||||||
<8 x i32> %idx, <8 x float> %mask,
|
<8 x i32> %idx, <8 x float> %mask,
|
||||||
float* nocapture %out) {
|
float* nocapture %out) {
|
||||||
; CHECK: test_gather_mask
|
; CHECK: test_gather_mask
|
||||||
; CHECK: vmovdqa %ymm2, [[DEST:%.*]]
|
; CHECK: vmovaps %ymm2, [[DEST:%.*]]
|
||||||
; CHECK: vgatherdps [[DEST]]
|
; CHECK: vgatherdps [[DEST]]
|
||||||
;; gather with mask
|
;; gather with mask
|
||||||
%a_i8 = bitcast float* %a to i8*
|
%a_i8 = bitcast float* %a to i8*
|
||||||
|
Reference in New Issue
Block a user