mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-14 11:32:34 +00:00
8f32e5f0d6
Summary: Initially, these intrinsics seemed like part of a family of "frame" related intrinsics, but now I think that's more confusing than helpful. Initially, the LangRef specified that this would create a new kind of allocation that would be allocated at a fixed offset from the frame pointer (EBP/RBP). We ended up dropping that design, and leaving the stack frame layout alone. These intrinsics are really about sharing local stack allocations, not frame pointers. I intend to go further and add an `llvm.localaddress()` intrinsic that returns whatever register (EBP, ESI, ESP, RBX) is being used to address locals, which should not be confused with the frame pointer. Naming suggestions at this point are welcome, I'm happy to re-run sed. Reviewers: majnemer, nicholas Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D11011 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@241633 91177308-0d34-0410-b5e6-96231b3b80d8
5343 lines
280 KiB
TableGen
5343 lines
280 KiB
TableGen
//===- IntrinsicsX86.td - Defines X86 intrinsics -----------*- tablegen -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file defines all of the X86-specific intrinsics.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Interrupt traps
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_int : Intrinsic<[], [llvm_i8_ty]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SEH intrinsics for Windows
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_seh_lsda : Intrinsic<[llvm_ptr_ty], [llvm_ptr_ty], [IntrNoMem]>;
|
|
|
|
// Restores the frame, base, and stack pointers as necessary after recovering
|
|
// from an exception. Any block resuming control flow in the parent function
|
|
// should call this before accessing any stack memory.
|
|
def int_x86_seh_restoreframe : Intrinsic<[], [], []>;
|
|
|
|
// Given a pointer to the end of an EH registration object, returns the true
|
|
// parent frame address that can be used with llvm.localrecover.
|
|
def int_x86_seh_recoverfp : Intrinsic<[llvm_ptr_ty],
|
|
[llvm_ptr_ty, llvm_ptr_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Read Time Stamp Counter.
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_rdtsc : GCCBuiltin<"__builtin_ia32_rdtsc">,
|
|
Intrinsic<[llvm_i64_ty], [], []>;
|
|
def int_x86_rdtscp : GCCBuiltin<"__builtin_ia32_rdtscp">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// Read Performance-Monitoring Counter.
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_rdpmc : GCCBuiltin<"__builtin_ia32_rdpmc">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i32_ty], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// 3DNow!
|
|
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_3dnow_pavgusb : GCCBuiltin<"__builtin_ia32_pavgusb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pf2id : GCCBuiltin<"__builtin_ia32_pf2id">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnow_pfacc : GCCBuiltin<"__builtin_ia32_pfacc">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfadd : GCCBuiltin<"__builtin_ia32_pfadd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfcmpeq : GCCBuiltin<"__builtin_ia32_pfcmpeq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfcmpge : GCCBuiltin<"__builtin_ia32_pfcmpge">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfcmpgt : GCCBuiltin<"__builtin_ia32_pfcmpgt">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfmax : GCCBuiltin<"__builtin_ia32_pfmax">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfmin : GCCBuiltin<"__builtin_ia32_pfmin">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfmul : GCCBuiltin<"__builtin_ia32_pfmul">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfrcp : GCCBuiltin<"__builtin_ia32_pfrcp">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnow_pfrcpit1 : GCCBuiltin<"__builtin_ia32_pfrcpit1">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfrcpit2 : GCCBuiltin<"__builtin_ia32_pfrcpit2">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfrsqrt : GCCBuiltin<"__builtin_ia32_pfrsqrt">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnow_pfrsqit1 : GCCBuiltin<"__builtin_ia32_pfrsqit1">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfsub : GCCBuiltin<"__builtin_ia32_pfsub">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pfsubr : GCCBuiltin<"__builtin_ia32_pfsubr">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnow_pi2fd : GCCBuiltin<"__builtin_ia32_pi2fd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnow_pmulhrw : GCCBuiltin<"__builtin_ia32_pmulhrw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// 3DNow! extensions
|
|
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_3dnowa_pf2iw : GCCBuiltin<"__builtin_ia32_pf2iw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnowa_pfnacc : GCCBuiltin<"__builtin_ia32_pfnacc">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnowa_pfpnacc : GCCBuiltin<"__builtin_ia32_pfpnacc">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_3dnowa_pi2fw : GCCBuiltin<"__builtin_ia32_pi2fw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_3dnowa_pswapd :
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE1
|
|
|
|
// Arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_add_ss : GCCBuiltin<"__builtin_ia32_addss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_sub_ss : GCCBuiltin<"__builtin_ia32_subss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_mul_ss : GCCBuiltin<"__builtin_ia32_mulss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_div_ss : GCCBuiltin<"__builtin_ia32_divss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_sqrt_ss : GCCBuiltin<"__builtin_ia32_sqrtss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_sqrt_ps : GCCBuiltin<"__builtin_ia32_sqrtps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_rcp_ss : GCCBuiltin<"__builtin_ia32_rcpss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_rcp_ps : GCCBuiltin<"__builtin_ia32_rcpps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_rsqrt_ss : GCCBuiltin<"__builtin_ia32_rsqrtss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_rsqrt_ps : GCCBuiltin<"__builtin_ia32_rsqrtps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_min_ss : GCCBuiltin<"__builtin_ia32_minss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_min_ps : GCCBuiltin<"__builtin_ia32_minps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_max_ss : GCCBuiltin<"__builtin_ia32_maxss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_max_ps : GCCBuiltin<"__builtin_ia32_maxps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Comparison ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_cmp_ss : GCCBuiltin<"__builtin_ia32_cmpss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cmp_ps : GCCBuiltin<"__builtin_ia32_cmpps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comieq_ss : GCCBuiltin<"__builtin_ia32_comieq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comilt_ss : GCCBuiltin<"__builtin_ia32_comilt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comile_ss : GCCBuiltin<"__builtin_ia32_comile">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comigt_ss : GCCBuiltin<"__builtin_ia32_comigt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comige_ss : GCCBuiltin<"__builtin_ia32_comige">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_comineq_ss : GCCBuiltin<"__builtin_ia32_comineq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomieq_ss : GCCBuiltin<"__builtin_ia32_ucomieq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomilt_ss : GCCBuiltin<"__builtin_ia32_ucomilt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomile_ss : GCCBuiltin<"__builtin_ia32_ucomile">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomigt_ss : GCCBuiltin<"__builtin_ia32_ucomigt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomige_ss : GCCBuiltin<"__builtin_ia32_ucomige">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_ucomineq_ss : GCCBuiltin<"__builtin_ia32_ucomineq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
|
|
// Conversion ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_cvtss2si : GCCBuiltin<"__builtin_ia32_cvtss2si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtss2si64 : GCCBuiltin<"__builtin_ia32_cvtss2si64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvttss2si : GCCBuiltin<"__builtin_ia32_cvttss2si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvttss2si64 : GCCBuiltin<"__builtin_ia32_cvttss2si64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtsi2ss : GCCBuiltin<"__builtin_ia32_cvtsi2ss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtsi642ss : GCCBuiltin<"__builtin_ia32_cvtsi642ss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i64_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_sse_cvtps2pi : GCCBuiltin<"__builtin_ia32_cvtps2pi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvttps2pi: GCCBuiltin<"__builtin_ia32_cvttps2pi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtpi2ps : GCCBuiltin<"__builtin_ia32_cvtpi2ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// SIMD store ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_storeu_ps : GCCBuiltin<"__builtin_ia32_storeups">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v4f32_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// Cacheability support ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_sfence : GCCBuiltin<"__builtin_ia32_sfence">,
|
|
Intrinsic<[], [], []>;
|
|
}
|
|
|
|
// Control register.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_stmxcsr :
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
def int_x86_sse_ldmxcsr :
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
}
|
|
|
|
// Misc.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse_movmsk_ps : GCCBuiltin<"__builtin_ia32_movmskps">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE2
|
|
|
|
// FP arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_add_sd : GCCBuiltin<"__builtin_ia32_addsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_sub_sd : GCCBuiltin<"__builtin_ia32_subsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_mul_sd : GCCBuiltin<"__builtin_ia32_mulsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_div_sd : GCCBuiltin<"__builtin_ia32_divsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_sqrt_sd : GCCBuiltin<"__builtin_ia32_sqrtsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse2_sqrt_pd : GCCBuiltin<"__builtin_ia32_sqrtpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse2_min_sd : GCCBuiltin<"__builtin_ia32_minsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_min_pd : GCCBuiltin<"__builtin_ia32_minpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_max_sd : GCCBuiltin<"__builtin_ia32_maxsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_max_pd : GCCBuiltin<"__builtin_ia32_maxpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// FP comparison ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_cmp_sd : GCCBuiltin<"__builtin_ia32_cmpsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cmp_pd : GCCBuiltin<"__builtin_ia32_cmppd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comieq_sd : GCCBuiltin<"__builtin_ia32_comisdeq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comilt_sd : GCCBuiltin<"__builtin_ia32_comisdlt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comile_sd : GCCBuiltin<"__builtin_ia32_comisdle">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comigt_sd : GCCBuiltin<"__builtin_ia32_comisdgt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comige_sd : GCCBuiltin<"__builtin_ia32_comisdge">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_comineq_sd : GCCBuiltin<"__builtin_ia32_comisdneq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomieq_sd : GCCBuiltin<"__builtin_ia32_ucomisdeq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomilt_sd : GCCBuiltin<"__builtin_ia32_ucomisdlt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomile_sd : GCCBuiltin<"__builtin_ia32_ucomisdle">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomigt_sd : GCCBuiltin<"__builtin_ia32_ucomisdgt">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomige_sd : GCCBuiltin<"__builtin_ia32_ucomisdge">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_ucomineq_sd : GCCBuiltin<"__builtin_ia32_ucomisdneq">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Integer arithmetic ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_padds_b : GCCBuiltin<"__builtin_ia32_paddsb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_padds_w : GCCBuiltin<"__builtin_ia32_paddsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_paddus_b : GCCBuiltin<"__builtin_ia32_paddusb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_paddus_w : GCCBuiltin<"__builtin_ia32_paddusw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_psubs_b : GCCBuiltin<"__builtin_ia32_psubsb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psubs_w : GCCBuiltin<"__builtin_ia32_psubsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psubus_b : GCCBuiltin<"__builtin_ia32_psubusb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psubus_w : GCCBuiltin<"__builtin_ia32_psubusw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_pmulhu_w : GCCBuiltin<"__builtin_ia32_pmulhuw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmulh_w : GCCBuiltin<"__builtin_ia32_pmulhw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmulu_dq : GCCBuiltin<"__builtin_ia32_pmuludq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmadd_wd : GCCBuiltin<"__builtin_ia32_pmaddwd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pavg_b : GCCBuiltin<"__builtin_ia32_pavgb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pavg_w : GCCBuiltin<"__builtin_ia32_pavgw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmaxu_b : GCCBuiltin<"__builtin_ia32_pmaxub128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmaxs_w : GCCBuiltin<"__builtin_ia32_pmaxsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pminu_b : GCCBuiltin<"__builtin_ia32_pminub128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_pmins_w : GCCBuiltin<"__builtin_ia32_pminsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_sse2_psad_bw : GCCBuiltin<"__builtin_ia32_psadbw128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Integer shift ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_psll_w : GCCBuiltin<"__builtin_ia32_psllw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psll_d : GCCBuiltin<"__builtin_ia32_pslld128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psll_q : GCCBuiltin<"__builtin_ia32_psllq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty,
|
|
llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrl_w : GCCBuiltin<"__builtin_ia32_psrlw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrl_d : GCCBuiltin<"__builtin_ia32_psrld128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrl_q : GCCBuiltin<"__builtin_ia32_psrlq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty,
|
|
llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psra_w : GCCBuiltin<"__builtin_ia32_psraw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psra_d : GCCBuiltin<"__builtin_ia32_psrad128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_sse2_pslli_w : GCCBuiltin<"__builtin_ia32_psllwi128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_pslli_d : GCCBuiltin<"__builtin_ia32_pslldi128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_pslli_q : GCCBuiltin<"__builtin_ia32_psllqi128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrli_w : GCCBuiltin<"__builtin_ia32_psrlwi128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrli_d : GCCBuiltin<"__builtin_ia32_psrldi128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrli_q : GCCBuiltin<"__builtin_ia32_psrlqi128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrai_w : GCCBuiltin<"__builtin_ia32_psrawi128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_psrai_d : GCCBuiltin<"__builtin_ia32_psradi128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Conversion ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_cvtdq2pd : GCCBuiltin<"__builtin_ia32_cvtdq2pd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtdq2ps : GCCBuiltin<"__builtin_ia32_cvtdq2ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtpd2dq : GCCBuiltin<"__builtin_ia32_cvtpd2dq">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvttpd2dq : GCCBuiltin<"__builtin_ia32_cvttpd2dq">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtpd2ps : GCCBuiltin<"__builtin_ia32_cvtpd2ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtps2dq : GCCBuiltin<"__builtin_ia32_cvtps2dq">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvttps2dq : GCCBuiltin<"__builtin_ia32_cvttps2dq">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtps2pd : GCCBuiltin<"__builtin_ia32_cvtps2pd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtsd2si : GCCBuiltin<"__builtin_ia32_cvtsd2si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtsd2si64 : GCCBuiltin<"__builtin_ia32_cvtsd2si64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvttsd2si : GCCBuiltin<"__builtin_ia32_cvttsd2si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvttsd2si64 : GCCBuiltin<"__builtin_ia32_cvttsd2si64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtsi2sd : GCCBuiltin<"__builtin_ia32_cvtsi2sd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtsi642sd : GCCBuiltin<"__builtin_ia32_cvtsi642sd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtsd2ss : GCCBuiltin<"__builtin_ia32_cvtsd2ss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_cvtss2sd : GCCBuiltin<"__builtin_ia32_cvtss2sd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtpd2pi : GCCBuiltin<"__builtin_ia32_cvtpd2pi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvttpd2pi: GCCBuiltin<"__builtin_ia32_cvttpd2pi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse_cvtpi2pd : GCCBuiltin<"__builtin_ia32_cvtpi2pd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// SIMD store ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_storeu_pd : GCCBuiltin<"__builtin_ia32_storeupd">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v2f64_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_sse2_storeu_dq : GCCBuiltin<"__builtin_ia32_storedqu">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v16i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_sse2_storel_dq : GCCBuiltin<"__builtin_ia32_storelv4si">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v4i32_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// Misc.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse2_packsswb_128 : GCCBuiltin<"__builtin_ia32_packsswb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_packssdw_128 : GCCBuiltin<"__builtin_ia32_packssdw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_packuswb_128 : GCCBuiltin<"__builtin_ia32_packuswb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_movmsk_pd : GCCBuiltin<"__builtin_ia32_movmskpd">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_pmovmskb_128 : GCCBuiltin<"__builtin_ia32_pmovmskb128">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_maskmov_dqu : GCCBuiltin<"__builtin_ia32_maskmovdqu">,
|
|
Intrinsic<[], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_ptr_ty], []>;
|
|
def int_x86_sse2_clflush : GCCBuiltin<"__builtin_ia32_clflush">,
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
def int_x86_sse2_lfence : GCCBuiltin<"__builtin_ia32_lfence">,
|
|
Intrinsic<[], [], []>;
|
|
def int_x86_sse2_mfence : GCCBuiltin<"__builtin_ia32_mfence">,
|
|
Intrinsic<[], [], []>;
|
|
def int_x86_sse2_pause : GCCBuiltin<"__builtin_ia32_pause">,
|
|
Intrinsic<[], [], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE3
|
|
|
|
// Addition / subtraction ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse3_addsub_ps : GCCBuiltin<"__builtin_ia32_addsubps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse3_addsub_pd : GCCBuiltin<"__builtin_ia32_addsubpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Horizontal ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse3_hadd_ps : GCCBuiltin<"__builtin_ia32_haddps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse3_hadd_pd : GCCBuiltin<"__builtin_ia32_haddpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_sse3_hsub_ps : GCCBuiltin<"__builtin_ia32_hsubps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_sse3_hsub_pd : GCCBuiltin<"__builtin_ia32_hsubpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Specialized unaligned load.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse3_ldu_dq : GCCBuiltin<"__builtin_ia32_lddqu">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_ptr_ty], [IntrReadMem]>;
|
|
}
|
|
|
|
// Thread synchronization ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse3_monitor : GCCBuiltin<"__builtin_ia32_monitor">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], []>;
|
|
def int_x86_sse3_mwait : GCCBuiltin<"__builtin_ia32_mwait">,
|
|
Intrinsic<[], [llvm_i32_ty,
|
|
llvm_i32_ty], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSSE3
|
|
|
|
// Horizontal arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_ssse3_phadd_w : GCCBuiltin<"__builtin_ia32_phaddw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phadd_w_128 : GCCBuiltin<"__builtin_ia32_phaddw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_phadd_d : GCCBuiltin<"__builtin_ia32_phaddd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phadd_d_128 : GCCBuiltin<"__builtin_ia32_phaddd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_phadd_sw : GCCBuiltin<"__builtin_ia32_phaddsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phadd_sw_128 : GCCBuiltin<"__builtin_ia32_phaddsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_phsub_w : GCCBuiltin<"__builtin_ia32_phsubw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phsub_w_128 : GCCBuiltin<"__builtin_ia32_phsubw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_phsub_d : GCCBuiltin<"__builtin_ia32_phsubd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phsub_d_128 : GCCBuiltin<"__builtin_ia32_phsubd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_phsub_sw : GCCBuiltin<"__builtin_ia32_phsubsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_phsub_sw_128 : GCCBuiltin<"__builtin_ia32_phsubsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_pmadd_ub_sw : GCCBuiltin<"__builtin_ia32_pmaddubsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_pmadd_ub_sw_128 : GCCBuiltin<"__builtin_ia32_pmaddubsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Packed multiply high with round and scale
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_ssse3_pmul_hr_sw : GCCBuiltin<"__builtin_ia32_pmulhrsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_ssse3_pmul_hr_sw_128 : GCCBuiltin<"__builtin_ia32_pmulhrsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Shuffle ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_ssse3_pshuf_b : GCCBuiltin<"__builtin_ia32_pshufb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_pshuf_b_128 : GCCBuiltin<"__builtin_ia32_pshufb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse2_pshuf_d : GCCBuiltin<"__builtin_ia32_pshufd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse2_pshufl_w : GCCBuiltin<"__builtin_ia32_pshuflw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse2_pshufh_w : GCCBuiltin<"__builtin_ia32_pshufhw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse_pshuf_w : GCCBuiltin<"__builtin_ia32_pshufw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Sign ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_ssse3_psign_b : GCCBuiltin<"__builtin_ia32_psignb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_psign_b_128 : GCCBuiltin<"__builtin_ia32_psignb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty,
|
|
llvm_v16i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_psign_w : GCCBuiltin<"__builtin_ia32_psignw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_psign_w_128 : GCCBuiltin<"__builtin_ia32_psignw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_psign_d : GCCBuiltin<"__builtin_ia32_psignd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_psign_d_128 : GCCBuiltin<"__builtin_ia32_psignd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Absolute value ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_ssse3_pabs_b : GCCBuiltin<"__builtin_ia32_pabsb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_pabs_b_128 : GCCBuiltin<"__builtin_ia32_pabsb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_pabs_w : GCCBuiltin<"__builtin_ia32_pabsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_pabs_w_128 : GCCBuiltin<"__builtin_ia32_pabsw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_ssse3_pabs_d : GCCBuiltin<"__builtin_ia32_pabsd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_ssse3_pabs_d_128 : GCCBuiltin<"__builtin_ia32_pabsd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE4.1
|
|
|
|
// FP rounding ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_round_ss : GCCBuiltin<"__builtin_ia32_roundss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse41_round_ps : GCCBuiltin<"__builtin_ia32_roundps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse41_round_sd : GCCBuiltin<"__builtin_ia32_roundsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_sse41_round_pd : GCCBuiltin<"__builtin_ia32_roundpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector sign and zero extend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_pmovsxbd : GCCBuiltin<"__builtin_ia32_pmovsxbd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovsxbq : GCCBuiltin<"__builtin_ia32_pmovsxbq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovsxbw : GCCBuiltin<"__builtin_ia32_pmovsxbw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovsxdq : GCCBuiltin<"__builtin_ia32_pmovsxdq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovsxwd : GCCBuiltin<"__builtin_ia32_pmovsxwd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovsxwq : GCCBuiltin<"__builtin_ia32_pmovsxwq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxbd : GCCBuiltin<"__builtin_ia32_pmovzxbd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxbq : GCCBuiltin<"__builtin_ia32_pmovzxbq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxbw : GCCBuiltin<"__builtin_ia32_pmovzxbw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxdq : GCCBuiltin<"__builtin_ia32_pmovzxdq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxwd : GCCBuiltin<"__builtin_ia32_pmovzxwd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pmovzxwq : GCCBuiltin<"__builtin_ia32_pmovzxwq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector min element
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_phminposuw : GCCBuiltin<"__builtin_ia32_phminposuw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector compare, min, max
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_pmaxsb : GCCBuiltin<"__builtin_ia32_pmaxsb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pmaxsd : GCCBuiltin<"__builtin_ia32_pmaxsd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pmaxud : GCCBuiltin<"__builtin_ia32_pmaxud128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pmaxuw : GCCBuiltin<"__builtin_ia32_pmaxuw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pminsb : GCCBuiltin<"__builtin_ia32_pminsb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pminsd : GCCBuiltin<"__builtin_ia32_pminsd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pminud : GCCBuiltin<"__builtin_ia32_pminud128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_pminuw : GCCBuiltin<"__builtin_ia32_pminuw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Advanced Encryption Standard (AES) Instructions
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_aesni_aesimc : GCCBuiltin<"__builtin_ia32_aesimc128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_aesni_aesenc : GCCBuiltin<"__builtin_ia32_aesenc128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_aesni_aesenclast : GCCBuiltin<"__builtin_ia32_aesenclast128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_aesni_aesdec : GCCBuiltin<"__builtin_ia32_aesdec128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_aesni_aesdeclast : GCCBuiltin<"__builtin_ia32_aesdeclast128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_aesni_aeskeygenassist :
|
|
GCCBuiltin<"__builtin_ia32_aeskeygenassist128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// PCLMUL instruction
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_pclmulqdq : GCCBuiltin<"__builtin_ia32_pclmulqdq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector pack
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_packusdw : GCCBuiltin<"__builtin_ia32_packusdw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector multiply
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_pmuldq : GCCBuiltin<"__builtin_ia32_pmuldq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Vector extract
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_pextrb :
|
|
Intrinsic<[llvm_i32_ty], [llvm_v16i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pextrd :
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4i32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_pextrq :
|
|
Intrinsic<[llvm_i64_ty], [llvm_v2i64_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_extractps : GCCBuiltin<"__builtin_ia32_extractps128">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector insert
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_insertps : GCCBuiltin<"__builtin_ia32_insertps128">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector blend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_pblendvb : GCCBuiltin<"__builtin_ia32_pblendvb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_blendvpd : GCCBuiltin<"__builtin_ia32_blendvpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_blendvps : GCCBuiltin<"__builtin_ia32_blendvps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector dot product
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_dppd : GCCBuiltin<"__builtin_ia32_dppd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
def int_x86_sse41_dpps : GCCBuiltin<"__builtin_ia32_dpps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Vector sum of absolute differences
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_mpsadbw : GCCBuiltin<"__builtin_ia32_mpsadbw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty, llvm_v16i8_ty,llvm_i8_ty],
|
|
[IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Cacheability support ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_movntdqa : GCCBuiltin<"__builtin_ia32_movntdqa">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_ptr_ty], [IntrReadMem]>;
|
|
}
|
|
|
|
// Test instruction with bitwise comparison.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse41_ptestz : GCCBuiltin<"__builtin_ia32_ptestz128">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_ptestc : GCCBuiltin<"__builtin_ia32_ptestc128">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse41_ptestnzc : GCCBuiltin<"__builtin_ia32_ptestnzc128">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE4.2
|
|
|
|
// Miscellaneous
|
|
// CRC Instruction
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse42_crc32_32_8 : GCCBuiltin<"__builtin_ia32_crc32qi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_crc32_32_16 : GCCBuiltin<"__builtin_ia32_crc32hi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_crc32_32_32 : GCCBuiltin<"__builtin_ia32_crc32si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_crc32_64_64 : GCCBuiltin<"__builtin_ia32_crc32di">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// String/text processing ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse42_pcmpistrm128 : GCCBuiltin<"__builtin_ia32_pcmpistrm128">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistri128 : GCCBuiltin<"__builtin_ia32_pcmpistri128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistria128 : GCCBuiltin<"__builtin_ia32_pcmpistria128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistric128 : GCCBuiltin<"__builtin_ia32_pcmpistric128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistrio128 : GCCBuiltin<"__builtin_ia32_pcmpistrio128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistris128 : GCCBuiltin<"__builtin_ia32_pcmpistris128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpistriz128 : GCCBuiltin<"__builtin_ia32_pcmpistriz128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestrm128 : GCCBuiltin<"__builtin_ia32_pcmpestrm128">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestri128 : GCCBuiltin<"__builtin_ia32_pcmpestri128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestria128 : GCCBuiltin<"__builtin_ia32_pcmpestria128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestric128 : GCCBuiltin<"__builtin_ia32_pcmpestric128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestrio128 : GCCBuiltin<"__builtin_ia32_pcmpestrio128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestris128 : GCCBuiltin<"__builtin_ia32_pcmpestris128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse42_pcmpestriz128 : GCCBuiltin<"__builtin_ia32_pcmpestriz128">,
|
|
Intrinsic<[llvm_i32_ty],
|
|
[llvm_v16i8_ty, llvm_i32_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SSE4A
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_sse4a_extrqi : GCCBuiltin<"__builtin_ia32_extrqi">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sse4a_extrq : GCCBuiltin<"__builtin_ia32_extrq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v16i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_sse4a_insertqi : GCCBuiltin<"__builtin_ia32_insertqi">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_sse4a_insertq : GCCBuiltin<"__builtin_ia32_insertq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_sse4a_movnt_ss : GCCBuiltin<"__builtin_ia32_movntss">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4f32_ty], []>;
|
|
def int_x86_sse4a_movnt_sd : GCCBuiltin<"__builtin_ia32_movntsd">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v2f64_ty], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// AVX
|
|
|
|
// Arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_addsub_pd_256 : GCCBuiltin<"__builtin_ia32_addsubpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_addsub_ps_256 : GCCBuiltin<"__builtin_ia32_addsubps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_max_pd_256 : GCCBuiltin<"__builtin_ia32_maxpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_max_ps_256 : GCCBuiltin<"__builtin_ia32_maxps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_min_pd_256 : GCCBuiltin<"__builtin_ia32_minpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_min_ps_256 : GCCBuiltin<"__builtin_ia32_minps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_sqrt_pd_256 : GCCBuiltin<"__builtin_ia32_sqrtpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_sqrt_ps_256 : GCCBuiltin<"__builtin_ia32_sqrtps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_rsqrt_ps_256 : GCCBuiltin<"__builtin_ia32_rsqrtps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_rcp_ps_256 : GCCBuiltin<"__builtin_ia32_rcpps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_round_pd_256 : GCCBuiltin<"__builtin_ia32_roundpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_round_ps_256 : GCCBuiltin<"__builtin_ia32_roundps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Horizontal ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_hadd_pd_256 : GCCBuiltin<"__builtin_ia32_haddpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_hsub_ps_256 : GCCBuiltin<"__builtin_ia32_hsubps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_hsub_pd_256 : GCCBuiltin<"__builtin_ia32_hsubpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_hadd_ps_256 : GCCBuiltin<"__builtin_ia32_haddps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector permutation
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_vpermilvar_pd : GCCBuiltin<"__builtin_ia32_vpermilvarpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vpermilvar_ps : GCCBuiltin<"__builtin_ia32_vpermilvarps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_vpermilvar_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermilvarpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vpermilvar_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermilvarps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx_vperm2f128_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vperm2f128_pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vperm2f128_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vperm2f128_ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vperm2f128_si_256 :
|
|
GCCBuiltin<"__builtin_ia32_vperm2f128_si256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2vard128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2vard256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2vard512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty],
|
|
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_hi_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varhi128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_hi_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varhi256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty],
|
|
[llvm_v16i16_ty, llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_hi_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varhi512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty],
|
|
[llvm_v32i16_ty, llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2i64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4i64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8i64_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4i32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8i32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16i32_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermi2var_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermi2varq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty],
|
|
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_d_512:
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_q_512:
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_ps_512:
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16i32_ty,
|
|
llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_pd_512:
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8i64_ty,
|
|
llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard128_maskz">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard256_maskz">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2vard512_maskz">,
|
|
Intrinsic<[llvm_v16i32_ty],
|
|
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_hi_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_hi_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi128_maskz">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_hi_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty],
|
|
[llvm_v16i16_ty, llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_hi_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi256_maskz">,
|
|
Intrinsic<[llvm_v16i16_ty],
|
|
[llvm_v16i16_ty, llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_hi_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty],
|
|
[llvm_v32i16_ty, llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_hi_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varhi512_maskz">,
|
|
Intrinsic<[llvm_v32i16_ty],
|
|
[llvm_v32i16_ty, llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2i64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd128_maskz">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2i64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4i64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd256_maskz">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4i64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varpd512_maskz">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8i64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4i32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps128_maskz">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4i32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8i32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps256_maskz">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8i32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varps512_maskz">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16i32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq128_maskz">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vpermt2var_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq256_maskz">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vpermt2var_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpermt2varq512_maskz">,
|
|
Intrinsic<[llvm_v8i64_ty],
|
|
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pshuf_b_128 :
|
|
GCCBuiltin<"__builtin_ia32_pshufb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_v16i8_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pshuf_b_256 :
|
|
GCCBuiltin<"__builtin_ia32_pshufb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty],
|
|
[llvm_v32i8_ty, llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pshuf_b_512 :
|
|
GCCBuiltin<"__builtin_ia32_pshufb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty],
|
|
[llvm_v64i8_ty, llvm_v64i8_ty, llvm_v64i8_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
|
|
// Vector blend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_blendv_pd_256 : GCCBuiltin<"__builtin_ia32_blendvpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_blendv_ps_256 : GCCBuiltin<"__builtin_ia32_blendvps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_v8f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector dot product
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_dp_ps_256 : GCCBuiltin<"__builtin_ia32_dpps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector compare
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_cmp_pd_256 : GCCBuiltin<"__builtin_ia32_cmppd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cmp_ps_256 : GCCBuiltin<"__builtin_ia32_cmpps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector convert
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_cvtdq2_pd_256 : GCCBuiltin<"__builtin_ia32_cvtdq2pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvtdq2_ps_256 : GCCBuiltin<"__builtin_ia32_cvtdq2ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvt_pd2_ps_256 : GCCBuiltin<"__builtin_ia32_cvtpd2ps256">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvt_ps2dq_256 : GCCBuiltin<"__builtin_ia32_cvtps2dq256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvt_ps2_pd_256 : GCCBuiltin<"__builtin_ia32_cvtps2pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvtt_pd2dq_256 : GCCBuiltin<"__builtin_ia32_cvttpd2dq256">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvt_pd2dq_256 : GCCBuiltin<"__builtin_ia32_cvtpd2dq256">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_cvtt_ps2dq_256 : GCCBuiltin<"__builtin_ia32_cvttps2dq256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector bit test
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_vtestz_pd : GCCBuiltin<"__builtin_ia32_vtestzpd">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestc_pd : GCCBuiltin<"__builtin_ia32_vtestcpd">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestnzc_pd : GCCBuiltin<"__builtin_ia32_vtestnzcpd">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty,
|
|
llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestz_ps : GCCBuiltin<"__builtin_ia32_vtestzps">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestc_ps : GCCBuiltin<"__builtin_ia32_vtestcps">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestnzc_ps : GCCBuiltin<"__builtin_ia32_vtestnzcps">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty,
|
|
llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestz_pd_256 : GCCBuiltin<"__builtin_ia32_vtestzpd256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestc_pd_256 : GCCBuiltin<"__builtin_ia32_vtestcpd256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestnzc_pd_256 : GCCBuiltin<"__builtin_ia32_vtestnzcpd256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f64_ty,
|
|
llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestz_ps_256 : GCCBuiltin<"__builtin_ia32_vtestzps256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestc_ps_256 : GCCBuiltin<"__builtin_ia32_vtestcps256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_vtestnzc_ps_256 : GCCBuiltin<"__builtin_ia32_vtestnzcps256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v8f32_ty,
|
|
llvm_v8f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx_ptestz_256 : GCCBuiltin<"__builtin_ia32_ptestz256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4i64_ty,
|
|
llvm_v4i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_ptestc_256 : GCCBuiltin<"__builtin_ia32_ptestc256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4i64_ty,
|
|
llvm_v4i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_ptestnzc_256 : GCCBuiltin<"__builtin_ia32_ptestnzc256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4i64_ty,
|
|
llvm_v4i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ptestm_d_512 : GCCBuiltin<"__builtin_ia32_ptestmd512">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ptestm_q_512 : GCCBuiltin<"__builtin_ia32_ptestmq512">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector extract sign mask
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_movmsk_pd_256 : GCCBuiltin<"__builtin_ia32_movmskpd256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx_movmsk_ps_256 : GCCBuiltin<"__builtin_ia32_movmskps256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector zero
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_vzeroall : GCCBuiltin<"__builtin_ia32_vzeroall">,
|
|
Intrinsic<[], [], []>;
|
|
def int_x86_avx_vzeroupper : GCCBuiltin<"__builtin_ia32_vzeroupper">,
|
|
Intrinsic<[], [], []>;
|
|
}
|
|
|
|
// Vector load with broadcast
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_vbroadcastf128_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastf128_pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_ptr_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx_vbroadcastf128_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastf128_ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_ptr_ty], [IntrReadArgMem]>;
|
|
}
|
|
|
|
// SIMD load ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_ldu_dq_256 : GCCBuiltin<"__builtin_ia32_lddqu256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_ptr_ty], [IntrReadMem]>;
|
|
}
|
|
|
|
// SIMD store ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_storeu_pd_256 : GCCBuiltin<"__builtin_ia32_storeupd256">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4f64_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx_storeu_ps_256 : GCCBuiltin<"__builtin_ia32_storeups256">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8f32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx_storeu_dq_256 : GCCBuiltin<"__builtin_ia32_storedqu256">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v32i8_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// Conditional load ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_maskload_pd : GCCBuiltin<"__builtin_ia32_maskloadpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_ptr_ty, llvm_v2f64_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx_maskload_ps : GCCBuiltin<"__builtin_ia32_maskloadps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_ptr_ty, llvm_v4f32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx_maskload_pd_256 : GCCBuiltin<"__builtin_ia32_maskloadpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_ptr_ty, llvm_v4f64_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx_maskload_ps_256 : GCCBuiltin<"__builtin_ia32_maskloadps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_ptr_ty, llvm_v8f32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_loadu_ps_512 : GCCBuiltin<"__builtin_ia32_loadups512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_ptr_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_loadu_pd_512 : GCCBuiltin<"__builtin_ia32_loadupd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_ptr_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_load_ps_512 : GCCBuiltin<"__builtin_ia32_loadaps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_ptr_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_load_pd_512 : GCCBuiltin<"__builtin_ia32_loadapd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_ptr_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
}
|
|
|
|
// Conditional store ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx_maskstore_pd : GCCBuiltin<"__builtin_ia32_maskstorepd">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v2f64_ty, llvm_v2f64_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx_maskstore_ps : GCCBuiltin<"__builtin_ia32_maskstoreps">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v4f32_ty, llvm_v4f32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx_maskstore_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_maskstorepd256">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v4f64_ty, llvm_v4f64_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx_maskstore_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_maskstoreps256">,
|
|
Intrinsic<[], [llvm_ptr_ty,
|
|
llvm_v8f32_ty, llvm_v8f32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_storeu_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_storeups512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_storeu_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_storeupd512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_store_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_storeaps512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_store_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_storeapd512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_store_ss :
|
|
GCCBuiltin<"__builtin_ia32_storess_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// AVX2
|
|
|
|
// Integer arithmetic ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_padds_b : GCCBuiltin<"__builtin_ia32_paddsb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_padds_w : GCCBuiltin<"__builtin_ia32_paddsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_paddus_b : GCCBuiltin<"__builtin_ia32_paddusb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_paddus_w : GCCBuiltin<"__builtin_ia32_paddusw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_psubs_b : GCCBuiltin<"__builtin_ia32_psubsb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psubs_w : GCCBuiltin<"__builtin_ia32_psubsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psubus_b : GCCBuiltin<"__builtin_ia32_psubusb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psubus_w : GCCBuiltin<"__builtin_ia32_psubusw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pmulhu_w : GCCBuiltin<"__builtin_ia32_pmulhuw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmulh_w : GCCBuiltin<"__builtin_ia32_pmulhw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmulu_dq : GCCBuiltin<"__builtin_ia32_pmuludq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmul_dq : GCCBuiltin<"__builtin_ia32_pmuldq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmadd_wd : GCCBuiltin<"__builtin_ia32_pmaddwd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pavg_b : GCCBuiltin<"__builtin_ia32_pavgb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pavg_w : GCCBuiltin<"__builtin_ia32_pavgw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_psad_bw : GCCBuiltin<"__builtin_ia32_psadbw256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Vector min, max
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pmaxu_b : GCCBuiltin<"__builtin_ia32_pmaxub256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmaxu_w : GCCBuiltin<"__builtin_ia32_pmaxuw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmaxu_d : GCCBuiltin<"__builtin_ia32_pmaxud256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmaxs_b : GCCBuiltin<"__builtin_ia32_pmaxsb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmaxs_w : GCCBuiltin<"__builtin_ia32_pmaxsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmaxs_d : GCCBuiltin<"__builtin_ia32_pmaxsd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pminu_b : GCCBuiltin<"__builtin_ia32_pminub256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pminu_w : GCCBuiltin<"__builtin_ia32_pminuw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pminu_d : GCCBuiltin<"__builtin_ia32_pminud256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmins_b : GCCBuiltin<"__builtin_ia32_pminsb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmins_w : GCCBuiltin<"__builtin_ia32_pminsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_pmins_d : GCCBuiltin<"__builtin_ia32_pminsd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx512_mask_pmaxs_b_128 : GCCBuiltin<"__builtin_ia32_pmaxsb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_b_256 : GCCBuiltin<"__builtin_ia32_pmaxsb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_b_512 : GCCBuiltin<"__builtin_ia32_pmaxsb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_b_128 : GCCBuiltin<"__builtin_ia32_pmaxub128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_b_256 : GCCBuiltin<"__builtin_ia32_pmaxub256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_b_512 : GCCBuiltin<"__builtin_ia32_pmaxub512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_w_128 : GCCBuiltin<"__builtin_ia32_pmaxsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_w_256 : GCCBuiltin<"__builtin_ia32_pmaxsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_w_512 : GCCBuiltin<"__builtin_ia32_pmaxsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty],[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_w_128 : GCCBuiltin<"__builtin_ia32_pmaxuw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_w_256 : GCCBuiltin<"__builtin_ia32_pmaxuw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_w_512 : GCCBuiltin<"__builtin_ia32_pmaxuw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty],[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_b_128 : GCCBuiltin<"__builtin_ia32_pminsb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty,llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_b_256 : GCCBuiltin<"__builtin_ia32_pminsb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_b_512 : GCCBuiltin<"__builtin_ia32_pminsb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_b_128 : GCCBuiltin<"__builtin_ia32_pminub128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_b_256 : GCCBuiltin<"__builtin_ia32_pminub256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_b_512 : GCCBuiltin<"__builtin_ia32_pminub512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_w_128 : GCCBuiltin<"__builtin_ia32_pminsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_w_256 : GCCBuiltin<"__builtin_ia32_pminsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_w_512 : GCCBuiltin<"__builtin_ia32_pminsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty],[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_w_128 : GCCBuiltin<"__builtin_ia32_pminuw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_w_256 : GCCBuiltin<"__builtin_ia32_pminuw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_w_512 : GCCBuiltin<"__builtin_ia32_pminuw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_d_512 : GCCBuiltin<"__builtin_ia32_pmaxud512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_d_256 : GCCBuiltin<"__builtin_ia32_pmaxud256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_d_128 : GCCBuiltin<"__builtin_ia32_pmaxud128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_d_512 : GCCBuiltin<"__builtin_ia32_pmaxsd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_d_256 : GCCBuiltin<"__builtin_ia32_pmaxsd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_d_128 : GCCBuiltin<"__builtin_ia32_pmaxsd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_q_512 : GCCBuiltin<"__builtin_ia32_pmaxuq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_q_256 : GCCBuiltin<"__builtin_ia32_pmaxuq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxu_q_128 : GCCBuiltin<"__builtin_ia32_pmaxuq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_q_512 : GCCBuiltin<"__builtin_ia32_pmaxsq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_q_256 : GCCBuiltin<"__builtin_ia32_pmaxsq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmaxs_q_128 : GCCBuiltin<"__builtin_ia32_pmaxsq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_d_512 : GCCBuiltin<"__builtin_ia32_pminud512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_d_256 : GCCBuiltin<"__builtin_ia32_pminud256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_d_128 : GCCBuiltin<"__builtin_ia32_pminud128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_d_512 : GCCBuiltin<"__builtin_ia32_pminsd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_d_256 : GCCBuiltin<"__builtin_ia32_pminsd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_d_128 : GCCBuiltin<"__builtin_ia32_pminsd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_q_512 : GCCBuiltin<"__builtin_ia32_pminuq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_q_256 : GCCBuiltin<"__builtin_ia32_pminuq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pminu_q_128 : GCCBuiltin<"__builtin_ia32_pminuq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_q_512 : GCCBuiltin<"__builtin_ia32_pminsq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_q_256 : GCCBuiltin<"__builtin_ia32_pminsq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmins_q_128 : GCCBuiltin<"__builtin_ia32_pminsq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Integer shift ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_psll_w : GCCBuiltin<"__builtin_ia32_psllw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psll_d : GCCBuiltin<"__builtin_ia32_pslld256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psll_q : GCCBuiltin<"__builtin_ia32_psllq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty,
|
|
llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrl_w : GCCBuiltin<"__builtin_ia32_psrlw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrl_d : GCCBuiltin<"__builtin_ia32_psrld256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrl_q : GCCBuiltin<"__builtin_ia32_psrlq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty,
|
|
llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psra_w : GCCBuiltin<"__builtin_ia32_psraw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psra_d : GCCBuiltin<"__builtin_ia32_psrad256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v4i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx2_pslli_w : GCCBuiltin<"__builtin_ia32_psllwi256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pslli_d : GCCBuiltin<"__builtin_ia32_pslldi256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pslli_q : GCCBuiltin<"__builtin_ia32_psllqi256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrli_w : GCCBuiltin<"__builtin_ia32_psrlwi256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrli_d : GCCBuiltin<"__builtin_ia32_psrldi256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrli_q : GCCBuiltin<"__builtin_ia32_psrlqi256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrai_w : GCCBuiltin<"__builtin_ia32_psrawi256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psrai_d : GCCBuiltin<"__builtin_ia32_psradi256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pslli_d : GCCBuiltin<"__builtin_ia32_pslldi512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pslli_q : GCCBuiltin<"__builtin_ia32_psllqi512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_i32_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrli_d : GCCBuiltin<"__builtin_ia32_psrldi512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrli_q : GCCBuiltin<"__builtin_ia32_psrlqi512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_i32_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrai_d : GCCBuiltin<"__builtin_ia32_psradi512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrai_q : GCCBuiltin<"__builtin_ia32_psraqi512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_i32_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_psll_d : GCCBuiltin<"__builtin_ia32_pslld512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v4i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psll_q : GCCBuiltin<"__builtin_ia32_psllq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v2i64_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrl_d : GCCBuiltin<"__builtin_ia32_psrld512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v4i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrl_q : GCCBuiltin<"__builtin_ia32_psrlq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v2i64_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psra_d : GCCBuiltin<"__builtin_ia32_psrad512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v4i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psra_q : GCCBuiltin<"__builtin_ia32_psraq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v2i64_ty, llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Pack ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_packsswb : GCCBuiltin<"__builtin_ia32_packsswb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_packssdw : GCCBuiltin<"__builtin_ia32_packssdw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_packuswb : GCCBuiltin<"__builtin_ia32_packuswb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_packusdw : GCCBuiltin<"__builtin_ia32_packusdw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Absolute value ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pabs_b : GCCBuiltin<"__builtin_ia32_pabsb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pabs_w : GCCBuiltin<"__builtin_ia32_pabsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pabs_d : GCCBuiltin<"__builtin_ia32_pabsd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_b_128 :
|
|
GCCBuiltin<"__builtin_ia32_pabsb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_b_256 :
|
|
GCCBuiltin<"__builtin_ia32_pabsb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty],
|
|
[llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_b_512 :
|
|
GCCBuiltin<"__builtin_ia32_pabsb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty],
|
|
[llvm_v64i8_ty, llvm_v64i8_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_pabsd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_pabsd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_pabsd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty],
|
|
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_pabsq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_pabsq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_pabsq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty],
|
|
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_w_128 :
|
|
GCCBuiltin<"__builtin_ia32_pabsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_w_256 :
|
|
GCCBuiltin<"__builtin_ia32_pabsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty],
|
|
[llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pabs_w_512 :
|
|
GCCBuiltin<"__builtin_ia32_pabsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty],
|
|
[llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Horizontal arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_phadd_w : GCCBuiltin<"__builtin_ia32_phaddw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_phadd_d : GCCBuiltin<"__builtin_ia32_phaddd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_phadd_sw : GCCBuiltin<"__builtin_ia32_phaddsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_phsub_w : GCCBuiltin<"__builtin_ia32_phsubw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_phsub_d : GCCBuiltin<"__builtin_ia32_phsubd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_phsub_sw : GCCBuiltin<"__builtin_ia32_phsubsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pmadd_ub_sw : GCCBuiltin<"__builtin_ia32_pmaddubsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Sign ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_psign_b : GCCBuiltin<"__builtin_ia32_psignb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psign_w : GCCBuiltin<"__builtin_ia32_psignw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_psign_d : GCCBuiltin<"__builtin_ia32_psignd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty,
|
|
llvm_v8i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Packed multiply high with round and scale
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pmul_hr_sw : GCCBuiltin<"__builtin_ia32_pmulhrsw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty,
|
|
llvm_v16i16_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx512_mask_pmul_hr_sw_128 : GCCBuiltin<"__builtin_ia32_pmulhrsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmul_hr_sw_256 : GCCBuiltin<"__builtin_ia32_pmulhrsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmul_hr_sw_512 : GCCBuiltin<"__builtin_ia32_pmulhrsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector sign and zero extend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pmovsxbd : GCCBuiltin<"__builtin_ia32_pmovsxbd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovsxbq : GCCBuiltin<"__builtin_ia32_pmovsxbq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovsxbw : GCCBuiltin<"__builtin_ia32_pmovsxbw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovsxdq : GCCBuiltin<"__builtin_ia32_pmovsxdq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovsxwd : GCCBuiltin<"__builtin_ia32_pmovsxwd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovsxwq : GCCBuiltin<"__builtin_ia32_pmovsxwq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxbd : GCCBuiltin<"__builtin_ia32_pmovzxbd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxbq : GCCBuiltin<"__builtin_ia32_pmovzxbq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxbw : GCCBuiltin<"__builtin_ia32_pmovzxbw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxdq : GCCBuiltin<"__builtin_ia32_pmovzxdq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxwd : GCCBuiltin<"__builtin_ia32_pmovzxwd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_pmovzxwq : GCCBuiltin<"__builtin_ia32_pmovzxwq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector blend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pblendvb : GCCBuiltin<"__builtin_ia32_pblendvb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector load with broadcast
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_vbroadcast_ss_ps :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastss_ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_vbroadcast_sd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastsd_pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_vbroadcast_ss_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastss_ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastb_128 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastb128">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastb_256 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastw_128 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastw128">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastw_256 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastd_128 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastd128">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastd_256 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastq_128 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastq128">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pbroadcastq_256 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pbroadcast_d_gpr_512 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastd512_gpr_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_i32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pbroadcast_q_gpr_512 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastq512_gpr_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_i64_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pbroadcast_q_mem_512 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastq512_mem_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_i64_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector permutation
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_permd : GCCBuiltin<"__builtin_ia32_permvarsi256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_permps : GCCBuiltin<"__builtin_ia32_permvarsf256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_vperm2i128 : GCCBuiltin<"__builtin_ia32_permti256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector extract and insert
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_mask_vextractf32x4_512 :
|
|
GCCBuiltin<"__builtin_ia32_extractf32x4_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v16f32_ty, llvm_i8_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_vextracti32x4_512 :
|
|
GCCBuiltin<"__builtin_ia32_extracti32x4_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v16i32_ty, llvm_i8_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_vextractf64x4_512 :
|
|
GCCBuiltin<"__builtin_ia32_extractf64x4_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_vextracti64x4_512 :
|
|
GCCBuiltin<"__builtin_ia32_extracti64x4_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i64_ty, llvm_i8_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Conditional load ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_maskload_d : GCCBuiltin<"__builtin_ia32_maskloadd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_ptr_ty, llvm_v4i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_maskload_q : GCCBuiltin<"__builtin_ia32_maskloadq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_ptr_ty, llvm_v2i64_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_maskload_d_256 : GCCBuiltin<"__builtin_ia32_maskloadd256">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_ptr_ty, llvm_v8i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_maskload_q_256 : GCCBuiltin<"__builtin_ia32_maskloadq256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_ptr_ty, llvm_v4i64_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_loadu_d_512 : GCCBuiltin<"__builtin_ia32_loaddqusi512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_ptr_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_loadu_q_512 : GCCBuiltin<"__builtin_ia32_loaddqudi512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_ptr_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
}
|
|
|
|
// Conditional store ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_maskstore_d : GCCBuiltin<"__builtin_ia32_maskstored">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx2_maskstore_q : GCCBuiltin<"__builtin_ia32_maskstoreq">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx2_maskstore_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_maskstored256">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8i32_ty, llvm_v8i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx2_maskstore_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_maskstoreq256">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4i64_ty, llvm_v4i64_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_storeu_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_storedqusi512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_storeu_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_storedqudi512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// Variable bit shift ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_psllv_d : GCCBuiltin<"__builtin_ia32_psllv4si">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psllv_d_256 : GCCBuiltin<"__builtin_ia32_psllv8si">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psllv_q : GCCBuiltin<"__builtin_ia32_psllv2di">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psllv_q_256 : GCCBuiltin<"__builtin_ia32_psllv4di">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx2_psrlv_d : GCCBuiltin<"__builtin_ia32_psrlv4si">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psrlv_d_256 : GCCBuiltin<"__builtin_ia32_psrlv8si">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psrlv_q : GCCBuiltin<"__builtin_ia32_psrlv2di">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psrlv_q_256 : GCCBuiltin<"__builtin_ia32_psrlv4di">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx2_psrav_d : GCCBuiltin<"__builtin_ia32_psrav4si">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx2_psrav_d_256 : GCCBuiltin<"__builtin_ia32_psrav8si">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_psllv_d : GCCBuiltin<"__builtin_ia32_psllv16si_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_psllv_q : GCCBuiltin<"__builtin_ia32_psllv8di_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrav_d : GCCBuiltin<"__builtin_ia32_psrav16si_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrav_q : GCCBuiltin<"__builtin_ia32_psrav8di_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrlv_d : GCCBuiltin<"__builtin_ia32_psrlv16si_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_psrlv_q : GCCBuiltin<"__builtin_ia32_psrlv8di_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Gather ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_gather_d_pd : GCCBuiltin<"__builtin_ia32_gatherd_pd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_pd_256 : GCCBuiltin<"__builtin_ia32_gatherd_pd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_pd : GCCBuiltin<"__builtin_ia32_gatherq_pd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_pd_256 : GCCBuiltin<"__builtin_ia32_gatherq_pd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_ps : GCCBuiltin<"__builtin_ia32_gatherd_ps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_ps_256 : GCCBuiltin<"__builtin_ia32_gatherd_ps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_ptr_ty, llvm_v8i32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_ps : GCCBuiltin<"__builtin_ia32_gatherq_ps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_ps_256 : GCCBuiltin<"__builtin_ia32_gatherq_ps256">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx2_gather_d_q : GCCBuiltin<"__builtin_ia32_gatherd_q">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_q_256 : GCCBuiltin<"__builtin_ia32_gatherd_q256">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_q : GCCBuiltin<"__builtin_ia32_gatherq_q">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_q_256 : GCCBuiltin<"__builtin_ia32_gatherq_q256">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_d : GCCBuiltin<"__builtin_ia32_gatherd_d">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_d_d_256 : GCCBuiltin<"__builtin_ia32_gatherd_d256">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_ptr_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_d : GCCBuiltin<"__builtin_ia32_gatherq_d">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx2_gather_q_d_256 : GCCBuiltin<"__builtin_ia32_gatherq_d256">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrReadArgMem]>;
|
|
}
|
|
|
|
// Misc.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx2_pmovmskb : GCCBuiltin<"__builtin_ia32_pmovmskb256">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_pshuf_b : GCCBuiltin<"__builtin_ia32_pshufb256">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty,
|
|
llvm_v32i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx2_mpsadbw : GCCBuiltin<"__builtin_ia32_mpsadbw256">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_i8_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_avx2_movntdqa : GCCBuiltin<"__builtin_ia32_movntdqa256">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_ptr_ty], [IntrReadMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// FMA3 and FMA4
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_fma_vfmadd_ss : GCCBuiltin<"__builtin_ia32_vfmaddss">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmadd_sd : GCCBuiltin<"__builtin_ia32_vfmaddsd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmadd_ps : GCCBuiltin<"__builtin_ia32_vfmaddps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmadd_pd : GCCBuiltin<"__builtin_ia32_vfmaddpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmadd_ps_256 : GCCBuiltin<"__builtin_ia32_vfmaddps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmadd_pd_256 : GCCBuiltin<"__builtin_ia32_vfmaddpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_fma_vfmsub_ss : GCCBuiltin<"__builtin_ia32_vfmsubss">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsub_sd : GCCBuiltin<"__builtin_ia32_vfmsubsd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsub_ps : GCCBuiltin<"__builtin_ia32_vfmsubps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsub_pd : GCCBuiltin<"__builtin_ia32_vfmsubpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsub_ps_256 : GCCBuiltin<"__builtin_ia32_vfmsubps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsub_pd_256 : GCCBuiltin<"__builtin_ia32_vfmsubpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_ss : GCCBuiltin<"__builtin_ia32_vfnmaddss">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_sd : GCCBuiltin<"__builtin_ia32_vfnmaddsd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_ps : GCCBuiltin<"__builtin_ia32_vfnmaddps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_pd : GCCBuiltin<"__builtin_ia32_vfnmaddpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_ps_256 : GCCBuiltin<"__builtin_ia32_vfnmaddps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmadd_pd_256 : GCCBuiltin<"__builtin_ia32_vfnmaddpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_ss : GCCBuiltin<"__builtin_ia32_vfnmsubss">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_sd : GCCBuiltin<"__builtin_ia32_vfnmsubsd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_ps : GCCBuiltin<"__builtin_ia32_vfnmsubps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_pd : GCCBuiltin<"__builtin_ia32_vfnmsubpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_ps_256 : GCCBuiltin<"__builtin_ia32_vfnmsubps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfnmsub_pd_256 : GCCBuiltin<"__builtin_ia32_vfnmsubpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmaddsub_ps : GCCBuiltin<"__builtin_ia32_vfmaddsubps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmaddsub_pd : GCCBuiltin<"__builtin_ia32_vfmaddsubpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmaddsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmaddsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsubadd_ps : GCCBuiltin<"__builtin_ia32_vfmsubaddps">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsubadd_pd : GCCBuiltin<"__builtin_ia32_vfmsubaddpd">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsubadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddps256">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_fma_vfmsubadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddpd256">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd128_mask3">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd128_maskz">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd256_mask3">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd256_maskz">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd512_mask3">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddpd512_maskz">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps128_mask3">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps128_maskz">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps256_mask3">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps256_maskz">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmadd_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmadd_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps512_mask3">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmadd_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddps512_maskz">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd128_mask3">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd128_maskz">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd256_mask3">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd256_maskz">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd512_mask3">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubpd512_maskz">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps128_mask3">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps128_maskz">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps256_mask3">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps256_maskz">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfmaddsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmaddsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps512_mask3">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_maskz_vfmaddsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmaddsubps512_maskz">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubpd128_mask3">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubpd256_mask3">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubpd512_mask3">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubps128_mask3">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubps256_mask3">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubps512_mask3">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddpd128_mask3">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddpd256_mask3">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddpd512_mask3">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddps128_mask3">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddps256_mask3">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfmsubadd_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfmsubaddps512_mask3">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmadd_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmaddps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd128_mask3">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd256_mask3">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubpd512_mask3">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps128_mask3">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps256_mask3">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_vfnmsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask3_vfnmsub_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vfnmsubps512_mask3">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// XOP
|
|
|
|
def int_x86_xop_vpermil2pd : GCCBuiltin<"__builtin_ia32_vpermil2pd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vpermil2pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermil2pd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vpermil2ps : GCCBuiltin<"__builtin_ia32_vpermil2ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpermil2ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpermil2ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vfrcz_pd : GCCBuiltin<"__builtin_ia32_vfrczpd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vfrcz_ps : GCCBuiltin<"__builtin_ia32_vfrczps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vfrcz_sd : GCCBuiltin<"__builtin_ia32_vfrczsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vfrcz_ss : GCCBuiltin<"__builtin_ia32_vfrczss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vfrcz_pd_256 : GCCBuiltin<"__builtin_ia32_vfrczpd256">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vfrcz_ps_256 : GCCBuiltin<"__builtin_ia32_vfrczps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_xop_vpcmov :
|
|
GCCBuiltin<"__builtin_ia32_vpcmov">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpcmov_256 :
|
|
GCCBuiltin<"__builtin_ia32_vpcmov_256">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_v4i64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vpcomb : GCCBuiltin<"__builtin_ia32_vpcomb">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomw : GCCBuiltin<"__builtin_ia32_vpcomw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomd : GCCBuiltin<"__builtin_ia32_vpcomd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomq : GCCBuiltin<"__builtin_ia32_vpcomq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomub : GCCBuiltin<"__builtin_ia32_vpcomub">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomuw : GCCBuiltin<"__builtin_ia32_vpcomuw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomud : GCCBuiltin<"__builtin_ia32_vpcomud">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpcomuq : GCCBuiltin<"__builtin_ia32_vpcomuq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_xop_vphaddbd :
|
|
GCCBuiltin<"__builtin_ia32_vphaddbd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddbq :
|
|
GCCBuiltin<"__builtin_ia32_vphaddbq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddbw :
|
|
GCCBuiltin<"__builtin_ia32_vphaddbw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphadddq :
|
|
GCCBuiltin<"__builtin_ia32_vphadddq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddubd :
|
|
GCCBuiltin<"__builtin_ia32_vphaddubd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddubq :
|
|
GCCBuiltin<"__builtin_ia32_vphaddubq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddubw :
|
|
GCCBuiltin<"__builtin_ia32_vphaddubw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddudq :
|
|
GCCBuiltin<"__builtin_ia32_vphaddudq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphadduwd :
|
|
GCCBuiltin<"__builtin_ia32_vphadduwd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphadduwq :
|
|
GCCBuiltin<"__builtin_ia32_vphadduwq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddwd :
|
|
GCCBuiltin<"__builtin_ia32_vphaddwd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphaddwq :
|
|
GCCBuiltin<"__builtin_ia32_vphaddwq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphsubbw :
|
|
GCCBuiltin<"__builtin_ia32_vphsubbw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v16i8_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphsubdq :
|
|
GCCBuiltin<"__builtin_ia32_vphsubdq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vphsubwd :
|
|
GCCBuiltin<"__builtin_ia32_vphsubwd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_xop_vpmacsdd :
|
|
GCCBuiltin<"__builtin_ia32_vpmacsdd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacsdqh :
|
|
GCCBuiltin<"__builtin_ia32_vpmacsdqh">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacsdql :
|
|
GCCBuiltin<"__builtin_ia32_vpmacsdql">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacssdd :
|
|
GCCBuiltin<"__builtin_ia32_vpmacssdd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacssdqh :
|
|
GCCBuiltin<"__builtin_ia32_vpmacssdqh">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacssdql :
|
|
GCCBuiltin<"__builtin_ia32_vpmacssdql">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacsswd :
|
|
GCCBuiltin<"__builtin_ia32_vpmacsswd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacssww :
|
|
GCCBuiltin<"__builtin_ia32_vpmacssww">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacswd :
|
|
GCCBuiltin<"__builtin_ia32_vpmacswd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmacsww :
|
|
GCCBuiltin<"__builtin_ia32_vpmacsww">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmadcsswd :
|
|
GCCBuiltin<"__builtin_ia32_vpmadcsswd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpmadcswd :
|
|
GCCBuiltin<"__builtin_ia32_vpmadcswd">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpperm :
|
|
GCCBuiltin<"__builtin_ia32_vpperm">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vprotb : GCCBuiltin<"__builtin_ia32_vprotb">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotd : GCCBuiltin<"__builtin_ia32_vprotd">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotq : GCCBuiltin<"__builtin_ia32_vprotq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotw : GCCBuiltin<"__builtin_ia32_vprotw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotbi : GCCBuiltin<"__builtin_ia32_vprotbi">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotdi : GCCBuiltin<"__builtin_ia32_vprotdi">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotqi : GCCBuiltin<"__builtin_ia32_vprotqi">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vprotwi : GCCBuiltin<"__builtin_ia32_vprotwi">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_xop_vpshab :
|
|
GCCBuiltin<"__builtin_ia32_vpshab">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshad :
|
|
GCCBuiltin<"__builtin_ia32_vpshad">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshaq :
|
|
GCCBuiltin<"__builtin_ia32_vpshaq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshaw :
|
|
GCCBuiltin<"__builtin_ia32_vpshaw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshlb :
|
|
GCCBuiltin<"__builtin_ia32_vpshlb">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshld :
|
|
GCCBuiltin<"__builtin_ia32_vpshld">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshlq :
|
|
GCCBuiltin<"__builtin_ia32_vpshlq">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_xop_vpshlw :
|
|
GCCBuiltin<"__builtin_ia32_vpshlw">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// MMX
|
|
|
|
// Empty MMX state op.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_mmx_emms : GCCBuiltin<"__builtin_ia32_emms">,
|
|
Intrinsic<[], [], []>;
|
|
def int_x86_mmx_femms : GCCBuiltin<"__builtin_ia32_femms">,
|
|
Intrinsic<[], [], []>;
|
|
}
|
|
|
|
// Integer arithmetic ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
// Addition
|
|
def int_x86_mmx_padd_b : GCCBuiltin<"__builtin_ia32_paddb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_padd_w : GCCBuiltin<"__builtin_ia32_paddw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_padd_d : GCCBuiltin<"__builtin_ia32_paddd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_padd_q : GCCBuiltin<"__builtin_ia32_paddq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_mmx_padds_b : GCCBuiltin<"__builtin_ia32_paddsb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_padds_w : GCCBuiltin<"__builtin_ia32_paddsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
def int_x86_mmx_paddus_b : GCCBuiltin<"__builtin_ia32_paddusb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_paddus_w : GCCBuiltin<"__builtin_ia32_paddusw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
// Subtraction
|
|
def int_x86_mmx_psub_b : GCCBuiltin<"__builtin_ia32_psubb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_psub_w : GCCBuiltin<"__builtin_ia32_psubw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_psub_d : GCCBuiltin<"__builtin_ia32_psubd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_psub_q : GCCBuiltin<"__builtin_ia32_psubq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psubs_b : GCCBuiltin<"__builtin_ia32_psubsb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psubs_w : GCCBuiltin<"__builtin_ia32_psubsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psubus_b : GCCBuiltin<"__builtin_ia32_psubusb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psubus_w : GCCBuiltin<"__builtin_ia32_psubusw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
// Multiplication
|
|
def int_x86_mmx_pmulh_w : GCCBuiltin<"__builtin_ia32_pmulhw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmull_w : GCCBuiltin<"__builtin_ia32_pmullw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmulhu_w : GCCBuiltin<"__builtin_ia32_pmulhuw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmulu_dq : GCCBuiltin<"__builtin_ia32_pmuludq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmadd_wd : GCCBuiltin<"__builtin_ia32_pmaddwd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
// Bitwise operations
|
|
def int_x86_mmx_pand : GCCBuiltin<"__builtin_ia32_pand">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_pandn : GCCBuiltin<"__builtin_ia32_pandn">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_por : GCCBuiltin<"__builtin_ia32_por">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_pxor : GCCBuiltin<"__builtin_ia32_pxor">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
|
|
// Averages
|
|
def int_x86_mmx_pavg_b : GCCBuiltin<"__builtin_ia32_pavgb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pavg_w : GCCBuiltin<"__builtin_ia32_pavgw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
// Maximum
|
|
def int_x86_mmx_pmaxu_b : GCCBuiltin<"__builtin_ia32_pmaxub">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmaxs_w : GCCBuiltin<"__builtin_ia32_pmaxsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
// Minimum
|
|
def int_x86_mmx_pminu_b : GCCBuiltin<"__builtin_ia32_pminub">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pmins_w : GCCBuiltin<"__builtin_ia32_pminsw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
// Packed sum of absolute differences
|
|
def int_x86_mmx_psad_bw : GCCBuiltin<"__builtin_ia32_psadbw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
}
|
|
|
|
// Integer shift ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
// Shift left logical
|
|
def int_x86_mmx_psll_w : GCCBuiltin<"__builtin_ia32_psllw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psll_d : GCCBuiltin<"__builtin_ia32_pslld">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psll_q : GCCBuiltin<"__builtin_ia32_psllq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psrl_w : GCCBuiltin<"__builtin_ia32_psrlw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psrl_d : GCCBuiltin<"__builtin_ia32_psrld">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psrl_q : GCCBuiltin<"__builtin_ia32_psrlq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psra_w : GCCBuiltin<"__builtin_ia32_psraw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psra_d : GCCBuiltin<"__builtin_ia32_psrad">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_pslli_w : GCCBuiltin<"__builtin_ia32_psllwi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_pslli_d : GCCBuiltin<"__builtin_ia32_pslldi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_pslli_q : GCCBuiltin<"__builtin_ia32_psllqi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psrli_w : GCCBuiltin<"__builtin_ia32_psrlwi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psrli_d : GCCBuiltin<"__builtin_ia32_psrldi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psrli_q : GCCBuiltin<"__builtin_ia32_psrlqi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_psrai_w : GCCBuiltin<"__builtin_ia32_psrawi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_psrai_d : GCCBuiltin<"__builtin_ia32_psradi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Pack ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_mmx_packsswb : GCCBuiltin<"__builtin_ia32_packsswb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_packssdw : GCCBuiltin<"__builtin_ia32_packssdw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_packuswb : GCCBuiltin<"__builtin_ia32_packuswb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Unpacking ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_mmx_punpckhbw : GCCBuiltin<"__builtin_ia32_punpckhbw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_punpckhwd : GCCBuiltin<"__builtin_ia32_punpckhwd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_punpckhdq : GCCBuiltin<"__builtin_ia32_punpckhdq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_punpcklbw : GCCBuiltin<"__builtin_ia32_punpcklbw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_punpcklwd : GCCBuiltin<"__builtin_ia32_punpcklwd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_mmx_punpckldq : GCCBuiltin<"__builtin_ia32_punpckldq">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty, llvm_x86mmx_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Integer comparison ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_mmx_pcmpeq_b : GCCBuiltin<"__builtin_ia32_pcmpeqb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pcmpeq_w : GCCBuiltin<"__builtin_ia32_pcmpeqw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
def int_x86_mmx_pcmpeq_d : GCCBuiltin<"__builtin_ia32_pcmpeqd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem, Commutative]>;
|
|
|
|
def int_x86_mmx_pcmpgt_b : GCCBuiltin<"__builtin_ia32_pcmpgtb">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_pcmpgt_w : GCCBuiltin<"__builtin_ia32_pcmpgtw">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
def int_x86_mmx_pcmpgt_d : GCCBuiltin<"__builtin_ia32_pcmpgtd">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Misc.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_mmx_maskmovq : GCCBuiltin<"__builtin_ia32_maskmovq">,
|
|
Intrinsic<[], [llvm_x86mmx_ty, llvm_x86mmx_ty, llvm_ptr_ty], []>;
|
|
|
|
def int_x86_mmx_pmovmskb : GCCBuiltin<"__builtin_ia32_pmovmskb">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_x86mmx_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_movnt_dq : GCCBuiltin<"__builtin_ia32_movntq">,
|
|
Intrinsic<[], [llvm_ptrx86mmx_ty, llvm_x86mmx_ty], []>;
|
|
|
|
def int_x86_mmx_palignr_b : GCCBuiltin<"__builtin_ia32_palignr">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_x86mmx_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_mmx_pextr_w : GCCBuiltin<"__builtin_ia32_vec_ext_v4hi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_x86mmx_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_mmx_pinsr_w : GCCBuiltin<"__builtin_ia32_vec_set_v4hi">,
|
|
Intrinsic<[llvm_x86mmx_ty], [llvm_x86mmx_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// BMI
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_bmi_bextr_32 : GCCBuiltin<"__builtin_ia32_bextr_u32">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_bextr_64 : GCCBuiltin<"__builtin_ia32_bextr_u64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_bzhi_32 : GCCBuiltin<"__builtin_ia32_bzhi_si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_bzhi_64 : GCCBuiltin<"__builtin_ia32_bzhi_di">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_pdep_32 : GCCBuiltin<"__builtin_ia32_pdep_si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_pdep_64 : GCCBuiltin<"__builtin_ia32_pdep_di">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_pext_32 : GCCBuiltin<"__builtin_ia32_pext_si">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_bmi_pext_64 : GCCBuiltin<"__builtin_ia32_pext_di">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// FS/GS Base
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_rdfsbase_32 : GCCBuiltin<"__builtin_ia32_rdfsbase32">,
|
|
Intrinsic<[llvm_i32_ty], []>;
|
|
def int_x86_rdgsbase_32 : GCCBuiltin<"__builtin_ia32_rdgsbase32">,
|
|
Intrinsic<[llvm_i32_ty], []>;
|
|
def int_x86_rdfsbase_64 : GCCBuiltin<"__builtin_ia32_rdfsbase64">,
|
|
Intrinsic<[llvm_i64_ty], []>;
|
|
def int_x86_rdgsbase_64 : GCCBuiltin<"__builtin_ia32_rdgsbase64">,
|
|
Intrinsic<[llvm_i64_ty], []>;
|
|
def int_x86_wrfsbase_32 : GCCBuiltin<"__builtin_ia32_wrfsbase32">,
|
|
Intrinsic<[], [llvm_i32_ty]>;
|
|
def int_x86_wrgsbase_32 : GCCBuiltin<"__builtin_ia32_wrgsbase32">,
|
|
Intrinsic<[], [llvm_i32_ty]>;
|
|
def int_x86_wrfsbase_64 : GCCBuiltin<"__builtin_ia32_wrfsbase64">,
|
|
Intrinsic<[], [llvm_i64_ty]>;
|
|
def int_x86_wrgsbase_64 : GCCBuiltin<"__builtin_ia32_wrgsbase64">,
|
|
Intrinsic<[], [llvm_i64_ty]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// FXSR
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_fxrstor : GCCBuiltin<"__builtin_ia32_fxrstor">,
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
def int_x86_fxrstor64 : GCCBuiltin<"__builtin_ia32_fxrstor64">,
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
def int_x86_fxsave : GCCBuiltin<"__builtin_ia32_fxsave">,
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
def int_x86_fxsave64 : GCCBuiltin<"__builtin_ia32_fxsave64">,
|
|
Intrinsic<[], [llvm_ptr_ty], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Half float conversion
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_vcvtph2ps_128 : GCCBuiltin<"__builtin_ia32_vcvtph2ps">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_vcvtph2ps_256 : GCCBuiltin<"__builtin_ia32_vcvtph2ps256">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8i16_ty], [IntrNoMem]>;
|
|
def int_x86_vcvtps2ph_128 : GCCBuiltin<"__builtin_ia32_vcvtps2ph">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v4f32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_vcvtps2ph_256 : GCCBuiltin<"__builtin_ia32_vcvtps2ph256">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8f32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_vcvtph2ps_512 : GCCBuiltin<"__builtin_ia32_vcvtph2ps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16i16_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_vcvtps2ph_512 : GCCBuiltin<"__builtin_ia32_vcvtps2ph512_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16f32_ty, llvm_i32_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// TBM
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_tbm_bextri_u32 : GCCBuiltin<"__builtin_ia32_bextri_u32">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_tbm_bextri_u64 : GCCBuiltin<"__builtin_ia32_bextri_u64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_i64_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// RDRAND intrinsics - Return a random value and whether it is valid.
|
|
// RDSEED intrinsics - Return a NIST SP800-90B & C compliant random value and
|
|
// whether it is valid.
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
// These are declared side-effecting so they don't get eliminated by CSE or
|
|
// LICM.
|
|
def int_x86_rdrand_16 : Intrinsic<[llvm_i16_ty, llvm_i32_ty], [], []>;
|
|
def int_x86_rdrand_32 : Intrinsic<[llvm_i32_ty, llvm_i32_ty], [], []>;
|
|
def int_x86_rdrand_64 : Intrinsic<[llvm_i64_ty, llvm_i32_ty], [], []>;
|
|
def int_x86_rdseed_16 : Intrinsic<[llvm_i16_ty, llvm_i32_ty], [], []>;
|
|
def int_x86_rdseed_32 : Intrinsic<[llvm_i32_ty, llvm_i32_ty], [], []>;
|
|
def int_x86_rdseed_64 : Intrinsic<[llvm_i64_ty, llvm_i32_ty], [], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// ADX
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_addcarryx_u32: GCCBuiltin<"__builtin_ia32_addcarryx_u32">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i32_ty, llvm_i32_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_addcarryx_u64: GCCBuiltin<"__builtin_ia32_addcarryx_u64">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i64_ty, llvm_i64_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_addcarry_u32: GCCBuiltin<"__builtin_ia32_addcarry_u32">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i32_ty, llvm_i32_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_addcarry_u64: GCCBuiltin<"__builtin_ia32_addcarry_u64">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i64_ty, llvm_i64_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_subborrow_u32: GCCBuiltin<"__builtin_ia32_subborrow_u32">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i32_ty, llvm_i32_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_subborrow_u64: GCCBuiltin<"__builtin_ia32_subborrow_u64">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_i8_ty, llvm_i64_ty, llvm_i64_ty,
|
|
llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// RTM intrinsics. Transactional Memory support.
|
|
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_xbegin : GCCBuiltin<"__builtin_ia32_xbegin">,
|
|
Intrinsic<[llvm_i32_ty], [], []>;
|
|
def int_x86_xend : GCCBuiltin<"__builtin_ia32_xend">,
|
|
Intrinsic<[], [], []>;
|
|
def int_x86_xabort : GCCBuiltin<"__builtin_ia32_xabort">,
|
|
Intrinsic<[], [llvm_i8_ty], [IntrNoReturn]>;
|
|
def int_x86_xtest : GCCBuiltin<"__builtin_ia32_xtest">,
|
|
Intrinsic<[llvm_i32_ty], [], []>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// AVX512
|
|
|
|
// Mask ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
// Mask instructions
|
|
// 16-bit mask
|
|
def int_x86_avx512_kand_w : GCCBuiltin<"__builtin_ia32_kandhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kandn_w : GCCBuiltin<"__builtin_ia32_kandnhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_knot_w : GCCBuiltin<"__builtin_ia32_knothi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_kor_w : GCCBuiltin<"__builtin_ia32_korhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kxor_w : GCCBuiltin<"__builtin_ia32_kxorhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kxnor_w : GCCBuiltin<"__builtin_ia32_kxnorhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kunpck_bw : GCCBuiltin<"__builtin_ia32_kunpckhi">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kortestz_w : GCCBuiltin<"__builtin_ia32_kortestzhi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_kortestc_w : GCCBuiltin<"__builtin_ia32_kortestchi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Conversion ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_cvtss2usi : GCCBuiltin<"__builtin_ia32_cvtss2usi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtss2usi64 : GCCBuiltin<"__builtin_ia32_cvtss2usi64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvttss2usi : GCCBuiltin<"__builtin_ia32_cvttss2usi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvttss2usi64 : GCCBuiltin<"__builtin_ia32_cvttss2usi64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtusi2ss : GCCBuiltin<"__builtin_ia32_cvtusi2ss32">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtusi642ss : GCCBuiltin<"__builtin_ia32_cvtusi2ss64">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i64_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_cvtsd2usi : GCCBuiltin<"__builtin_ia32_cvtsd2usi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtsd2usi64 : GCCBuiltin<"__builtin_ia32_cvtsd2usi64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvttsd2usi : GCCBuiltin<"__builtin_ia32_cvttsd2usi">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvttsd2usi64 : GCCBuiltin<"__builtin_ia32_cvttsd2usi64">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtusi2sd : GCCBuiltin<"__builtin_ia32_cvtusi2sd32">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtusi642sd : GCCBuiltin<"__builtin_ia32_cvtusi2sd64">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i64_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_cvtsi2ss32 : GCCBuiltin<"__builtin_ia32_cvtsi2ss32">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtsi2ss64 : GCCBuiltin<"__builtin_ia32_cvtsi2ss64">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty,
|
|
llvm_i64_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtsi2sd32 : GCCBuiltin<"__builtin_ia32_cvtsi2sd32">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_cvtsi2sd64 : GCCBuiltin<"__builtin_ia32_cvtsi2sd64">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty,
|
|
llvm_i64_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Pack ops.
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_mask_packsswb_128 : GCCBuiltin<"__builtin_ia32_packsswb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packsswb_256 : GCCBuiltin<"__builtin_ia32_packsswb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v16i16_ty,llvm_v16i16_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packsswb_512 : GCCBuiltin<"__builtin_ia32_packsswb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v32i16_ty,llvm_v32i16_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packssdw_128 : GCCBuiltin<"__builtin_ia32_packssdw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packssdw_256 : GCCBuiltin<"__builtin_ia32_packssdw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packssdw_512 : GCCBuiltin<"__builtin_ia32_packssdw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packuswb_128 : GCCBuiltin<"__builtin_ia32_packuswb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packuswb_256 : GCCBuiltin<"__builtin_ia32_packuswb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v16i16_ty,llvm_v16i16_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packuswb_512 : GCCBuiltin<"__builtin_ia32_packuswb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v32i16_ty,llvm_v32i16_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packusdw_128 : GCCBuiltin<"__builtin_ia32_packusdw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packusdw_256 : GCCBuiltin<"__builtin_ia32_packusdw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_packusdw_512 : GCCBuiltin<"__builtin_ia32_packusdw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector convert
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_mask_cvttps2dq_512: GCCBuiltin<"__builtin_ia32_cvttps2dq512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16f32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvttps2udq_512: GCCBuiltin<"__builtin_ia32_cvttps2udq512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16f32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvttpd2dq_512: GCCBuiltin<"__builtin_ia32_cvttpd2dq512_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f64_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvttpd2udq_512: GCCBuiltin<"__builtin_ia32_cvttpd2udq512_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f64_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_rndscale_ps_512: GCCBuiltin<"__builtin_ia32_rndscaleps_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_i32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_rndscale_pd_512: GCCBuiltin<"__builtin_ia32_rndscalepd_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_i32_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtps2dq_512: GCCBuiltin<"__builtin_ia32_cvtps2dq512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16f32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtpd2dq_512: GCCBuiltin<"__builtin_ia32_cvtpd2dq512_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f64_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtps2udq_512: GCCBuiltin<"__builtin_ia32_cvtps2udq512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16f32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtpd2udq_512: GCCBuiltin<"__builtin_ia32_cvtpd2udq512_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8f64_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtdq2ps_512 : GCCBuiltin<"__builtin_ia32_cvtdq2ps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16i32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtdq2pd_512 : GCCBuiltin<"__builtin_ia32_cvtdq2pd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8i32_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtudq2ps_512 : GCCBuiltin<"__builtin_ia32_cvtudq2ps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16i32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtudq2pd_512 : GCCBuiltin<"__builtin_ia32_cvtudq2pd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8i32_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cvtpd2ps_512 : GCCBuiltin<"__builtin_ia32_cvtpd2ps512_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f64_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector load with broadcast
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_vbroadcast_ss_512 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastss512">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_ptr_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_vbroadcast_ss_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastss_ps512">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v4f32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_vbroadcast_sd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastsd512">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_ptr_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_vbroadcast_sd_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_vbroadcastsd_pd512">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v2f64_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_pbroadcastd_512 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastd512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_pbroadcastd_i32_512 :
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_pbroadcastq_512 :
|
|
GCCBuiltin<"__builtin_ia32_pbroadcastq512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v2i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_pbroadcastq_i64_512 :
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_i64_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Vector sign and zero extend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_pmovzxbq : GCCBuiltin<"__builtin_ia32_pmovzxbq512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_pmovzxwd : GCCBuiltin<"__builtin_ia32_pmovzxwd512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_pmovzxbd : GCCBuiltin<"__builtin_ia32_pmovzxbd512">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_pmovzxwq : GCCBuiltin<"__builtin_ia32_pmovzxwq512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_pmovzxdq : GCCBuiltin<"__builtin_ia32_pmovzxdq512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
//Bitwise Ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_mask_pand_d_128 : GCCBuiltin<"__builtin_ia32_pandd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pand_d_256 : GCCBuiltin<"__builtin_ia32_pandd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pand_d_512 : GCCBuiltin<"__builtin_ia32_pandd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pand_q_128 : GCCBuiltin<"__builtin_ia32_pandq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pand_q_256 : GCCBuiltin<"__builtin_ia32_pandq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pand_q_512 : GCCBuiltin<"__builtin_ia32_pandq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_d_128 : GCCBuiltin<"__builtin_ia32_pandnd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_d_256 : GCCBuiltin<"__builtin_ia32_pandnd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_d_512 : GCCBuiltin<"__builtin_ia32_pandnd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_q_128 : GCCBuiltin<"__builtin_ia32_pandnq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_q_256 : GCCBuiltin<"__builtin_ia32_pandnq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pandn_q_512 : GCCBuiltin<"__builtin_ia32_pandnq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_d_128 : GCCBuiltin<"__builtin_ia32_pord128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_d_256 : GCCBuiltin<"__builtin_ia32_pord256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_d_512 : GCCBuiltin<"__builtin_ia32_pord512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_q_128 : GCCBuiltin<"__builtin_ia32_porq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_q_256 : GCCBuiltin<"__builtin_ia32_porq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_por_q_512 : GCCBuiltin<"__builtin_ia32_porq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_d_128 : GCCBuiltin<"__builtin_ia32_pxord128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_d_256 : GCCBuiltin<"__builtin_ia32_pxord256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_d_512 : GCCBuiltin<"__builtin_ia32_pxord512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_q_128 : GCCBuiltin<"__builtin_ia32_pxorq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_q_256 : GCCBuiltin<"__builtin_ia32_pxorq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pxor_q_512 : GCCBuiltin<"__builtin_ia32_pxorq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
// Arithmetic ops
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
|
|
def int_x86_avx512_mask_add_ps_128 : GCCBuiltin<"__builtin_ia32_addps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_ps_256 : GCCBuiltin<"__builtin_ia32_addps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_ps_512 : GCCBuiltin<"__builtin_ia32_addps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_pd_128 : GCCBuiltin<"__builtin_ia32_addpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_pd_256 : GCCBuiltin<"__builtin_ia32_addpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_pd_512 : GCCBuiltin<"__builtin_ia32_addpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_ps_128 : GCCBuiltin<"__builtin_ia32_subps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_ps_256 : GCCBuiltin<"__builtin_ia32_subps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_ps_512 : GCCBuiltin<"__builtin_ia32_subps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_pd_128 : GCCBuiltin<"__builtin_ia32_subpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_pd_256 : GCCBuiltin<"__builtin_ia32_subpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_pd_512 : GCCBuiltin<"__builtin_ia32_subpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_ps_128 : GCCBuiltin<"__builtin_ia32_mulps_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_ps_256 : GCCBuiltin<"__builtin_ia32_mulps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_ps_512 : GCCBuiltin<"__builtin_ia32_mulps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_pd_128 : GCCBuiltin<"__builtin_ia32_mulpd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_pd_256 : GCCBuiltin<"__builtin_ia32_mulpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_pd_512 : GCCBuiltin<"__builtin_ia32_mulpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_ps_128 : GCCBuiltin<"__builtin_ia32_divps_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_ps_256 : GCCBuiltin<"__builtin_ia32_divps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_ps_512 : GCCBuiltin<"__builtin_ia32_divps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_pd_128 : GCCBuiltin<"__builtin_ia32_divpd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_pd_256 : GCCBuiltin<"__builtin_ia32_divpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_pd_512 : GCCBuiltin<"__builtin_ia32_divpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_ps_128 : GCCBuiltin<"__builtin_ia32_maxps_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_ps_256 : GCCBuiltin<"__builtin_ia32_maxps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_ps_512 : GCCBuiltin<"__builtin_ia32_maxps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_pd_128 : GCCBuiltin<"__builtin_ia32_maxpd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_pd_256 : GCCBuiltin<"__builtin_ia32_maxpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_pd_512 : GCCBuiltin<"__builtin_ia32_maxpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_ps_128 : GCCBuiltin<"__builtin_ia32_minps_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_ps_256 : GCCBuiltin<"__builtin_ia32_minps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_ps_512 : GCCBuiltin<"__builtin_ia32_minps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_pd_128 : GCCBuiltin<"__builtin_ia32_minpd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_pd_256 : GCCBuiltin<"__builtin_ia32_minpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_pd_512 : GCCBuiltin<"__builtin_ia32_minpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_add_ss_round : GCCBuiltin<"__builtin_ia32_addss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_ss_round : GCCBuiltin<"__builtin_ia32_divss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_ss_round : GCCBuiltin<"__builtin_ia32_mulss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_ss_round : GCCBuiltin<"__builtin_ia32_subss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_ss_round : GCCBuiltin<"__builtin_ia32_maxss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_ss_round : GCCBuiltin<"__builtin_ia32_minss_round">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_add_sd_round : GCCBuiltin<"__builtin_ia32_addsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_div_sd_round : GCCBuiltin<"__builtin_ia32_divsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_mul_sd_round : GCCBuiltin<"__builtin_ia32_mulsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sub_sd_round : GCCBuiltin<"__builtin_ia32_subsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_max_sd_round : GCCBuiltin<"__builtin_ia32_maxsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_min_sd_round : GCCBuiltin<"__builtin_ia32_minsd_round">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_rndscale_ss : GCCBuiltin<"__builtin_ia32_rndscaless_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty, llvm_i32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_rndscale_sd : GCCBuiltin<"__builtin_ia32_rndscalesd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_scalef_pd_128 : GCCBuiltin<"__builtin_ia32_scalefpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_scalef_pd_256 : GCCBuiltin<"__builtin_ia32_scalefpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty],[IntrNoMem]>;
|
|
def int_x86_avx512_mask_scalef_pd_512 : GCCBuiltin<"__builtin_ia32_scalefpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_scalef_ps_128 : GCCBuiltin<"__builtin_ia32_scalefps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_scalef_ps_256 : GCCBuiltin<"__builtin_ia32_scalefps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_scalef_ps_512 : GCCBuiltin<"__builtin_ia32_scalefps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_sqrt_ss : GCCBuiltin<"__builtin_ia32_sqrtrndss">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_sqrt_sd : GCCBuiltin<"__builtin_ia32_sqrtrndsd">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_sqrt_pd_128 : GCCBuiltin<"__builtin_ia32_sqrtpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sqrt_pd_256 : GCCBuiltin<"__builtin_ia32_sqrtpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sqrt_pd_512 : GCCBuiltin<"__builtin_ia32_sqrtpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sqrt_ps_128 : GCCBuiltin<"__builtin_ia32_sqrtps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sqrt_ps_256 : GCCBuiltin<"__builtin_ia32_sqrtps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_sqrt_ps_512 : GCCBuiltin<"__builtin_ia32_sqrtps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_pd_128 : GCCBuiltin<"__builtin_ia32_getexppd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_pd_256 : GCCBuiltin<"__builtin_ia32_getexppd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_pd_512 : GCCBuiltin<"__builtin_ia32_getexppd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_ps_128 : GCCBuiltin<"__builtin_ia32_getexpps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_ps_256 : GCCBuiltin<"__builtin_ia32_getexpps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_getexp_ps_512 : GCCBuiltin<"__builtin_ia32_getexpps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_rsqrt14_ss : GCCBuiltin<"__builtin_ia32_rsqrt14ss_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt14_sd : GCCBuiltin<"__builtin_ia32_rsqrt14sd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_rsqrt14_pd_512 : GCCBuiltin<"__builtin_ia32_rsqrt14pd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt14_ps_512 : GCCBuiltin<"__builtin_ia32_rsqrt14ps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rcp14_ss : GCCBuiltin<"__builtin_ia32_rcp14ss_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rcp14_sd : GCCBuiltin<"__builtin_ia32_rcp14sd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_rcp14_pd_512 : GCCBuiltin<"__builtin_ia32_rcp14pd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rcp14_ps_512 : GCCBuiltin<"__builtin_ia32_rcp14ps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_rcp28_ps : GCCBuiltin<"__builtin_ia32_rcp28ps_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_rcp28_pd : GCCBuiltin<"__builtin_ia32_rcp28pd_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_exp2_ps : GCCBuiltin<"__builtin_ia32_exp2ps_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_exp2_pd : GCCBuiltin<"__builtin_ia32_exp2pd_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_rcp28_ss : GCCBuiltin<"__builtin_ia32_rcp28ss_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_rcp28_sd : GCCBuiltin<"__builtin_ia32_rcp28sd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt28_ps : GCCBuiltin<"__builtin_ia32_rsqrt28ps_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt28_pd : GCCBuiltin<"__builtin_ia32_rsqrt28pd_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt28_ss : GCCBuiltin<"__builtin_ia32_rsqrt28ss_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_rsqrt28_sd : GCCBuiltin<"__builtin_ia32_rsqrt28sd_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
// FP logical ops
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_and_pd_128 : GCCBuiltin<"__builtin_ia32_andpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_and_pd_256 : GCCBuiltin<"__builtin_ia32_andpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_and_pd_512 : GCCBuiltin<"__builtin_ia32_andpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_and_ps_128 : GCCBuiltin<"__builtin_ia32_andps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_and_ps_256 : GCCBuiltin<"__builtin_ia32_andps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_and_ps_512 : GCCBuiltin<"__builtin_ia32_andps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_pd_128 : GCCBuiltin<"__builtin_ia32_andnpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_pd_256 : GCCBuiltin<"__builtin_ia32_andnpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_pd_512 : GCCBuiltin<"__builtin_ia32_andnpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_ps_128 : GCCBuiltin<"__builtin_ia32_andnps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_ps_256 : GCCBuiltin<"__builtin_ia32_andnps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_andn_ps_512 : GCCBuiltin<"__builtin_ia32_andnps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_pd_128 : GCCBuiltin<"__builtin_ia32_orpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_pd_256 : GCCBuiltin<"__builtin_ia32_orpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_pd_512 : GCCBuiltin<"__builtin_ia32_orpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_ps_128 : GCCBuiltin<"__builtin_ia32_orps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_ps_256 : GCCBuiltin<"__builtin_ia32_orps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_or_ps_512 : GCCBuiltin<"__builtin_ia32_orps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_xor_pd_128 : GCCBuiltin<"__builtin_ia32_xorpd128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_v2f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_xor_pd_256 : GCCBuiltin<"__builtin_ia32_xorpd256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_v4f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_xor_pd_512 : GCCBuiltin<"__builtin_ia32_xorpd512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_v8f64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_xor_ps_128 : GCCBuiltin<"__builtin_ia32_xorps128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_v4f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_xor_ps_256 : GCCBuiltin<"__builtin_ia32_xorps256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_v8f32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_xor_ps_512 : GCCBuiltin<"__builtin_ia32_xorps512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_v16f32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
}
|
|
// Integer arithmetic ops
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_padd_b_128 : GCCBuiltin<"__builtin_ia32_paddb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_b_256 : GCCBuiltin<"__builtin_ia32_paddb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_b_512 : GCCBuiltin<"__builtin_ia32_paddb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_w_128 : GCCBuiltin<"__builtin_ia32_paddw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_w_256 : GCCBuiltin<"__builtin_ia32_paddw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_w_512 : GCCBuiltin<"__builtin_ia32_paddw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_b_128 : GCCBuiltin<"__builtin_ia32_paddsb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_b_256 : GCCBuiltin<"__builtin_ia32_paddsb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_b_512 : GCCBuiltin<"__builtin_ia32_paddsb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_w_128 : GCCBuiltin<"__builtin_ia32_paddsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_w_256 : GCCBuiltin<"__builtin_ia32_paddsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padds_w_512 : GCCBuiltin<"__builtin_ia32_paddsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_b_128 : GCCBuiltin<"__builtin_ia32_paddusb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_b_256 : GCCBuiltin<"__builtin_ia32_paddusb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_b_512 : GCCBuiltin<"__builtin_ia32_paddusb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_w_128 : GCCBuiltin<"__builtin_ia32_paddusw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_w_256 : GCCBuiltin<"__builtin_ia32_paddusw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_paddus_w_512 : GCCBuiltin<"__builtin_ia32_paddusw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_d_128 : GCCBuiltin<"__builtin_ia32_paddd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_d_256 : GCCBuiltin<"__builtin_ia32_paddd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_d_512 : GCCBuiltin<"__builtin_ia32_paddd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_q_128 : GCCBuiltin<"__builtin_ia32_paddq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_q_256 : GCCBuiltin<"__builtin_ia32_paddq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_padd_q_512 : GCCBuiltin<"__builtin_ia32_paddq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_b_128 : GCCBuiltin<"__builtin_ia32_psubb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_b_256 : GCCBuiltin<"__builtin_ia32_psubb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_b_512 : GCCBuiltin<"__builtin_ia32_psubb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_w_128 : GCCBuiltin<"__builtin_ia32_psubw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_w_256 : GCCBuiltin<"__builtin_ia32_psubw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_w_512 : GCCBuiltin<"__builtin_ia32_psubw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_b_128 : GCCBuiltin<"__builtin_ia32_psubsb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_b_256 : GCCBuiltin<"__builtin_ia32_psubsb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_b_512 : GCCBuiltin<"__builtin_ia32_psubsb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_w_128 : GCCBuiltin<"__builtin_ia32_psubsw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_w_256 : GCCBuiltin<"__builtin_ia32_psubsw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubs_w_512 : GCCBuiltin<"__builtin_ia32_psubsw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_b_128 : GCCBuiltin<"__builtin_ia32_psubusb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_b_256 : GCCBuiltin<"__builtin_ia32_psubusb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_b_512 : GCCBuiltin<"__builtin_ia32_psubusb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_w_128 : GCCBuiltin<"__builtin_ia32_psubusw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_w_256 : GCCBuiltin<"__builtin_ia32_psubusw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psubus_w_512 : GCCBuiltin<"__builtin_ia32_psubusw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_d_128 : GCCBuiltin<"__builtin_ia32_psubd128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_d_256 : GCCBuiltin<"__builtin_ia32_psubd256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_d_512 : GCCBuiltin<"__builtin_ia32_psubd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_q_128 : GCCBuiltin<"__builtin_ia32_psubq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_q_256 : GCCBuiltin<"__builtin_ia32_psubq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_psub_q_512 : GCCBuiltin<"__builtin_ia32_psubq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulu_dq_128 : GCCBuiltin<"__builtin_ia32_pmuludq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmul_dq_128 : GCCBuiltin<"__builtin_ia32_pmuldq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulu_dq_256 : GCCBuiltin<"__builtin_ia32_pmuludq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmul_dq_256 : GCCBuiltin<"__builtin_ia32_pmuldq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulu_dq_512 : GCCBuiltin<"__builtin_ia32_pmuludq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmul_dq_512 : GCCBuiltin<"__builtin_ia32_pmuldq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_w_128 : GCCBuiltin<"__builtin_ia32_pmullw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_w_256 : GCCBuiltin<"__builtin_ia32_pmullw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_w_512 : GCCBuiltin<"__builtin_ia32_pmullw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_d_128 : GCCBuiltin<"__builtin_ia32_pmulld128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_d_256 : GCCBuiltin<"__builtin_ia32_pmulld256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_d_512 : GCCBuiltin<"__builtin_ia32_pmulld512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_q_128 : GCCBuiltin<"__builtin_ia32_pmullq128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_v2i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_q_256 : GCCBuiltin<"__builtin_ia32_pmullq256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_v4i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmull_q_512 : GCCBuiltin<"__builtin_ia32_pmullq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulhu_w_512 : GCCBuiltin<"__builtin_ia32_pmulhuw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulh_w_512 : GCCBuiltin<"__builtin_ia32_pmulhw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulhu_w_128 : GCCBuiltin<"__builtin_ia32_pmulhuw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulhu_w_256 : GCCBuiltin<"__builtin_ia32_pmulhuw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulh_w_128 : GCCBuiltin<"__builtin_ia32_pmulhw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pmulh_w_256 : GCCBuiltin<"__builtin_ia32_pmulhw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_b_512 : GCCBuiltin<"__builtin_ia32_pavgb512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty,
|
|
llvm_v64i8_ty, llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_w_512 : GCCBuiltin<"__builtin_ia32_pavgw512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty], [llvm_v32i16_ty, llvm_v32i16_ty,
|
|
llvm_v32i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_b_128 : GCCBuiltin<"__builtin_ia32_pavgb128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty], [llvm_v16i8_ty, llvm_v16i8_ty,
|
|
llvm_v16i8_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_b_256 : GCCBuiltin<"__builtin_ia32_pavgb256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty], [llvm_v32i8_ty, llvm_v32i8_ty,
|
|
llvm_v32i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_w_128 : GCCBuiltin<"__builtin_ia32_pavgw128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty], [llvm_v8i16_ty, llvm_v8i16_ty,
|
|
llvm_v8i16_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_pavg_w_256 : GCCBuiltin<"__builtin_ia32_pavgw256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty,
|
|
llvm_v16i16_ty, llvm_i16_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Gather and Scatter ops
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_gather_dpd_512 : GCCBuiltin<"__builtin_ia32_gathersiv8df">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_ptr_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_dps_512 : GCCBuiltin<"__builtin_ia32_gathersiv16sf">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_ptr_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_qpd_512 : GCCBuiltin<"__builtin_ia32_gatherdiv8df">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_ptr_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_qps_512 : GCCBuiltin<"__builtin_ia32_gatherdiv16sf">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_ptr_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
|
|
def int_x86_avx512_gather_dpq_512 : GCCBuiltin<"__builtin_ia32_gathersiv8di">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_v8i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_dpi_512 : GCCBuiltin<"__builtin_ia32_gathersiv16si">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_ptr_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_qpq_512 : GCCBuiltin<"__builtin_ia32_gatherdiv8di">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
def int_x86_avx512_gather_qpi_512 : GCCBuiltin<"__builtin_ia32_gatherdiv16si">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_ptr_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div2_df :
|
|
GCCBuiltin<"__builtin_ia32_gather3div2df">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div2_di :
|
|
GCCBuiltin<"__builtin_ia32_gather3div2di">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v2i64_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div4_df :
|
|
GCCBuiltin<"__builtin_ia32_gather3div4df">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div4_di :
|
|
GCCBuiltin<"__builtin_ia32_gather3div4di">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v4i64_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div4_sf :
|
|
GCCBuiltin<"__builtin_ia32_gather3div4sf">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div4_si :
|
|
GCCBuiltin<"__builtin_ia32_gather3div4si">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v2i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div8_sf :
|
|
GCCBuiltin<"__builtin_ia32_gather3div8sf">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3div8_si :
|
|
GCCBuiltin<"__builtin_ia32_gather3div8si">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v4i64_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv2_df :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv2df">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv2_di :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv2di">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v2i64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv4_df :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv4df">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv4_di :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv4di">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v4i64_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv4_sf :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv4sf">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv4_si :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv4si">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_ptr_ty, llvm_v4i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv8_sf :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv8sf">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_ptr_ty, llvm_v8i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_gather3siv8_si :
|
|
GCCBuiltin<"__builtin_ia32_gather3siv8si">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_ptr_ty, llvm_v8i32_ty, llvm_i8_ty, llvm_i32_ty],
|
|
[IntrReadArgMem]>;
|
|
|
|
// scatter
|
|
def int_x86_avx512_scatter_dpd_512 : GCCBuiltin<"__builtin_ia32_scattersiv8df">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty,
|
|
llvm_v8i32_ty, llvm_v8f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_dps_512 : GCCBuiltin<"__builtin_ia32_scattersiv16sf">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i16_ty,
|
|
llvm_v16i32_ty, llvm_v16f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_qpd_512 : GCCBuiltin<"__builtin_ia32_scatterdiv8df">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty,
|
|
llvm_v8i64_ty, llvm_v8f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_qps_512 : GCCBuiltin<"__builtin_ia32_scatterdiv16sf">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty,
|
|
llvm_v8i64_ty, llvm_v8f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
|
|
def int_x86_avx512_scatter_dpq_512 : GCCBuiltin<"__builtin_ia32_scattersiv8di">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty,
|
|
llvm_v8i32_ty, llvm_v8i64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_dpi_512 : GCCBuiltin<"__builtin_ia32_scattersiv16si">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i16_ty,
|
|
llvm_v16i32_ty, llvm_v16i32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_qpq_512 : GCCBuiltin<"__builtin_ia32_scatterdiv8di">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty,llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatter_qpi_512 : GCCBuiltin<"__builtin_ia32_scatterdiv16si">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_i8_ty, llvm_v8i64_ty, llvm_v8i32_ty,
|
|
llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv2_df :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv2df">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v2i64_ty, llvm_v2f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv2_di :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv2di">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v2i64_ty, llvm_v2i64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv4_df :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv4df">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i64_ty, llvm_v4f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv4_di :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv4di">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i64_ty, llvm_v4i64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv4_sf :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv4sf">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v2i64_ty, llvm_v4f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv4_si :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv4si">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v2i64_ty, llvm_v4i32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv8_sf :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv8sf">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i64_ty, llvm_v4f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scatterdiv8_si :
|
|
GCCBuiltin<"__builtin_ia32_scatterdiv8si">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i64_ty, llvm_v4i32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv2_df :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv2df">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v2f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv2_di :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv2di">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v2i64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv4_df :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv4df">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v4f64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv4_di :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv4di">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v4i64_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv4_sf :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv4sf">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v4f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv4_si :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv4si">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv8_sf :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv8sf">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v8i32_ty, llvm_v8f32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_scattersiv8_si :
|
|
GCCBuiltin<"__builtin_ia32_scattersiv8si">,
|
|
Intrinsic<[],
|
|
[llvm_ptr_ty, llvm_i8_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i32_ty],
|
|
[IntrReadWriteArgMem]>;
|
|
|
|
// gather prefetch
|
|
def int_x86_avx512_gatherpf_dpd_512 : GCCBuiltin<"__builtin_ia32_gatherpfdpd">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i32_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_gatherpf_dps_512 : GCCBuiltin<"__builtin_ia32_gatherpfdps">,
|
|
Intrinsic<[], [llvm_i16_ty, llvm_v16i32_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_gatherpf_qpd_512 : GCCBuiltin<"__builtin_ia32_gatherpfqpd">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_gatherpf_qps_512 : GCCBuiltin<"__builtin_ia32_gatherpfqps">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
|
|
// scatter prefetch
|
|
def int_x86_avx512_scatterpf_dpd_512 : GCCBuiltin<"__builtin_ia32_scatterpfdpd">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i32_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatterpf_dps_512 : GCCBuiltin<"__builtin_ia32_scatterpfdps">,
|
|
Intrinsic<[], [llvm_i16_ty, llvm_v16i32_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatterpf_qpd_512 : GCCBuiltin<"__builtin_ia32_scatterpfqpd">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_scatterpf_qps_512 : GCCBuiltin<"__builtin_ia32_scatterpfqps">,
|
|
Intrinsic<[], [llvm_i8_ty, llvm_v8i64_ty, llvm_ptr_ty,
|
|
llvm_i32_ty, llvm_i32_ty], [IntrReadWriteArgMem]>;
|
|
}
|
|
|
|
// AVX-512 conflict detection
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_conflict_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpconflictsi_512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_conflict_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_vpconflictdi_512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_lzcnt_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_vplzcntd_512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty,
|
|
llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_lzcnt_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_vplzcntq_512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty,
|
|
llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Vector blend
|
|
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
|
|
def int_x86_avx512_mask_blend_ps_512 : GCCBuiltin<"__builtin_ia32_blendmps_512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty],
|
|
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_ps_256 : GCCBuiltin<"__builtin_ia32_blendmps_256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty],
|
|
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_ps_128 : GCCBuiltin<"__builtin_ia32_blendmps_128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty],
|
|
[llvm_v4f32_ty, llvm_v4f32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_pd_512 : GCCBuiltin<"__builtin_ia32_blendmpd_512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty],
|
|
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_pd_256 : GCCBuiltin<"__builtin_ia32_blendmpd_256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty],
|
|
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_pd_128 : GCCBuiltin<"__builtin_ia32_blendmpd_128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty],
|
|
[llvm_v2f64_ty, llvm_v2f64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_blend_d_512 : GCCBuiltin<"__builtin_ia32_blendmd_512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty],
|
|
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_q_512 : GCCBuiltin<"__builtin_ia32_blendmq_512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty],
|
|
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_d_256 : GCCBuiltin<"__builtin_ia32_blendmd_256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty],
|
|
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_q_256 : GCCBuiltin<"__builtin_ia32_blendmq_256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty],
|
|
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_d_128 : GCCBuiltin<"__builtin_ia32_blendmd_128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty],
|
|
[llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_q_128 : GCCBuiltin<"__builtin_ia32_blendmq_128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty],
|
|
[llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_blend_w_512 : GCCBuiltin<"__builtin_ia32_blendmw_512_mask">,
|
|
Intrinsic<[llvm_v32i16_ty],
|
|
[llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_w_256 : GCCBuiltin<"__builtin_ia32_blendmw_256_mask">,
|
|
Intrinsic<[llvm_v16i16_ty],
|
|
[llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_w_128 : GCCBuiltin<"__builtin_ia32_blendmw_128_mask">,
|
|
Intrinsic<[llvm_v8i16_ty],
|
|
[llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_b_512 : GCCBuiltin<"__builtin_ia32_blendmb_512_mask">,
|
|
Intrinsic<[llvm_v64i8_ty],
|
|
[llvm_v64i8_ty, llvm_v64i8_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_b_256 : GCCBuiltin<"__builtin_ia32_blendmb_256_mask">,
|
|
Intrinsic<[llvm_v32i8_ty],
|
|
[llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_blend_b_128 : GCCBuiltin<"__builtin_ia32_blendmb_128_mask">,
|
|
Intrinsic<[llvm_v16i8_ty],
|
|
[llvm_v16i8_ty, llvm_v16i8_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
|
|
}
|
|
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_valign_q_512 : GCCBuiltin<"__builtin_ia32_alignq512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty],
|
|
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_valign_d_512 : GCCBuiltin<"__builtin_ia32_alignd512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty],
|
|
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_i8_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
}
|
|
|
|
// Compares
|
|
let TargetPrefix = "x86" in {
|
|
// 512-bit
|
|
def int_x86_avx512_mask_pcmpeq_b_512 : GCCBuiltin<"__builtin_ia32_pcmpeqb512_mask">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v64i8_ty, llvm_v64i8_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_w_512 : GCCBuiltin<"__builtin_ia32_pcmpeqw512_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_d_512 : GCCBuiltin<"__builtin_ia32_pcmpeqd512_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_q_512 : GCCBuiltin<"__builtin_ia32_pcmpeqq512_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pcmpgt_b_512: GCCBuiltin<"__builtin_ia32_pcmpgtb512_mask">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v64i8_ty, llvm_v64i8_ty, llvm_i64_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_w_512: GCCBuiltin<"__builtin_ia32_pcmpgtw512_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_d_512: GCCBuiltin<"__builtin_ia32_pcmpgtd512_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_q_512: GCCBuiltin<"__builtin_ia32_pcmpgtq512_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i64_ty, llvm_v8i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_cmp_b_512: GCCBuiltin<"__builtin_ia32_cmpb512_mask">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v64i8_ty, llvm_v64i8_ty, llvm_i32_ty,
|
|
llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_w_512: GCCBuiltin<"__builtin_ia32_cmpw512_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_d_512: GCCBuiltin<"__builtin_ia32_cmpd512_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem ]>;
|
|
def int_x86_avx512_mask_cmp_q_512: GCCBuiltin<"__builtin_ia32_cmpq512_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i64_ty, llvm_v8i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_ucmp_b_512: GCCBuiltin<"__builtin_ia32_ucmpb512_mask">,
|
|
Intrinsic<[llvm_i64_ty], [llvm_v64i8_ty, llvm_v64i8_ty, llvm_i32_ty,
|
|
llvm_i64_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_w_512: GCCBuiltin<"__builtin_ia32_ucmpw512_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i16_ty, llvm_v32i16_ty, llvm_i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_d_512: GCCBuiltin<"__builtin_ia32_ucmpd512_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_q_512: GCCBuiltin<"__builtin_ia32_ucmpq512_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i64_ty, llvm_v8i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
// 256-bit
|
|
def int_x86_avx512_mask_pcmpeq_b_256 : GCCBuiltin<"__builtin_ia32_pcmpeqb256_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_w_256 : GCCBuiltin<"__builtin_ia32_pcmpeqw256_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_d_256 : GCCBuiltin<"__builtin_ia32_pcmpeqd256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_q_256 : GCCBuiltin<"__builtin_ia32_pcmpeqq256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pcmpgt_b_256: GCCBuiltin<"__builtin_ia32_pcmpgtb256_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_w_256: GCCBuiltin<"__builtin_ia32_pcmpgtw256_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_d_256: GCCBuiltin<"__builtin_ia32_pcmpgtd256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_q_256: GCCBuiltin<"__builtin_ia32_pcmpgtq256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i64_ty, llvm_v4i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_cmp_b_256: GCCBuiltin<"__builtin_ia32_cmpb256_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_w_256: GCCBuiltin<"__builtin_ia32_cmpw256_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_d_256: GCCBuiltin<"__builtin_ia32_cmpd256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_q_256: GCCBuiltin<"__builtin_ia32_cmpq256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i64_ty, llvm_v4i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_ucmp_b_256: GCCBuiltin<"__builtin_ia32_ucmpb256_mask">,
|
|
Intrinsic<[llvm_i32_ty], [llvm_v32i8_ty, llvm_v32i8_ty, llvm_i32_ty,
|
|
llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_w_256: GCCBuiltin<"__builtin_ia32_ucmpw256_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i16_ty, llvm_v16i16_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_d_256: GCCBuiltin<"__builtin_ia32_ucmpd256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_q_256: GCCBuiltin<"__builtin_ia32_ucmpq256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i64_ty, llvm_v4i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
// 128-bit
|
|
def int_x86_avx512_mask_pcmpeq_b_128 : GCCBuiltin<"__builtin_ia32_pcmpeqb128_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i8_ty, llvm_v16i8_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_w_128 : GCCBuiltin<"__builtin_ia32_pcmpeqw128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_d_128 : GCCBuiltin<"__builtin_ia32_pcmpeqd128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpeq_q_128 : GCCBuiltin<"__builtin_ia32_pcmpeqq128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_pcmpgt_b_128: GCCBuiltin<"__builtin_ia32_pcmpgtb128_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i8_ty, llvm_v16i8_ty, llvm_i16_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_w_128: GCCBuiltin<"__builtin_ia32_pcmpgtw128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_d_128: GCCBuiltin<"__builtin_ia32_pcmpgtd128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_avx512_mask_pcmpgt_q_128: GCCBuiltin<"__builtin_ia32_pcmpgtq128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v2i64_ty, llvm_v2i64_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_cmp_b_128: GCCBuiltin<"__builtin_ia32_cmpb128_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i8_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_w_128: GCCBuiltin<"__builtin_ia32_cmpw128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_d_128: GCCBuiltin<"__builtin_ia32_cmpd128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_q_128: GCCBuiltin<"__builtin_ia32_cmpq128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v2i64_ty, llvm_v2i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_ucmp_b_128: GCCBuiltin<"__builtin_ia32_ucmpb128_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16i8_ty, llvm_v16i8_ty, llvm_i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_w_128: GCCBuiltin<"__builtin_ia32_ucmpw128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8i16_ty, llvm_v8i16_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_d_128: GCCBuiltin<"__builtin_ia32_ucmpd128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_ucmp_q_128: GCCBuiltin<"__builtin_ia32_ucmpq128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v2i64_ty, llvm_v2i64_ty, llvm_i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
}
|
|
|
|
// Compress, Expand
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_compress_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_compresssf512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressdf512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_compresssf256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressdf256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_compresssf128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressdf128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_compress_store_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresf512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredf512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresf256_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredf256_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresf128_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredf128_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
|
|
def int_x86_avx512_mask_compress_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_compresssi512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressdi512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_compresssi256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressdi256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_compresssi128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_compress_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressdi128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_compress_store_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresi512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredi512_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresi256_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredi256_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4i64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoresi128_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
def int_x86_avx512_mask_compress_store_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_compressstoredi128_mask">,
|
|
Intrinsic<[], [llvm_ptr_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrReadWriteArgMem]>;
|
|
|
|
// expand
|
|
def int_x86_avx512_mask_expand_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandsf512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_expanddf512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandsf256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_expanddf256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandsf128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_expanddf128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_expand_load_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsf512_mask">,
|
|
Intrinsic<[llvm_v16f32_ty], [llvm_ptr_ty, llvm_v16f32_ty,
|
|
llvm_i16_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddf512_mask">,
|
|
Intrinsic<[llvm_v8f64_ty], [llvm_ptr_ty, llvm_v8f64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsf256_mask">,
|
|
Intrinsic<[llvm_v8f32_ty], [llvm_ptr_ty, llvm_v8f32_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddf256_mask">,
|
|
Intrinsic<[llvm_v4f64_ty], [llvm_ptr_ty, llvm_v4f64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsf128_mask">,
|
|
Intrinsic<[llvm_v4f32_ty], [llvm_ptr_ty, llvm_v4f32_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddf128_mask">,
|
|
Intrinsic<[llvm_v2f64_ty], [llvm_ptr_ty, llvm_v2f64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
|
|
def int_x86_avx512_mask_expand_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandsi512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_expanddi512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_v8i64_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandsi256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_expanddi256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_v4i64_ty, llvm_v4i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandsi128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_expand_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_expanddi128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_v2i64_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_mask_expand_load_d_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsi512_mask">,
|
|
Intrinsic<[llvm_v16i32_ty], [llvm_ptr_ty, llvm_v16i32_ty,
|
|
llvm_i16_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_q_512 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddi512_mask">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_ptr_ty, llvm_v8i64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_d_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsi256_mask">,
|
|
Intrinsic<[llvm_v8i32_ty], [llvm_ptr_ty, llvm_v8i32_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_q_256 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddi256_mask">,
|
|
Intrinsic<[llvm_v4i64_ty], [llvm_ptr_ty, llvm_v4i64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_d_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandloadsi128_mask">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_ptr_ty, llvm_v4i32_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
def int_x86_avx512_mask_expand_load_q_128 :
|
|
GCCBuiltin<"__builtin_ia32_expandloaddi128_mask">,
|
|
Intrinsic<[llvm_v2i64_ty], [llvm_ptr_ty, llvm_v2i64_ty,
|
|
llvm_i8_ty], [IntrReadArgMem]>;
|
|
|
|
}
|
|
// Misc.
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_avx512_mask_cmp_ps_512 :
|
|
GCCBuiltin<"__builtin_ia32_cmpps512_mask">,
|
|
Intrinsic<[llvm_i16_ty], [llvm_v16f32_ty, llvm_v16f32_ty,
|
|
llvm_i32_ty, llvm_i16_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_pd_512 :
|
|
GCCBuiltin<"__builtin_ia32_cmppd512_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8f64_ty, llvm_v8f64_ty,
|
|
llvm_i32_ty, llvm_i8_ty, llvm_i32_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_ps_256 :
|
|
GCCBuiltin<"__builtin_ia32_cmpps256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v8f32_ty, llvm_v8f32_ty,
|
|
llvm_i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_pd_256 :
|
|
GCCBuiltin<"__builtin_ia32_cmppd256_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4f64_ty, llvm_v4f64_ty,
|
|
llvm_i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_ps_128 :
|
|
GCCBuiltin<"__builtin_ia32_cmpps128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v4f32_ty, llvm_v4f32_ty,
|
|
llvm_i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
def int_x86_avx512_mask_cmp_pd_128 :
|
|
GCCBuiltin<"__builtin_ia32_cmppd128_mask">,
|
|
Intrinsic<[llvm_i8_ty], [llvm_v2f64_ty, llvm_v2f64_ty,
|
|
llvm_i32_ty, llvm_i8_ty], [IntrNoMem]>;
|
|
|
|
def int_x86_avx512_movntdqa :
|
|
GCCBuiltin<"__builtin_ia32_movntdqa512">,
|
|
Intrinsic<[llvm_v8i64_ty], [llvm_ptr_ty], [IntrReadMem]>;
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// SHA intrinsics
|
|
let TargetPrefix = "x86" in {
|
|
def int_x86_sha1rnds4 : GCCBuiltin<"__builtin_ia32_sha1rnds4">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sha1nexte : GCCBuiltin<"__builtin_ia32_sha1nexte">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sha1msg1 : GCCBuiltin<"__builtin_ia32_sha1msg1">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sha1msg2 : GCCBuiltin<"__builtin_ia32_sha1msg2">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sha256rnds2 : GCCBuiltin<"__builtin_ia32_sha256rnds2">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty],
|
|
[IntrNoMem]>;
|
|
def int_x86_sha256msg1 : GCCBuiltin<"__builtin_ia32_sha256msg1">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty], [IntrNoMem]>;
|
|
def int_x86_sha256msg2 : GCCBuiltin<"__builtin_ia32_sha256msg2">,
|
|
Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty], [IntrNoMem]>;
|
|
}
|