diff options
author | Craig Topper <craig.topper@intel.com> | 2018-05-30 05:25:59 +0000 |
---|---|---|
committer | Craig Topper <craig.topper@intel.com> | 2018-05-30 05:25:59 +0000 |
commit | cc0741e59f854777144eca819c04d92a3bbf7ecb (patch) | |
tree | 4092275afe335520ce741588cd43c36889b20c13 | |
parent | 5096d06c102241cbe654d500a881571f4fcd22ca (diff) | |
download | bcm5719-llvm-cc0741e59f854777144eca819c04d92a3bbf7ecb.tar.gz bcm5719-llvm-cc0741e59f854777144eca819c04d92a3bbf7ecb.zip |
[X86] Add unmasked AVX512VNNI instrinsics. Use a select in IR instead.
A future patch will remove the old masked intrinsics.
llvm-svn: 333508
-rw-r--r-- | llvm/include/llvm/IR/IntrinsicsX86.td | 125 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86IntrinsicsInfo.h | 14 |
2 files changed, 91 insertions, 48 deletions
diff --git a/llvm/include/llvm/IR/IntrinsicsX86.td b/llvm/include/llvm/IR/IntrinsicsX86.td index 6482f05b938..eabdacf3e51 100644 --- a/llvm/include/llvm/IR/IntrinsicsX86.td +++ b/llvm/include/llvm/IR/IntrinsicsX86.td @@ -2459,105 +2459,134 @@ let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.". // VNNI let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.". - def int_x86_avx512_mask_vpdpbusd_128 : - GCCBuiltin<"__builtin_ia32_vpdpbusd128_mask">, + def int_x86_avx512_mask_vpdpbusd_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusd_128 : - GCCBuiltin<"__builtin_ia32_vpdpbusd128_maskz">, + def int_x86_avx512_maskz_vpdpbusd_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpbusd_256 : - GCCBuiltin<"__builtin_ia32_vpdpbusd256_mask">, + def int_x86_avx512_mask_vpdpbusd_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusd_256 : - GCCBuiltin<"__builtin_ia32_vpdpbusd256_maskz">, + def int_x86_avx512_maskz_vpdpbusd_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpbusd_512 : - GCCBuiltin<"__builtin_ia32_vpdpbusd512_mask">, + def int_x86_avx512_mask_vpdpbusd_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusd_512 : - GCCBuiltin<"__builtin_ia32_vpdpbusd512_maskz">, + def int_x86_avx512_maskz_vpdpbusd_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpbusds_128 : - GCCBuiltin<"__builtin_ia32_vpdpbusds128_mask">, + def int_x86_avx512_mask_vpdpbusds_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusds_128 : - GCCBuiltin<"__builtin_ia32_vpdpbusds128_maskz">, + def int_x86_avx512_maskz_vpdpbusds_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpbusds_256 : - GCCBuiltin<"__builtin_ia32_vpdpbusds256_mask">, + def int_x86_avx512_mask_vpdpbusds_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusds_256 : - GCCBuiltin<"__builtin_ia32_vpdpbusds256_maskz">, + def int_x86_avx512_maskz_vpdpbusds_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpbusds_512 : - GCCBuiltin<"__builtin_ia32_vpdpbusds512_mask">, + def int_x86_avx512_mask_vpdpbusds_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpbusds_512 : - GCCBuiltin<"__builtin_ia32_vpdpbusds512_maskz">, + def int_x86_avx512_maskz_vpdpbusds_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssd_128 : - GCCBuiltin<"__builtin_ia32_vpdpwssd128_mask">, + def int_x86_avx512_mask_vpdpwssd_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssd_128 : - GCCBuiltin<"__builtin_ia32_vpdpwssd128_maskz">, + def int_x86_avx512_maskz_vpdpwssd_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssd_256 : - GCCBuiltin<"__builtin_ia32_vpdpwssd256_mask">, + def int_x86_avx512_mask_vpdpwssd_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssd_256 : - GCCBuiltin<"__builtin_ia32_vpdpwssd256_maskz">, + def int_x86_avx512_maskz_vpdpwssd_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssd_512 : - GCCBuiltin<"__builtin_ia32_vpdpwssd512_mask">, + def int_x86_avx512_mask_vpdpwssd_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssd_512 : - GCCBuiltin<"__builtin_ia32_vpdpwssd512_maskz">, + def int_x86_avx512_maskz_vpdpwssd_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssds_128 : - GCCBuiltin<"__builtin_ia32_vpdpwssds128_mask">, + def int_x86_avx512_mask_vpdpwssds_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssds_128 : - GCCBuiltin<"__builtin_ia32_vpdpwssds128_maskz">, + def int_x86_avx512_maskz_vpdpwssds_128 : // FIXME: Remove Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, llvm_v4i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssds_256 : - GCCBuiltin<"__builtin_ia32_vpdpwssds256_mask">, + def int_x86_avx512_mask_vpdpwssds_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssds_256 : - GCCBuiltin<"__builtin_ia32_vpdpwssds256_maskz">, + def int_x86_avx512_maskz_vpdpwssds_256 : // FIXME: Remove Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, llvm_v8i32_ty, llvm_i8_ty], [IntrNoMem]>; - def int_x86_avx512_mask_vpdpwssds_512 : - GCCBuiltin<"__builtin_ia32_vpdpwssds512_mask">, + def int_x86_avx512_mask_vpdpwssds_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; - def int_x86_avx512_maskz_vpdpwssds_512 : - GCCBuiltin<"__builtin_ia32_vpdpwssds512_maskz">, + def int_x86_avx512_maskz_vpdpwssds_512 : // FIXME: Remove Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, llvm_v16i32_ty, llvm_i16_ty], [IntrNoMem]>; + + + def int_x86_avx512_vpdpbusd_128 : + GCCBuiltin<"__builtin_ia32_vpdpbusd128">, + Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, + llvm_v4i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpbusd_256 : + GCCBuiltin<"__builtin_ia32_vpdpbusd256">, + Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, + llvm_v8i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpbusd_512 : + GCCBuiltin<"__builtin_ia32_vpdpbusd512">, + Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, + llvm_v16i32_ty], [IntrNoMem]>; + + def int_x86_avx512_vpdpbusds_128 : + GCCBuiltin<"__builtin_ia32_vpdpbusds128">, + Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, + llvm_v4i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpbusds_256 : + GCCBuiltin<"__builtin_ia32_vpdpbusds256">, + Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, + llvm_v8i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpbusds_512 : + GCCBuiltin<"__builtin_ia32_vpdpbusds512">, + Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, + llvm_v16i32_ty], [IntrNoMem]>; + + def int_x86_avx512_vpdpwssd_128 : + GCCBuiltin<"__builtin_ia32_vpdpwssd128">, + Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, + llvm_v4i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpwssd_256 : + GCCBuiltin<"__builtin_ia32_vpdpwssd256">, + Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, + llvm_v8i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpwssd_512 : + GCCBuiltin<"__builtin_ia32_vpdpwssd512">, + Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, + llvm_v16i32_ty], [IntrNoMem]>; + + def int_x86_avx512_vpdpwssds_128 : + GCCBuiltin<"__builtin_ia32_vpdpwssds128">, + Intrinsic<[llvm_v4i32_ty], [llvm_v4i32_ty, llvm_v4i32_ty, + llvm_v4i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpwssds_256 : + GCCBuiltin<"__builtin_ia32_vpdpwssds256">, + Intrinsic<[llvm_v8i32_ty], [llvm_v8i32_ty, llvm_v8i32_ty, + llvm_v8i32_ty], [IntrNoMem]>; + def int_x86_avx512_vpdpwssds_512 : + GCCBuiltin<"__builtin_ia32_vpdpwssds512">, + Intrinsic<[llvm_v16i32_ty], [llvm_v16i32_ty, llvm_v16i32_ty, + llvm_v16i32_ty], [IntrNoMem]>; } //===----------------------------------------------------------------------===// diff --git a/llvm/lib/Target/X86/X86IntrinsicsInfo.h b/llvm/lib/Target/X86/X86IntrinsicsInfo.h index 7b5df0fd325..7a9e9c28329 100644 --- a/llvm/lib/Target/X86/X86IntrinsicsInfo.h +++ b/llvm/lib/Target/X86/X86IntrinsicsInfo.h @@ -1324,6 +1324,20 @@ static const IntrinsicData IntrinsicsWithoutChain[] = { X86_INTRINSIC_DATA(avx512_vcvtss2si64, INTR_TYPE_2OP, X86ISD::CVTS2SI_RND, 0), X86_INTRINSIC_DATA(avx512_vcvtss2usi32, INTR_TYPE_2OP, X86ISD::CVTS2UI_RND, 0), X86_INTRINSIC_DATA(avx512_vcvtss2usi64, INTR_TYPE_2OP, X86ISD::CVTS2UI_RND, 0), + + X86_INTRINSIC_DATA(avx512_vpdpbusd_128, INTR_TYPE_3OP, X86ISD::VPDPBUSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpbusd_256, INTR_TYPE_3OP, X86ISD::VPDPBUSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpbusd_512, INTR_TYPE_3OP, X86ISD::VPDPBUSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpbusds_128, INTR_TYPE_3OP, X86ISD::VPDPBUSDS, 0), + X86_INTRINSIC_DATA(avx512_vpdpbusds_256, INTR_TYPE_3OP, X86ISD::VPDPBUSDS, 0), + X86_INTRINSIC_DATA(avx512_vpdpbusds_512, INTR_TYPE_3OP, X86ISD::VPDPBUSDS, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssd_128, INTR_TYPE_3OP, X86ISD::VPDPWSSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssd_256, INTR_TYPE_3OP, X86ISD::VPDPWSSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssd_512, INTR_TYPE_3OP, X86ISD::VPDPWSSD, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssds_128, INTR_TYPE_3OP, X86ISD::VPDPWSSDS, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssds_256, INTR_TYPE_3OP, X86ISD::VPDPWSSDS, 0), + X86_INTRINSIC_DATA(avx512_vpdpwssds_512, INTR_TYPE_3OP, X86ISD::VPDPWSSDS, 0), + X86_INTRINSIC_DATA(avx512_vpermi2var_d_128, INTR_TYPE_3OP, X86ISD::VPERMV3, 0), X86_INTRINSIC_DATA(avx512_vpermi2var_d_256, INTR_TYPE_3OP, X86ISD::VPERMV3, 0), X86_INTRINSIC_DATA(avx512_vpermi2var_d_512, INTR_TYPE_3OP, X86ISD::VPERMV3, 0), |