@@ -814,7 +814,7 @@ defm : vextract_for_size_lowering<"VEXTRACTF64x4Z", v32f16_info, v16f16x_info,
814
814
815
815
// A 128-bit extract from bits [255:128] of a 512-bit vector should use a
816
816
// smaller extract to enable EVEX->VEX.
817
- let Predicates = [NoVLX] in {
817
+ let Predicates = [NoVLX, HasEVEX512 ] in {
818
818
def : Pat<(v2i64 (extract_subvector (v8i64 VR512:$src), (iPTR 2))),
819
819
(v2i64 (VEXTRACTI128rr
820
820
(v4i64 (EXTRACT_SUBREG (v8i64 VR512:$src), sub_ymm)),
@@ -3068,7 +3068,7 @@ def : Pat<(Narrow.KVT (and Narrow.KRC:$mask,
3068
3068
addr:$src2, (X86cmpm_imm_commute timm:$cc)), Narrow.KRC)>;
3069
3069
}
3070
3070
3071
- let Predicates = [HasAVX512, NoVLX] in {
3071
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
3072
3072
defm : axv512_icmp_packed_cc_no_vlx_lowering<X86pcmpm, X86pcmpm_su, "VPCMPD", v8i32x_info, v16i32_info>;
3073
3073
defm : axv512_icmp_packed_cc_no_vlx_lowering<X86pcmpum, X86pcmpum_su, "VPCMPUD", v8i32x_info, v16i32_info>;
3074
3074
@@ -3099,7 +3099,7 @@ let Predicates = [HasAVX512, NoVLX] in {
3099
3099
defm : axv512_cmp_packed_cc_no_vlx_lowering<"VCMPPD", v2f64x_info, v8f64_info>;
3100
3100
}
3101
3101
3102
- let Predicates = [HasBWI, NoVLX] in {
3102
+ let Predicates = [HasBWI, NoVLX, HasEVEX512 ] in {
3103
3103
defm : axv512_icmp_packed_cc_no_vlx_lowering<X86pcmpm, X86pcmpm_su, "VPCMPB", v32i8x_info, v64i8_info>;
3104
3104
defm : axv512_icmp_packed_cc_no_vlx_lowering<X86pcmpum, X86pcmpum_su, "VPCMPUB", v32i8x_info, v64i8_info>;
3105
3105
@@ -3493,7 +3493,7 @@ multiclass mask_move_lowering<string InstrStr, X86VectorVTInfo Narrow,
3493
3493
3494
3494
// Patterns for handling v8i1 selects of 256-bit vectors when VLX isn't
3495
3495
// available. Use a 512-bit operation and extract.
3496
- let Predicates = [HasAVX512, NoVLX] in {
3496
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
3497
3497
defm : mask_move_lowering<"VMOVAPSZ", v4f32x_info, v16f32_info>;
3498
3498
defm : mask_move_lowering<"VMOVDQA32Z", v4i32x_info, v16i32_info>;
3499
3499
defm : mask_move_lowering<"VMOVAPSZ", v8f32x_info, v16f32_info>;
@@ -3505,7 +3505,7 @@ let Predicates = [HasAVX512, NoVLX] in {
3505
3505
defm : mask_move_lowering<"VMOVDQA64Z", v4i64x_info, v8i64_info>;
3506
3506
}
3507
3507
3508
- let Predicates = [HasBWI, NoVLX] in {
3508
+ let Predicates = [HasBWI, NoVLX, HasEVEX512 ] in {
3509
3509
defm : mask_move_lowering<"VMOVDQU8Z", v16i8x_info, v64i8_info>;
3510
3510
defm : mask_move_lowering<"VMOVDQU8Z", v32i8x_info, v64i8_info>;
3511
3511
@@ -4998,8 +4998,8 @@ defm VPMINUD : avx512_binop_rm_vl_d<0x3B, "vpminud", umin,
4998
4998
defm VPMINUQ : avx512_binop_rm_vl_q<0x3B, "vpminuq", umin,
4999
4999
SchedWriteVecALU, HasAVX512, 1>, T8;
5000
5000
5001
- // PMULLQ: Use 512bit version to implement 128/256 bit in case NoVLX.
5002
- let Predicates = [HasDQI, NoVLX] in {
5001
+ // PMULLQ: Use 512bit version to implement 128/256 bit in case NoVLX, HasEVEX512 .
5002
+ let Predicates = [HasDQI, NoVLX, HasEVEX512 ] in {
5003
5003
def : Pat<(v4i64 (mul (v4i64 VR256X:$src1), (v4i64 VR256X:$src2))),
5004
5004
(EXTRACT_SUBREG
5005
5005
(VPMULLQZrr
@@ -5055,7 +5055,7 @@ multiclass avx512_min_max_lowering<string Instr, SDNode OpNode> {
5055
5055
sub_xmm)>;
5056
5056
}
5057
5057
5058
- let Predicates = [HasAVX512, NoVLX] in {
5058
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
5059
5059
defm : avx512_min_max_lowering<"VPMAXUQZ", umax>;
5060
5060
defm : avx512_min_max_lowering<"VPMINUQZ", umin>;
5061
5061
defm : avx512_min_max_lowering<"VPMAXSQZ", smax>;
@@ -6032,7 +6032,7 @@ defm VPSRL : avx512_shift_types<0xD2, 0xD3, 0xD1, "vpsrl", X86vsrl,
6032
6032
SchedWriteVecShift>;
6033
6033
6034
6034
// Use 512bit VPSRA/VPSRAI version to implement v2i64/v4i64 in case NoVLX.
6035
- let Predicates = [HasAVX512, NoVLX] in {
6035
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
6036
6036
def : Pat<(v4i64 (X86vsra (v4i64 VR256X:$src1), (v2i64 VR128X:$src2))),
6037
6037
(EXTRACT_SUBREG (v8i64
6038
6038
(VPSRAQZrr
@@ -6161,14 +6161,14 @@ defm VPSRLV : avx512_var_shift_types<0x45, "vpsrlv", X86vsrlv, SchedWriteVarVecS
6161
6161
defm VPRORV : avx512_var_shift_types<0x14, "vprorv", rotr, SchedWriteVarVecShift>;
6162
6162
defm VPROLV : avx512_var_shift_types<0x15, "vprolv", rotl, SchedWriteVarVecShift>;
6163
6163
6164
- defm : avx512_var_shift_lowering<avx512vl_i64_info, "VPSRAVQ", X86vsrav, [HasAVX512, NoVLX]>;
6165
- defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSLLVW", X86vshlv, [HasBWI, NoVLX]>;
6166
- defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSRAVW", X86vsrav, [HasBWI, NoVLX]>;
6167
- defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSRLVW", X86vsrlv, [HasBWI, NoVLX]>;
6164
+ defm : avx512_var_shift_lowering<avx512vl_i64_info, "VPSRAVQ", X86vsrav, [HasAVX512, NoVLX, HasEVEX512 ]>;
6165
+ defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSLLVW", X86vshlv, [HasBWI, NoVLX, HasEVEX512 ]>;
6166
+ defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSRAVW", X86vsrav, [HasBWI, NoVLX, HasEVEX512 ]>;
6167
+ defm : avx512_var_shift_lowering<avx512vl_i16_info, "VPSRLVW", X86vsrlv, [HasBWI, NoVLX, HasEVEX512 ]>;
6168
6168
6169
6169
6170
6170
// Use 512bit VPROL/VPROLI version to implement v2i64/v4i64 + v4i32/v8i32 in case NoVLX.
6171
- let Predicates = [HasAVX512, NoVLX] in {
6171
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
6172
6172
def : Pat<(v2i64 (rotl (v2i64 VR128X:$src1), (v2i64 VR128X:$src2))),
6173
6173
(EXTRACT_SUBREG (v8i64
6174
6174
(VPROLVQZrr
@@ -6219,7 +6219,7 @@ let Predicates = [HasAVX512, NoVLX] in {
6219
6219
}
6220
6220
6221
6221
// Use 512bit VPROR/VPRORI version to implement v2i64/v4i64 + v4i32/v8i32 in case NoVLX.
6222
- let Predicates = [HasAVX512, NoVLX] in {
6222
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
6223
6223
def : Pat<(v2i64 (rotr (v2i64 VR128X:$src1), (v2i64 VR128X:$src2))),
6224
6224
(EXTRACT_SUBREG (v8i64
6225
6225
(VPRORVQZrr
@@ -9816,7 +9816,7 @@ defm VPMOVUSWB : avx512_trunc_wb<0x10, "vpmovuswb", X86vtruncus,
9816
9816
truncstore_us_vi8, masked_truncstore_us_vi8,
9817
9817
X86vtruncus, X86vmtruncus>;
9818
9818
9819
- let Predicates = [HasAVX512, NoVLX] in {
9819
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
9820
9820
def: Pat<(v8i16 (trunc (v8i32 VR256X:$src))),
9821
9821
(v8i16 (EXTRACT_SUBREG
9822
9822
(v16i16 (VPMOVDWZrr (v16i32 (INSERT_SUBREG (IMPLICIT_DEF),
@@ -9827,7 +9827,7 @@ def: Pat<(v4i32 (trunc (v4i64 VR256X:$src))),
9827
9827
VR256X:$src, sub_ymm)))), sub_xmm))>;
9828
9828
}
9829
9829
9830
- let Predicates = [HasBWI, NoVLX] in {
9830
+ let Predicates = [HasBWI, NoVLX, HasEVEX512 ] in {
9831
9831
def: Pat<(v16i8 (trunc (v16i16 VR256X:$src))),
9832
9832
(v16i8 (EXTRACT_SUBREG (VPMOVWBZrr (v32i16 (INSERT_SUBREG (IMPLICIT_DEF),
9833
9833
VR256X:$src, sub_ymm))), sub_xmm))>;
@@ -10370,7 +10370,7 @@ multiclass avx512_convert_vector_to_mask<bits<8> opc, string OpcodeStr,
10370
10370
defm Z128 : convert_vector_to_mask_common<opc, VTInfo.info128, OpcodeStr>,
10371
10371
EVEX_V128;
10372
10372
}
10373
- let Predicates = [prd, NoVLX] in {
10373
+ let Predicates = [prd, NoVLX, HasEVEX512 ] in {
10374
10374
defm Z256_Alt : convert_vector_to_mask_lowering<VTInfo.info512, VTInfo.info256, NAME>;
10375
10375
defm Z128_Alt : convert_vector_to_mask_lowering<VTInfo.info512, VTInfo.info128, NAME>;
10376
10376
}
@@ -11157,7 +11157,7 @@ defm VPABS : avx512_unary_rm_vl_all<0x1C, 0x1D, 0x1E, 0x1F, "vpabs", abs,
11157
11157
SchedWriteVecALU>;
11158
11158
11159
11159
// VPABS: Use 512bit version to implement 128/256 bit in case NoVLX.
11160
- let Predicates = [HasAVX512, NoVLX] in {
11160
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
11161
11161
def : Pat<(v4i64 (abs VR256X:$src)),
11162
11162
(EXTRACT_SUBREG
11163
11163
(VPABSQZrr
@@ -11173,7 +11173,7 @@ let Predicates = [HasAVX512, NoVLX] in {
11173
11173
// Use 512bit version to implement 128/256 bit.
11174
11174
multiclass avx512_unary_lowering<string InstrStr, SDNode OpNode,
11175
11175
AVX512VLVectorVTInfo _, Predicate prd> {
11176
- let Predicates = [prd, NoVLX] in {
11176
+ let Predicates = [prd, NoVLX, HasEVEX512 ] in {
11177
11177
def : Pat<(_.info256.VT (OpNode (_.info256.VT _.info256.RC:$src1))),
11178
11178
(EXTRACT_SUBREG
11179
11179
(!cast<Instruction>(InstrStr # "Zrr")
@@ -11792,7 +11792,7 @@ let Predicates = [HasAVX512] in {
11792
11792
(VPTERNLOGQZrri VR512:$src, VR512:$src, VR512:$src, (i8 15))>;
11793
11793
}
11794
11794
11795
- let Predicates = [HasAVX512, NoVLX] in {
11795
+ let Predicates = [HasAVX512, NoVLX, HasEVEX512 ] in {
11796
11796
def : Pat<(v16i8 (vnot VR128X:$src)),
11797
11797
(EXTRACT_SUBREG
11798
11798
(VPTERNLOGQZrri
0 commit comments