diff --git a/src/jit/codegencommon.cpp b/src/jit/codegencommon.cpp index 0843dffef0c7..3ff5b6fe68df 100644 --- a/src/jit/codegencommon.cpp +++ b/src/jit/codegencommon.cpp @@ -11049,7 +11049,7 @@ void CodeGen::genVzeroupperIfNeeded(bool check256bitOnly /* = true*/) if (emitVzeroUpper) { - assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX); + assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX2); instGen(INS_vzeroupper); } #endif diff --git a/src/jit/codegenxarch.cpp b/src/jit/codegenxarch.cpp index 3f8eef286fc7..22914493b1f7 100644 --- a/src/jit/codegenxarch.cpp +++ b/src/jit/codegenxarch.cpp @@ -5316,7 +5316,7 @@ void CodeGen::genCallInstruction(GenTreeCall* call) // when there's preceding 256-bit AVX to legacy SSE transition penalty. if (call->IsPInvoke() && (call->gtCallType == CT_USER_FUNC) && getEmitter()->Contains256bitAVX()) { - assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX); + assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX2); instGen(INS_vzeroupper); } #endif diff --git a/src/jit/compiler.h b/src/jit/compiler.h index 50e26a6d7b1c..18fab9b3df16 100644 --- a/src/jit/compiler.h +++ b/src/jit/compiler.h @@ -7251,7 +7251,7 @@ XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX #if defined(_TARGET_XARCH_) && !defined(LEGACY_BACKEND) if (canUseAVX()) { - return InstructionSet_AVX; + return InstructionSet_AVX2; } if (CanUseSSE3_4()) diff --git a/src/jit/instr.h b/src/jit/instr.h index 309a2f5dfeac..41ed560ef288 100644 --- a/src/jit/instr.h +++ b/src/jit/instr.h @@ -282,8 +282,7 @@ enum InstructionSet #ifdef _TARGET_XARCH_ InstructionSet_SSE2, // SSE2 Instruction set InstructionSet_SSE3_4, // SSE3, SSSE3, SSE4.1 and SSE4.2 instruction set - InstructionSet_AVX, // AVX2 instruction set - // TODO-Cleaup - This should be named as InstructionSet_AVX2 + InstructionSet_AVX2, // AVX2 instruction set #elif defined(_TARGET_ARM_) InstructionSet_NEON, #endif diff --git a/src/jit/lowerxarch.cpp b/src/jit/lowerxarch.cpp index d568e52b2396..9fab7ef0f1e8 100644 --- a/src/jit/lowerxarch.cpp +++ b/src/jit/lowerxarch.cpp @@ -2241,7 +2241,7 @@ void Lowering::ContainCheckSIMD(GenTreeSIMD* simdNode) { MakeSrcContained(simdNode, op1); } - else if ((comp->getSIMDInstructionSet() == InstructionSet_AVX) && + else if ((comp->getSIMDInstructionSet() == InstructionSet_AVX2) && ((simdNode->gtSIMDSize == 16) || (simdNode->gtSIMDSize == 32))) { // Either op1 is a float or dbl constant or an addr diff --git a/src/jit/lsraxarch.cpp b/src/jit/lsraxarch.cpp index 4945db32b4cf..18825768cd5e 100644 --- a/src/jit/lsraxarch.cpp +++ b/src/jit/lsraxarch.cpp @@ -2261,7 +2261,7 @@ void LinearScan::TreeNodeInfoInitSIMD(GenTreeSIMD* simdTree) { bool needFloatTemp; if (varTypeIsSmallInt(simdTree->gtSIMDBaseType) && - (compiler->getSIMDInstructionSet() == InstructionSet_AVX)) + (compiler->getSIMDInstructionSet() == InstructionSet_AVX2)) { int byteShiftCnt = (int)op2->AsIntCon()->gtIconVal * genTypeSize(simdTree->gtSIMDBaseType); needFloatTemp = (byteShiftCnt >= 16); @@ -2335,7 +2335,7 @@ void LinearScan::TreeNodeInfoInitSIMD(GenTreeSIMD* simdTree) info->isInternalRegDelayFree = true; info->srcCount = 1; info->internalIntCount = 1; - if (compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { info->internalFloatCount = 2; } @@ -2358,7 +2358,7 @@ void LinearScan::TreeNodeInfoInitSIMD(GenTreeSIMD* simdTree) } else #endif - if ((compiler->getSIMDInstructionSet() == InstructionSet_AVX) || + if ((compiler->getSIMDInstructionSet() == InstructionSet_AVX2) || (simdTree->gtSIMDBaseType == TYP_ULONG)) { info->internalFloatCount = 2; @@ -2374,7 +2374,7 @@ void LinearScan::TreeNodeInfoInitSIMD(GenTreeSIMD* simdTree) // We need an internal register different from targetReg. info->isInternalRegDelayFree = true; info->srcCount = 2; - if ((compiler->getSIMDInstructionSet() == InstructionSet_AVX) && (simdTree->gtSIMDBaseType != TYP_DOUBLE)) + if ((compiler->getSIMDInstructionSet() == InstructionSet_AVX2) && (simdTree->gtSIMDBaseType != TYP_DOUBLE)) { info->internalFloatCount = 2; } @@ -2783,11 +2783,11 @@ void LinearScan::SetContainsAVXFlags(bool isFloatingPointType /* = true */, unsi #ifdef FEATURE_AVX_SUPPORT if (isFloatingPointType) { - if (compiler->getFloatingPointInstructionSet() == InstructionSet_AVX) + if (compiler->getFloatingPointInstructionSet() == InstructionSet_AVX2) { compiler->getEmitter()->SetContainsAVX(true); } - if (sizeOfSIMDVector == 32 && compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (sizeOfSIMDVector == 32 && compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { compiler->getEmitter()->SetContains256bitAVX(true); } diff --git a/src/jit/simdcodegenxarch.cpp b/src/jit/simdcodegenxarch.cpp index ef50aaecc0c5..72c484e9fa40 100644 --- a/src/jit/simdcodegenxarch.cpp +++ b/src/jit/simdcodegenxarch.cpp @@ -672,7 +672,7 @@ void CodeGen::genSIMDScalarMove( { assert(varTypeIsFloating(baseType)); #ifdef FEATURE_AVX_SUPPORT - if (compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { switch (moveType) { @@ -874,7 +874,7 @@ void CodeGen::genSIMDIntrinsicInit(GenTreeSIMD* simdNode) #ifdef FEATURE_AVX_SUPPORT else { - assert(iset == InstructionSet_AVX); + assert(iset == InstructionSet_AVX2); ins = getOpForSIMDIntrinsic(SIMDIntrinsicInit, baseType); if (op1->IsCnsFltOrDbl()) { @@ -893,7 +893,7 @@ void CodeGen::genSIMDIntrinsicInit(GenTreeSIMD* simdNode) } #endif // FEATURE_AVX_SUPPORT } - else if (iset == InstructionSet_AVX && ((size == 32) || (size == 16))) + else if (iset == InstructionSet_AVX2 && ((size == 32) || (size == 16))) { regNumber srcReg = genConsumeReg(op1); if (baseType == TYP_INT || baseType == TYP_UINT || baseType == TYP_LONG || baseType == TYP_ULONG) @@ -1145,7 +1145,7 @@ void CodeGen::genSIMDIntrinsic32BitConvert(GenTreeSIMD* simdNode) getEmitter()->emitIns_R_I(INS_mov, EA_8BYTE, tmpIntReg, (ssize_t)0X5300000053000000); inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_ULONG); #else - if (compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { getEmitter()->emitIns_R_I(INS_mov, EA_4BYTE, tmpIntReg, (ssize_t)0X53000000); inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_UINT); @@ -1158,7 +1158,7 @@ void CodeGen::genSIMDIntrinsic32BitConvert(GenTreeSIMD* simdNode) getEmitter()->emitIns_R_R_I(INS_pinsrw, emitTypeSize(TYP_INT), tmpReg, tmpIntReg, 3); } #endif - if (compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { inst_RV_RV(INS_vpbroadcastd, tmpReg, tmpReg, targetType, emitActualTypeSize(targetType)); } @@ -1257,7 +1257,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) } else #endif - if (iset == InstructionSet_AVX || (baseType == TYP_ULONG)) + if (iset == InstructionSet_AVX2 || (baseType == TYP_ULONG)) { tmpReg = simdNode->ExtractTempReg(RBM_ALLFLOAT); tmpReg2 = simdNode->GetSingleTempReg(RBM_ALLFLOAT); @@ -1313,7 +1313,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_UINT); getEmitter()->emitIns_R_I(INS_pslldq, EA_16BYTE, tmpReg, 4); #endif - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { inst_RV_RV(INS_vpbroadcastq, tmpReg, tmpReg, simdType, emitActualTypeSize(simdType)); } @@ -1335,7 +1335,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_UINT); getEmitter()->emitIns_R_I(INS_pslldq, EA_16BYTE, tmpReg, 4); #endif - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { inst_RV_RV(INS_vpbroadcastq, tmpReg, tmpReg, simdType, emitActualTypeSize(simdType)); } @@ -1357,7 +1357,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) instruction rightShiftIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftRightInternal, TYP_SIMD16); instruction leftShiftIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftLeftInternal, TYP_SIMD16); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { // Extract the high 16-bits getEmitter()->emitIns_R_R_I(INS_vextracti128, EA_32BYTE, tmpReg, op1Reg, 0x01); @@ -1395,7 +1395,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) inst_RV_RV(INS_movaps, targetReg, tmpReg, simdType, emitActualTypeSize(simdType)); } - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { getEmitter()->emitIns_R_R_I(INS_vinsertf128, EA_32BYTE, targetReg, tmpReg2, 0x01); } @@ -1425,7 +1425,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_UINT); getEmitter()->emitIns_R_I(INS_pslldq, EA_16BYTE, tmpReg, 4); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { inst_RV_RV(INS_vpbroadcastq, tmpReg, tmpReg, simdType, emitActualTypeSize(simdType)); } @@ -1443,7 +1443,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) inst_RV_RV(INS_mov_i2xmm, tmpReg, tmpIntReg, TYP_UINT); getEmitter()->emitIns_R_I(INS_pslldq, EA_16BYTE, tmpReg, 4); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { inst_RV_RV(INS_vpbroadcastq, tmpReg, tmpReg, simdType, emitActualTypeSize(simdType)); } @@ -1468,7 +1468,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) instruction rightShiftIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftRightInternal, TYP_SIMD16); instruction leftShiftIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftLeftInternal, TYP_SIMD16); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { // Extract the high 16-bits getEmitter()->emitIns_R_R_I(INS_vextractf128, EA_32BYTE, tmpReg, op1Reg, 0x01); @@ -1504,7 +1504,7 @@ void CodeGen::genSIMDIntrinsic64BitConvert(GenTreeSIMD* simdNode) // Merge or copy the results (only at this point are we done with op1Reg). assert(tmpReg != targetReg); inst_RV_RV(INS_por, targetReg, tmpReg, simdType, emitActualTypeSize(simdType)); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { getEmitter()->emitIns_R_R_I(INS_vinserti128, EA_32BYTE, targetReg, tmpReg2, 0x01); } @@ -1526,7 +1526,7 @@ void CodeGen::genSIMDExtractUpperHalf(GenTreeSIMD* simdNode, regNumber srcReg, r { var_types simdType = simdNode->TypeGet(); emitAttr emitSize = emitActualTypeSize(simdType); - if (compiler->getSIMDInstructionSet() == InstructionSet_AVX) + if (compiler->getSIMDInstructionSet() == InstructionSet_AVX2) { instruction extractIns = varTypeIsFloating(simdNode->gtSIMDBaseType) ? INS_vextractf128 : INS_vextracti128; getEmitter()->emitIns_R_R_I(extractIns, EA_32BYTE, tgtReg, srcReg, 0x01); @@ -1588,7 +1588,7 @@ void CodeGen::genSIMDIntrinsicWiden(GenTreeSIMD* simdNode) regNumber tmpReg = simdNode->GetSingleTempReg(RBM_ALLFLOAT); assert(tmpReg != op1Reg); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { // permute op1Reg and put it into targetReg unsigned ival = 0xd4; @@ -1658,7 +1658,7 @@ void CodeGen::genSIMDIntrinsicNarrow(GenTreeSIMD* simdNode) } else if (varTypeIsLong(baseType)) { - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { // We have 8 long elements, 0-3 in op1Reg, 4-7 in op2Reg. // We will generate the following: @@ -1720,7 +1720,7 @@ void CodeGen::genSIMDIntrinsicNarrow(GenTreeSIMD* simdNode) instruction shiftLeftIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftLeftInternal, baseType); instruction shiftRightIns = getOpForSIMDIntrinsic(SIMDIntrinsicShiftRightInternal, baseType); - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { regNumber tmpReg = simdNode->ExtractTempReg(RBM_ALLFLOAT); regNumber tmpReg2 = simdNode->GetSingleTempReg(RBM_ALLFLOAT); @@ -2414,7 +2414,7 @@ void CodeGen::genSIMDIntrinsicDotProduct(GenTreeSIMD* simdNode) #endif // tmpReg1 = op1 * op2 - if (iset == InstructionSet_AVX) + if (iset == InstructionSet_AVX2) { // On AVX take advantage 3 operand form of pmulld inst_RV_RV_RV(INS_pmulld, tmpReg1, op1Reg, op2Reg, emitTypeSize(simdEvalType)); @@ -2611,7 +2611,7 @@ void CodeGen::genSIMDIntrinsicGetItem(GenTreeSIMD* simdNode) if (byteShiftCnt >= 16) { - assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX); + assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX2); byteShiftCnt -= 16; regNumber newSrcReg; if (varTypeIsFloating(baseType)) @@ -2671,7 +2671,7 @@ void CodeGen::genSIMDIntrinsicGetItem(GenTreeSIMD* simdNode) // low 3 bits of index, but it's better to use the right value. if (index > 8) { - assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX); + assert(compiler->getSIMDInstructionSet() == InstructionSet_AVX2); index -= 8; }