Skip to content
This repository has been archived by the owner on Jan 23, 2023. It is now read-only.

Add optimized UTF-8 validation and transcoding apis, hook them up to UTF8Encoding #21948

Merged
Merged
Show file tree
Hide file tree
Changes from 22 commits
Commits
Show all changes
32 commits
Select commit Hold shift + click to select a range
abd7add
Add optimized UTF-8 validation and transcoding logic
GrabYourPitchforks Mar 26, 2019
21721c2
Merge remote-tracking branch 'origin/master' into utf8_validation_apis
GrabYourPitchforks Mar 27, 2019
7198253
Merge commit 'aab338efb65808acc1ff9b7f95bd3dd5f0a6a3be' into utf8_val…
GrabYourPitchforks Apr 3, 2019
effeb6e
Hook up new UTF-8 logic through UTF8Encoding
GrabYourPitchforks Apr 3, 2019
4caf96a
Improve perf of "is ASCII?" inner loop in UTF-8 validation.
GrabYourPitchforks Apr 3, 2019
3f939ee
Remove SSE41.X64 optimization from AsciiUtility
GrabYourPitchforks Apr 3, 2019
2be465e
Merge remote-tracking branch 'origin/master' into utf8_validation_apis_3
GrabYourPitchforks Apr 4, 2019
fbb7246
Merge remote-tracking branch 'origin/master' into utf8_validation_apis_3
GrabYourPitchforks Apr 5, 2019
15a361a
Merge remote-tracking branch 'origin/master' into utf8_validation_apis_3
GrabYourPitchforks Apr 8, 2019
5995f81
Clarify that vector read is unaligned
GrabYourPitchforks Apr 8, 2019
c4e94df
Simplify vectorized logic; remove unnecessary adjustment
GrabYourPitchforks Apr 8, 2019
5db40d7
Merge remote-tracking branch 'origin/master' into utf8_validation_apis_3
GrabYourPitchforks Apr 9, 2019
f4519f5
PR feedback: GetElement(0) -> Sse2.StoreLow
GrabYourPitchforks Apr 9, 2019
9baf5be
PR feedback
GrabYourPitchforks Apr 9, 2019
2a3fe36
PR feedback: Enable SSE2 in Utf16Utility code
GrabYourPitchforks Apr 10, 2019
2d47f1b
Expand masks in Utf8Utility, fix const in fallback path
GrabYourPitchforks Apr 10, 2019
356ae17
Temporarily disable failing CoreFX tests
GrabYourPitchforks Apr 10, 2019
5257614
Fix incorrect Debug.Assert statements
GrabYourPitchforks Apr 10, 2019
6cc74a9
Add comments tracking JIT workarounds.
GrabYourPitchforks Apr 10, 2019
60b8c4f
Rename DWORD -> UInt32 throughout API surface
GrabYourPitchforks Apr 10, 2019
bae40fa
Re-flow Utf8Utility.Helpers
GrabYourPitchforks Apr 10, 2019
eda0c04
Merge remote-tracking branch 'origin/master' into utf8_validation_apis_3
GrabYourPitchforks Apr 11, 2019
3e09d17
PR feedback: Fix typos
GrabYourPitchforks Apr 11, 2019
56fa69d
PR feedback: CountNumberOfLeadingAsciiBytesFrom24BitInteger
GrabYourPitchforks Apr 11, 2019
8f2860d
PR feedback: Remove redundant endianess checks
GrabYourPitchforks Apr 11, 2019
ce13100
PR feedback: Validate nint definitions
GrabYourPitchforks Apr 11, 2019
c3aa431
PR feedback: Clarify charIsNonAscii vector usage
GrabYourPitchforks Apr 11, 2019
d8e2589
PR feedback: document tempUtf8CodeUnitCountAdjustment usage
GrabYourPitchforks Apr 11, 2019
7558272
Fix compilation failure in Utf16Utility
GrabYourPitchforks Apr 11, 2019
affc24a
PR feedback: Clarify 3-byte sequence processing
GrabYourPitchforks Apr 11, 2019
0adca8b
Add missing check to 3-byte processing logic
GrabYourPitchforks Apr 11, 2019
e307d14
Clarify comment in 3-byte processing
GrabYourPitchforks Apr 11, 2019
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -768,6 +768,7 @@
<Compile Include="$(MSBuildThisFileDirectory)System\SystemException.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\ASCIIEncoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\ASCIIUtility.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\ASCIIUtility.Helpers.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\StringBuilderCache.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\CodePageDataItem.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Decoder.cs" />
Expand Down Expand Up @@ -799,13 +800,17 @@
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UnicodeDebug.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UnicodeEncoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UnicodeUtility.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Utf16Utility.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UTF32Encoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UTF7Encoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\UTF8Encoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\ValueStringBuilder.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf16Utility.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf16Utility.Validation.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf8.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf8Utility.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf8Utility.Helpers.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf8Utility.Transcoding.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Text\Unicode\Utf8Utility.Validation.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\TimeSpan.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\ThreadAttributes.cs" />
<Compile Include="$(MSBuildThisFileDirectory)System\Threading\AbandonedMutexException.cs" />
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
using System.Runtime.CompilerServices;
using System.Runtime.InteropServices;
using System.Runtime.Serialization;
using System.Text;
using System.Text.Unicode;
using Internal.Runtime.CompilerServices;

namespace System.Globalization
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@
using System.Runtime.InteropServices;
using System.Runtime.Serialization;
using System.Text;
using System.Text.Unicode;
using Internal.Runtime.CompilerServices;

#if BIT64
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
using System.Buffers;
using System.Diagnostics;
using System.Runtime.InteropServices;
using System.Text;
using System.Text.Unicode;
using Internal.Runtime.CompilerServices;

#if BIT64
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,77 @@
// Licensed to the .NET Foundation under one or more agreements.
// The .NET Foundation licenses this file to you under the MIT license.
// See the LICENSE file in the project root for more information.

using System.Diagnostics;
using System.Numerics;
using System.Runtime.CompilerServices;

namespace System.Text
{
internal static partial class ASCIIUtility
{
/// <summary>
/// A mask which selects only the high bit of each byte of the given <see cref="uint"/>.
/// </summary>
private const uint UInt32HighBitsOnlyMask = 0x80808080u;

/// <summary>
/// A mask which selects only the high bit of each byte of the given <see cref="ulong"/>.
/// </summary>
private const ulong UInt64HighBitsOnlyMask = 0x80808080_80808080ul;

/// <summary>
/// Returns <see langword="true"/> iff all bytes in <paramref name="value"/> are ASCII.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
internal static bool AllBytesInUInt32AreAscii(uint value)
{
// If the high bit of any byte is set, that byte is non-ASCII.

return (value & UInt32HighBitsOnlyMask) == 0;
}


/// <summary>
/// Given a 24-bit integer which represents a three-byte buffer read in machine endianness,
/// counts the number of consecutive ASCII bytes starting from the beginning of the buffer.
/// Returns a value 0 - 3, inclusive. (The caller is responsible for ensuring that an all-
/// ASCII value does not make its way to this method.)
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
internal static uint CountNumberOfLeadingAsciiBytesFrom24BitInteger(uint value)
{
Debug.Assert(!AllBytesInUInt32AreAscii(value), "Caller shouldn't provide an all-ASCII value.");
GrabYourPitchforks marked this conversation as resolved.
Show resolved Hide resolved

if (BitConverter.IsLittleEndian)
{
return (uint)BitOperations.TrailingZeroCount(value & UInt32HighBitsOnlyMask) >> 3;
}
else
{
// The 'allBytesUpToNowAreAscii' DWORD uses bit twiddling to hold a 1 or a 0 depending
// on whether all processed bytes were ASCII. Then we accumulate all of the
// results to calculate how many consecutive ASCII bytes are present.

value = ~value;

// Read first byte
value = BitOperations.RotateLeft(value, 1);
uint allBytesUpToNowAreAscii = value & 1;
uint numAsciiBytes = allBytesUpToNowAreAscii;

// Read second byte
value = BitOperations.RotateLeft(value, 8);
allBytesUpToNowAreAscii &= value;
numAsciiBytes += allBytesUpToNowAreAscii;

// Read third byte
value = BitOperations.RotateLeft(value, 8);
allBytesUpToNowAreAscii &= value;
numAsciiBytes += allBytesUpToNowAreAscii;

return numAsciiBytes;
GrabYourPitchforks marked this conversation as resolved.
Show resolved Hide resolved
}
}
}
}
104 changes: 7 additions & 97 deletions src/System.Private.CoreLib/shared/System/Text/ASCIIUtility.cs
Original file line number Diff line number Diff line change
Expand Up @@ -21,19 +21,12 @@ namespace System.Text
{
internal static partial class ASCIIUtility
{
/// <summary>
/// Returns <see langword="true"/> iff all bytes in <paramref name="value"/> are ASCII.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
private static bool AllBytesInUInt32AreAscii(uint value)
{
return ((value & 0x80808080u) == 0);
}

[MethodImpl(MethodImplOptions.AggressiveInlining)]
private static bool AllBytesInUInt64AreAscii(ulong value)
{
return ((value & 0x80808080_80808080ul) == 0);
// If the high bit of any byte is set, that byte is non-ASCII.

return ((value & UInt64HighBitsOnlyMask) == 0);
}

/// <summary>
Expand All @@ -54,56 +47,6 @@ private static bool AllCharsInUInt64AreAscii(ulong value)
return ((value & ~0x007F007F_007F007Ful) == 0);
}

/// <summary>
/// Given a 24-bit integer which represents a three-byte buffer read in machine endianness,
/// counts the number of consecutive ASCII bytes starting from the beginning of the buffer.
/// Returns a value 0 - 3, inclusive.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
private static uint CountNumberOfLeadingAsciiBytesFrom24BitInteger(uint value)
{
// This implementation seems to have better performance than tzcnt.

// The 'allBytesUpToNowAreAscii' DWORD uses bit twiddling to hold a 1 or a 0 depending
// on whether all processed bytes were ASCII. Then we accumulate all of the
// results to calculate how many consecutive ASCII bytes are present.

value = ~value;

if (BitConverter.IsLittleEndian)
{
// Read first byte
uint allBytesUpToNowAreAscii = (value >>= 7) & 1;
uint numAsciiBytes = allBytesUpToNowAreAscii;

// Read second byte
allBytesUpToNowAreAscii &= (value >>= 8);
numAsciiBytes += allBytesUpToNowAreAscii;

// Read third byte
allBytesUpToNowAreAscii &= (value >>= 8);
numAsciiBytes += allBytesUpToNowAreAscii;

return numAsciiBytes;
}
else
{
// Read first byte
uint allBytesUpToNowAreAscii = (value = ROL32(value, 1)) & 1;
uint numAsciiBytes = allBytesUpToNowAreAscii;

// Read second byte
allBytesUpToNowAreAscii &= (value = ROL32(value, 8));
numAsciiBytes += allBytesUpToNowAreAscii;

// Read third byte
allBytesUpToNowAreAscii &= (value = ROL32(value, 8));
numAsciiBytes += allBytesUpToNowAreAscii;

return numAsciiBytes;
}
}

/// <summary>
/// Given a DWORD which represents two packed chars in machine-endian order,
/// <see langword="true"/> iff the first char (in machine-endian order) is ASCII.
Expand Down Expand Up @@ -461,7 +404,7 @@ private static unsafe nuint GetIndexOfFirstNonAsciiByte_Sse2(byte* pBuffer, nuin
// Clear everything but the high bit of each byte, then tzcnt.
// Remember the / 8 at the end to convert bit count to byte count.

candidateUInt64 &= 0x80808080_80808080ul;
candidateUInt64 &= UInt64HighBitsOnlyMask;
pBuffer += (nuint)(Bmi1.X64.TrailingZeroCount(candidateUInt64) / 8);
goto Finish;
}
Expand Down Expand Up @@ -1395,17 +1338,7 @@ private static unsafe nuint NarrowUtf16ToAscii_Sse2(char* pUtf16Buffer, byte* pA
// Turn the 8 ASCII chars we just read into 8 ASCII bytes, then copy it to the destination.

Vector128<byte> asciiVector = Sse2.PackUnsignedSaturate(utf16VectorFirst, utf16VectorFirst);

if (Sse41.X64.IsSupported)
{
// Use PEXTRQ instruction if available, since it can extract from the vector directly to the destination address.
Unsafe.WriteUnaligned<ulong>(pAsciiBuffer, Sse41.X64.Extract(asciiVector.AsUInt64(), 0));
}
else
{
// Bounce this through a temporary register (with potential stack spillage) before writing to memory.
Unsafe.WriteUnaligned<ulong>(pAsciiBuffer, asciiVector.AsUInt64().GetElement(0));
}
Sse2.StoreLow((ulong*)pAsciiBuffer, asciiVector.AsUInt64()); // ulong* calculated here is UNALIGNED

nuint currentOffsetInElements = SizeOfVector128 / 2; // we processed 8 elements so far

Expand Down Expand Up @@ -1444,16 +1377,7 @@ private static unsafe nuint NarrowUtf16ToAscii_Sse2(char* pUtf16Buffer, byte* pA

// Turn the 8 ASCII chars we just read into 8 ASCII bytes, then copy it to the destination.
asciiVector = Sse2.PackUnsignedSaturate(utf16VectorFirst, utf16VectorFirst);

// See comments earlier in this method for information about how this works.
if (Sse41.X64.IsSupported)
{
Unsafe.WriteUnaligned<ulong>(pAsciiBuffer + currentOffsetInElements, Sse41.X64.Extract(asciiVector.AsUInt64(), 0));
}
else
{
Unsafe.WriteUnaligned<ulong>(pAsciiBuffer + currentOffsetInElements, asciiVector.AsUInt64().GetElement(0));
}
Sse2.StoreLow((ulong*)(pAsciiBuffer + currentOffsetInElements), asciiVector.AsUInt64()); // ulong* calculated here is UNALIGNED
}

// Calculate how many elements we wrote in order to get pAsciiBuffer to its next alignment
Expand Down Expand Up @@ -1529,26 +1453,12 @@ private static unsafe nuint NarrowUtf16ToAscii_Sse2(char* pUtf16Buffer, byte* pA

Debug.Assert(((nuint)pAsciiBuffer + currentOffsetInElements) % sizeof(ulong) == 0, "Destination should be ulong-aligned.");

// See comments earlier in this method for information about how this works.
if (Sse41.X64.IsSupported)
{
*(ulong*)(pAsciiBuffer + currentOffsetInElements) = Sse41.X64.Extract(asciiVector.AsUInt64(), 0);
}
else
{
*(ulong*)(pAsciiBuffer + currentOffsetInElements) = asciiVector.AsUInt64().GetElement(0);
}
Sse2.StoreLow((ulong*)(pAsciiBuffer + currentOffsetInElements), asciiVector.AsUInt64()); // ulong* calculated here is aligned
currentOffsetInElements += SizeOfVector128 / 2;

goto Finish;
}

/// <summary>
/// Rotates a <see cref="uint"/> left. The JIT is smart enough to turn this into a ROL / ROR instruction.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
private static uint ROL32(uint value, int shift) => (value << shift) | (value >> (32 - shift));

/// <summary>
/// Copies as many ASCII bytes (00..7F) as possible from <paramref name="pAsciiBuffer"/>
/// to <paramref name="pUtf16Buffer"/>, stopping when the first non-ASCII byte is encountered
Expand Down
11 changes: 10 additions & 1 deletion src/System.Private.CoreLib/shared/System/Text/DecoderNLS.cs
Original file line number Diff line number Diff line change
Expand Up @@ -266,6 +266,7 @@ internal int DrainLeftoverDataForGetCharCount(ReadOnlySpan<byte> bytes, out int
// to be in progress. Unlike EncoderNLS, this is simply a Debug.Assert. No exception is thrown.

Debug.Assert(_fallbackBuffer is null || _fallbackBuffer.Remaining == 0, "Should have no data remaining in the fallback buffer.");
Debug.Assert(HasLeftoverData, "Caller shouldn't invoke this routine unless there's leftover data in the decoder.");

// Copy the existing leftover data plus as many bytes as possible of the new incoming data
// into a temporary concated buffer, then get its char count by decoding it.
Expand Down Expand Up @@ -319,6 +320,7 @@ internal int DrainLeftoverDataForGetChars(ReadOnlySpan<byte> bytes, Span<char> c
// to be in progress. Unlike EncoderNLS, this is simply a Debug.Assert. No exception is thrown.

Debug.Assert(_fallbackBuffer is null || _fallbackBuffer.Remaining == 0, "Should have no data remaining in the fallback buffer.");
Debug.Assert(HasLeftoverData, "Caller shouldn't invoke this routine unless there's leftover data in the decoder.");

// Copy the existing leftover data plus as many bytes as possible of the new incoming data
// into a temporary concated buffer, then transcode it from bytes to chars.
Expand Down Expand Up @@ -370,6 +372,14 @@ internal int DrainLeftoverDataForGetChars(ReadOnlySpan<byte> bytes, Span<char> c

Finish:

// Report back the number of bytes (from the new incoming span) we consumed just now.
// This calculation is simple: it's the difference between the original leftover byte
// count and the number of bytes from the combined buffer we needed to decode the first
// scalar value. We need to report this before the call to SetLeftoverData /
// ClearLeftoverData because those methods will overwrite the _leftoverByteCount field.

bytesConsumed = combinedBufferBytesConsumed - _leftoverByteCount;

if (persistNewCombinedBuffer)
{
Debug.Assert(combinedBufferBytesConsumed == combinedBuffer.Length, "We should be asked to persist the entire combined buffer.");
Expand All @@ -380,7 +390,6 @@ internal int DrainLeftoverDataForGetChars(ReadOnlySpan<byte> bytes, Span<char> c
ClearLeftoverData(); // the buffer contains no partial data; we'll go down the normal paths
}

bytesConsumed = combinedBufferBytesConsumed - _leftoverByteCount; // amount of 'bytes' buffer consumed just now
return charsWritten;

DestinationTooSmall:
Expand Down
21 changes: 16 additions & 5 deletions src/System.Private.CoreLib/shared/System/Text/Encoding.Internal.cs
Original file line number Diff line number Diff line change
Expand Up @@ -850,8 +850,14 @@ private unsafe int GetCharCountWithFallback(byte* pOriginalBytes, int originalBy

ReadOnlySpan<byte> bytes = new ReadOnlySpan<byte>(pOriginalBytes, originalByteCount).Slice(bytesConsumedSoFar);

int totalCharCount = decoder.DrainLeftoverDataForGetCharCount(bytes, out int bytesConsumedJustNow);
bytes = bytes.Slice(bytesConsumedJustNow);
int bytesConsumedJustNow = 0;
int totalCharCount = 0;

if (decoder.HasLeftoverData)
{
totalCharCount = decoder.DrainLeftoverDataForGetCharCount(bytes, out bytesConsumedJustNow);
bytes = bytes.Slice(bytesConsumedJustNow);
}

// Now try invoking the "fast path" (no fallback) implementation.
// We can use Unsafe.AsPointer here since these spans are created from pinned data (raw pointers).
Expand Down Expand Up @@ -1120,10 +1126,15 @@ private protected unsafe int GetCharsWithFallback(byte* pOriginalBytes, int orig
ReadOnlySpan<byte> bytes = new ReadOnlySpan<byte>(pOriginalBytes, originalByteCount).Slice(bytesConsumedSoFar);
Span<char> chars = new Span<char>(pOriginalChars, originalCharCount).Slice(charsWrittenSoFar);

int charsWrittenJustNow = decoder.DrainLeftoverDataForGetChars(bytes, chars, out int bytesConsumedJustNow);
int bytesConsumedJustNow = 0;
int charsWrittenJustNow = 0;

bytes = bytes.Slice(bytesConsumedJustNow);
chars = chars.Slice(charsWrittenJustNow);
if (decoder.HasLeftoverData)
{
charsWrittenJustNow = decoder.DrainLeftoverDataForGetChars(bytes, chars, out bytesConsumedJustNow);
bytes = bytes.Slice(bytesConsumedJustNow);
chars = chars.Slice(charsWrittenJustNow);
}

Debug.Assert(!decoder.InternalHasFallbackBuffer || decoder.FallbackBuffer.Remaining == 0, "Should be no remaining fallback data at this point.");

Expand Down
1 change: 1 addition & 0 deletions src/System.Private.CoreLib/shared/System/Text/Rune.cs
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@
using System.Diagnostics;
using System.Globalization;
using System.Runtime.CompilerServices;
using System.Text.Unicode;

namespace System.Text
{
Expand Down
Loading