dotnet · tannergooding · Apr 7, 2021 · Jun 17, 2020 · Jun 17, 2020 · Jun 17, 2020
diff --git a/src/libraries/System.Private.CoreLib/src/System/String.Manipulation.cs b/src/libraries/System.Private.CoreLib/src/System/String.Manipulation.cs
@@ -6,6 +6,9 @@
 using System.Diagnostics;
 using System.Globalization;
 using System.Numerics;
+using System.Runtime.InteropServices;
+using System.Runtime.Intrinsics;
+using System.Runtime.Intrinsics.X86;
 using System.Text;
 using Internal.Runtime.CompilerServices;
 
@@ -1573,6 +1576,13 @@ private void MakeSeparatorList(ReadOnlySpan<char> separators, ref ValueListBuild
                 // Special-case the common cases of 1, 2, and 3 separators, with manual comparisons against each separator.
                 case 1:
                     sep0 = separators[0];
+
+                    if (Avx2.IsSupported && 16 <= Length)
+                    {
+                        MakeSeparatorListVectorized(ref sepListBuilder, sep0);
+                        return;
+                    }
+
                     for (int i = 0; i < Length; i++)
                     {
                         if (this[i] == sep0)
@@ -1584,6 +1594,13 @@ private void MakeSeparatorList(ReadOnlySpan<char> separators, ref ValueListBuild
                 case 2:
                     sep0 = separators[0];
                     sep1 = separators[1];
+
+                    if (Avx2.IsSupported && 16 <= Length)
+                    {
+                        MakeSeparatorListVectorized(ref sepListBuilder, sep0, sep1);
+                        return;
+                    }
+
                     for (int i = 0; i < Length; i++)
                     {
                         char c = this[i];
@@ -1597,6 +1614,13 @@ private void MakeSeparatorList(ReadOnlySpan<char> separators, ref ValueListBuild
                     sep0 = separators[0];
                     sep1 = separators[1];
                     sep2 = separators[2];
+
+                    if (Avx2.IsSupported && 16 <= Length)
+                    {
+                        MakeSeparatorListVectorized(ref sepListBuilder, sep0, sep1, sep2);
+                        return;
+                    }
+
                     for (int i = 0; i < Length; i++)
                     {
                         char c = this[i];
@@ -1630,6 +1654,72 @@ private void MakeSeparatorList(ReadOnlySpan<char> separators, ref ValueListBuild
             }
         }
 
+        private void MakeSeparatorListVectorized(ref ValueListBuilder<int> sepListBuilder, char c, char? c2 = null, char? c3 = null)
+        {
+            // Constant that defines indices of characters within an AVX-Register
+            const ulong indicesConstant = 0xFEDCBA9876543210;
+            ReadOnlySpan<byte> shuffleConstantData = new byte[] {
+                0x02, 0x06, 0x0A, 0x0E, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
+                0xFF, 0xFF, 0xFF, 0xFF, 0x02, 0x06, 0x0A, 0x0E, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF
+            };
+            Vector256<byte> shuffleConstant = Unsafe.ReadUnaligned<Vector256<byte>>(ref MemoryMarshal.GetReference(shuffleConstantData));
+
+            Vector256<ushort> v1 = Vector256.Create(c);
+            Vector256<ushort>? v2 = c2 is char sep2 ? Vector256.Create(sep2) : (Vector256<ushort>?)null;
+            Vector256<ushort>? v3 = c3 is char sep3 ? Vector256.Create(sep3) : (Vector256<ushort>?)null;
+
+            ref char c0 = ref MemoryMarshal.GetReference(this.AsSpan());
+            int cond = Length - (Length % Vector256<ushort>.Count);
+            int i = 0;
+
+            for (; i < cond; i += Vector256<ushort>.Count)
+            {
+                Vector256<ushort> charVector = ReadVector(ref c0, i);
+                Vector256<ushort> cmp = Avx2.CompareEqual(charVector, v1);
+
+                if (v2 is Vector256<ushort> vecSep2)
 case 1: 
     sep0 = separators[0]; 
 case 1: 
     sep0 = separators[0]; 
+                {
+                    cmp = Avx2.Or(Avx2.CompareEqual(charVector, vecSep2), cmp);
+                }
+
+                if (v3 is Vector256<ushort> vecSep3)
+                {
+                    cmp = Avx2.Or(Avx2.CompareEqual(charVector, vecSep3), cmp);
+                }
+
+                if (Avx.TestZ(cmp, cmp)) { continue; }
+
+                Vector256<byte> mask = Avx2.ShiftLeftLogical(cmp.AsUInt64(), 4).AsByte();
+                mask = Avx2.Shuffle(mask, shuffleConstant);
+
+                Vector128<byte> res = Sse2.Or(mask.GetLower(), mask.GetUpper());
+                ulong extractedBits = Bmi2.X64.ParallelBitExtract(indicesConstant, Sse2.X64.ConvertToUInt64(res.AsUInt64()));
+
+                while (true)
+                {
+                    sepListBuilder.Append(((byte)(extractedBits & 0xF)) + i);
+                    extractedBits >>= 4;
+                    if (extractedBits == 0) { break; }
+                }
+            }
+
+            for (; i < Length; i++)
+            {
+                char curr = this[i];
+                if (curr == c || (c2 != null && curr == c2) || (c3 != null && curr == c3))
+                {
+                    sepListBuilder.Append(i);
+                }
+            }
+
+            static Vector256<ushort> ReadVector(ref char c0, int offset)
+            {
+                ref char ci = ref Unsafe.Add(ref c0, offset);
+                ref byte b = ref Unsafe.As<char, byte>(ref ci);
+                return Unsafe.ReadUnaligned<Vector256<ushort>>(ref b);
+            }
+        }
+
         /// <summary>
         /// Uses ValueListBuilder to create list that holds indexes of separators in string.
         /// </summary>