Tweak scalar paths

dotnet · MihaZupan · Nov 21, 2022 · Nov 19, 2022 · Nov 19, 2022 · Nov 19, 2022
commit 5b648d1185a00b52a9156bb4c904a0ecf375e30b
diff --git a/src/libraries/System.Private.CoreLib/src/System.Private.CoreLib.Shared.projitems b/src/libraries/System.Private.CoreLib/src/System.Private.CoreLib.Shared.projitems
@@ -431,8 +431,8 @@
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfAnyValues.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfAnyValues.T.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfAnyValuesDebugView.cs" />
-    <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfEmptyValues.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfAnyValuesInRange.cs" />
+    <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\IndexOfEmptyValues.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOfAnyValues\ProbabilisticMap.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\IndexOutOfRangeException.cs" />
     <Compile Include="$(MSBuildThisFileDirectory)System\InsufficientExecutionStackException.cs" />

diff --git a/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/BitVector256.cs b/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/BitVector256.cs
@@ -21,15 +21,20 @@ public void Set(int c)
 
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         public readonly bool Contains128(char c) =>
-            c < 128 && Contains((byte)c);
+            c < 128 && ContainsUnchecked(c);
 
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         public readonly bool Contains256(char c) =>
-            c < 256 && Contains((byte)c);
+            c < 256 && ContainsUnchecked(c);
 
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
-        public readonly bool Contains(byte b)
+        public readonly bool Contains(byte b) =>
+            ContainsUnchecked(b);
+
+        [MethodImpl(MethodImplOptions.AggressiveInlining)]
+        private readonly bool ContainsUnchecked(int b)
         {
+            Debug.Assert(b < 256);
             uint offset = (uint)(b >> 5);
             uint significantBit = 1u << (b & 31);
             return (_values[offset] & significantBit) != 0;
@@ -40,7 +45,7 @@ public readonly char[] GetCharValues()
             var chars = new List<char>();
             for (int i = 0; i < 256; i++)
             {
-                if (Contains((byte)i))
+                if (ContainsUnchecked(i))
                 {
                     chars.Add((char)i);
                 }
@@ -53,7 +58,7 @@ public readonly byte[] GetByteValues()
             var bytes = new List<byte>();
             for (int i = 0; i < 256; i++)
             {
-                if (Contains((byte)i))
+                if (ContainsUnchecked(i))
                 {
                     bytes.Add((byte)i);
                 }

diff --git a/...libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyAsciiByteValues.cs b/...libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyAsciiByteValues.cs
@@ -58,12 +58,18 @@ private int LastIndexOfAny<TNegator>(ref byte searchSpace, int searchSpaceLength
         private int IndexOfAnyScalar<TNegator>(ref byte searchSpace, int searchSpaceLength)
             where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
         {
-            for (int i = 0; i < searchSpaceLength; i++)
+            ref byte searchSpaceEnd = ref Unsafe.Add(ref searchSpace, searchSpaceLength);
+            ref byte cur = ref searchSpace;
+
+            while (!Unsafe.AreSame(ref cur, ref searchSpaceEnd))
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains(Unsafe.Add(ref searchSpace, i))))
+                byte b = cur;
+                if (TNegator.NegateIfNeeded(_lookup.Contains(b)))
                 {
-                    return i;
+                    return (int)Unsafe.ByteOffset(ref searchSpace, ref cur);
                 }
+
+                cur = ref Unsafe.Add(ref cur, 1);
             }
 
             return -1;
@@ -74,7 +80,8 @@ private int LastIndexOfAnyScalar<TNegator>(ref byte searchSpace, int searchSpace
         {
             for (int i = searchSpaceLength - 1; i >= 0; i--)
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains(Unsafe.Add(ref searchSpace, i))))
+                byte b = Unsafe.Add(ref searchSpace, i);
+                if (TNegator.NegateIfNeeded(_lookup.Contains(b)))
                 {
                     return i;
                 }

diff --git a/...libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyAsciiCharValues.cs b/...libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyAsciiCharValues.cs
@@ -58,12 +58,18 @@ private int LastIndexOfAny<TNegator>(ref char searchSpace, int searchSpaceLength
         private int IndexOfAnyScalar<TNegator>(ref char searchSpace, int searchSpaceLength)
             where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
         {
-            for (int i = 0; i < searchSpaceLength; i++)
+            ref char searchSpaceEnd = ref Unsafe.Add(ref searchSpace, searchSpaceLength);
+            ref char cur = ref searchSpace;
+
+            while (!Unsafe.AreSame(ref cur, ref searchSpaceEnd))
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains128(Unsafe.Add(ref searchSpace, i))))
+                char c = cur;
+                if (TNegator.NegateIfNeeded(_lookup.Contains128(c)))
                 {
-                    return i;
+                    return (int)(Unsafe.ByteOffset(ref searchSpace, ref cur) / sizeof(char));
                 }
+
+                cur = ref Unsafe.Add(ref cur, 1);
             }
 
             return -1;
@@ -74,7 +80,8 @@ private int LastIndexOfAnyScalar<TNegator>(ref char searchSpace, int searchSpace
         {
             for (int i = searchSpaceLength - 1; i >= 0; i--)
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains128(Unsafe.Add(ref searchSpace, i))))
+                char c = Unsafe.Add(ref searchSpace, i);
+                if (TNegator.NegateIfNeeded(_lookup.Contains128(c)))
                 {
                     return i;
                 }

diff --git a/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyByteValues.cs b/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyByteValues.cs
@@ -55,12 +55,18 @@ private int LastIndexOfAny<TNegator>(ref byte searchSpace, int searchSpaceLength
         private int IndexOfAnyScalar<TNegator>(ref byte searchSpace, int searchSpaceLength)
             where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
         {
-            for (int i = 0; i < searchSpaceLength; i++)
+            ref byte searchSpaceEnd = ref Unsafe.Add(ref searchSpace, searchSpaceLength);
+            ref byte cur = ref searchSpace;
+
+            while (!Unsafe.AreSame(ref cur, ref searchSpaceEnd))
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains(Unsafe.Add(ref searchSpace, i))))
+                byte b = cur;
+                if (TNegator.NegateIfNeeded(_lookup.Contains(b)))
                 {
-                    return i;
+                    return (int)(Unsafe.ByteOffset(ref searchSpace, ref cur));
                 }
+
+                cur = ref Unsafe.Add(ref cur, 1);
             }
 
             return -1;
@@ -71,7 +77,8 @@ private int LastIndexOfAnyScalar<TNegator>(ref byte searchSpace, int searchSpace
         {
             for (int i = searchSpaceLength - 1; i >= 0; i--)
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains(Unsafe.Add(ref searchSpace, i))))
+                byte b = Unsafe.Add(ref searchSpace, i);
+                if (TNegator.NegateIfNeeded(_lookup.Contains(b)))
                 {
                     return i;
                 }

diff --git a/...s/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyCharValuesProbabilistic.cs b/...s/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyCharValuesProbabilistic.cs
@@ -6,19 +6,15 @@
 
 namespace System.Buffers
 {
-    internal sealed class IndexOfAnyCharValuesProbabilistic<TContains> : IndexOfAnyValues<char>
-        where TContains : struct, IndexOfAnyValues.IStringContains
+    internal sealed class IndexOfAnyCharValuesProbabilistic : IndexOfAnyValues<char>
     {
-        private readonly ProbabilisticMap _map;
+        private ProbabilisticMap _map;
         private readonly string _values;
 
         public unsafe IndexOfAnyCharValuesProbabilistic(ReadOnlySpan<char> values)
         {
             _values = new string(values);
-
-            ProbabilisticMap map = default;
-            ProbabilisticMap.Initialize((uint*)&map, _values);
-            _map = map;
+            _map = new ProbabilisticMap(_values);
         }
 
         internal override char[] GetValues() => _values.ToCharArray();
@@ -39,44 +35,14 @@ internal override int LastIndexOfAny(ReadOnlySpan<char> span) =>
         internal override int LastIndexOfAnyExcept(ReadOnlySpan<char> span) =>
             LastIndexOfAny<IndexOfAnyAsciiSearcher.Negate>(ref MemoryMarshal.GetReference(span), span.Length);
 
+        [MethodImpl(MethodImplOptions.NoInlining)]
         private int IndexOfAny<TNegator>(ref char searchSpace, int searchSpaceLength)
-            where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
-        {
-            string values = _values;
-
-            for (int i = 0; i < searchSpaceLength; i++)
-            {
-                int ch = Unsafe.Add(ref searchSpace, i);
-                if (TNegator.NegateIfNeeded(
-                        _map.IsCharBitSet((byte)ch) &&
-                        _map.IsCharBitSet((byte)(ch >> 8)) &&
-                        TContains.Contains(values, (char)ch)))
-                {
-                    return i;
-                }
-            }
-
-            return -1;
-        }
+            where TNegator : struct, IndexOfAnyAsciiSearcher.INegator =>
+            ProbabilisticMap.IndexOfAny<TNegator>(ref Unsafe.As<ProbabilisticMap, uint>(ref _map), ref searchSpace, searchSpaceLength, _values);
 
+        [MethodImpl(MethodImplOptions.NoInlining)]
         private int LastIndexOfAny<TNegator>(ref char searchSpace, int searchSpaceLength)
-            where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
-        {
-            string values = _values;
-
-            for (int i = searchSpaceLength - 1; i >= 0; i--)
-            {
-                int ch = Unsafe.Add(ref searchSpace, i);
-                if (TNegator.NegateIfNeeded(
-                        _map.IsCharBitSet((byte)ch) &&
-                        _map.IsCharBitSet((byte)(ch >> 8)) &&
-                        TContains.Contains(values, (char)ch)))
-                {
-                    return i;
-                }
-            }
-
-            return -1;
-        }
+            where TNegator : struct, IndexOfAnyAsciiSearcher.INegator =>
+            ProbabilisticMap.LastIndexOfAny<TNegator>(ref Unsafe.As<ProbabilisticMap, uint>(ref _map), ref searchSpace, searchSpaceLength, _values);
     }
 }
diff --git a/...ibraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyLatin1CharValues.cs b/...ibraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyLatin1CharValues.cs
@@ -45,12 +45,18 @@ internal override int LastIndexOfAnyExcept(ReadOnlySpan<char> span) =>
         private int IndexOfAny<TNegator>(ref char searchSpace, int searchSpaceLength)
             where TNegator : struct, IndexOfAnyAsciiSearcher.INegator
         {
-            for (int i = 0; i < searchSpaceLength; i++)
+            ref char searchSpaceEnd = ref Unsafe.Add(ref searchSpace, searchSpaceLength);
+            ref char cur = ref searchSpace;
+
+            while (!Unsafe.AreSame(ref cur, ref searchSpaceEnd))
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains256(Unsafe.Add(ref searchSpace, i))))
+                char c = cur;
+                if (TNegator.NegateIfNeeded(_lookup.Contains256(c)))
                 {
-                    return i;
+                    return (int)(Unsafe.ByteOffset(ref searchSpace, ref cur) / sizeof(char));
                 }
+
+                cur = ref Unsafe.Add(ref cur, 1);
             }
 
             return -1;
@@ -61,7 +67,8 @@ private int LastIndexOfAny<TNegator>(ref char searchSpace, int searchSpaceLength
         {
             for (int i = searchSpaceLength - 1; i >= 0; i--)
             {
-                if (TNegator.NegateIfNeeded(_lookup.Contains256(Unsafe.Add(ref searchSpace, i))))
+                char c = Unsafe.Add(ref searchSpace, i);
+                if (TNegator.NegateIfNeeded(_lookup.Contains256(c)))
                 {
                     return i;
                 }

diff --git a/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyValues.cs b/src/libraries/System.Private.CoreLib/src/System/IndexOfAnyValues/IndexOfAnyValues.cs
@@ -127,9 +127,7 @@ ref Unsafe.As<char, short>(ref MemoryMarshal.GetReference(values)),
                 return new IndexOfAnyLatin1CharValues(values);
             }
 
-            return values.Length < Vector128<short>.Count
-                ? new IndexOfAnyCharValuesProbabilistic<ShortLoopContains>(values)
-                : new IndexOfAnyCharValuesProbabilistic<StringContains>(values);
+            return new IndexOfAnyCharValuesProbabilistic(values);
         }
 
         private static IndexOfAnyValues<T>? TryGetSingleRange<T>(ReadOnlySpan<T> values, out T maxInclusive)
@@ -169,32 +167,5 @@ ref Unsafe.As<char, short>(ref MemoryMarshal.GetReference(values)),
 
             return (IndexOfAnyValues<T>)(object)new IndexOfAnyValuesInRange<T>(min, max);
         }
-
-        internal interface IStringContains
-        {
-            public static abstract bool Contains(string s, char value);
-        }
-
-        private readonly struct StringContains : IStringContains
-        {
-            public static bool Contains(string s, char value) => s.Contains(value);
-        }
-
-        private readonly struct ShortLoopContains : IStringContains
-        {
-            [MethodImpl(MethodImplOptions.AggressiveInlining)]
-            public static bool Contains(string s, char value)
-            {
-                foreach (char c in s)
-                {
-                    if (value == c)
-                    {
-                        return true;
-                    }
-                }
-
-                return false;
-            }
-        }
     }
 }