[RegexDiff X64] [stephentoub] Avoid extra boundary checks when preceeded/suc ...

[Job](https://mihubot.xyz/runtime-utils/E2rNflNA) completed in 18 minutes 16 seconds (remote runner delay: 1 minute 14 seconds).
https://github.com/dotnet/runtime/pull/118105
Using arguments: ````regexdiff````


3865 out of 18857 patterns have generated source code changes.

<details>
<summary>Examples of GeneratedRegex source diffs</summary>

<details>
<summary>&quot;{\\s*(?&lt;P&gt;\\D\\w*)\\s*\\:\\s*var\$\\s*(?&lt;B&gt; ...&quot; (9881 uses)</summary>

```c#
[GeneratedRegex("{\\s*(?<P>\\D\\w*)\\s*\\:\\s*var\\(\\s*(?<B>\\D\\w*)\\s*\$\\s*(;\\s*(?<P>\\D\\w*)\\s*\\:\\s*var\$\\s*(?<B>\\D\\w*)\\s*\$\\s*\\s*)*}")]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 StackPush(ref stack, ref pos, arg0, arg1, arg2);
             }
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;[A-z-[dDfFiIoOqQuUwWzZ]]\\d[A-z-[dDfFiIoOqQu ...&quot; (5703 uses)</summary>

```c#
[GeneratedRegex("[A-z-[dDfFiIoOqQuUwWzZ]]\\d[A-z-[dDfFiIoOqQuU]] *\\d[A-z-[dDfFiIoOqQuU]]\\d\\b", RegexOptions.IgnoreCase | RegexOptions.Singleline | RegexOptions.CultureInvariant)]
```

```diff
              }
              
              // Match if at a word boundary.
-               if (!Utilities.IsBoundary(inputSpan, pos + 6))
+               if (!Utilities.IsPostWordCharBoundary(inputSpan, pos + 6))
              {
                  return false; // The input didn't match.
              }
  /// <summary>Whether <see cref="s_defaultTimeout"/> is non-infinite.</summary>
  internal static readonly bool s_hasTimeout = s_defaultTimeout != Regex.InfiniteMatchTimeout;
  
-   /// <summary>Determines whether the specified index is a boundary.</summary>
+   /// <summary>Determines whether the specified index is a boundary word character.</summary>
+   /// <remarks>This is the same as \w plus U+200C ZERO WIDTH NON-JOINER and U+200D ZERO WIDTH JOINER.</remarks>
  [MethodImpl(MethodImplOptions.AggressiveInlining)]
-   internal static bool IsBoundary(ReadOnlySpan<char> inputSpan, int index)
+   internal static bool IsBoundaryWordChar(char ch)
  {
-       int indexMinus1 = index - 1;
-       return ((uint)indexMinus1 < (uint)inputSpan.Length && IsBoundaryWordChar(inputSpan[indexMinus1])) !=
-              ((uint)index < (uint)inputSpan.Length && IsBoundaryWordChar(inputSpan[index]));
-   
-       static bool IsBoundaryWordChar(char ch) => IsWordChar(ch) || (ch == '\u200C' | ch == '\u200D');
+       ReadOnlySpan<byte> ascii = WordCharBitmap;
+       int chDiv8 = ch >> 3;
+       return (uint)chDiv8 < (uint)ascii.Length ?
+           (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
+           ((WordCategoriesMask & (1 << (int)CharUnicodeInfo.GetUnicodeCategory(ch))) != 0) || (ch is '‌' or '‍');
  }
  
-   /// <summary>Determines whether the character is part of the [\w] set.</summary>
+   /// <summary>Determines whether the specified index is a boundary.</summary>
+   /// <remarks>This variant is only employed when the previous character has already been validated as a word character.</remarks>
  [MethodImpl(MethodImplOptions.AggressiveInlining)]
-   internal static bool IsWordChar(char ch)
-   {
-       // Mask of Unicode categories that combine to form [\w]
-       const int WordCategoriesMask =
-           1 << (int)UnicodeCategory.UppercaseLetter |
-           1 << (int)UnicodeCategory.LowercaseLetter |
-           1 << (int)UnicodeCategory.TitlecaseLetter |
-           1 << (int)UnicodeCategory.ModifierLetter |
-           1 << (int)UnicodeCategory.OtherLetter |
-           1 << (int)UnicodeCategory.NonSpacingMark |
-           1 << (int)UnicodeCategory.DecimalDigitNumber |
-           1 << (int)UnicodeCategory.ConnectorPunctuation;
+   internal static bool IsPostWordCharBoundary(ReadOnlySpan<char> inputSpan, int index) =>
+       ((uint)index >= (uint)inputSpan.Length || !IsBoundaryWordChar(inputSpan[index]));
  
-       // Bitmap for whether each character 0 through 127 is in [\w]
-       ReadOnlySpan<byte> ascii = new byte[]
+   /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+   private const int WordCategoriesMask =
+       1 << (int)UnicodeCategory.UppercaseLetter |
+       1 << (int)UnicodeCategory.LowercaseLetter |
+       1 << (int)UnicodeCategory.TitlecaseLetter |
+       1 << (int)UnicodeCategory.ModifierLetter |
+       1 << (int)UnicodeCategory.OtherLetter |
+       1 << (int)UnicodeCategory.NonSpacingMark |
+       1 << (int)UnicodeCategory.DecimalDigitNumber |
+       1 << (int)UnicodeCategory.ConnectorPunctuation;
+   
+   /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+   private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
      {
          0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
          0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
      };
  
-       // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
-       int chDiv8 = ch >> 3;
-       return (uint)chDiv8 < (uint)ascii.Length ?
-           (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
-           (WordCategoriesMask & (1 << (int)CharUnicodeInfo.GetUnicodeCategory(ch))) != 0;
-   }
  
  /// <summary>Supports searching for characters in or not in "ABCEGHJKLMNPRSTVXY[\\]^_`abceghjklmnprstvxyK".</summary>
  internal static readonly SearchValues<char> s_nonAscii_0DD9414ACADF36B5FCB9FD5EDD16B6170F356585861BFF97C0F99F5B6EB09472 = SearchValues.Create("ABCEGHJKLMNPRSTVXY[\\]^_`abceghjklmnprstvxyK");
```

</details>
<details>
<summary>&quot;^\\w+([_.-]\\w+)*$&quot; (5006 uses)</summary>

```c#
[GeneratedRegex("^\\w+([_.-]\\w+)*$", RegexOptions.IgnoreCase | RegexOptions.ExplicitCapture)]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 StackPush(ref stack, ref pos, arg0, arg1);
             }
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;^(\\w*)=(.*?)&quot; (3778 uses)</summary>

```c#
[GeneratedRegex("^(\\w*)=(.*?)")]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 (WordCategoriesMask & (1 << (int)CharUnicodeInfo.GetUnicodeCategory(ch))) != 0;
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;^(\\w+\\.)+\\w+$&quot; (2468 uses)</summary>

```c#
[GeneratedRegex("^(\\w+\\.)+\\w+$")]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 StackPush(ref stack, ref pos, arg0, arg1);
             }
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;{(?&lt;env&gt;env:)??\\w+(\\s+(\\?\\?)??\\s+\\w+)??}&quot; (2282 uses)</summary>

```c#
[GeneratedRegex("{(?<env>env:)??\\w+(\\s+(\\?\\?)??\\s+\\w+)??}")]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 StackPush(ref stack, ref pos, arg0, arg1, arg2);
             }
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;, Version=\\d+.\\d+.\\d+.\\d+, Culture=\\w+, ...&quot; (2239 uses)</summary>

```c#
[GeneratedRegex(", Version=\\d+.\\d+.\\d+.\\d+, Culture=\\w+, PublicKeyToken=\\w+")]
```

```diff
      [MethodImpl(MethodImplOptions.AggressiveInlining)]
      internal static bool IsWordChar(char ch)
      {
-           // Mask of Unicode categories that combine to form [\w]
-           const int WordCategoriesMask =
-               1 << (int)UnicodeCategory.UppercaseLetter |
-               1 << (int)UnicodeCategory.LowercaseLetter |
-               1 << (int)UnicodeCategory.TitlecaseLetter |
-               1 << (int)UnicodeCategory.ModifierLetter |
-               1 << (int)UnicodeCategory.OtherLetter |
-               1 << (int)UnicodeCategory.NonSpacingMark |
-               1 << (int)UnicodeCategory.DecimalDigitNumber |
-               1 << (int)UnicodeCategory.ConnectorPunctuation;
-       
-           // Bitmap for whether each character 0 through 127 is in [\w]
-           ReadOnlySpan<byte> ascii = new byte[]
-           {
-               0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-               0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-           };
-       
          // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+           ReadOnlySpan<byte> ascii = WordCharBitmap;
          int chDiv8 = ch >> 3;
          return (uint)chDiv8 < (uint)ascii.Length ?
              (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
              (WordCategoriesMask & (1 << (int)CharUnicodeInfo.GetUnicodeCategory(ch))) != 0;
      }
      
+       /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+       private const int WordCategoriesMask =
+           1 << (int)UnicodeCategory.UppercaseLetter |
+           1 << (int)UnicodeCategory.LowercaseLetter |
+           1 << (int)UnicodeCategory.TitlecaseLetter |
+           1 << (int)UnicodeCategory.ModifierLetter |
+           1 << (int)UnicodeCategory.OtherLetter |
+           1 << (int)UnicodeCategory.NonSpacingMark |
+           1 << (int)UnicodeCategory.DecimalDigitNumber |
+           1 << (int)UnicodeCategory.ConnectorPunctuation;
+       
+       /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+       private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+           {
+               0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+               0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+           };
+       
+       
      /// <summary>Supports searching for the string ", Version=".</summary>
      internal static readonly SearchValues<string> s_indexOfString_F484FBA9DDF61CC32D17E4ED223128BF4D7C62347668A9B369CE2C1E6BBB3513 = SearchValues.Create([", Version="], StringComparison.Ordinal);
  }
```

</details>
<details>
<summary>&quot;^-+ *BEGIN (?&lt;keyName&gt;\\w+( \\w+)*) PRIVATE  ...&quot; (1964 uses)</summary>

```c#
[GeneratedRegex("^-+ *BEGIN (?<keyName>\\w+( \\w+)*) PRIVATE KEY *-+\\r?\\n(Proc-Type: 4,ENCRYPTED\\r?\\nDEK-Info: (?<cipherName>[A-Z0-9-]+),(?<salt>[A-F0-9]+)\\r?\\n\\r?\\n)?(?<data>([a-zA-Z0-9/+=]{1,80}\\r?\\n)+)-+ *END \\k<keyName> PRIVATE KEY *-+", RegexOptions.Multiline)]
```

```diff
  [MethodImpl(MethodImplOptions.AggressiveInlining)]
  internal static bool IsWordChar(char ch)
  {
-       // Mask of Unicode categories that combine to form [\w]
-       const int WordCategoriesMask =
-           1 << (int)UnicodeCategory.UppercaseLetter |
-           1 << (int)UnicodeCategory.LowercaseLetter |
-           1 << (int)UnicodeCategory.TitlecaseLetter |
-           1 << (int)UnicodeCategory.ModifierLetter |
-           1 << (int)UnicodeCategory.OtherLetter |
-           1 << (int)UnicodeCategory.NonSpacingMark |
-           1 << (int)UnicodeCategory.DecimalDigitNumber |
-           1 << (int)UnicodeCategory.ConnectorPunctuation;
-   
-       // Bitmap for whether each character 0 through 127 is in [\w]
-       ReadOnlySpan<byte> ascii = new byte[]
-       {
-           0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-           0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-       };
-   
      // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+       ReadOnlySpan<byte> ascii = WordCharBitmap;
      int chDiv8 = ch >> 3;
      return (uint)chDiv8 < (uint)ascii.Length ?
          (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
      }
  }
  
+   /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+   private const int WordCategoriesMask =
+       1 << (int)UnicodeCategory.UppercaseLetter |
+       1 << (int)UnicodeCategory.LowercaseLetter |
+       1 << (int)UnicodeCategory.TitlecaseLetter |
+       1 << (int)UnicodeCategory.ModifierLetter |
+       1 << (int)UnicodeCategory.OtherLetter |
+       1 << (int)UnicodeCategory.NonSpacingMark |
+       1 << (int)UnicodeCategory.DecimalDigitNumber |
+       1 << (int)UnicodeCategory.ConnectorPunctuation;
+   
+   /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+   private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+       {
+           0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+           0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+       };
+   
+   
  /// <summary>Supports searching for characters in or not in "0123456789ABCDEF".</summary>
  internal static readonly SearchValues<char> s_asciiHexDigitsUpper = SearchValues.Create("0123456789ABCDEF");
```

</details>
<details>
<summary>&quot;&amp;(?!#?\\w+;)&quot; (1880 uses)</summary>

```c#
[GeneratedRegex("&(?!#?\\w+;)")]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 (WordCategoriesMask & (1 << (int)CharUnicodeInfo.GetUnicodeCategory(ch))) != 0;
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>
<details>
<summary>&quot;\\A\\s*(?&lt;name&gt;\\w+)(\\s*\$(?&lt;arguments&gt;.*) ...&quot; (1751 uses)</summary>

```c#
[GeneratedRegex("\\A\\s*(?<name>\\w+)(\\s*\\((?<arguments>.*)\$)?\\s*\\Z", RegexOptions.Singleline)]
```

```diff
         [MethodImpl(MethodImplOptions.AggressiveInlining)]
         internal static bool IsWordChar(char ch)
         {
-            // Mask of Unicode categories that combine to form [\w]
-            const int WordCategoriesMask =
-                1 << (int)UnicodeCategory.UppercaseLetter |
-                1 << (int)UnicodeCategory.LowercaseLetter |
-                1 << (int)UnicodeCategory.TitlecaseLetter |
-                1 << (int)UnicodeCategory.ModifierLetter |
-                1 << (int)UnicodeCategory.OtherLetter |
-                1 << (int)UnicodeCategory.NonSpacingMark |
-                1 << (int)UnicodeCategory.DecimalDigitNumber |
-                1 << (int)UnicodeCategory.ConnectorPunctuation;
-        
-            // Bitmap for whether each character 0 through 127 is in [\w]
-            ReadOnlySpan<byte> ascii = new byte[]
-            {
-                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
-                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
-            };
-        
             // If the char is ASCII, look it up in the bitmap. Otherwise, query its Unicode category.
+            ReadOnlySpan<byte> ascii = WordCharBitmap;
             int chDiv8 = ch >> 3;
             return (uint)chDiv8 < (uint)ascii.Length ?
                 (ascii[chDiv8] & (1 << (ch & 0x7))) != 0 :
                 StackPush(ref stack, ref pos, arg0, arg1, arg2);
             }
         }
+        
+        /// <summary>Provides a mask of Unicode categories that combine to form [\w].</summary>
+        private const int WordCategoriesMask =
+            1 << (int)UnicodeCategory.UppercaseLetter |
+            1 << (int)UnicodeCategory.LowercaseLetter |
+            1 << (int)UnicodeCategory.TitlecaseLetter |
+            1 << (int)UnicodeCategory.ModifierLetter |
+            1 << (int)UnicodeCategory.OtherLetter |
+            1 << (int)UnicodeCategory.NonSpacingMark |
+            1 << (int)UnicodeCategory.DecimalDigitNumber |
+            1 << (int)UnicodeCategory.ConnectorPunctuation;
+        
+        /// <summary>Gets a bitmap for whether each character 0 through 127 is in [\w]</summary>
+        private static ReadOnlySpan<byte> WordCharBitmap => new byte[]
+            {
+                0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xFF, 0x03,
+                0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x07
+            };
+        
     }
 }
```

</details>


For more diff examples, see https://gist.github.com/MihuBot/3dc0c347ab5ededb4c479718266d90f0

</details>


<details>
<summary>JIT assembly changes</summary>


```
Total bytes of base: 54138884
Total bytes of diff: 53799262
Total bytes of delta: -339622 (-0.63 % of base)
Total relative delta: -96.31
    diff is an improvement.
    relative diff is an improvement.
```
For a list of JIT diff regressions, see [Regressions.md](https://gist.github.com/MihuBot/4d78140c75221c91c45c0fbc81f79e03)
For a list of JIT diff improvements, see [Improvements.md](https://gist.github.com/MihuBot/f474837ab3ebef7b52e31332b3aaa0d4)

</details>


<details>
<summary>Sample source code for further analysis</summary>

```c#
const string JsonPath = "RegexResults-1303.json";
if (!File.Exists(JsonPath))
{
    await using var archiveStream = await new HttpClient().GetStreamAsync("https://mihubot.xyz/r/E2rQ5ESA");
    using var archive = new ZipArchive(archiveStream, ZipArchiveMode.Read);
    archive.Entries.First(e => e.Name == "Results.json").ExtractToFile(JsonPath);
}

using FileStream jsonFileStream = File.OpenRead(JsonPath);
RegexEntry[] entries = JsonSerializer.Deserialize<RegexEntry[]>(jsonFileStream, new JsonSerializerOptions { IncludeFields = true })!;
Console.WriteLine($"Working with {entries.Length} patterns");



record KnownPattern(string Pattern, RegexOptions Options, int Count);

sealed class RegexEntry
{
    public required KnownPattern Regex { get; set; }
    public required string MainSource { get; set; }
    public required string PrSource { get; set; }
    public string? FullDiff { get; set; }
    public string? ShortDiff { get; set; }
    public (string Name, string Values)[]? SearchValuesOfChar { get; set; }
    public (string[] Values, StringComparison ComparisonType)[]? SearchValuesOfString { get; set; }
}
```

</details>


Artifacts:
- [ShortExampleDiffs.md](https://mihubot.xyz/r/E2rQ2WDA) (27 KB)
- [LongExampleDiffs.md](https://mihubot.xyz/r/E2rQ2WtA) (900 KB)
- [Results.zip](https://mihubot.xyz/r/E2rQ5ESA) (55 MB)
- [jit-diffs.zip](https://mihubot.xyz/r/E2rRmixA) (390 MB)
- [JitAnalyzeSummary.txt](https://mihubot.xyz/r/E2rRobg) (70 KB)
- [JitDiffRegressions.md](https://mihubot.xyz/r/E2rRpwSA) (865 KB)
- [LongJitDiffRegressions.md](https://mihubot.xyz/r/E2rRp8M) (85 MB)
- [JitDiffImprovements.md](https://mihubot.xyz/r/E2rRqQDA) (873 KB)
- [LongJitDiffImprovements.md](https://mihubot.xyz/r/E2rRqSHA) (23 MB)



Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

[RegexDiff X64] [stephentoub] Avoid extra boundary checks when preceeded/suc ... #1303

Metadata

Assignees

Labels

Projects

Milestone

Relationships

Development

Uh oh!

[RegexDiff X64] [stephentoub] Avoid extra boundary checks when preceeded/suc ... #1303

Description

Metadata

Metadata

Assignees

Labels

Projects

Milestone

Relationships

Development

Issue actions