From 9554e7cc7b796f64a80baa272ed3e49ad03466a3 Mon Sep 17 00:00:00 2001 From: Joseph Liu Date: Fri, 17 Jan 2025 21:43:36 -0500 Subject: [PATCH] fix(preset/english): add word boundary to 'shit' pattern The pattern `shit` was matching on names such as "harshit". Fix this issue by adding a word boundary assertion at the start. Thanks to @kaushal-aubie for the report. Closes #93 --- src/preset/english.ts | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/src/preset/english.ts b/src/preset/english.ts index 11250e8..066bcac 100644 --- a/src/preset/english.ts +++ b/src/preset/english.ts @@ -364,12 +364,11 @@ export const englishDataset = new DataSet<{ originalWord: EnglishProfaneWord }>( .addPhrase((phrase) => phrase .setMetadata({ originalWord: 'shit' }) - .addPattern(pattern`shit`) + .addPattern(pattern`|shit`) .addWhitelistedTerm('s hit') .addWhitelistedTerm('sh it') .addWhitelistedTerm('shi t') - .addWhitelistedTerm('shitake') - .addWhitelistedTerm('mishit'), + .addWhitelistedTerm('shitake'), ) .addPhrase((phrase) => phrase.setMetadata({ originalWord: 'slut' }).addPattern(pattern`s[s]lut`)) .addPhrase((phrase) => phrase.setMetadata({ originalWord: 'spastic' }).addPattern(pattern`|spastic`))