Merge pull request #1 from aplazo/feature/improve-rfc-generation

Aleph06 · web-flow · commit efe85acc3130 · 2024-05-22T09:51:15.000-06:00
feat: enhance RFC code generation to support special characters
diff --git a/build.gradle b/build.gradle
@@ -1,16 +1,17 @@
 apply plugin: 'java'
 apply plugin: 'me.tatarka.retrolambda'
+apply plugin: 'maven-publish'
 
 sourceCompatibility = 1.8
-version = '2.0.3-SNAPSHOT'
+version = '2.1.0'
 
 buildscript {
     repositories {
         mavenCentral()
     }
 
     dependencies {
-        classpath 'me.tatarka:gradle-retrolambda:3.2.4'
+        classpath 'me.tatarka:gradle-retrolambda:3.7.1'
     }
 }
 
@@ -23,11 +24,46 @@ dependencies {
     compile 'org.apache.commons:commons-lang3:3.0'
     compile 'net.sourceforge.streamsupport:streamsupport:1.4.1'
 
-    testCompile 'junit:junit:4.12'
+    testCompile 'junit:junit:4.13.1'
     testCompile 'org.hamcrest:hamcrest-core:1.3'
     testCompile 'org.hamcrest:hamcrest-library:1.3'
 }
 
+publishing {
+    publications {
+        maven(MavenPublication) {
+            groupId = 'com.josketres'
+            artifactId = 'rfcfacil'
+            version = "2.1.0"
+            from components.java
+
+            pom {
+                name = 'rfcfacil'
+                description = 'Libreria para calcular el Registro Federal de Contribuyentes en México (RFC) en Java.'
+            }
+        }
+    }
+    repositories {
+        maven {
+            credentials {
+                username = "<nexus-maven-username>"
+                password = "<nexus-maven-password>"
+            }
+            url = "https://nexus.aplazo.dev/repository/maven-releases"
+        }
+    }
+}
+
+tasks.register('sourcesJar', Jar) {
+    dependsOn classes
+    classifier = 'sources'
+    from sourceSets.main.allSource
+}
+
+artifacts {
+    archives sourcesJar
+}
+
 // http://zserge.com/blog/gradle-maven-publish.html
 //  export JAVA6_HOME=/System/Library/Frameworks/JavaVM.framework/Versions/1.6/Home/
 // ./gradlew uploadArchives
diff --git a/src/main/java/com/josketres/rfcfacil/HomoclaveCalculator.java b/src/main/java/com/josketres/rfcfacil/HomoclaveCalculator.java
@@ -5,13 +5,15 @@
 import java.util.HashMap;
 import java.util.Map;
 
+import static java.lang.String.valueOf;
+
 /**
  * Calculates a two-digits code known as "homoclave".
  */
 class HomoclaveCalculator {
 
     private static final String HOMOCLAVE_DIGITS = "123456789ABCDEFGHIJKLMNPQRSTUVWXYZ";
-    private static final Map<String, String> FULL_NAME_MAPPING = new HashMap<String, String>();
+    private static final Map<String, String> FULL_NAME_MAPPING = new HashMap<>();
 
     static {
         FULL_NAME_MAPPING.put(" ", "00");
@@ -68,26 +70,22 @@ public HomoclaveCalculator(HomoclavePerson person) {
     }
 
     public String calculate() {
-
         normalizeFullName();
         mapFullNameToDigitsCode();
         sumPairsOfDigits();
         buildHomoclave();
-
         return homoclave;
     }
 
     private void buildHomoclave() {
-
         int lastThreeDigits = pairsOfDigitsSum % 1000;
         int quo = lastThreeDigits / 34;
         int reminder = lastThreeDigits % 34;
         homoclave = String.valueOf(HOMOCLAVE_DIGITS.charAt(quo))
-                + String.valueOf(HOMOCLAVE_DIGITS.charAt(reminder));
+                + HOMOCLAVE_DIGITS.charAt(reminder);
     }
 
     private void sumPairsOfDigits() {
-
         pairsOfDigitsSum = 0;
         for (int i = 0; i < mappedFullName.length() - 1; i++) {
             int intNum1 = Integer.parseInt(mappedFullName.substring(i, i + 2));
@@ -97,15 +95,14 @@ private void sumPairsOfDigits() {
     }
 
     private void mapFullNameToDigitsCode() {
-
-        mappedFullName = "0";
+        StringBuilder mappedFullNameBuilder = new StringBuilder("0");
         for (int i = 0; i < fullName.length(); i++) {
-            mappedFullName += mapCharacterToTwoDigitCode(String.valueOf(fullName.charAt(i)));
+            mappedFullNameBuilder.append(mapCharacterToTwoDigitCode(valueOf(fullName.charAt(i))));
         }
+        mappedFullName = mappedFullNameBuilder.toString();
     }
 
     private String mapCharacterToTwoDigitCode(String c) {
-
         if (!FULL_NAME_MAPPING.containsKey(c)) {
             throw new IllegalArgumentException("No two-digit-code mapping for char: " + c);
         } else {
@@ -114,27 +111,18 @@ private String mapCharacterToTwoDigitCode(String c) {
     }
 
     private void normalizeFullName() {
-
         String rawFullName = person.getFullNameForHomoclave().toUpperCase();
-
-        fullName = StringUtils.stripAccents(rawFullName);
-        fullName = fullName.replaceAll("[\\-\\.',]", ""); // remove .'-,
-        fullName = addMissingCharToFullName(rawFullName, 'Ñ');
-
+        fullName = stripAccentsExcludingNTilde(rawFullName);
+        fullName = fullName.replaceAll("[^A-Z0-9&Ñ ]", "");
     }
 
-    private String addMissingCharToFullName(String rawFullName, char missingChar) {
+    private String stripAccentsExcludingNTilde(String input) {
+        if (StringUtils.isEmpty(input))
+            return input;
 
-        int index = rawFullName.indexOf(missingChar);
-        if (index == -1) {
-            return fullName;
-        }
-
-        StringBuilder newFullName = new StringBuilder(fullName);
-        while (index >= 0) {
-            newFullName.setCharAt(index, missingChar);
-            index = rawFullName.indexOf(missingChar, index + 1);
-        }
-        return newFullName.toString();
+        input = input.toUpperCase();
+        input = input.replace("Ñ", "$");
+        input = StringUtils.stripAccents(input);
+        return input.replace("$", "Ñ");
     }
 }
diff --git a/src/main/java/com/josketres/rfcfacil/NaturalPersonTenDigitsCodeCalculator.java b/src/main/java/com/josketres/rfcfacil/NaturalPersonTenDigitsCodeCalculator.java
@@ -16,23 +16,21 @@ class NaturalPersonTenDigitsCodeCalculator {
     private final NaturalPerson person;
 
     private static final String[] SPECIAL_PARTICLES =
-            {"DE", "LA", "LAS", "MC", "VON", "DEL", "LOS", "Y", "MAC", "VAN", "MI"};
-
-    private static final String[] FORBIDDEN_WORDS = { "BUEI", "BUEY", "CACA", "CACO", "CAGA", "CAGO", "CAKA", "CAKO", "COGE", "COJA", "COJE", "COJI", "COJO", "CULO", "FETO", "GUEY", "JOTO", "KACA", "KACO", "KAGA", "KAGO", "KOGE", "KOJO", "KAKA", "KULO", "MAME", "MAMO", "MEAR", "MEAS", "MEON", "MION", "MOCO", "MULA", "PEDA", "PEDO", "PENE", "PUTA", "PUTO", "QULO", "RATA", "RUIN" };
+            {"DAS", "DA", "DEL", "DER", "DE", "DIE", "DI", "DD", "EL", "LES", "LA", "LOS", "LAS", "LES", "LE", "MAC", "MC", "VAN", "VON", "Y"};
 
+    private static final String[] FORBIDDEN_WORDS = {"BACA", "BAKA", "BUEI", "BUEY", "CACA", "CACO", "CAGA", "CAGO", "CAKA", "CAKO", "COGE", "COGI", "COJA", "COJE", "COJI", "COJO", "COLA", "CULO", "FALO", "FETO", "GETA", "GUEI", "GUEY", "JETA", "JOTO", "KACA", "KACO", "KAGA", "KAGO", "KAKA", "KAKO", "KOGE", "KOGI", "KOJA", "KOJE", "KOJI", "KOJO", "KOLA", "KULO", "LILO", "LOCA", "LOCO", "LOKA", "LOKO", "MAME", "MAMO", "MEAR", "MEAS", "MEON", "MIAR", "MION", "MOCO", "MOKO", "MULA", "MULO", "NACA", "NACO", "PEDA", "PEDO", "PENE", "PIPI", "PITO", "POPO", "PUTA", "PUTO", "QULO", "RATA", "ROBA", "ROBE", "ROBO", "RUIN", "SENO", "TETA", "VACA", "VAGA", "VAGO", "VAKA", "VUEI", "VUEY", "WUEI", "WUEY"};
 
     NaturalPersonTenDigitsCodeCalculator(NaturalPerson person) {
-
         this.person = person;
     }
 
     public String calculate() {
-
-        return obfuscateForbiddenWords(nameCode()) + birthdayCode();
+        String a = nameCode();
+        String b = StringUtils.stripAccents(a);
+        return obfuscateForbiddenWords(b) + birthdayCode();
     }
 
     private String obfuscateForbiddenWords(String nameCode) {
-
         for (String forbidden : FORBIDDEN_WORDS) {
             if (forbidden.equals(nameCode)) {
                 return nameCode.substring(0, 3) + "X";
@@ -42,7 +40,6 @@ private String obfuscateForbiddenWords(String nameCode) {
     }
 
     private String nameCode() {
-
         if (isFirstLastNameEmpty()) {
             return firstLastNameEmptyForm();
         } else if (isSecondLastNameEmpty()) {
@@ -55,114 +52,108 @@ private String nameCode() {
     }
 
     private String secondLastNameEmptyForm() {
-
         return firstTwoLettersOf(person.firstLastName)
                 + firstTwoLettersOf(filterName(person.name));
     }
 
     private String birthdayCode() {
-
         return lastTwoDigitsOf(person.year)
                 + formattedInTwoDigits(person.month)
                 + formattedInTwoDigits(person.day);
     }
 
     private boolean isSecondLastNameEmpty() {
-
         return StringUtils.isEmpty(normalize(person.secondLastName));
     }
 
     private String firstLastNameEmptyForm() {
-
         return firstTwoLettersOf(person.secondLastName)
                 + firstTwoLettersOf(filterName(person.name));
     }
 
     private boolean isFirstLastNameEmpty() {
-
         return StringUtils.isEmpty(normalize(person.firstLastName));
     }
 
     private String firstLastNameTooShortForm() {
-
         return firstLetterOf(person.firstLastName)
                 + firstLetterOf(person.secondLastName)
                 + firstTwoLettersOf(filterName(person.name));
     }
 
     private String firstTwoLettersOf(String word) {
-
-        String normalizedWord = normalize(word);
-        return normalizedWord.substring(0, 2);
+        String normalizedWord = normalize(word).replace(" ", "");
+        return normalizedWord.length() > 1 ? normalizedWord.substring(0, 2) : normalizedWord.concat("X");
     }
 
     private boolean isFirstLastNameIsTooShort() {
-
         return normalize(person.firstLastName).length() <= 2;
     }
 
     private String normalForm() {
-
         return firstLetterOf(person.firstLastName)
                 + firstVowelExcludingFirstCharacterOf(person.firstLastName)
                 + firstLetterOf(person.secondLastName)
                 + firstLetterOf(filterName(person.name));
     }
 
     private String filterName(String name) {
-
-        return normalize(name)
-                .trim()
-                .replaceFirst("^(MA|MA.|MARIA|JOSE)\\s+", "");
+        return normalize(name).trim()
+                .replaceFirst("^(MARIA|MA\\.|MA|M\\.|M|JOSE|J|J\\.|DA|DAS|DE|DEL|DER|DI|DIE|DD|EL|LA|LAS|LOS|LE|LES|MAC|MC|VAN|VON|Y)\\s+", "");
     }
 
     private String formattedInTwoDigits(int number) {
-
         return String.format(Locale.getDefault(), "%02d", number);
     }
 
     private String lastTwoDigitsOf(int number) {
-
         return formattedInTwoDigits(number % 100);
     }
 
     private String firstLetterOf(String word) {
-
         String normalizedWord = normalize(word);
         return String.valueOf(normalizedWord.charAt(0));
     }
 
     private String normalize(String word) {
-
-        if (StringUtils.isEmpty(word)) {
+        if (StringUtils.isEmpty(word))
             return word;
-        } else {
-            String normalizedWord = StringUtils.stripAccents(word).toUpperCase();
-            return removeSpecialParticles(normalizedWord, SPECIAL_PARTICLES);
+
+        String cleanedWord = word.replaceAll("[\\-.',´`’\\\\/]", "");
+        if (StringUtils.isEmpty(cleanedWord)) {
+            return cleanedWord;
         }
-    }
 
-    private String removeSpecialParticles(String word, String[] specialParticles) {
+        String normalizedWord = stripAccentsExcludingNTilde(cleanedWord);
 
-        StringBuilder newWord = new StringBuilder(word);
-        for (String particle : specialParticles) {
-            String[] particlePositions = {particle + " ", " " + particle};
-            for (String p : particlePositions)
-                while (newWord.toString().contains(p)) {
-                    int i = newWord.toString().indexOf(p);
-                    newWord.delete(i, i + p.length());
-                }
-        }
-        return newWord.toString();
+        return removeSpecialParticles(normalizedWord);
     }
 
-    private String firstVowelExcludingFirstCharacterOf(String word) {
+    private String removeSpecialParticles(String word) {
+        String particlesRegex = String.join("|", SPECIAL_PARTICLES);  // convert the array to a regex OR sequence
+        Pattern pattern = Pattern.compile("\\b(" + particlesRegex + ")\\b", Pattern.CASE_INSENSITIVE); // match the particles only if they are whole words
+        Matcher matcher = pattern.matcher(word);
+        String result = matcher.replaceAll(" "); // replace all special particles with space
+        return result.trim();  // remove any leading and trailing spaces
+    }
 
+    private String firstVowelExcludingFirstCharacterOf(String word) {
         String normalizedWord = normalize(word).substring(1);
         Matcher m = VOWEL_PATTERN.matcher(normalizedWord);
         if (!m.find()) {
             return "X";
         }
         return String.valueOf(normalizedWord.charAt(m.start()));
     }
+
+    private String stripAccentsExcludingNTilde(String input) {
+        if (StringUtils.isEmpty(input))
+            return input;
+
+        input = input.toUpperCase();
+        input = input.replace("Ñ", "$");
+        input = StringUtils.stripAccents(input);
+        input = input.replace("$", "Ñ");
+        return input.replaceAll("[^A-Z0-9&Ñ ]", "");
+    }
 }
diff --git a/src/test/java/com/josketres/rfcfacil/NaturalPersonTenDigitsCodeCalculatorTest.java b/src/test/java/com/josketres/rfcfacil/NaturalPersonTenDigitsCodeCalculatorTest.java
@@ -77,7 +77,7 @@ public void should_use_second_name_if_person_has_multiple_names_and_first_name_i
     @Test
     public void should_use_second_name_if_person_has_multiple_names_and_first_name_is_maria() {
 
-        assertThat(tenDigitsCode("María Luisa", "Ramírez", "Sánchez", 13, 12, 1970), equalTo("RASL701213"));
+        assertThat(tenDigitsCode("María del Luisa", "Ramírez", "Sánchez", 13, 12, 1970), equalTo("RASL701213"));
     }
 
     @Test
@@ -117,6 +117,11 @@ public void should_use_ma_when_first_name_is_not_Maria() {
         assertThat(tenDigitsCode("Marco Antonio", "Cano", "Barraza", 13, 12, 1970), equalTo("CABM701213"));
     }
 
+    @Test
+    public void should_not_fail_for_names_with_special_characters(){
+        assertThat(tenDigitsCode("Jesus Antonio","López", "Ventura", 17,8,2004),equalTo("LOVJ040817"));
+    }
+
     private String tenDigitsCode(String name,
                                  String firstLastName,
                                  String secondLastName,
diff --git a/src/test/java/com/josketres/rfcfacil/RfcReworkTest.java b/src/test/java/com/josketres/rfcfacil/RfcReworkTest.java