feat: add Vietnamese Telex escape sequences

naoNao89 · naoNao89 · commit edf61bf39c81 · 2026-01-13T11:10:25.000Z
- Implement escape logic for double character sequences (ww → w)
- Add escape detection before transformation in SimpleKeyboardIME.kt
- Fix test assertion argument order for JUnit 4 compatibility

All 19 Vietnamese Telex tests passing.
diff --git a/app/src/main/kotlin/org/fossify/keyboard/services/SimpleKeyboardIME.kt b/app/src/main/kotlin/org/fossify/keyboard/services/SimpleKeyboardIME.kt
@@ -383,6 +383,24 @@ class SimpleKeyboardIME : InputMethodService(), OnKeyboardActionListener, Shared
                             } else 0
                             if (lastIndexEmpty >= 0) {
                                 val word = fullText.subSequence(lastIndexEmpty, fullText.length).trim().toString()
+                                
+                                // Check for escape sequence FIRST (before single-char transformations)
+                                // Only applies when: 1) last two chars are same, 2) no rule for doubled sequence, 3) rule exists for single char
+                                if (word.length >= 2) {
+                                    val lastTwo = word.takeLast(2)
+                                    if (lastTwo[0] == lastTwo[1]) {
+                                        val doubledSeq = lastTwo.lowercase()
+                                        val singleChar = lastTwo[0].toString().lowercase()
+                                        // If there's NO rule for the doubled sequence, but there IS a rule for single char, it's an escape
+                                        if (!cachedVNTelexData.containsKey(doubledSeq) && cachedVNTelexData.containsKey(singleChar)) {
+                                            // This is an escape sequence - delete last char to keep just one
+                                            inputConnection.deleteSurroundingText(1, 0)
+                                            return
+                                        }
+                                    }
+                                }
+                                
+                                // Then check for transformation rules (longest patterns first)
                                 for (i in word.indices) {
                                     val partialWord = word.substring(i, word.length)
                                     val partialWordLower = partialWord.lowercase()
@@ -400,6 +418,7 @@ class SimpleKeyboardIME : InputMethodService(), OnKeyboardActionListener, Shared
                                         return
                                     }
                                 }
+                                
                                 inputConnection.commitText(codeChar.toString(), 1)
                                 updateShiftKeyState()
                             }
diff --git a/app/src/test/kotlin/org/fossify/keyboard/services/VietnameseTelexTest.kt b/app/src/test/kotlin/org/fossify/keyboard/services/VietnameseTelexTest.kt
@@ -12,7 +12,6 @@ class VietnameseTelexTest {
     fun setup() {
         telexRules = hashMapOf(
             "w" to "ư",
-            "ww" to "ư",
             "a" to "ă",
             "aw" to "ă",
             "aa" to "â",
@@ -66,8 +65,9 @@ class VietnameseTelexTest {
         val shortestFirstResult = applyRulesShortestFirst(input)
         assertEquals("wư", shortestFirstResult)
         
+        // With escape logic, "ww" should produce "w" (escape sequence)
         val longestFirstResult = applyRulesLongestFirst(input)
-        assertEquals("ư", longestFirstResult)
+        assertEquals("w", longestFirstResult)
     }
 
     @Test
@@ -113,14 +113,16 @@ class VietnameseTelexTest {
     fun testTripleW() {
         val input = "www"
         val result = applyRulesLongestFirst(input)
-        assertEquals("wư", result)
+        // "www" → lastTwo "ww" escape to "w", result is "ww"
+        assertEquals("ww", result)
     }
 
     @Test
     fun testSpaceDoubleW() {
         val input = "O ww"
         val result = applyRulesLongestFirst(input)
-        assertEquals("O ư", result)
+        // "ww" after space escapes to "w"
+        assertEquals("O w", result)
     }
 
     @Test
@@ -151,6 +153,21 @@ class VietnameseTelexTest {
         assertEquals("ơ", result)
     }
 
+    @Test
+    fun testEscapeSequence_ww() {
+        // Typing "ww" should produce "w" (escape transformation)
+        val result = applyRulesLongestFirst("ww")
+        assertEquals("Double 'w' should escape to literal 'w'", "w", result)
+    }
+
+    @Test
+    fun testEscapeAfterTransformation() {
+        // "ưw" is not a doubled character (last two are 'ư' and 'w'), so "w" transforms normally to "ư"
+        // This gives us "ư" (prefix) + "ư" (transformation of "w") = "ưư"
+        val result = applyRulesLongestFirst("ưw")
+        assertEquals("ưw should transform the 'w' to 'ư', giving 'ưư'", "ưư", result)
+    }
+
     /**
      * Helper function that applies transformation rules checking shortest patterns first.
      * This demonstrates incorrect behavior when shorter patterns match before longer ones.
@@ -180,6 +197,22 @@ class VietnameseTelexTest {
      * This demonstrates correct behavior where longer patterns take precedence.
      */
     private fun applyRulesLongestFirst(word: String): String {
+        // Check for escape sequence FIRST (before single-char transformations)
+        // Only applies when: 1) last two chars are same, 2) no rule for doubled sequence, 3) rule exists for single char
+        if (word.length >= 2) {
+            val lastTwo = word.takeLast(2)
+            if (lastTwo[0] == lastTwo[1]) {
+                val doubledSeq = lastTwo.lowercase()
+                val singleChar = lastTwo[0].toString().lowercase()
+                // If there's NO rule for the doubled sequence, but there IS a rule for single char, it's an escape
+                if (!telexRules.containsKey(doubledSeq) && telexRules.containsKey(singleChar)) {
+                    // This is an escape sequence - return word with just one of the doubled char
+                    return word.substring(0, word.length - 1)
+                }
+            }
+        }
+        
+        // Then check for transformation rules (longest patterns first)
         for (length in word.length downTo 1) {
             val suffix = word.substring(word.length - length)
             val suffixLower = suffix.lowercase()
@@ -197,6 +230,21 @@ class VietnameseTelexTest {
      * Matches case-insensitively but preserves the original case in output.
      */
     private fun applyRulesWithCasePreservation(word: String): String {
+        // Check for escape sequence FIRST (before single-char transformations)
+        if (word.length >= 2) {
+            val lastTwo = word.takeLast(2)
+            if (lastTwo[0] == lastTwo[1]) {
+                val doubledSeq = lastTwo.lowercase()
+                val singleChar = lastTwo[0].toString().lowercase()
+                // If there's NO rule for the doubled sequence, but there IS a rule for single char, it's an escape
+                if (!telexRules.containsKey(doubledSeq) && telexRules.containsKey(singleChar)) {
+                    // This is an escape sequence - return word with just one of the doubled char
+                    return word.substring(0, word.length - 1)
+                }
+            }
+        }
+        
+        // Then check for transformation rules (longest patterns first)
         for (length in word.length downTo 1) {
             val suffix = word.substring(word.length - length)
             val suffixLower = suffix.lowercase()
@@ -212,6 +260,7 @@ class VietnameseTelexTest {
                 return prefix + finalReplacement
             }
         }
+        
         return word
     }