|
| 1 | +package tribixbite.cleverkeys |
| 2 | + |
| 3 | +import com.google.common.truth.Truth.assertThat |
| 4 | +import org.junit.Test |
| 5 | + |
| 6 | +/** |
| 7 | + * Tests for French contraction frequency scoring (v1.2.9 fix). |
| 8 | + * |
| 9 | + * The v1.2.9 fix ensures that French contractions like "qu'est" can rank |
| 10 | + * higher than their base words like "quest" when the contraction has |
| 11 | + * higher frequency in the dictionary. |
| 12 | + * |
| 13 | + * This is achieved by looking up actual contraction frequencies and using |
| 14 | + * VocabularyUtils.calculateCombinedScore for fair comparison. |
| 15 | + */ |
| 16 | +class ContractionFrequencyTest { |
| 17 | + |
| 18 | + // ========================================================================= |
| 19 | + // calculateCombinedScore for contraction ranking |
| 20 | + // ========================================================================= |
| 21 | + |
| 22 | + @Test |
| 23 | + fun `high frequency contraction scores higher than low frequency base word`() { |
| 24 | + // Simulate "qu'est" (high frequency French contraction) vs "quest" (lower frequency) |
| 25 | + val contractionFrequency = 0.9f // Very common French word |
| 26 | + val baseWordFrequency = 0.3f // Less common English word |
| 27 | + |
| 28 | + val commonBoost = 1.15f |
| 29 | + val confidenceWeight = 0.6f |
| 30 | + val frequencyWeight = 0.4f |
| 31 | + |
| 32 | + // Both have same NN confidence (user swiped the same pattern) |
| 33 | + val nnConfidence = 0.85f |
| 34 | + |
| 35 | + val contractionScore = VocabularyUtils.calculateCombinedScore( |
| 36 | + nnConfidence, contractionFrequency, commonBoost, confidenceWeight, frequencyWeight |
| 37 | + ) |
| 38 | + |
| 39 | + val baseWordScore = VocabularyUtils.calculateCombinedScore( |
| 40 | + nnConfidence, baseWordFrequency, 1.0f, confidenceWeight, frequencyWeight |
| 41 | + ) |
| 42 | + |
| 43 | + // Contraction should score higher due to higher frequency + common boost |
| 44 | + assertThat(contractionScore).isGreaterThan(baseWordScore) |
| 45 | + } |
| 46 | + |
| 47 | + @Test |
| 48 | + fun `low frequency contraction scores lower than high frequency base word`() { |
| 49 | + // When base word is more common, it should rank higher |
| 50 | + val contractionFrequency = 0.2f // Rare contraction |
| 51 | + val baseWordFrequency = 0.95f // Very common word |
| 52 | + |
| 53 | + val top5000Boost = 1.08f |
| 54 | + val commonBoost = 1.15f |
| 55 | + val confidenceWeight = 0.6f |
| 56 | + val frequencyWeight = 0.4f |
| 57 | + |
| 58 | + val nnConfidence = 0.85f |
| 59 | + |
| 60 | + val contractionScore = VocabularyUtils.calculateCombinedScore( |
| 61 | + nnConfidence, contractionFrequency, top5000Boost, confidenceWeight, frequencyWeight |
| 62 | + ) |
| 63 | + |
| 64 | + val baseWordScore = VocabularyUtils.calculateCombinedScore( |
| 65 | + nnConfidence, baseWordFrequency, commonBoost, confidenceWeight, frequencyWeight |
| 66 | + ) |
| 67 | + |
| 68 | + // Base word should score higher |
| 69 | + assertThat(baseWordScore).isGreaterThan(contractionScore) |
| 70 | + } |
| 71 | + |
| 72 | + @Test |
| 73 | + fun `frequency ranking is fair with equal boosts`() { |
| 74 | + // With same boosts, higher frequency should always win |
| 75 | + val boost = 1.0f |
| 76 | + val confidenceWeight = 0.6f |
| 77 | + val frequencyWeight = 0.4f |
| 78 | + val nnConfidence = 0.80f |
| 79 | + |
| 80 | + val highFreqScore = VocabularyUtils.calculateCombinedScore( |
| 81 | + nnConfidence, 0.9f, boost, confidenceWeight, frequencyWeight |
| 82 | + ) |
| 83 | + |
| 84 | + val lowFreqScore = VocabularyUtils.calculateCombinedScore( |
| 85 | + nnConfidence, 0.3f, boost, confidenceWeight, frequencyWeight |
| 86 | + ) |
| 87 | + |
| 88 | + assertThat(highFreqScore).isGreaterThan(lowFreqScore) |
| 89 | + } |
| 90 | + |
| 91 | + // ========================================================================= |
| 92 | + // Frequency conversion from rank |
| 93 | + // ========================================================================= |
| 94 | + |
| 95 | + @Test |
| 96 | + fun `frequency rank 0 converts to frequency 1_0`() { |
| 97 | + // Rank 0 = most common word, should have frequency 1.0 |
| 98 | + val rank = 0 |
| 99 | + val frequency = 1.0f - (rank / 255.0f) |
| 100 | + assertThat(frequency).isWithin(0.001f).of(1.0f) |
| 101 | + } |
| 102 | + |
| 103 | + @Test |
| 104 | + fun `frequency rank 255 converts to near zero frequency`() { |
| 105 | + // Rank 255 = rarest tracked word |
| 106 | + val rank = 255 |
| 107 | + val frequency = 1.0f - (rank / 255.0f) |
| 108 | + assertThat(frequency).isWithin(0.001f).of(0.0f) |
| 109 | + } |
| 110 | + |
| 111 | + @Test |
| 112 | + fun `frequency rank 127 converts to mid frequency`() { |
| 113 | + // Rank 127 = middle of the range |
| 114 | + val rank = 127 |
| 115 | + val frequency = 1.0f - (rank / 255.0f) |
| 116 | + assertThat(frequency).isWithin(0.01f).of(0.5f) |
| 117 | + } |
| 118 | + |
| 119 | + // ========================================================================= |
| 120 | + // Realistic French contraction scenarios |
| 121 | + // ========================================================================= |
| 122 | + |
| 123 | + @Test |
| 124 | + fun `quest_vs_quest_scenario`() { |
| 125 | + // In French, "qu'est" (what is) is more common than English "quest" |
| 126 | + // Simulated dictionary ranks: |
| 127 | + // - "qu'est" rank ~20 (very common in French) |
| 128 | + // - "quest" rank ~150 (moderately common in English) |
| 129 | + |
| 130 | + val questRank = 150 |
| 131 | + val questFreq = 1.0f - (questRank / 255.0f) // ~0.41 |
| 132 | + |
| 133 | + val questApostropheRank = 20 |
| 134 | + val questApostropheFreq = 1.0f - (questApostropheRank / 255.0f) // ~0.92 |
| 135 | + |
| 136 | + val commonBoost = 1.15f |
| 137 | + val top5000Boost = 1.08f |
| 138 | + val confidenceWeight = 0.6f |
| 139 | + val frequencyWeight = 0.4f |
| 140 | + val nnConfidence = 0.82f |
| 141 | + |
| 142 | + val questScore = VocabularyUtils.calculateCombinedScore( |
| 143 | + nnConfidence, questFreq, top5000Boost, confidenceWeight, frequencyWeight |
| 144 | + ) |
| 145 | + |
| 146 | + val questApostropheScore = VocabularyUtils.calculateCombinedScore( |
| 147 | + nnConfidence, questApostropheFreq, commonBoost, confidenceWeight, frequencyWeight |
| 148 | + ) |
| 149 | + |
| 150 | + // "qu'est" should rank higher due to its much higher frequency |
| 151 | + assertThat(questApostropheScore).isGreaterThan(questScore) |
| 152 | + } |
| 153 | + |
| 154 | + @Test |
| 155 | + fun `jai_vs_jail_scenario`() { |
| 156 | + // French "j'ai" (I have) vs English "jail" |
| 157 | + // "j'ai" is extremely common in French |
| 158 | + // "jail" is moderately common in English |
| 159 | + |
| 160 | + val jailRank = 180 |
| 161 | + val jailFreq = 1.0f - (jailRank / 255.0f) // ~0.29 |
| 162 | + |
| 163 | + val jaiRank = 5 |
| 164 | + val jaiFreq = 1.0f - (jaiRank / 255.0f) // ~0.98 |
| 165 | + |
| 166 | + val commonBoost = 1.15f |
| 167 | + val top5000Boost = 1.08f |
| 168 | + val confidenceWeight = 0.6f |
| 169 | + val frequencyWeight = 0.4f |
| 170 | + val nnConfidence = 0.78f |
| 171 | + |
| 172 | + val jailScore = VocabularyUtils.calculateCombinedScore( |
| 173 | + nnConfidence, jailFreq, top5000Boost, confidenceWeight, frequencyWeight |
| 174 | + ) |
| 175 | + |
| 176 | + val jaiScore = VocabularyUtils.calculateCombinedScore( |
| 177 | + nnConfidence, jaiFreq, commonBoost, confidenceWeight, frequencyWeight |
| 178 | + ) |
| 179 | + |
| 180 | + // "j'ai" should rank higher |
| 181 | + assertThat(jaiScore).isGreaterThan(jailScore) |
| 182 | + } |
| 183 | + |
| 184 | + // ========================================================================= |
| 185 | + // Edge cases |
| 186 | + // ========================================================================= |
| 187 | + |
| 188 | + @Test |
| 189 | + fun `zero frequency contraction still gets valid score`() { |
| 190 | + val score = VocabularyUtils.calculateCombinedScore( |
| 191 | + confidence = 0.8f, |
| 192 | + frequency = 0.0f, |
| 193 | + boost = 1.0f, |
| 194 | + confidenceWeight = 0.6f, |
| 195 | + frequencyWeight = 0.4f |
| 196 | + ) |
| 197 | + // Should still produce a positive score from confidence alone |
| 198 | + assertThat(score).isGreaterThan(0f) |
| 199 | + assertThat(score).isWithin(0.001f).of(0.48f) // 0.6 * 0.8 + 0.4 * 0 |
| 200 | + } |
| 201 | + |
| 202 | + @Test |
| 203 | + fun `default contraction frequency 0_6 is reasonable fallback`() { |
| 204 | + // When contraction isn't in dictionary, default to 0.6 |
| 205 | + val defaultFreq = 0.6f |
| 206 | + |
| 207 | + val score = VocabularyUtils.calculateCombinedScore( |
| 208 | + confidence = 0.8f, |
| 209 | + frequency = defaultFreq, |
| 210 | + boost = 1.08f, |
| 211 | + confidenceWeight = 0.6f, |
| 212 | + frequencyWeight = 0.4f |
| 213 | + ) |
| 214 | + |
| 215 | + // Score should be reasonable (not too high, not too low) |
| 216 | + assertThat(score).isGreaterThan(0.5f) |
| 217 | + assertThat(score).isLessThan(1.0f) |
| 218 | + } |
| 219 | +} |
0 commit comments