@@ -64,9 +64,9 @@ public void testEdgeCases() throws EncoderException {
64
64
{"i" , "0" },
65
65
{"o" , "0" },
66
66
{"u" , "0" },
67
- {"\u00E4 " , "0" },
68
- {"\u00F6 " , "0" },
69
- {"\u00FC " , "0" },
67
+ {"\u00E4 " , "0" }, // a-umlaut
68
+ {"\u00F6 " , "0" }, // o-umlaut
69
+ {"\u00FC " , "0" }, // u-umlaut
70
70
{"aa" , "0" },
71
71
{"ha" , "0" },
72
72
{"h" , "" },
@@ -94,20 +94,20 @@ public void testEdgeCases() throws EncoderException {
94
94
@ Test
95
95
public void testExamples () throws EncoderException {
96
96
String [][] data = {
97
- {"m\u00DC ller" , "657" },
97
+ {"m\u00DC ller" , "657" }, // mÜller - why upper case U-umlaut?
98
98
{"schmidt" , "862" },
99
99
{"schneider" , "8627" },
100
100
{"fischer" , "387" },
101
101
{"weber" , "317" },
102
102
{"wagner" , "3467" },
103
103
{"becker" , "147" },
104
104
{"hoffmann" , "0366" },
105
- {"sch\u00C4 fer" , "837" },
105
+ {"sch\u00C4 fer" , "837" }, // schÄfer - why upper case A-umlaut ?
106
106
{"Breschnew" , "17863" },
107
107
{"Wikipedia" , "3412" },
108
108
{"peter" , "127" },
109
109
{"pharma" , "376" },
110
- {"mönchengladbach " , "664645214" },
110
+ {"m \u00f6 nchengladbach " , "664645214" }, // mönchengladbach
111
111
{"deutsch" , "28" },
112
112
{"deutz" , "28" },
113
113
{"hamburg" , "06174" },
@@ -127,20 +127,21 @@ public void testExamples() throws EncoderException {
127
127
128
128
@ Test
129
129
public void testHyphen () throws EncoderException {
130
- String [][] data = {{"bergisch-gladbach" , "174845214" }, {"Müller-Lüdenscheidt" , "65752682" }};
130
+ String [][] data = {{"bergisch-gladbach" , "174845214" },
131
+ {"M\u00fc ller-L\u00fc denscheidt" , "65752682" }}; // Müller-Lüdenscheidt
131
132
this .checkEncodings (data );
132
133
}
133
134
134
135
@ Test
135
136
public void testIsEncodeEquals () {
136
137
String [][] data = {
137
- {"Meyer" , "Müller " },
138
+ {"Meyer" , "M \u00fc ller " }, // Müller
138
139
{"Meyer" , "Mayr" },
139
140
{"house" , "house" },
140
141
{"House" , "house" },
141
142
{"Haus" , "house" },
142
143
{"ganz" , "Gans" },
143
- {"ganz" , "Gänse " },
144
+ {"ganz" , "G \u00e4 nse " }, // Gänse
144
145
{"Miyagi" , "Miyako" }};
145
146
for (String [] element : data ) {
146
147
((ColognePhonetic ) this .getStringEncoder ()).isEncodeEqual (element [1 ], element [0 ]);
0 commit comments