Completed
Push — master ( 7e413a...470d5e )
by Chris
11:47
created

BeiderMorseTestCases.test_bmpm_uscensus2000_cc()   A

Complexity

Conditions 5

Size

Total Lines 21
Code Lines 18

Duplication

Lines 21
Ratio 100 %

Importance

Changes 0
Metric Value
cc 5
eloc 18
nop 1
dl 21
loc 21
rs 9.0333
c 0
b 0
f 0
1
# -*- coding: utf-8 -*-
2
3
# Copyright 2014-2018 by Christopher C. Little.
4
# This file is part of Abydos.
5
#
6
# Abydos is free software: you can redistribute it and/or modify
7
# it under the terms of the GNU General Public License as published by
8
# the Free Software Foundation, either version 3 of the License, or
9
# (at your option) any later version.
10
#
11
# Abydos is distributed in the hope that it will be useful,
12
# but WITHOUT ANY WARRANTY; without even the implied warranty of
13
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14
# GNU General Public License for more details.
15
#
16
# You should have received a copy of the GNU General Public License
17
# along with Abydos. If not, see <http://www.gnu.org/licenses/>.
18
19
"""abydos.tests.test_phonetic.
20
21
This module contains unit tests for abydos.phonetic
22
"""
23
24
from __future__ import unicode_literals
25
26
import codecs
27
import math
28
import os
29
import unittest
30
from random import random
31
32
from abydos._bm import _bm_apply_rule_if_compat, _bm_expand_alternates, \
33
    _bm_language, _bm_normalize_lang_attrs, _bm_phonetic_number, \
34
    _bm_remove_dupes
35
from abydos._bmdata import L_ANY, L_CYRILLIC, L_CZECH, L_DUTCH, L_ENGLISH, \
36
    L_FRENCH, L_GERMAN, L_GREEK, L_GREEKLATIN, L_HEBREW, L_HUNGARIAN, \
37
    L_ITALIAN, L_LATVIAN, L_POLISH, L_PORTUGUESE, L_ROMANIAN, L_SPANISH, \
38
    L_TURKISH
39
from abydos.phonetic import alpha_sis, bmpm, caverphone, davidson, \
40
    dm_soundex, dolby, double_metaphone, eudex, fonem, fuzzy_soundex, \
41
    haase_phonetik, henry_early, koelner_phonetik, koelner_phonetik_alpha, \
42
    koelner_phonetik_num_to_alpha, lein, metaphone, metasoundex, mra, \
43
    norphone, nrl, nysiis, onca, parmar_kumbharana, phonem, phonet, \
44
    phonetic_spanish, phonex, phonix, pshp_soundex_first, pshp_soundex_last, \
45
    refined_soundex, reth_schek_phonetik, roger_root, russell_index, \
46
    russell_index_alpha, russell_index_num_to_alpha, sfinxbis, sound_d, \
47
    soundex, soundex_br, spanish_metaphone, spfc, statistics_canada
48
49
from six import text_type
50
51
TESTDIR = os.path.dirname(__file__)
52
53
EXTREME_TEST = False  # Set to True to test EVERY single case (NB: takes hours)
54
ALLOW_RANDOM = True  # Set to False to skip all random tests
55
56
if not EXTREME_TEST and os.path.isfile(TESTDIR + '/EXTREME_TEST'):
57
    # EXTREME_TEST file detected -- switching to EXTREME_TEST mode...
58
    EXTREME_TEST = True
59
60
61
def one_in(inverse_probability):
62
    """Return whether to run a test.
63
64
    Return True if:
65
        EXTREME_TEST is True
66
        OR
67
        (ALLOW_RANDOM is False
68
        AND
69
        random.random() * inverse_probability < 1
70
    Otherwise return False
71
    """
72
    if EXTREME_TEST:
73
        return True
74
    elif ALLOW_RANDOM and random() * inverse_probability < 1:  # noqa: S311
75
        return True
76
    else:
77
        return False
78
79
80
class RussellIndexTestCases(unittest.TestCase):
81
    """Test Russel Index functions.
82
83
    test cases for abydos.phonetic.russell_index,
84
    .russell_index_num_to_alpha, & .russell_index_alpha
85
    """
86
87
    def test_russel_index(self):
88
        """Test abydos.phonetic.russell_index."""
89
        self.assertTrue(math.isnan(russell_index('')))
90
        self.assertTrue(math.isnan(russell_index('H')))
91
        self.assertEqual(russell_index('Hoppa'), 12)
92
        self.assertEqual(russell_index('Hopley'), 125)
93
        self.assertEqual(russell_index('Highfield'), 1254)
94
        self.assertEqual(russell_index('Wright'), 814)
95
        self.assertEqual(russell_index('Carter'), 31848)
96
        self.assertEqual(russell_index('Hopf'), 12)
97
        self.assertEqual(russell_index('Hay'), 1)
98
        self.assertEqual(russell_index('Haas'), 1)
99
        self.assertEqual(russell_index('Meyers'), 618)
100
        self.assertEqual(russell_index('Myers'), 618)
101
        self.assertEqual(russell_index('Meyer'), 618)
102
        self.assertEqual(russell_index('Myer'), 618)
103
        self.assertEqual(russell_index('Mack'), 613)
104
        self.assertEqual(russell_index('Knack'), 3713)
105
106
    def test_russel_index_n2a(self):
107
        """Test abydos.phonetic.russell_index_num_to_alpha."""
108
        self.assertEqual(russell_index_num_to_alpha(0), '')
109
        self.assertEqual(russell_index_num_to_alpha(''), '')
110
        self.assertEqual(russell_index_num_to_alpha(float('NaN')), '')
111
        self.assertEqual(russell_index_num_to_alpha(123456789), 'ABCDLMNR')
112
        self.assertEqual(russell_index_num_to_alpha('0123456789'), 'ABCDLMNR')
113
114
    def test_russel_index_alpha(self):
115
        """Test abydos.phonetic.russell_index_alpha."""
116
        self.assertEqual(russell_index_alpha(''), '')
117
        self.assertEqual(russell_index_alpha('H'), '')
118
        self.assertEqual(russell_index_alpha('Hoppa'), 'AB')
119
        self.assertEqual(russell_index_alpha('Hopley'), 'ABL')
120
        self.assertEqual(russell_index_alpha('Highfield'), 'ABLD')
121
        self.assertEqual(russell_index_alpha('Wright'), 'RAD')
122
        self.assertEqual(russell_index_alpha('Carter'), 'CARDR')
123
        self.assertEqual(russell_index_alpha('Hopf'), 'AB')
124
        self.assertEqual(russell_index_alpha('Hay'), 'A')
125
        self.assertEqual(russell_index_alpha('Haas'), 'A')
126
        self.assertEqual(russell_index_alpha('Meyers'), 'MAR')
127
        self.assertEqual(russell_index_alpha('Myers'), 'MAR')
128
        self.assertEqual(russell_index_alpha('Meyer'), 'MAR')
129
        self.assertEqual(russell_index_alpha('Myer'), 'MAR')
130
        self.assertEqual(russell_index_alpha('Mack'), 'MAC')
131
        self.assertEqual(russell_index_alpha('Knack'), 'CNAC')
132
133
134
class SoundexTestCases(unittest.TestCase):
135
    """Test Soundex functions.
136
137
    test cases for abydos.phonetic.soundex, .refined_soundex,
138
    & .dm_soundex
139
    """
140
141
    def test_soundex(self):
142
        """Test abydos.phonetic.soundex."""
143
        self.assertEqual(soundex(''), '0000')
144
145
        # https://archive.org/stream/accessingindivid00moor#page/14/mode/2up
146
        self.assertEqual(soundex('Euler'), 'E460')
147
        self.assertEqual(soundex('Gauss'), 'G200')
148
        self.assertEqual(soundex('Hilbert'), 'H416')
149
        self.assertEqual(soundex('Knuth'), 'K530')
150
        self.assertEqual(soundex('Lloyd'), 'L300')
151
        self.assertEqual(soundex('Lukasieicz'), 'L222')
152
        self.assertEqual(soundex('Ellery'), 'E460')
153
        self.assertEqual(soundex('Ghosh'), 'G200')
154
        self.assertEqual(soundex('Heilbronn'), 'H416')
155
        self.assertEqual(soundex('Kant'), 'K530')
156
        self.assertEqual(soundex('Ladd'), 'L300')
157
        self.assertEqual(soundex('Lissajous'), 'L222')
158
        self.assertEqual(soundex('Rogers'), 'R262')
159
        self.assertEqual(soundex('Rodgers'), 'R326')
160
        self.assertNotEquals(soundex('Rogers'), soundex('Rodgers'))
161
        self.assertNotEquals(soundex('Sinclair'), soundex('St. Clair'))
162
        self.assertNotEquals(soundex('Tchebysheff'), soundex('Chebyshev'))
163
164
        # http://creativyst.com/Doc/Articles/SoundEx1/SoundEx1.htm#Related
165
        self.assertEqual(soundex('Htacky'), 'H320')
166
        self.assertEqual(soundex('Atacky'), 'A320')
167
        self.assertEqual(soundex('Schmit'), 'S530')
168
        self.assertEqual(soundex('Schneider'), 'S536')
169
        self.assertEqual(soundex('Pfister'), 'P236')
170
        self.assertEqual(soundex('Ashcroft'), 'A261')
171
        self.assertEqual(soundex('Asicroft'), 'A226')
172
173
        # https://en.wikipedia.org/wiki/Soundex
174
        self.assertEqual(soundex('Robert'), 'R163')
175
        self.assertEqual(soundex('Rupert'), 'R163')
176
        self.assertEqual(soundex('Rubin'), 'R150')
177
        self.assertEqual(soundex('Tymczak'), 'T522')
178
179
        # https://en.wikipedia.org/wiki/Daitch%E2%80%93Mokotoff_Soundex
180
        self.assertEqual(soundex('Peters'), 'P362')
181
        self.assertEqual(soundex('Peterson'), 'P362')
182
        self.assertEqual(soundex('Moskowitz'), 'M232')
183
        self.assertEqual(soundex('Moskovitz'), 'M213')
184
        self.assertEqual(soundex('Auerbach'), 'A612')
185
        self.assertEqual(soundex('Uhrbach'), 'U612')
186
        self.assertEqual(soundex('Jackson'), 'J250')
187
        self.assertEqual(soundex('Jackson-Jackson'), 'J252')
188
189
        # maxlength tests
190
        self.assertEqual(soundex('Lincoln', 10), 'L524500000')
191
        self.assertEqual(soundex('Lincoln', 5), 'L5245')
192
        self.assertEqual(soundex('Christopher', 6), 'C62316')
193
194
        # maxlength bounds tests
195
        self.assertEqual(soundex('Niall', maxlength=float('inf')),
196
                         'N4000000000000000000000000000000000000000000000000' +
197
                         '00000000000000')
198
        self.assertEqual(soundex('Niall', maxlength=None),
199
                         'N4000000000000000000000000000000000000000000000000' +
200
                         '00000000000000')
201
        self.assertEqual(soundex('Niall', maxlength=0), 'N400')
202
203
        # reverse tests
204
        self.assertEqual(soundex('Rubin', reverse=True), 'N160')
205
        self.assertEqual(soundex('Llyod', reverse=True), 'D400')
206
        self.assertEqual(soundex('Lincoln', reverse=True), 'N425')
207
        self.assertEqual(soundex('Knuth', reverse=True), 'H352')
208
209
        # zero_pad tests
210
        self.assertEqual(soundex('Niall', maxlength=float('inf'),
211
                                 zero_pad=False), 'N4')
212
        self.assertEqual(soundex('Niall', maxlength=None,
213
                                 zero_pad=False), 'N4')
214
        self.assertEqual(soundex('Niall', maxlength=0, zero_pad=False), 'N4')
215
        self.assertEqual(soundex('Niall', maxlength=0, zero_pad=True), 'N400')
216
        self.assertEqual(soundex('', maxlength=4, zero_pad=False), '0')
217
        self.assertEqual(soundex('', maxlength=4, zero_pad=True), '0000')
218
219
    def test_soundex_special(self):
220
        """Test abydos.phonetic.soundex (special 1880-1910 variant method)."""
221
        self.assertEqual(soundex('Ashcroft', var='special'), 'A226')
222
        self.assertEqual(soundex('Asicroft', var='special'), 'A226')
223
        self.assertEqual(soundex('AsWcroft', var='special'), 'A226')
224
        self.assertEqual(soundex('Rupert', var='special'), 'R163')
225
        self.assertEqual(soundex('Rubin', var='special'), 'R150')
226
227
    def test_soundex_census(self):
228
        """Test abydos.phonetic.soundex (Census variant method)."""
229
        self.assertEqual(soundex('Vandeusen', var='Census'), ('V532', 'D250'))
230
        self.assertEqual(soundex('van Deusen', var='Census'), ('V532', 'D250'))
231
        self.assertEqual(soundex('McDonald', var='Census'), 'M235')
232
        self.assertEqual(soundex('la Cruz', var='Census'), ('L262', 'C620'))
233
        self.assertEqual(soundex('vanDamme', var='Census'), ('V535', 'D500'))
234
235
    def test_refined_soundex(self):
236
        """Test abydos.phonetic.refined_soundex."""
237
        # http://ntz-develop.blogspot.com/2011/03/phonetic-algorithms.html
238
        self.assertEqual(refined_soundex('Braz'), 'B195')
239
        self.assertEqual(refined_soundex('Broz'), 'B195')
240
        self.assertEqual(refined_soundex('Caren'), 'C398')
241
        self.assertEqual(refined_soundex('Caron'), 'C398')
242
        self.assertEqual(refined_soundex('Carren'), 'C398')
243
        self.assertEqual(refined_soundex('Charon'), 'C398')
244
        self.assertEqual(refined_soundex('Corain'), 'C398')
245
        self.assertEqual(refined_soundex('Coram'), 'C398')
246
        self.assertEqual(refined_soundex('Corran'), 'C398')
247
        self.assertEqual(refined_soundex('Corrin'), 'C398')
248
        self.assertEqual(refined_soundex('Corwin'), 'C398')
249
        self.assertEqual(refined_soundex('Curran'), 'C398')
250
        self.assertEqual(refined_soundex('Curreen'), 'C398')
251
        self.assertEqual(refined_soundex('Currin'), 'C398')
252
        self.assertEqual(refined_soundex('Currom'), 'C398')
253
        self.assertEqual(refined_soundex('Currum'), 'C398')
254
        self.assertEqual(refined_soundex('Curwen'), 'C398')
255
        self.assertEqual(refined_soundex('Caren'), 'C398')
256
        self.assertEqual(refined_soundex('Caren'), 'C398')
257
        self.assertEqual(refined_soundex('Caren'), 'C398')
258
        self.assertEqual(refined_soundex('Caren'), 'C398')
259
        self.assertEqual(refined_soundex('Caren'), 'C398')
260
        self.assertEqual(refined_soundex('Caren'), 'C398')
261
        self.assertEqual(refined_soundex('Caren'), 'C398')
262
        self.assertEqual(refined_soundex('Hairs'), 'H93')
263
        self.assertEqual(refined_soundex('Hark'), 'H93')
264
        self.assertEqual(refined_soundex('Hars'), 'H93')
265
        self.assertEqual(refined_soundex('Hayers'), 'H93')
266
        self.assertEqual(refined_soundex('Heers'), 'H93')
267
        self.assertEqual(refined_soundex('Hiers'), 'H93')
268
        self.assertEqual(refined_soundex('Lambard'), 'L78196')
269
        self.assertEqual(refined_soundex('Lambart'), 'L78196')
270
        self.assertEqual(refined_soundex('Lambert'), 'L78196')
271
        self.assertEqual(refined_soundex('Lambird'), 'L78196')
272
        self.assertEqual(refined_soundex('Lampaert'), 'L78196')
273
        self.assertEqual(refined_soundex('Lampard'), 'L78196')
274
        self.assertEqual(refined_soundex('Lampart'), 'L78196')
275
        self.assertEqual(refined_soundex('Lamperd'), 'L78196')
276
        self.assertEqual(refined_soundex('Lampert'), 'L78196')
277
        self.assertEqual(refined_soundex('Lamport'), 'L78196')
278
        self.assertEqual(refined_soundex('Limbert'), 'L78196')
279
        self.assertEqual(refined_soundex('Lombard'), 'L78196')
280
        self.assertEqual(refined_soundex('Nolton'), 'N8768')
281
        self.assertEqual(refined_soundex('Noulton'), 'N8768')
282
283
        # http://trimc-nlp.blogspot.com/2015/03/the-soundex-algorithm.html
284
        self.assertEqual(refined_soundex('Craig'), 'C394')
285
        self.assertEqual(refined_soundex('Crag'), 'C394')
286
        self.assertEqual(refined_soundex('Crejg'), 'C394')
287
        self.assertEqual(refined_soundex('Creig'), 'C394')
288
        self.assertEqual(refined_soundex('Craigg'), 'C394')
289
        self.assertEqual(refined_soundex('Craug'), 'C394')
290
        self.assertEqual(refined_soundex('Craiggg'), 'C394')
291
        self.assertEqual(refined_soundex('Creg'), 'C394')
292
        self.assertEqual(refined_soundex('Cregg'), 'C394')
293
        self.assertEqual(refined_soundex('Creag'), 'C394')
294
        self.assertEqual(refined_soundex('Greg'), 'G494')
295
        self.assertEqual(refined_soundex('Gregg'), 'G494')
296
        self.assertEqual(refined_soundex('Graig'), 'G494')
297
        self.assertEqual(refined_soundex('Greig'), 'G494')
298
        self.assertEqual(refined_soundex('Greggg'), 'G494')
299
        self.assertEqual(refined_soundex('Groeg'), 'G494')
300
        self.assertEqual(refined_soundex('Graj'), 'G494')
301
        self.assertEqual(refined_soundex('Grej'), 'G494')
302
        self.assertEqual(refined_soundex('Grreg'), 'G494')
303
        self.assertEqual(refined_soundex('Greag'), 'G494')
304
        self.assertEqual(refined_soundex('Grig'), 'G494')
305
        self.assertEqual(refined_soundex('Kregg'), 'K394')
306
        self.assertEqual(refined_soundex('Kraig'), 'K394')
307
        self.assertEqual(refined_soundex('Krag'), 'K394')
308
        self.assertEqual(refined_soundex('Kreig'), 'K394')
309
        self.assertEqual(refined_soundex('Krug'), 'K394')
310
        self.assertEqual(refined_soundex('Kreg'), 'K394')
311
        self.assertEqual(refined_soundex('Krieg'), 'K394')
312
        self.assertEqual(refined_soundex('Krijg'), 'K394')
313
314
        # Apache Commons test cases
315
        # http://svn.apache.org/viewvc/commons/proper/codec/trunk/src/test/java/org/apache/commons/codec/language/RefinedSoundexTest.java?view=markup
316
        self.assertEqual(refined_soundex('testing'), 'T63684')
317
        self.assertEqual(refined_soundex('TESTING'), 'T63684')
318
        self.assertEqual(refined_soundex('The'), 'T6')
319
        self.assertEqual(refined_soundex('quick'), 'Q53')
320
        self.assertEqual(refined_soundex('brown'), 'B198')
321
        self.assertEqual(refined_soundex('fox'), 'F25')
322
        self.assertEqual(refined_soundex('jumped'), 'J4816')
323
        self.assertEqual(refined_soundex('over'), 'O29')
324
        self.assertEqual(refined_soundex('the'), 'T6')
325
        self.assertEqual(refined_soundex('lazy'), 'L75')
326
        self.assertEqual(refined_soundex('dogs'), 'D643')
327
328
        # Test with retain_vowels=True
329
        # http://ntz-develop.blogspot.com/2011/03/phonetic-algorithms.html
330
        self.assertEqual(refined_soundex('Braz', retain_vowels=True), 'B1905')
331
        self.assertEqual(refined_soundex('Broz', retain_vowels=True), 'B1905')
332
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
333
                         'C30908')
334
        self.assertEqual(refined_soundex('Caron', retain_vowels=True),
335
                         'C30908')
336
        self.assertEqual(refined_soundex('Carren', retain_vowels=True),
337
                         'C30908')
338
        self.assertEqual(refined_soundex('Charon', retain_vowels=True),
339
                         'C30908')
340
        self.assertEqual(refined_soundex('Corain', retain_vowels=True),
341
                         'C30908')
342
        self.assertEqual(refined_soundex('Coram', retain_vowels=True),
343
                         'C30908')
344
        self.assertEqual(refined_soundex('Corran', retain_vowels=True),
345
                         'C30908')
346
        self.assertEqual(refined_soundex('Corrin', retain_vowels=True),
347
                         'C30908')
348
        self.assertEqual(refined_soundex('Corwin', retain_vowels=True),
349
                         'C30908')
350
        self.assertEqual(refined_soundex('Curran', retain_vowels=True),
351
                         'C30908')
352
        self.assertEqual(refined_soundex('Curreen', retain_vowels=True),
353
                         'C30908')
354
        self.assertEqual(refined_soundex('Currin', retain_vowels=True),
355
                         'C30908')
356
        self.assertEqual(refined_soundex('Currom', retain_vowels=True),
357
                         'C30908')
358
        self.assertEqual(refined_soundex('Currum', retain_vowels=True),
359
                         'C30908')
360
        self.assertEqual(refined_soundex('Curwen', retain_vowels=True),
361
                         'C30908')
362
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
363
                         'C30908')
364
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
365
                         'C30908')
366
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
367
                         'C30908')
368
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
369
                         'C30908')
370
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
371
                         'C30908')
372
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
373
                         'C30908')
374
        self.assertEqual(refined_soundex('Caren', retain_vowels=True),
375
                         'C30908')
376
        self.assertEqual(refined_soundex('Hairs', retain_vowels=True), 'H093')
377
        self.assertEqual(refined_soundex('Hark', retain_vowels=True), 'H093')
378
        self.assertEqual(refined_soundex('Hars', retain_vowels=True), 'H093')
379
        self.assertEqual(refined_soundex('Hayers', retain_vowels=True), 'H093')
380
        self.assertEqual(refined_soundex('Heers', retain_vowels=True), 'H093')
381
        self.assertEqual(refined_soundex('Hiers', retain_vowels=True), 'H093')
382
        self.assertEqual(refined_soundex('Lambard', retain_vowels=True),
383
                         'L7081096')
384
        self.assertEqual(refined_soundex('Lambart', retain_vowels=True),
385
                         'L7081096')
386
        self.assertEqual(refined_soundex('Lambert', retain_vowels=True),
387
                         'L7081096')
388
        self.assertEqual(refined_soundex('Lambird', retain_vowels=True),
389
                         'L7081096')
390
        self.assertEqual(refined_soundex('Lampaert', retain_vowels=True),
391
                         'L7081096')
392
        self.assertEqual(refined_soundex('Lampard', retain_vowels=True),
393
                         'L7081096')
394
        self.assertEqual(refined_soundex('Lampart', retain_vowels=True),
395
                         'L7081096')
396
        self.assertEqual(refined_soundex('Lamperd', retain_vowels=True),
397
                         'L7081096')
398
        self.assertEqual(refined_soundex('Lampert', retain_vowels=True),
399
                         'L7081096')
400
        self.assertEqual(refined_soundex('Lamport', retain_vowels=True),
401
                         'L7081096')
402
        self.assertEqual(refined_soundex('Limbert', retain_vowels=True),
403
                         'L7081096')
404
        self.assertEqual(refined_soundex('Lombard', retain_vowels=True),
405
                         'L7081096')
406
        self.assertEqual(refined_soundex('Nolton', retain_vowels=True),
407
                         'N807608')
408
        self.assertEqual(refined_soundex('Noulton', retain_vowels=True),
409
                         'N807608')
410
411
        # http://trimc-nlp.blogspot.com/2015/03/the-soundex-algorithm.html
412
        self.assertEqual(refined_soundex('Craig', retain_vowels=True), 'C3904')
413
        self.assertEqual(refined_soundex('Crag', retain_vowels=True), 'C3904')
414
        self.assertEqual(refined_soundex('Crejg', retain_vowels=True), 'C3904')
415
        self.assertEqual(refined_soundex('Creig', retain_vowels=True), 'C3904')
416
        self.assertEqual(refined_soundex('Craigg', retain_vowels=True),
417
                         'C3904')
418
        self.assertEqual(refined_soundex('Craug', retain_vowels=True), 'C3904')
419
        self.assertEqual(refined_soundex('Craiggg', retain_vowels=True),
420
                         'C3904')
421
        self.assertEqual(refined_soundex('Creg', retain_vowels=True), 'C3904')
422
        self.assertEqual(refined_soundex('Cregg', retain_vowels=True), 'C3904')
423
        self.assertEqual(refined_soundex('Creag', retain_vowels=True), 'C3904')
424
        self.assertEqual(refined_soundex('Greg', retain_vowels=True), 'G4904')
425
        self.assertEqual(refined_soundex('Gregg', retain_vowels=True), 'G4904')
426
        self.assertEqual(refined_soundex('Graig', retain_vowels=True), 'G4904')
427
        self.assertEqual(refined_soundex('Greig', retain_vowels=True), 'G4904')
428
        self.assertEqual(refined_soundex('Greggg', retain_vowels=True),
429
                         'G4904')
430
        self.assertEqual(refined_soundex('Groeg', retain_vowels=True), 'G4904')
431
        self.assertEqual(refined_soundex('Graj', retain_vowels=True), 'G4904')
432
        self.assertEqual(refined_soundex('Grej', retain_vowels=True), 'G4904')
433
        self.assertEqual(refined_soundex('Grreg', retain_vowels=True), 'G4904')
434
        self.assertEqual(refined_soundex('Greag', retain_vowels=True), 'G4904')
435
        self.assertEqual(refined_soundex('Grig', retain_vowels=True), 'G4904')
436
        self.assertEqual(refined_soundex('Kregg', retain_vowels=True), 'K3904')
437
        self.assertEqual(refined_soundex('Kraig', retain_vowels=True), 'K3904')
438
        self.assertEqual(refined_soundex('Krag', retain_vowels=True), 'K3904')
439
        self.assertEqual(refined_soundex('Kreig', retain_vowels=True), 'K3904')
440
        self.assertEqual(refined_soundex('Krug', retain_vowels=True), 'K3904')
441
        self.assertEqual(refined_soundex('Kreg', retain_vowels=True), 'K3904')
442
        self.assertEqual(refined_soundex('Krieg', retain_vowels=True), 'K3904')
443
        self.assertEqual(refined_soundex('Krijg', retain_vowels=True), 'K3904')
444
445
        # Apache Commons test cases
446
        # http://svn.apache.org/viewvc/commons/proper/codec/trunk/src/test/java/org/apache/commons/codec/language/RefinedSoundexTest.java?view=markup
447
        self.assertEqual(refined_soundex('testing', retain_vowels=True),
448
                         'T6036084')
449
        self.assertEqual(refined_soundex('TESTING', retain_vowels=True),
450
                         'T6036084')
451
        self.assertEqual(refined_soundex('The', retain_vowels=True), 'T60')
452
        self.assertEqual(refined_soundex('quick', retain_vowels=True), 'Q503')
453
        self.assertEqual(refined_soundex('brown', retain_vowels=True), 'B1908')
454
        self.assertEqual(refined_soundex('fox', retain_vowels=True), 'F205')
455
        self.assertEqual(refined_soundex('jumped', retain_vowels=True),
456
                         'J408106')
457
        self.assertEqual(refined_soundex('over', retain_vowels=True), 'O0209')
458
        self.assertEqual(refined_soundex('the', retain_vowels=True), 'T60')
459
        self.assertEqual(refined_soundex('lazy', retain_vowels=True), 'L7050')
460
        self.assertEqual(refined_soundex('dogs', retain_vowels=True), 'D6043')
461
462
        # length tests
463
        self.assertEqual(refined_soundex('testing', maxlength=4,
464
                                         zero_pad=True), 'T636')
465
        self.assertEqual(refined_soundex('TESTING', maxlength=4,
466
                                         zero_pad=True), 'T636')
467
        self.assertEqual(refined_soundex('The', maxlength=4, zero_pad=True),
468
                         'T600')
469
        self.assertEqual(refined_soundex('quick', maxlength=4, zero_pad=True),
470
                         'Q530')
471
        self.assertEqual(refined_soundex('brown', maxlength=4, zero_pad=True),
472
                         'B198')
473
        self.assertEqual(refined_soundex('fox', maxlength=4, zero_pad=True),
474
                         'F250')
475
        self.assertEqual(refined_soundex('jumped', maxlength=4, zero_pad=True),
476
                         'J481')
477
        self.assertEqual(refined_soundex('over', maxlength=4, zero_pad=True),
478
                         'O290')
479
        self.assertEqual(refined_soundex('the', maxlength=4, zero_pad=True),
480
                         'T600')
481
        self.assertEqual(refined_soundex('lazy', maxlength=4, zero_pad=True),
482
                         'L750')
483
        self.assertEqual(refined_soundex('dogs', maxlength=4, zero_pad=True),
484
                         'D643')
485
        self.assertEqual(refined_soundex('The', maxlength=4),
486
                         'T6')
487
        self.assertEqual(refined_soundex('quick', maxlength=4),
488
                         'Q53')
489
        self.assertEqual(refined_soundex('brown', maxlength=4),
490
                         'B198')
491
        self.assertEqual(refined_soundex('fox', maxlength=4),
492
                         'F25')
493
        self.assertEqual(refined_soundex('jumped', maxlength=4),
494
                         'J481')
495
        self.assertEqual(refined_soundex('over', maxlength=4),
496
                         'O29')
497
        self.assertEqual(refined_soundex('the', maxlength=4),
498
                         'T6')
499
        self.assertEqual(refined_soundex('lazy', maxlength=4),
500
                         'L75')
501
        self.assertEqual(refined_soundex('dogs', maxlength=4),
502
                         'D643')
503
504
    def test_dm_soundex(self):
505
        """Test abydos.phonetic.dm_soundex (Daitch-Mokotoff Soundex)."""
506
        # D-M tests
507
        self.assertEqual(dm_soundex(''), {'000000'})
508
509
        # http://www.avotaynu.com/soundex.htm
510
        self.assertEqual(dm_soundex('Augsburg'), {'054795'})
511
        self.assertEqual(dm_soundex('Breuer'), {'791900'})
512
        self.assertEqual(dm_soundex('Halberstadt'), {'587943', '587433'})
513
        self.assertEqual(dm_soundex('Mannheim'), {'665600'})
514
        self.assertEqual(dm_soundex('Chernowitz'), {'496740', '596740'})
515
        self.assertEqual(dm_soundex('Cherkassy'), {'495400', '595400'})
516
        self.assertEqual(dm_soundex('Kleinman'), {'586660'})
517
        self.assertEqual(dm_soundex('Berlin'), {'798600'})
518
519
        self.assertEqual(dm_soundex('Ceniow'), {'467000', '567000'})
520
        self.assertEqual(dm_soundex('Tsenyuv'), {'467000'})
521
        self.assertEqual(dm_soundex('Holubica'), {'587400', '587500'})
522
        self.assertEqual(dm_soundex('Golubitsa'), {'587400'})
523
        self.assertEqual(dm_soundex('Przemysl'), {'746480', '794648'})
524
        self.assertEqual(dm_soundex('Pshemeshil'), {'746480'})
525
        self.assertEqual(dm_soundex('Rosochowaciec'),
526
                         {'944744', '945744', '944755', '944754', '944745',
527
                          '945745', '945754', '945755'})
528
        self.assertEqual(dm_soundex('Rosokhovatsets'), {'945744'})
529
530
        # https://en.wikipedia.org/wiki/Daitch%E2%80%93Mokotoff_Soundex
531
        self.assertEqual(dm_soundex('Peters'), {'739400', '734000'})
532
        self.assertEqual(dm_soundex('Peterson'), {'739460', '734600'})
533
        self.assertEqual(dm_soundex('Moskowitz'), {'645740'})
534
        self.assertEqual(dm_soundex('Moskovitz'), {'645740'})
535
        self.assertEqual(dm_soundex('Auerbach'), {'097500', '097400'})
536
        self.assertEqual(dm_soundex('Uhrbach'), {'097500', '097400'})
537
        self.assertEqual(dm_soundex('Jackson'),
538
                         {'154600', '454600', '145460', '445460'})
539
        self.assertEqual(dm_soundex('Jackson-Jackson'),
540
                         {'154654', '454654', '145465', '445465',
541
                          '154645', '454645', '145464', '445464',
542
                          '154644', '454644'})
543
544
        # http://www.jewishgen.org/infofiles/soundex.html
545
        self.assertEqual(dm_soundex('OHRBACH'), {'097500', '097400'})
546
        self.assertEqual(dm_soundex('LIPSHITZ'), {'874400'})
547
        self.assertEqual(dm_soundex('LIPPSZYC'), {'874400', '874500'})
548
        self.assertEqual(dm_soundex('LEWINSKY'), {'876450'})
549
        self.assertEqual(dm_soundex('LEVINSKI'), {'876450'})
550
        self.assertEqual(dm_soundex('SZLAMAWICZ'), {'486740'})
551
        self.assertEqual(dm_soundex('SHLAMOVITZ'), {'486740'})
552
553
        # http://community.actian.com/wiki/OME_soundex_dm()
554
        self.assertEqual(dm_soundex('Schwarzenegger'),
555
                         {'479465', '474659'})
556
        self.assertEqual(dm_soundex('Shwarzenegger'),
557
                         {'479465', '474659'})
558
        self.assertEqual(dm_soundex('Schwartsenegger'), {'479465'})
559
560
        # maxlength bounds tests
561
        self.assertEqual(dm_soundex('Niall', maxlength=float('inf')),
562
                         {'68'+'0'*62})
563
        self.assertEqual(dm_soundex('Niall', maxlength=None),
564
                         {'68'+'0'*62})
565
        self.assertEqual(dm_soundex('Niall', maxlength=0), {'680000'})
566
567
        # zero_pad tests
568
        self.assertEqual(dm_soundex('Niall', maxlength=float('inf'),
569
                                    zero_pad=False), {'68'})
570
        self.assertEqual(dm_soundex('Niall', maxlength=None, zero_pad=False),
571
                         {'68'})
572
        self.assertEqual(dm_soundex('Niall', maxlength=0, zero_pad=False),
573
                         {'68'})
574
        self.assertEqual(dm_soundex('Niall', maxlength=0, zero_pad=True),
575
                         {'680000'})
576
        self.assertEqual(dm_soundex('', maxlength=6, zero_pad=False),
577
                         {'0'})
578
        self.assertEqual(dm_soundex('', maxlength=6, zero_pad=True),
579
                         {'000000'})
580
581
582
class KoelnerPhonetikTestCases(unittest.TestCase):
583
    """Test Koelner Phonetic functions.
584
585
    test cases for abydos.phonetic.koelner_phonetik,
586
    .koelner_phonetik_num_to_alpha, & .koelner_phonetik_alpha
587
    """
588
589
    def test_koelner_phonetik(self):
590
        """Test abydos.phonetic.koelner_phonetik."""
591
        self.assertEqual(koelner_phonetik(''), '')
592
593
        # https://de.wikipedia.org/wiki/K%C3%B6lner_Phonetik
594
        self.assertEqual(koelner_phonetik('Müller-Lüdenscheidt'), '65752682')
595
        self.assertEqual(koelner_phonetik('Wikipedia'), '3412')
596
        self.assertEqual(koelner_phonetik('Breschnew'), '17863')
597
598
        # http://search.cpan.org/~maros/Text-Phonetic/lib/Text/Phonetic/Koeln.pm
599
        self.assertEqual(koelner_phonetik('Müller'), '657')
600
        self.assertEqual(koelner_phonetik('schmidt'), '862')
601
        self.assertEqual(koelner_phonetik('schneider'), '8627')
602
        self.assertEqual(koelner_phonetik('fischer'), '387')
603
        self.assertEqual(koelner_phonetik('weber'), '317')
604
        self.assertEqual(koelner_phonetik('meyer'), '67')
605
        self.assertEqual(koelner_phonetik('wagner'), '3467')
606
        self.assertEqual(koelner_phonetik('schulz'), '858')
607
        self.assertEqual(koelner_phonetik('becker'), '147')
608
        self.assertEqual(koelner_phonetik('hoffmann'), '0366')
609
        self.assertEqual(koelner_phonetik('schäfer'), '837')
610
        self.assertEqual(koelner_phonetik('cater'), '427')
611
        self.assertEqual(koelner_phonetik('axel'), '0485')
612
613
        # etc. (for code coverage)
614
        self.assertEqual(koelner_phonetik('Akxel'), '0485')
615
        self.assertEqual(koelner_phonetik('Adz'), '08')
616
        self.assertEqual(koelner_phonetik('Alpharades'), '053728')
617
        self.assertEqual(koelner_phonetik('Cent'), '862')
618
        self.assertEqual(koelner_phonetik('Acre'), '087')
619
        self.assertEqual(koelner_phonetik('H'), '')
620
621
    def test_koelner_phonetik_n2a(self):
622
        """Test abydos.phonetic.koelner_phonetik_num_to_alpha."""
623
        self.assertEqual(koelner_phonetik_num_to_alpha('0123456789'),
624
                         'APTFKLNRS')
625
626
    def test_koelner_phonetik_alpha(self):
627
        """Test abydos.phonetic.koelner_phonetik_alpha."""
628
        self.assertEqual(koelner_phonetik_alpha('Müller-Lüdenscheidt'),
629
                         'NLRLTNST')
630
        self.assertEqual(koelner_phonetik_alpha('Wikipedia'), 'FKPT')
631
        self.assertEqual(koelner_phonetik_alpha('Breschnew'), 'PRSNF')
632
        self.assertEqual(koelner_phonetik_alpha('Müller'), 'NLR')
633
        self.assertEqual(koelner_phonetik_alpha('schmidt'), 'SNT')
634
        self.assertEqual(koelner_phonetik_alpha('schneider'), 'SNTR')
635
        self.assertEqual(koelner_phonetik_alpha('fischer'), 'FSR')
636
        self.assertEqual(koelner_phonetik_alpha('weber'), 'FPR')
637
        self.assertEqual(koelner_phonetik_alpha('meyer'), 'NR')
638
        self.assertEqual(koelner_phonetik_alpha('wagner'), 'FKNR')
639
        self.assertEqual(koelner_phonetik_alpha('schulz'), 'SLS')
640
        self.assertEqual(koelner_phonetik_alpha('becker'), 'PKR')
641
        self.assertEqual(koelner_phonetik_alpha('hoffmann'), 'AFNN')
642
        self.assertEqual(koelner_phonetik_alpha('schäfer'), 'SFR')
643
        self.assertEqual(koelner_phonetik_alpha('cater'), 'KTR')
644
        self.assertEqual(koelner_phonetik_alpha('axel'), 'AKSL')
645
646
647
class NysiisTestCases(unittest.TestCase):
648
    """Test NYSIIS functions.
649
650
    test cases for abydos.phonetic.nysiis
651
    """
652
653
    def test_nysiis(self):
654
        """Test abydos.phonetic.nysiis."""
655
        self.assertEqual(nysiis(''), '')
656
657
        # http://coryodaniel.com/index.php/2009/12/30/ruby-nysiis-implementation/
658
        self.assertEqual(nysiis('O\'Daniel'), 'ODANAL')
659
        self.assertEqual(nysiis('O\'Donnel'), 'ODANAL')
660
        self.assertEqual(nysiis('Cory'), 'CARY')
661
        self.assertEqual(nysiis('Corey'), 'CARY')
662
        self.assertEqual(nysiis('Kory'), 'CARY')
663
664
        # http://ntz-develop.blogspot.com/2011/03/phonetic-algorithms.html
665
        self.assertEqual(nysiis('Diggell'), 'DAGAL')
666
        self.assertEqual(nysiis('Dougal'), 'DAGAL')
667
        self.assertEqual(nysiis('Doughill'), 'DAGAL')
668
        self.assertEqual(nysiis('Dougill'), 'DAGAL')
669
        self.assertEqual(nysiis('Dowgill'), 'DAGAL')
670
        self.assertEqual(nysiis('Dugall'), 'DAGAL')
671
        self.assertEqual(nysiis('Dugall'), 'DAGAL')
672
        self.assertEqual(nysiis('Glinde'), 'GLAND')
673
        self.assertEqual(nysiis('Plumridge', maxlength=20), 'PLANRADG')
674
        self.assertEqual(nysiis('Chinnick'), 'CANAC')
675
        self.assertEqual(nysiis('Chinnock'), 'CANAC')
676
        self.assertEqual(nysiis('Chinnock'), 'CANAC')
677
        self.assertEqual(nysiis('Chomicki'), 'CANAC')
678
        self.assertEqual(nysiis('Chomicz'), 'CANAC')
679
        self.assertEqual(nysiis('Schimek'), 'SANAC')
680
        self.assertEqual(nysiis('Shimuk'), 'SANAC')
681
        self.assertEqual(nysiis('Simak'), 'SANAC')
682
        self.assertEqual(nysiis('Simek'), 'SANAC')
683
        self.assertEqual(nysiis('Simic'), 'SANAC')
684
        self.assertEqual(nysiis('Sinnock'), 'SANAC')
685
        self.assertEqual(nysiis('Sinnocke'), 'SANAC')
686
        self.assertEqual(nysiis('Sunnex'), 'SANAX')
687
        self.assertEqual(nysiis('Sunnucks'), 'SANAC')
688
        self.assertEqual(nysiis('Sunock'), 'SANAC')
689
        self.assertEqual(nysiis('Webberley', maxlength=20), 'WABARLY')
690
        self.assertEqual(nysiis('Wibberley', maxlength=20), 'WABARLY')
691
692
        # etc. (for code coverage)
693
        self.assertEqual(nysiis('Alpharades'), 'ALFARA')
694
        self.assertEqual(nysiis('Aschenputtel'), 'ASANPA')
695
        self.assertEqual(nysiis('Beverly'), 'BAFARL')
696
        self.assertEqual(nysiis('Hardt'), 'HARD')
697
        self.assertEqual(nysiis('acknowledge'), 'ACNALA')
698
        self.assertEqual(nysiis('MacNeill'), 'MCNAL')
699
        self.assertEqual(nysiis('MacNeill'), nysiis('McNeill'))
700
        self.assertEqual(nysiis('Knight'), 'NAGT')
701
        self.assertEqual(nysiis('Knight'), nysiis('Night'))
702
        self.assertEqual(nysiis('Pfarr'), 'FAR')
703
        self.assertEqual(nysiis('Phair'), 'FAR')
704
        self.assertEqual(nysiis('Phair'), nysiis('Pfarr'))
705
        self.assertEqual(nysiis('Cherokee'), 'CARACY')
706
        self.assertEqual(nysiis('Iraq'), 'IRAG')
707
708
        # maxlength bounds tests
709
        self.assertEqual(nysiis('Niall', maxlength=float('inf')), 'NAL')
710
        self.assertEqual(nysiis('Niall', maxlength=None), 'NAL')
711
        self.assertEqual(nysiis('Niall', maxlength=0), 'NAL')
712
713
    def test_modified_nysiis(self):
714
        """Test abydos.phonetic.nysiis (modified version)."""
715
        self.assertEqual(nysiis('', maxlength=float('inf'), modified=True), '')
716
717
        # https://naldc.nal.usda.gov/download/27833/PDF
718
        # Some of these were... wrong... and have been corrected
719
        self.assertEqual(nysiis('Daves', maxlength=8, modified=True), 'DAV')
720
        self.assertEqual(nysiis('Davies', maxlength=8, modified=True), 'DAVY')
721
        self.assertEqual(nysiis('Devies', maxlength=8, modified=True), 'DAFY')
722
        self.assertEqual(nysiis('Divish', maxlength=8, modified=True), 'DAVAS')
723
        self.assertEqual(nysiis('Dove', maxlength=8, modified=True), 'DAV')
724
        self.assertEqual(nysiis('Devese', maxlength=8, modified=True), 'DAFAS')
725
        self.assertEqual(nysiis('Devies', maxlength=8, modified=True), 'DAFY')
726
        self.assertEqual(nysiis('Devos', maxlength=8, modified=True), 'DAF')
727
728
        self.assertEqual(nysiis('Schmit', maxlength=8, modified=True), 'SNAT')
729
        self.assertEqual(nysiis('Schmitt', maxlength=8, modified=True), 'SNAT')
730
        self.assertEqual(nysiis('Schmitz', maxlength=8, modified=True), 'SNAT')
731
        self.assertEqual(nysiis('Schmoutz', maxlength=8, modified=True),
732
                         'SNAT')
733
        self.assertEqual(nysiis('Schnitt', maxlength=8, modified=True), 'SNAT')
734
        self.assertEqual(nysiis('Smit', maxlength=8, modified=True), 'SNAT')
735
        self.assertEqual(nysiis('Smite', maxlength=8, modified=True), 'SNAT')
736
        self.assertEqual(nysiis('Smits', maxlength=8, modified=True), 'SNAT')
737
        self.assertEqual(nysiis('Smoot', maxlength=8, modified=True), 'SNAT')
738
        self.assertEqual(nysiis('Smuts', maxlength=8, modified=True), 'SNAT')
739
        self.assertEqual(nysiis('Sneath', maxlength=8, modified=True), 'SNAT')
740
        self.assertEqual(nysiis('Smyth', maxlength=8, modified=True), 'SNAT')
741
        self.assertEqual(nysiis('Smithy', maxlength=8, modified=True), 'SNATY')
742
        self.assertEqual(nysiis('Smithey', maxlength=8, modified=True),
743
                         'SNATY')
744
745
        # http://www.dropby.com/NYSIISTextStrings.html
746
        # Some of these have been altered since the above uses a different set
747
        # of modifications.
748
        self.assertEqual(nysiis('Edwards', maxlength=8, modified=True),
749
                         'EDWAD')
750
        self.assertEqual(nysiis('Perez', maxlength=8, modified=True), 'PAR')
751
        self.assertEqual(nysiis('Macintosh', maxlength=8, modified=True),
752
                         'MCANTAS')
753
        self.assertEqual(nysiis('Phillipson', maxlength=8, modified=True),
754
                         'FALAPSAN')
755
        self.assertEqual(nysiis('Haddix', maxlength=8, modified=True), 'HADAC')
756
        self.assertEqual(nysiis('Essex', maxlength=8, modified=True), 'ESAC')
757
        self.assertEqual(nysiis('Moye', maxlength=8, modified=True), 'MY')
758
        self.assertEqual(nysiis('McKee', maxlength=8, modified=True), 'MCY')
759
        self.assertEqual(nysiis('Mackie', maxlength=8, modified=True), 'MCY')
760
        self.assertEqual(nysiis('Heitschmidt', maxlength=8, modified=True),
761
                         'HATSNAD')
762
        self.assertEqual(nysiis('Bart', maxlength=8, modified=True), 'BAD')
763
        self.assertEqual(nysiis('Hurd', maxlength=8, modified=True), 'HAD')
764
        self.assertEqual(nysiis('Hunt', maxlength=8, modified=True), 'HAN')
765
        self.assertEqual(nysiis('Westerlund', maxlength=8, modified=True),
766
                         'WASTARLA')
767
        self.assertEqual(nysiis('Evers', maxlength=8, modified=True), 'EVAR')
768
        self.assertEqual(nysiis('Devito', maxlength=8, modified=True), 'DAFAT')
769
        self.assertEqual(nysiis('Rawson', maxlength=8, modified=True), 'RASAN')
770
        self.assertEqual(nysiis('Shoulders', maxlength=8, modified=True),
771
                         'SALDAR')
772
        self.assertEqual(nysiis('Leighton', maxlength=8, modified=True),
773
                         'LATAN')
774
        self.assertEqual(nysiis('Wooldridge', maxlength=8, modified=True),
775
                         'WALDRAG')
776
        self.assertEqual(nysiis('Oliphant', maxlength=8, modified=True),
777
                         'OLAFAN')
778
        self.assertEqual(nysiis('Hatchett', maxlength=8, modified=True),
779
                         'HATCAT')
780
        self.assertEqual(nysiis('McKnight', maxlength=8, modified=True),
781
                         'MCNAT')
782
        self.assertEqual(nysiis('Rickert', maxlength=8, modified=True),
783
                         'RACAD')
784
        self.assertEqual(nysiis('Bowman', maxlength=8, modified=True), 'BANAN')
785
        self.assertEqual(nysiis('Vasquez', maxlength=8, modified=True), 'VASG')
786
        self.assertEqual(nysiis('Bashaw', maxlength=8, modified=True), 'BAS')
787
        self.assertEqual(nysiis('Schoenhoeft', maxlength=8, modified=True),
788
                         'SANAFT')
789
        self.assertEqual(nysiis('Heywood', maxlength=8, modified=True), 'HAD')
790
        self.assertEqual(nysiis('Hayman', maxlength=8, modified=True), 'HANAN')
791
        self.assertEqual(nysiis('Seawright', maxlength=8, modified=True),
792
                         'SARAT')
793
        self.assertEqual(nysiis('Kratzer', maxlength=8, modified=True),
794
                         'CRATSAR')
795
        self.assertEqual(nysiis('Canaday', maxlength=8, modified=True),
796
                         'CANADY')
797
        self.assertEqual(nysiis('Crepeau', maxlength=8, modified=True), 'CRAP')
798
799
        # Additional tests from @Yomguithereal's talisman
800
        # https://github.com/Yomguithereal/talisman/blob/master/test/phonetics/nysiis.js
801
        self.assertEqual(nysiis('Andrew', maxlength=8, modified=True), 'ANDR')
802
        self.assertEqual(nysiis('Robertson', maxlength=8, modified=True),
803
                         'RABARTSA')
804
        self.assertEqual(nysiis('Nolan', maxlength=8, modified=True), 'NALAN')
805
        self.assertEqual(nysiis('Louis XVI', maxlength=8, modified=True),
806
                         'LASXV')
807
        self.assertEqual(nysiis('Case', maxlength=8, modified=True), 'CAS')
808
        self.assertEqual(nysiis('Mclaughlin', maxlength=8, modified=True),
809
                         'MCLAGLAN')
810
        self.assertEqual(nysiis('Awale', maxlength=8, modified=True), 'AL')
811
        self.assertEqual(nysiis('Aegir', maxlength=8, modified=True), 'AGAR')
812
        self.assertEqual(nysiis('Lundgren', maxlength=8, modified=True),
813
                         'LANGRAN')
814
        self.assertEqual(nysiis('Philbert', maxlength=8, modified=True),
815
                         'FALBAD')
816
        self.assertEqual(nysiis('Harry', maxlength=8, modified=True), 'HARY')
817
        self.assertEqual(nysiis('Mackenzie', maxlength=8, modified=True),
818
                         'MCANSY')
819
820
        # maxlength bounds tests
821
        self.assertEqual(nysiis('Niall', maxlength=float('inf'),
822
                                modified=True), 'NAL')
823
        self.assertEqual(nysiis('Niall', maxlength=None, modified=True), 'NAL')
824
        self.assertEqual(nysiis('Niall', maxlength=0, modified=True), 'NAL')
825
826
        # coverage
827
        self.assertEqual(nysiis('Sam Jr.', modified=True), 'ERROR')
828
        self.assertEqual(nysiis('John Sr.', modified=True), 'ERROR')
829
        self.assertEqual(nysiis('Wright', modified=True), 'RAT')
830
        self.assertEqual(nysiis('Rhodes', modified=True), 'RAD')
831
        self.assertEqual(nysiis('Dgagoda', modified=True), 'GAGAD')
832
        self.assertEqual(nysiis('Bosch', modified=True), 'BAS')
833
        self.assertEqual(nysiis('Schrader', modified=True), 'SRADAR')
834
835
836
class MraTestCases(unittest.TestCase):
837
    """Test MRA functions.
838
839
    test cases for abydos.phonetic.mra
840
    """
841
842
    def test_mra(self):
843
        """Test abydos.phonetic.mra."""
844
        self.assertEqual(mra(''), '')
845
846
        # https://en.wikipedia.org/wiki/Match_rating_approach
847
        self.assertEqual(mra('Byrne'), 'BYRN')
848
        self.assertEqual(mra('Boern'), 'BRN')
849
        self.assertEqual(mra('Smith'), 'SMTH')
850
        self.assertEqual(mra('Smyth'), 'SMYTH')
851
        self.assertEqual(mra('Catherine'), 'CTHRN')
852
        self.assertEqual(mra('Kathryn'), 'KTHRYN')
853
854
        # length checks
855
        self.assertEqual(mra('Christopher'), 'CHRPHR')
856
        self.assertEqual(mra('Dickensianistic'), 'DCKSTC')
857
        self.assertEqual(mra('Acetylcholinesterase'), 'ACTTRS')
858
859
860
class MetaphoneTestCases(unittest.TestCase):
861
    """Test Metaphone functions.
862
863
    test cases for abydos.phonetic.metaphone
864
    """
865
866
    def test_metaphone(self):
867
        """Test abydos.phonetic.metaphone."""
868
        self.assertEqual(metaphone(''), '')
869
        self.assertEqual(metaphone('...'), '')
870
871
        # http://ntz-develop.blogspot.com/2011/03/phonetic-algorithms.html
872
        self.assertEqual(metaphone('Fishpool', 4), 'FXPL')
873
        self.assertEqual(metaphone('Fishpoole', 4), 'FXPL')
874
        self.assertEqual(metaphone('Gellately', 4), 'JLTL')
875
        self.assertEqual(metaphone('Gelletly', 4), 'JLTL')
876
        self.assertEqual(metaphone('Lowers', 4), 'LWRS')
877
        self.assertEqual(metaphone('Lowerson', 4), 'LWRS')
878
        self.assertEqual(metaphone('Mallabar', 4), 'MLBR')
879
        self.assertEqual(metaphone('Melbert', 4), 'MLBR')
880
        self.assertEqual(metaphone('Melbourn', 4), 'MLBR')
881
        self.assertEqual(metaphone('Melbourne', 4), 'MLBR')
882
        self.assertEqual(metaphone('Melburg', 4), 'MLBR')
883
        self.assertEqual(metaphone('Melbury', 4), 'MLBR')
884
        self.assertEqual(metaphone('Milberry', 4), 'MLBR')
885
        self.assertEqual(metaphone('Milborn', 4), 'MLBR')
886
        self.assertEqual(metaphone('Milbourn', 4), 'MLBR')
887
        self.assertEqual(metaphone('Milbourne', 4), 'MLBR')
888
        self.assertEqual(metaphone('Milburn', 4), 'MLBR')
889
        self.assertEqual(metaphone('Milburne', 4), 'MLBR')
890
        self.assertEqual(metaphone('Millberg', 4), 'MLBR')
891
        self.assertEqual(metaphone('Mulberry', 4), 'MLBR')
892
        self.assertEqual(metaphone('Mulbery', 4), 'MLBR')
893
        self.assertEqual(metaphone('Mulbry', 4), 'MLBR')
894
        self.assertEqual(metaphone('Saipy', 4), 'SP')
895
        self.assertEqual(metaphone('Sapey', 4), 'SP')
896
        self.assertEqual(metaphone('Sapp', 4), 'SP')
897
        self.assertEqual(metaphone('Sappy', 4), 'SP')
898
        self.assertEqual(metaphone('Sepey', 4), 'SP')
899
        self.assertEqual(metaphone('Seppey', 4), 'SP')
900
        self.assertEqual(metaphone('Sopp', 4), 'SP')
901
        self.assertEqual(metaphone('Zoppie', 4), 'SP')
902
        self.assertEqual(metaphone('Zoppo', 4), 'SP')
903
        self.assertEqual(metaphone('Zupa', 4), 'SP')
904
        self.assertEqual(metaphone('Zupo', 4), 'SP')
905
        self.assertEqual(metaphone('Zuppa', 4), 'SP')
906
907
        # assorted tests to complete code coverage
908
        self.assertEqual(metaphone('Xavier'), 'SFR')
909
        self.assertEqual(metaphone('Acacia'), 'AKX')
910
        self.assertEqual(metaphone('Schuler'), 'SKLR')
911
        self.assertEqual(metaphone('Sign'), 'SN')
912
        self.assertEqual(metaphone('Signed'), 'SNT')
913
        self.assertEqual(metaphone('Horatio'), 'HRX')
914
        self.assertEqual(metaphone('Ignatio'), 'IKNX')
915
        self.assertEqual(metaphone('Lucretia'), 'LKRX')
916
917
        # assorted tests to complete branch coverage
918
        self.assertEqual(metaphone('Lamb'), 'LM')
919
        self.assertEqual(metaphone('science'), 'SNS')
920
921
        # maxlength bounds tests
922
        self.assertEqual(metaphone('Niall', maxlength=float('inf')), 'NL')
923
        self.assertEqual(metaphone('Niall', maxlength=None), 'NL')
924
        self.assertEqual(metaphone('Niall', maxlength=0), 'NL')
925
926
927
class DoubleMetaphoneTestCases(unittest.TestCase):
928
    """Test Double Metaphone functions.
929
930
    test cases for abydos.phonetic.double_metaphone
931
932
    These test cases are copied from two sources:
933
    https://github.com/oubiwann/metaphone/blob/master/metaphone/tests/test_metaphone.py
934
    and
935
    http://swoodbridge.com/DoubleMetaPhone/surnames.txt
936
937
    Most test cases other than those in test_surnames and test_surnames4 come
938
    from the former and are under the following license:
939
940
        Copyright (c) 2007 Andrew Collins, Chris Leong
941
        Copyright (c) 2009 Matthew Somerville
942
        Copyright (c) 2010 Maximillian Dornseif, Richard Barran
943
        Copyright (c) 2012 Duncan McGreggor
944
        All rights reserved.
945
946
         * Redistribution and use in source and binary forms, with or without
947
            modification, are permitted provided that the following conditions
948
            are met:
949
950
         * Redistributions of source code must retain the above copyright
951
             notice, this list of conditions and the following disclaimer.
952
953
         * Redistributions in binary form must reproduce the above copyright
954
            notice, this list of conditions and the following disclaimer in
955
            the documentation and/or other materials provided with the
956
            distribution.
957
958
        Neither the name "Metaphone" nor the names of its contributors may be
959
        used to endorse or promote products derived from this software without
960
        specific prior written permission.
961
962
        THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
963
        "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
964
        LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
965
        A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
966
        HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
967
        SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
968
        LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
969
        DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
970
        THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
971
        (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
972
        OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
973
974
    test_surname and test_surname4 come from a set of tests for a PHP port
975
    of Double Metaphone that is Copyright 2001, Stephen Woodbridge and
976
    identified as 'freely distributable'
977
    """
978
979
    def test_double_metaphone(self):
980
        """Test abydos.phonetic.double_metaphone."""
981
        # base case
982
        self.assertEqual(double_metaphone(''), ('', ''))
983
984
        # single result
985
        self.assertEqual(double_metaphone('aubrey'), ('APR', ''))
986
987
        # double result
988
        self.assertEqual(double_metaphone('richard'), ('RXRT', 'RKRT'))
989
990
        # general word list
991
        self.assertEqual(double_metaphone('Jose'), ('HS', ''))
992
        self.assertEqual(double_metaphone('cambrillo'), ('KMPRL', 'KMPR'))
993
        self.assertEqual(double_metaphone('otto'), ('AT', ''))
994
        self.assertEqual(double_metaphone('aubrey'), ('APR', ''))
995
        self.assertEqual(double_metaphone('maurice'), ('MRS', ''))
996
        self.assertEqual(double_metaphone('auto'), ('AT', ''))
997
        self.assertEqual(double_metaphone('maisey'), ('MS', ''))
998
        self.assertEqual(double_metaphone('catherine'), ('K0RN', 'KTRN'))
999
        self.assertEqual(double_metaphone('geoff'), ('JF', 'KF'))
1000
        self.assertEqual(double_metaphone('Chile'), ('XL', ''))
1001
        self.assertEqual(double_metaphone('katherine'), ('K0RN', 'KTRN'))
1002
        self.assertEqual(double_metaphone('steven'), ('STFN', ''))
1003
        self.assertEqual(double_metaphone('zhang'), ('JNK', ''))
1004
        self.assertEqual(double_metaphone('bob'), ('PP', ''))
1005
        self.assertEqual(double_metaphone('ray'), ('R', ''))
1006
        self.assertEqual(double_metaphone('Tux'), ('TKS', ''))
1007
        self.assertEqual(double_metaphone('bryan'), ('PRN', ''))
1008
        self.assertEqual(double_metaphone('bryce'), ('PRS', ''))
1009
        self.assertEqual(double_metaphone('Rapelje'), ('RPL', ''))
1010
        self.assertEqual(double_metaphone('richard'), ('RXRT', 'RKRT'))
1011
        self.assertEqual(double_metaphone('solilijs'), ('SLLS', ''))
1012
        self.assertEqual(double_metaphone('Dallas'), ('TLS', ''))
1013
        self.assertEqual(double_metaphone('Schwein'), ('XN', 'XFN'))
1014
        self.assertEqual(double_metaphone('dave'), ('TF', ''))
1015
        self.assertEqual(double_metaphone('eric'), ('ARK', ''))
1016
        self.assertEqual(double_metaphone('Parachute'), ('PRKT', ''))
1017
        self.assertEqual(double_metaphone('brian'), ('PRN', ''))
1018
        self.assertEqual(double_metaphone('randy'), ('RNT', ''))
1019
        self.assertEqual(double_metaphone('Through'), ('0R', 'TR'))
1020
        self.assertEqual(double_metaphone('Nowhere'), ('NR', ''))
1021
        self.assertEqual(double_metaphone('heidi'), ('HT', ''))
1022
        self.assertEqual(double_metaphone('Arnow'), ('ARN', 'ARNF'))
1023
        self.assertEqual(double_metaphone('Thumbail'), ('0MPL', 'TMPL'))
1024
1025
        # homophones
1026
        self.assertEqual(double_metaphone('tolled'), double_metaphone('told'))
1027
        self.assertEqual(double_metaphone('katherine'),
1028
                         double_metaphone('catherine'))
1029
        self.assertEqual(double_metaphone('brian'), double_metaphone('bryan'))
1030
1031
        # similar names
1032
        self.assertEqual(double_metaphone('Bartoš'), ('PRT', ''))
1033
        self.assertEqual(double_metaphone('Bartosz'), ('PRTS', 'PRTX'))
1034
        self.assertEqual(double_metaphone('Bartosch'), ('PRTX', ''))
1035
        self.assertEqual(double_metaphone('Bartos'), ('PRTS', ''))
1036
        self.assertEqual(list(set(double_metaphone('Jablonski'))
1037
                              .intersection(double_metaphone('Yablonsky'))),
1038
                         ['APLNSK'])
1039
        self.assertEqual(list(set(double_metaphone('Smith'))
1040
                              .intersection(double_metaphone('Schmidt'))),
1041
                         ['XMT'])
1042
1043
        # non-English Unicode
1044
        self.assertEqual(double_metaphone('andestādītu'), ('ANTSTTT', ''))
1045
1046
        # c-cedilla
1047
        self.assertEqual(double_metaphone('français'), ('FRNS', 'FRNSS'))
1048
        self.assertEqual(double_metaphone('garçon'), ('KRSN', ''))
1049
        self.assertEqual(double_metaphone('leçon'), ('LSN', ''))
1050
1051
        # German words
1052
        self.assertEqual(double_metaphone('ach'), ('AK', ''))
1053
        self.assertEqual(double_metaphone('bacher'), ('PKR', ''))
1054
        self.assertEqual(double_metaphone('macher'), ('MKR', ''))
1055
1056
        # Italian words
1057
        self.assertEqual(double_metaphone('bacci'), ('PX', ''))
1058
        self.assertEqual(double_metaphone('bertucci'), ('PRTX', ''))
1059
        self.assertEqual(double_metaphone('bellocchio'), ('PLX', ''))
1060
        self.assertEqual(double_metaphone('bacchus'), ('PKS', ''))
1061
        self.assertEqual(double_metaphone('focaccia'), ('FKX', ''))
1062
        self.assertEqual(double_metaphone('chianti'), ('KNT', ''))
1063
        self.assertEqual(double_metaphone('tagliaro'), ('TKLR', 'TLR'))
1064
        self.assertEqual(double_metaphone('biaggi'), ('PJ', 'PK'))
1065
1066
        # Spanish words
1067
        self.assertEqual(double_metaphone('bajador'), ('PJTR', 'PHTR'))
1068
        self.assertEqual(double_metaphone('cabrillo'), ('KPRL', 'KPR'))
1069
        self.assertEqual(double_metaphone('gallegos'), ('KLKS', 'KKS'))
1070
        self.assertEqual(double_metaphone('San Jacinto'), ('SNHSNT', ''))
1071
1072
        # French words
1073
        self.assertEqual(double_metaphone('rogier'), ('RJ', 'RJR'))
1074
        self.assertEqual(double_metaphone('breaux'), ('PR', ''))
1075
1076
        # Slavic words
1077
        self.assertEqual(double_metaphone('Wewski'), ('ASK', 'FFSK'))
1078
1079
        # Chinese words
1080
        self.assertEqual(double_metaphone('zhao'), ('J', ''))
1081
1082
        # Dutch-origin words
1083
        self.assertEqual(double_metaphone('school'), ('SKL', ''))
1084
        self.assertEqual(double_metaphone('schooner'), ('SKNR', ''))
1085
        self.assertEqual(double_metaphone('schermerhorn'),
1086
                         ('XRMRRN', 'SKRMRRN'))
1087
        self.assertEqual(double_metaphone('schenker'), ('XNKR', 'SKNKR'))
1088
1089
        # <ch> words
1090
        self.assertEqual(double_metaphone('Charac'), ('KRK', ''))
1091
        self.assertEqual(double_metaphone('Charis'), ('KRS', ''))
1092
        self.assertEqual(double_metaphone('chord'), ('KRT', ''))
1093
        self.assertEqual(double_metaphone('Chym'), ('KM', ''))
1094
        self.assertEqual(double_metaphone('Chia'), ('K', ''))
1095
        self.assertEqual(double_metaphone('chem'), ('KM', ''))
1096
        self.assertEqual(double_metaphone('chore'), ('XR', ''))
1097
        self.assertEqual(double_metaphone('orchestra'), ('ARKSTR', ''))
1098
        self.assertEqual(double_metaphone('architect'), ('ARKTKT', ''))
1099
        self.assertEqual(double_metaphone('orchid'), ('ARKT', ''))
1100
1101
        # <cc> words
1102
        self.assertEqual(double_metaphone('accident'), ('AKSTNT', ''))
1103
        self.assertEqual(double_metaphone('accede'), ('AKST', ''))
1104
        self.assertEqual(double_metaphone('succeed'), ('SKST', ''))
1105
1106
        # <mc> words
1107
        self.assertEqual(double_metaphone('mac caffrey'), ('MKFR', ''))
1108
        self.assertEqual(double_metaphone('mac gregor'), ('MKRKR', ''))
1109
        self.assertEqual(double_metaphone('mc crae'), ('MKR', ''))
1110
        self.assertEqual(double_metaphone('mcclain'), ('MKLN', ''))
1111
1112
        # <gh> words
1113
        self.assertEqual(double_metaphone('laugh'), ('LF', ''))
1114
        self.assertEqual(double_metaphone('cough'), ('KF', ''))
1115
        self.assertEqual(double_metaphone('rough'), ('RF', ''))
1116
1117
        # <g__> words
1118
        self.assertEqual(double_metaphone('gya'), ('K', 'J'))
1119
        self.assertEqual(double_metaphone('ges'), ('KS', 'JS'))
1120
        self.assertEqual(double_metaphone('gep'), ('KP', 'JP'))
1121
        self.assertEqual(double_metaphone('geb'), ('KP', 'JP'))
1122
        self.assertEqual(double_metaphone('gel'), ('KL', 'JL'))
1123
        self.assertEqual(double_metaphone('gey'), ('K', 'J'))
1124
        self.assertEqual(double_metaphone('gib'), ('KP', 'JP'))
1125
        self.assertEqual(double_metaphone('gil'), ('KL', 'JL'))
1126
        self.assertEqual(double_metaphone('gin'), ('KN', 'JN'))
1127
        self.assertEqual(double_metaphone('gie'), ('K', 'J'))
1128
        self.assertEqual(double_metaphone('gei'), ('K', 'J'))
1129
        self.assertEqual(double_metaphone('ger'), ('KR', 'JR'))
1130
        self.assertEqual(double_metaphone('danger'), ('TNJR', 'TNKR'))
1131
        self.assertEqual(double_metaphone('manager'), ('MNKR', 'MNJR'))
1132
        self.assertEqual(double_metaphone('dowager'), ('TKR', 'TJR'))
1133
1134
        # <pb> words
1135
        self.assertEqual(double_metaphone('Campbell'), ('KMPL', ''))
1136
        self.assertEqual(double_metaphone('raspberry'), ('RSPR', ''))
1137
1138
        # <th> words
1139
        self.assertEqual(double_metaphone('Thomas'), ('TMS', ''))
1140
        self.assertEqual(double_metaphone('Thames'), ('TMS', ''))
1141
1142
        # etc. (for code coverage)
1143
        self.assertEqual(double_metaphone('Xavier'), ('SF', 'SFR'))
1144
        self.assertEqual(double_metaphone('Michael'), ('MKL', 'MXL'))
1145
        self.assertEqual(double_metaphone('Ignacio'), ('AKNS', 'ANX'))
1146
        self.assertEqual(double_metaphone('Ajjam'), ('AJM', ''))
1147
        self.assertEqual(double_metaphone('Akkad'), ('AKT', ''))
1148
        self.assertEqual(double_metaphone('Año'), ('AN', ''))
1149
        self.assertEqual(double_metaphone('Año'), double_metaphone('Anno'))
1150
        self.assertEqual(double_metaphone('Caucasian'), ('KKSN', 'KKXN'))
1151
        self.assertEqual(double_metaphone('Kaukasian'), ('KKSN', ''))
1152
        self.assertEqual(double_metaphone('Zaqqum'), ('SKM', ''))
1153
        self.assertEqual(double_metaphone('stevven'), ('STFN', ''))
1154
        self.assertEqual(double_metaphone('Tuxx'), ('TKS', ''))
1155
        self.assertEqual(double_metaphone('Ghiradelli'), ('JRTL', ''))
1156
        self.assertEqual(double_metaphone('ghoul'), ('KL', ''))
1157
        self.assertEqual(double_metaphone('hej'), ('HJ', 'H'))
1158
1159
        # maxlength bounds tests
1160
        self.assertEqual(double_metaphone('Niall', maxlength=float('inf')),
1161
                         ('NL', ''))
1162
        self.assertEqual(double_metaphone('Niall', maxlength=None), ('NL', ''))
1163
        self.assertEqual(double_metaphone('Niall', maxlength=0), ('NL', ''))
1164
1165
    def test_double_metaphone_surnames(self):
1166
        """Test abydos.phonetic.double_metaphone (surname data)."""
1167
        self.assertEqual(double_metaphone(''), ('', ''))
1168
        self.assertEqual(double_metaphone('ALLERTON'), ('ALRTN', ''))
1169
        self.assertEqual(double_metaphone('Acton'), ('AKTN', ''))
1170
        self.assertEqual(double_metaphone('Adams'), ('ATMS', ''))
1171
        self.assertEqual(double_metaphone('Aggar'), ('AKR', ''))
1172
        self.assertEqual(double_metaphone('Ahl'), ('AL', ''))
1173
        self.assertEqual(double_metaphone('Aiken'), ('AKN', ''))
1174
        self.assertEqual(double_metaphone('Alan'), ('ALN', ''))
1175
        self.assertEqual(double_metaphone('Alcock'), ('ALKK', ''))
1176
        self.assertEqual(double_metaphone('Alden'), ('ALTN', ''))
1177
        self.assertEqual(double_metaphone('Aldham'), ('ALTM', ''))
1178
        self.assertEqual(double_metaphone('Allen'), ('ALN', ''))
1179
        self.assertEqual(double_metaphone('Allerton'), ('ALRTN', ''))
1180
        self.assertEqual(double_metaphone('Alsop'), ('ALSP', ''))
1181
        self.assertEqual(double_metaphone('Alwein'), ('ALN', ''))
1182
        self.assertEqual(double_metaphone('Ambler'), ('AMPLR', ''))
1183
        self.assertEqual(double_metaphone('Andevill'), ('ANTFL', ''))
1184
        self.assertEqual(double_metaphone('Andrews'), ('ANTRS', ''))
1185
        self.assertEqual(double_metaphone('Andreyco'), ('ANTRK', ''))
1186
        self.assertEqual(double_metaphone('Andriesse'), ('ANTRS', ''))
1187
        self.assertEqual(double_metaphone('Angier'), ('ANJ', 'ANJR'))
1188
        self.assertEqual(double_metaphone('Annabel'), ('ANPL', ''))
1189
        self.assertEqual(double_metaphone('Anne'), ('AN', ''))
1190
        self.assertEqual(double_metaphone('Anstye'), ('ANST', ''))
1191
        self.assertEqual(double_metaphone('Appling'), ('APLNK', ''))
1192
        self.assertEqual(double_metaphone('Apuke'), ('APK', ''))
1193
        self.assertEqual(double_metaphone('Arnold'), ('ARNLT', ''))
1194
        self.assertEqual(double_metaphone('Ashby'), ('AXP', ''))
1195
        self.assertEqual(double_metaphone('Astwood'), ('ASTT', ''))
1196
        self.assertEqual(double_metaphone('Atkinson'), ('ATKNSN', ''))
1197
        self.assertEqual(double_metaphone('Audley'), ('ATL', ''))
1198
        self.assertEqual(double_metaphone('Austin'), ('ASTN', ''))
1199
        self.assertEqual(double_metaphone('Avenal'), ('AFNL', ''))
1200
        self.assertEqual(double_metaphone('Ayer'), ('AR', ''))
1201
        self.assertEqual(double_metaphone('Ayot'), ('AT', ''))
1202
        self.assertEqual(double_metaphone('Babbitt'), ('PPT', ''))
1203
        self.assertEqual(double_metaphone('Bachelor'), ('PXLR', 'PKLR'))
1204
        self.assertEqual(double_metaphone('Bachelour'), ('PXLR', 'PKLR'))
1205
        self.assertEqual(double_metaphone('Bailey'), ('PL', ''))
1206
        self.assertEqual(double_metaphone('Baivel'), ('PFL', ''))
1207
        self.assertEqual(double_metaphone('Baker'), ('PKR', ''))
1208
        self.assertEqual(double_metaphone('Baldwin'), ('PLTN', ''))
1209
        self.assertEqual(double_metaphone('Balsley'), ('PLSL', ''))
1210
        self.assertEqual(double_metaphone('Barber'), ('PRPR', ''))
1211
        self.assertEqual(double_metaphone('Barker'), ('PRKR', ''))
1212
        self.assertEqual(double_metaphone('Barlow'), ('PRL', 'PRLF'))
1213
        self.assertEqual(double_metaphone('Barnard'), ('PRNRT', ''))
1214
        self.assertEqual(double_metaphone('Barnes'), ('PRNS', ''))
1215
        self.assertEqual(double_metaphone('Barnsley'), ('PRNSL', ''))
1216
        self.assertEqual(double_metaphone('Barouxis'), ('PRKSS', ''))
1217
        self.assertEqual(double_metaphone('Bartlet'), ('PRTLT', ''))
1218
        self.assertEqual(double_metaphone('Basley'), ('PSL', ''))
1219
        self.assertEqual(double_metaphone('Basset'), ('PST', ''))
1220
        self.assertEqual(double_metaphone('Bassett'), ('PST', ''))
1221
        self.assertEqual(double_metaphone('Batchlor'), ('PXLR', ''))
1222
        self.assertEqual(double_metaphone('Bates'), ('PTS', ''))
1223
        self.assertEqual(double_metaphone('Batson'), ('PTSN', ''))
1224
        self.assertEqual(double_metaphone('Bayes'), ('PS', ''))
1225
        self.assertEqual(double_metaphone('Bayley'), ('PL', ''))
1226
        self.assertEqual(double_metaphone('Beale'), ('PL', ''))
1227
        self.assertEqual(double_metaphone('Beauchamp'), ('PXMP', 'PKMP'))
1228
        self.assertEqual(double_metaphone('Beauclerc'), ('PKLRK', ''))
1229
        self.assertEqual(double_metaphone('Beech'), ('PK', ''))
1230
        self.assertEqual(double_metaphone('Beers'), ('PRS', ''))
1231
        self.assertEqual(double_metaphone('Beke'), ('PK', ''))
1232
        self.assertEqual(double_metaphone('Belcher'), ('PLXR', 'PLKR'))
1233
        self.assertEqual(double_metaphone('Benjamin'), ('PNJMN', ''))
1234
        self.assertEqual(double_metaphone('Benningham'), ('PNNKM', ''))
1235
        self.assertEqual(double_metaphone('Bereford'), ('PRFRT', ''))
1236
        self.assertEqual(double_metaphone('Bergen'), ('PRJN', 'PRKN'))
1237
        self.assertEqual(double_metaphone('Berkeley'), ('PRKL', ''))
1238
        self.assertEqual(double_metaphone('Berry'), ('PR', ''))
1239
        self.assertEqual(double_metaphone('Besse'), ('PS', ''))
1240
        self.assertEqual(double_metaphone('Bessey'), ('PS', ''))
1241
        self.assertEqual(double_metaphone('Bessiles'), ('PSLS', ''))
1242
        self.assertEqual(double_metaphone('Bigelow'), ('PJL', 'PKLF'))
1243
        self.assertEqual(double_metaphone('Bigg'), ('PK', ''))
1244
        self.assertEqual(double_metaphone('Bigod'), ('PKT', ''))
1245
        self.assertEqual(double_metaphone('Billings'), ('PLNKS', ''))
1246
        self.assertEqual(double_metaphone('Bimper'), ('PMPR', ''))
1247
        self.assertEqual(double_metaphone('Binker'), ('PNKR', ''))
1248
        self.assertEqual(double_metaphone('Birdsill'), ('PRTSL', ''))
1249
        self.assertEqual(double_metaphone('Bishop'), ('PXP', ''))
1250
        self.assertEqual(double_metaphone('Black'), ('PLK', ''))
1251
        self.assertEqual(double_metaphone('Blagge'), ('PLK', ''))
1252
        self.assertEqual(double_metaphone('Blake'), ('PLK', ''))
1253
        self.assertEqual(double_metaphone('Blanck'), ('PLNK', ''))
1254
        self.assertEqual(double_metaphone('Bledsoe'), ('PLTS', ''))
1255
        self.assertEqual(double_metaphone('Blennerhasset'), ('PLNRST', ''))
1256
        self.assertEqual(double_metaphone('Blessing'), ('PLSNK', ''))
1257
        self.assertEqual(double_metaphone('Blewett'), ('PLT', ''))
1258
        self.assertEqual(double_metaphone('Bloctgoed'), ('PLKTKT', ''))
1259
        self.assertEqual(double_metaphone('Bloetgoet'), ('PLTKT', ''))
1260
        self.assertEqual(double_metaphone('Bloodgood'), ('PLTKT', ''))
1261
        self.assertEqual(double_metaphone('Blossom'), ('PLSM', ''))
1262
        self.assertEqual(double_metaphone('Blount'), ('PLNT', ''))
1263
        self.assertEqual(double_metaphone('Bodine'), ('PTN', ''))
1264
        self.assertEqual(double_metaphone('Bodman'), ('PTMN', ''))
1265
        self.assertEqual(double_metaphone('BonCoeur'), ('PNKR', ''))
1266
        self.assertEqual(double_metaphone('Bond'), ('PNT', ''))
1267
        self.assertEqual(double_metaphone('Boscawen'), ('PSKN', ''))
1268
        self.assertEqual(double_metaphone('Bosworth'), ('PSR0', 'PSRT'))
1269
        self.assertEqual(double_metaphone('Bouchier'), ('PX', 'PKR'))
1270
        self.assertEqual(double_metaphone('Bowne'), ('PN', ''))
1271
        self.assertEqual(double_metaphone('Bradbury'), ('PRTPR', ''))
1272
        self.assertEqual(double_metaphone('Bradder'), ('PRTR', ''))
1273
        self.assertEqual(double_metaphone('Bradford'), ('PRTFRT', ''))
1274
        self.assertEqual(double_metaphone('Bradstreet'), ('PRTSTRT', ''))
1275
        self.assertEqual(double_metaphone('Braham'), ('PRHM', ''))
1276
        self.assertEqual(double_metaphone('Brailsford'), ('PRLSFRT', ''))
1277
        self.assertEqual(double_metaphone('Brainard'), ('PRNRT', ''))
1278
        self.assertEqual(double_metaphone('Brandish'), ('PRNTX', ''))
1279
        self.assertEqual(double_metaphone('Braun'), ('PRN', ''))
1280
        self.assertEqual(double_metaphone('Brecc'), ('PRK', ''))
1281
        self.assertEqual(double_metaphone('Brent'), ('PRNT', ''))
1282
        self.assertEqual(double_metaphone('Brenton'), ('PRNTN', ''))
1283
        self.assertEqual(double_metaphone('Briggs'), ('PRKS', ''))
1284
        self.assertEqual(double_metaphone('Brigham'), ('PRM', ''))
1285
        self.assertEqual(double_metaphone('Brobst'), ('PRPST', ''))
1286
        self.assertEqual(double_metaphone('Brome'), ('PRM', ''))
1287
        self.assertEqual(double_metaphone('Bronson'), ('PRNSN', ''))
1288
        self.assertEqual(double_metaphone('Brooks'), ('PRKS', ''))
1289
        self.assertEqual(double_metaphone('Brouillard'), ('PRLRT', ''))
1290
        self.assertEqual(double_metaphone('Brown'), ('PRN', ''))
1291
        self.assertEqual(double_metaphone('Browne'), ('PRN', ''))
1292
        self.assertEqual(double_metaphone('Brownell'), ('PRNL', ''))
1293
        self.assertEqual(double_metaphone('Bruley'), ('PRL', ''))
1294
        self.assertEqual(double_metaphone('Bryant'), ('PRNT', ''))
1295
        self.assertEqual(double_metaphone('Brzozowski'),
1296
                         ('PRSSSK', 'PRTSTSFSK'))
1297
        self.assertEqual(double_metaphone('Buide'), ('PT', ''))
1298
        self.assertEqual(double_metaphone('Bulmer'), ('PLMR', ''))
1299
        self.assertEqual(double_metaphone('Bunker'), ('PNKR', ''))
1300
        self.assertEqual(double_metaphone('Burden'), ('PRTN', ''))
1301
        self.assertEqual(double_metaphone('Burge'), ('PRJ', 'PRK'))
1302
        self.assertEqual(double_metaphone('Burgoyne'), ('PRKN', ''))
1303
        self.assertEqual(double_metaphone('Burke'), ('PRK', ''))
1304
        self.assertEqual(double_metaphone('Burnett'), ('PRNT', ''))
1305
        self.assertEqual(double_metaphone('Burpee'), ('PRP', ''))
1306
        self.assertEqual(double_metaphone('Bursley'), ('PRSL', ''))
1307
        self.assertEqual(double_metaphone('Burton'), ('PRTN', ''))
1308
        self.assertEqual(double_metaphone('Bushnell'), ('PXNL', ''))
1309
        self.assertEqual(double_metaphone('Buss'), ('PS', ''))
1310
        self.assertEqual(double_metaphone('Buswell'), ('PSL', ''))
1311
        self.assertEqual(double_metaphone('Butler'), ('PTLR', ''))
1312
        self.assertEqual(double_metaphone('Calkin'), ('KLKN', ''))
1313
        self.assertEqual(double_metaphone('Canada'), ('KNT', ''))
1314
        self.assertEqual(double_metaphone('Canmore'), ('KNMR', ''))
1315
        self.assertEqual(double_metaphone('Canney'), ('KN', ''))
1316
        self.assertEqual(double_metaphone('Capet'), ('KPT', ''))
1317
        self.assertEqual(double_metaphone('Card'), ('KRT', ''))
1318
        self.assertEqual(double_metaphone('Carman'), ('KRMN', ''))
1319
        self.assertEqual(double_metaphone('Carpenter'), ('KRPNTR', ''))
1320
        self.assertEqual(double_metaphone('Cartwright'), ('KRTRT', ''))
1321
        self.assertEqual(double_metaphone('Casey'), ('KS', ''))
1322
        self.assertEqual(double_metaphone('Catterfield'), ('KTRFLT', ''))
1323
        self.assertEqual(double_metaphone('Ceeley'), ('SL', ''))
1324
        self.assertEqual(double_metaphone('Chambers'), ('XMPRS', ''))
1325
        self.assertEqual(double_metaphone('Champion'), ('XMPN', ''))
1326
        self.assertEqual(double_metaphone('Chapman'), ('XPMN', ''))
1327
        self.assertEqual(double_metaphone('Chase'), ('XS', ''))
1328
        self.assertEqual(double_metaphone('Cheney'), ('XN', ''))
1329
        self.assertEqual(double_metaphone('Chetwynd'), ('XTNT', ''))
1330
        self.assertEqual(double_metaphone('Chevalier'), ('XFL', 'XFLR'))
1331
        self.assertEqual(double_metaphone('Chillingsworth'),
1332
                         ('XLNKSR0', 'XLNKSRT'))
1333
        self.assertEqual(double_metaphone('Christie'), ('KRST', ''))
1334
        self.assertEqual(double_metaphone('Chubbuck'), ('XPK', ''))
1335
        self.assertEqual(double_metaphone('Church'), ('XRX', 'XRK'))
1336
        self.assertEqual(double_metaphone('Clark'), ('KLRK', ''))
1337
        self.assertEqual(double_metaphone('Clarke'), ('KLRK', ''))
1338
        self.assertEqual(double_metaphone('Cleare'), ('KLR', ''))
1339
        self.assertEqual(double_metaphone('Clement'), ('KLMNT', ''))
1340
        self.assertEqual(double_metaphone('Clerke'), ('KLRK', ''))
1341
        self.assertEqual(double_metaphone('Clibben'), ('KLPN', ''))
1342
        self.assertEqual(double_metaphone('Clifford'), ('KLFRT', ''))
1343
        self.assertEqual(double_metaphone('Clivedon'), ('KLFTN', ''))
1344
        self.assertEqual(double_metaphone('Close'), ('KLS', ''))
1345
        self.assertEqual(double_metaphone('Clothilde'), ('KL0LT', 'KLTLT'))
1346
        self.assertEqual(double_metaphone('Cobb'), ('KP', ''))
1347
        self.assertEqual(double_metaphone('Coburn'), ('KPRN', ''))
1348
        self.assertEqual(double_metaphone('Coburne'), ('KPRN', ''))
1349
        self.assertEqual(double_metaphone('Cocke'), ('KK', ''))
1350
        self.assertEqual(double_metaphone('Coffin'), ('KFN', ''))
1351
        self.assertEqual(double_metaphone('Coffyn'), ('KFN', ''))
1352
        self.assertEqual(double_metaphone('Colborne'), ('KLPRN', ''))
1353
        self.assertEqual(double_metaphone('Colby'), ('KLP', ''))
1354
        self.assertEqual(double_metaphone('Cole'), ('KL', ''))
1355
        self.assertEqual(double_metaphone('Coleman'), ('KLMN', ''))
1356
        self.assertEqual(double_metaphone('Collier'), ('KL', 'KLR'))
1357
        self.assertEqual(double_metaphone('Compton'), ('KMPTN', ''))
1358
        self.assertEqual(double_metaphone('Cone'), ('KN', ''))
1359
        self.assertEqual(double_metaphone('Cook'), ('KK', ''))
1360
        self.assertEqual(double_metaphone('Cooke'), ('KK', ''))
1361
        self.assertEqual(double_metaphone('Cooper'), ('KPR', ''))
1362
        self.assertEqual(double_metaphone('Copperthwaite'), ('KPR0T', 'KPRTT'))
1363
        self.assertEqual(double_metaphone('Corbet'), ('KRPT', ''))
1364
        self.assertEqual(double_metaphone('Corell'), ('KRL', ''))
1365
        self.assertEqual(double_metaphone('Corey'), ('KR', ''))
1366
        self.assertEqual(double_metaphone('Corlies'), ('KRLS', ''))
1367
        self.assertEqual(double_metaphone('Corneliszen'), ('KRNLSN', 'KRNLXN'))
1368
        self.assertEqual(double_metaphone('Cornelius'), ('KRNLS', ''))
1369
        self.assertEqual(double_metaphone('Cornwallis'), ('KRNLS', ''))
1370
        self.assertEqual(double_metaphone('Cosgrove'), ('KSKRF', ''))
1371
        self.assertEqual(double_metaphone('Count of Brionne'), ('KNTFPRN', ''))
1372
        self.assertEqual(double_metaphone('Covill'), ('KFL', ''))
1373
        self.assertEqual(double_metaphone('Cowperthwaite'), ('KPR0T', 'KPRTT'))
1374
        self.assertEqual(double_metaphone('Cowperwaite'), ('KPRT', ''))
1375
        self.assertEqual(double_metaphone('Crane'), ('KRN', ''))
1376
        self.assertEqual(double_metaphone('Creagmile'), ('KRKML', ''))
1377
        self.assertEqual(double_metaphone('Crew'), ('KR', 'KRF'))
1378
        self.assertEqual(double_metaphone('Crispin'), ('KRSPN', ''))
1379
        self.assertEqual(double_metaphone('Crocker'), ('KRKR', ''))
1380
        self.assertEqual(double_metaphone('Crockett'), ('KRKT', ''))
1381
        self.assertEqual(double_metaphone('Crosby'), ('KRSP', ''))
1382
        self.assertEqual(double_metaphone('Crump'), ('KRMP', ''))
1383
        self.assertEqual(double_metaphone('Cunningham'), ('KNNKM', ''))
1384
        self.assertEqual(double_metaphone('Curtis'), ('KRTS', ''))
1385
        self.assertEqual(double_metaphone('Cutha'), ('K0', 'KT'))
1386
        self.assertEqual(double_metaphone('Cutter'), ('KTR', ''))
1387
        self.assertEqual(double_metaphone('D\'Aubigny'), ('TPN', 'TPKN'))
1388
        self.assertEqual(double_metaphone('DAVIS'), ('TFS', ''))
1389
        self.assertEqual(double_metaphone('Dabinott'), ('TPNT', ''))
1390
        self.assertEqual(double_metaphone('Dacre'), ('TKR', ''))
1391
        self.assertEqual(double_metaphone('Daggett'), ('TKT', ''))
1392
        self.assertEqual(double_metaphone('Danvers'), ('TNFRS', ''))
1393
        self.assertEqual(double_metaphone('Darcy'), ('TRS', ''))
1394
        self.assertEqual(double_metaphone('Davis'), ('TFS', ''))
1395
        self.assertEqual(double_metaphone('Dawn'), ('TN', ''))
1396
        self.assertEqual(double_metaphone('Dawson'), ('TSN', ''))
1397
        self.assertEqual(double_metaphone('Day'), ('T', ''))
1398
        self.assertEqual(double_metaphone('Daye'), ('T', ''))
1399
        self.assertEqual(double_metaphone('DeGrenier'), ('TKRN', 'TKRNR'))
1400
        self.assertEqual(double_metaphone('Dean'), ('TN', ''))
1401
        self.assertEqual(double_metaphone('Deekindaugh'), ('TKNT', ''))
1402
        self.assertEqual(double_metaphone('Dennis'), ('TNS', ''))
1403
        self.assertEqual(double_metaphone('Denny'), ('TN', ''))
1404
        self.assertEqual(double_metaphone('Denton'), ('TNTN', ''))
1405
        self.assertEqual(double_metaphone('Desborough'), ('TSPRF', ''))
1406
        self.assertEqual(double_metaphone('Despenser'), ('TSPNSR', ''))
1407
        self.assertEqual(double_metaphone('Deverill'), ('TFRL', ''))
1408
        self.assertEqual(double_metaphone('Devine'), ('TFN', ''))
1409
        self.assertEqual(double_metaphone('Dexter'), ('TKSTR', ''))
1410
        self.assertEqual(double_metaphone('Dillaway'), ('TL', ''))
1411
        self.assertEqual(double_metaphone('Dimmick'), ('TMK', ''))
1412
        self.assertEqual(double_metaphone('Dinan'), ('TNN', ''))
1413
        self.assertEqual(double_metaphone('Dix'), ('TKS', ''))
1414
        self.assertEqual(double_metaphone('Doggett'), ('TKT', ''))
1415
        self.assertEqual(double_metaphone('Donahue'), ('TNH', ''))
1416
        self.assertEqual(double_metaphone('Dorfman'), ('TRFMN', ''))
1417
        self.assertEqual(double_metaphone('Dorris'), ('TRS', ''))
1418
        self.assertEqual(double_metaphone('Dow'), ('T', 'TF'))
1419
        self.assertEqual(double_metaphone('Downey'), ('TN', ''))
1420
        self.assertEqual(double_metaphone('Downing'), ('TNNK', ''))
1421
        self.assertEqual(double_metaphone('Dowsett'), ('TST', ''))
1422
        self.assertEqual(double_metaphone('Duck?'), ('TK', ''))
1423
        self.assertEqual(double_metaphone('Dudley'), ('TTL', ''))
1424
        self.assertEqual(double_metaphone('Duffy'), ('TF', ''))
1425
        self.assertEqual(double_metaphone('Dunn'), ('TN', ''))
1426
        self.assertEqual(double_metaphone('Dunsterville'), ('TNSTRFL', ''))
1427
        self.assertEqual(double_metaphone('Durrant'), ('TRNT', ''))
1428
        self.assertEqual(double_metaphone('Durrin'), ('TRN', ''))
1429
        self.assertEqual(double_metaphone('Dustin'), ('TSTN', ''))
1430
        self.assertEqual(double_metaphone('Duston'), ('TSTN', ''))
1431
        self.assertEqual(double_metaphone('Eames'), ('AMS', ''))
1432
        self.assertEqual(double_metaphone('Early'), ('ARL', ''))
1433
        self.assertEqual(double_metaphone('Easty'), ('AST', ''))
1434
        self.assertEqual(double_metaphone('Ebbett'), ('APT', ''))
1435
        self.assertEqual(double_metaphone('Eberbach'), ('APRPK', ''))
1436
        self.assertEqual(double_metaphone('Eberhard'), ('APRRT', ''))
1437
        self.assertEqual(double_metaphone('Eddy'), ('AT', ''))
1438
        self.assertEqual(double_metaphone('Edenden'), ('ATNTN', ''))
1439
        self.assertEqual(double_metaphone('Edwards'), ('ATRTS', ''))
1440
        self.assertEqual(double_metaphone('Eglinton'), ('AKLNTN', 'ALNTN'))
1441
        self.assertEqual(double_metaphone('Eliot'), ('ALT', ''))
1442
        self.assertEqual(double_metaphone('Elizabeth'), ('ALSP0', 'ALSPT'))
1443
        self.assertEqual(double_metaphone('Ellis'), ('ALS', ''))
1444
        self.assertEqual(double_metaphone('Ellison'), ('ALSN', ''))
1445
        self.assertEqual(double_metaphone('Ellot'), ('ALT', ''))
1446
        self.assertEqual(double_metaphone('Elny'), ('ALN', ''))
1447
        self.assertEqual(double_metaphone('Elsner'), ('ALSNR', ''))
1448
        self.assertEqual(double_metaphone('Emerson'), ('AMRSN', ''))
1449
        self.assertEqual(double_metaphone('Empson'), ('AMPSN', ''))
1450
        self.assertEqual(double_metaphone('Est'), ('AST', ''))
1451
        self.assertEqual(double_metaphone('Estabrook'), ('ASTPRK', ''))
1452
        self.assertEqual(double_metaphone('Estes'), ('ASTS', ''))
1453
        self.assertEqual(double_metaphone('Estey'), ('AST', ''))
1454
        self.assertEqual(double_metaphone('Evans'), ('AFNS', ''))
1455
        self.assertEqual(double_metaphone('Fallowell'), ('FLL', ''))
1456
        self.assertEqual(double_metaphone('Farnsworth'), ('FRNSR0', 'FRNSRT'))
1457
        self.assertEqual(double_metaphone('Feake'), ('FK', ''))
1458
        self.assertEqual(double_metaphone('Feke'), ('FK', ''))
1459
        self.assertEqual(double_metaphone('Fellows'), ('FLS', ''))
1460
        self.assertEqual(double_metaphone('Fettiplace'), ('FTPLS', ''))
1461
        self.assertEqual(double_metaphone('Finney'), ('FN', ''))
1462
        self.assertEqual(double_metaphone('Fischer'), ('FXR', 'FSKR'))
1463
        self.assertEqual(double_metaphone('Fisher'), ('FXR', ''))
1464
        self.assertEqual(double_metaphone('Fisk'), ('FSK', ''))
1465
        self.assertEqual(double_metaphone('Fiske'), ('FSK', ''))
1466
        self.assertEqual(double_metaphone('Fletcher'), ('FLXR', ''))
1467
        self.assertEqual(double_metaphone('Folger'), ('FLKR', 'FLJR'))
1468
        self.assertEqual(double_metaphone('Foliot'), ('FLT', ''))
1469
        self.assertEqual(double_metaphone('Folyot'), ('FLT', ''))
1470
        self.assertEqual(double_metaphone('Fones'), ('FNS', ''))
1471
        self.assertEqual(double_metaphone('Fordham'), ('FRTM', ''))
1472
        self.assertEqual(double_metaphone('Forstner'), ('FRSTNR', ''))
1473
        self.assertEqual(double_metaphone('Fosten'), ('FSTN', ''))
1474
        self.assertEqual(double_metaphone('Foster'), ('FSTR', ''))
1475
        self.assertEqual(double_metaphone('Foulke'), ('FLK', ''))
1476
        self.assertEqual(double_metaphone('Fowler'), ('FLR', ''))
1477
        self.assertEqual(double_metaphone('Foxwell'), ('FKSL', ''))
1478
        self.assertEqual(double_metaphone('Fraley'), ('FRL', ''))
1479
        self.assertEqual(double_metaphone('Franceys'), ('FRNSS', ''))
1480
        self.assertEqual(double_metaphone('Franke'), ('FRNK', ''))
1481
        self.assertEqual(double_metaphone('Frascella'), ('FRSL', ''))
1482
        self.assertEqual(double_metaphone('Frazer'), ('FRSR', ''))
1483
        self.assertEqual(double_metaphone('Fredd'), ('FRT', ''))
1484
        self.assertEqual(double_metaphone('Freeman'), ('FRMN', ''))
1485
        self.assertEqual(double_metaphone('French'), ('FRNX', 'FRNK'))
1486
        self.assertEqual(double_metaphone('Freville'), ('FRFL', ''))
1487
        self.assertEqual(double_metaphone('Frey'), ('FR', ''))
1488
        self.assertEqual(double_metaphone('Frick'), ('FRK', ''))
1489
        self.assertEqual(double_metaphone('Frier'), ('FR', 'FRR'))
1490
        self.assertEqual(double_metaphone('Froe'), ('FR', ''))
1491
        self.assertEqual(double_metaphone('Frorer'), ('FRRR', ''))
1492
        self.assertEqual(double_metaphone('Frost'), ('FRST', ''))
1493
        self.assertEqual(double_metaphone('Frothingham'), ('FR0NKM', 'FRTNKM'))
1494
        self.assertEqual(double_metaphone('Fry'), ('FR', ''))
1495
        self.assertEqual(double_metaphone('Gaffney'), ('KFN', ''))
1496
        self.assertEqual(double_metaphone('Gage'), ('KJ', 'KK'))
1497
        self.assertEqual(double_metaphone('Gallion'), ('KLN', ''))
1498
        self.assertEqual(double_metaphone('Gallishan'), ('KLXN', ''))
1499
        self.assertEqual(double_metaphone('Gamble'), ('KMPL', ''))
1500
        self.assertEqual(double_metaphone('Garbrand'), ('KRPRNT', ''))
1501
        self.assertEqual(double_metaphone('Gardner'), ('KRTNR', ''))
1502
        self.assertEqual(double_metaphone('Garrett'), ('KRT', ''))
1503
        self.assertEqual(double_metaphone('Gassner'), ('KSNR', ''))
1504
        self.assertEqual(double_metaphone('Gater'), ('KTR', ''))
1505
        self.assertEqual(double_metaphone('Gaunt'), ('KNT', ''))
1506
        self.assertEqual(double_metaphone('Gayer'), ('KR', ''))
1507
        self.assertEqual(double_metaphone('Gerken'), ('KRKN', 'JRKN'))
1508
        self.assertEqual(double_metaphone('Gerritsen'), ('KRTSN', 'JRTSN'))
1509
        self.assertEqual(double_metaphone('Gibbs'), ('KPS', 'JPS'))
1510
        self.assertEqual(double_metaphone('Giffard'), ('JFRT', 'KFRT'))
1511
        self.assertEqual(double_metaphone('Gilbert'), ('KLPRT', 'JLPRT'))
1512
        self.assertEqual(double_metaphone('Gill'), ('KL', 'JL'))
1513
        self.assertEqual(double_metaphone('Gilman'), ('KLMN', 'JLMN'))
1514
        self.assertEqual(double_metaphone('Glass'), ('KLS', ''))
1515
        self.assertEqual(double_metaphone('GoddardGifford'), ('KTRJFRT', ''))
1516
        self.assertEqual(double_metaphone('Godfrey'), ('KTFR', ''))
1517
        self.assertEqual(double_metaphone('Godwin'), ('KTN', ''))
1518
        self.assertEqual(double_metaphone('Goodale'), ('KTL', ''))
1519
        self.assertEqual(double_metaphone('Goodnow'), ('KTN', 'KTNF'))
1520
        self.assertEqual(double_metaphone('Gorham'), ('KRM', ''))
1521
        self.assertEqual(double_metaphone('Goseline'), ('KSLN', ''))
1522
        self.assertEqual(double_metaphone('Gott'), ('KT', ''))
1523
        self.assertEqual(double_metaphone('Gould'), ('KLT', ''))
1524
        self.assertEqual(double_metaphone('Grafton'), ('KRFTN', ''))
1525
        self.assertEqual(double_metaphone('Grant'), ('KRNT', ''))
1526
        self.assertEqual(double_metaphone('Gray'), ('KR', ''))
1527
        self.assertEqual(double_metaphone('Green'), ('KRN', ''))
1528
        self.assertEqual(double_metaphone('Griffin'), ('KRFN', ''))
1529
        self.assertEqual(double_metaphone('Grill'), ('KRL', ''))
1530
        self.assertEqual(double_metaphone('Grim'), ('KRM', ''))
1531
        self.assertEqual(double_metaphone('Grisgonelle'), ('KRSKNL', ''))
1532
        self.assertEqual(double_metaphone('Gross'), ('KRS', ''))
1533
        self.assertEqual(double_metaphone('Guba'), ('KP', ''))
1534
        self.assertEqual(double_metaphone('Gybbes'), ('KPS', 'JPS'))
1535
        self.assertEqual(double_metaphone('Haburne'), ('HPRN', ''))
1536
        self.assertEqual(double_metaphone('Hackburne'), ('HKPRN', ''))
1537
        self.assertEqual(double_metaphone('Haddon?'), ('HTN', ''))
1538
        self.assertEqual(double_metaphone('Haines'), ('HNS', ''))
1539
        self.assertEqual(double_metaphone('Hale'), ('HL', ''))
1540
        self.assertEqual(double_metaphone('Hall'), ('HL', ''))
1541
        self.assertEqual(double_metaphone('Hallet'), ('HLT', ''))
1542
        self.assertEqual(double_metaphone('Hallock'), ('HLK', ''))
1543
        self.assertEqual(double_metaphone('Halstead'), ('HLSTT', ''))
1544
        self.assertEqual(double_metaphone('Hammond'), ('HMNT', ''))
1545
        self.assertEqual(double_metaphone('Hance'), ('HNS', ''))
1546
        self.assertEqual(double_metaphone('Handy'), ('HNT', ''))
1547
        self.assertEqual(double_metaphone('Hanson'), ('HNSN', ''))
1548
        self.assertEqual(double_metaphone('Harasek'), ('HRSK', ''))
1549
        self.assertEqual(double_metaphone('Harcourt'), ('HRKRT', ''))
1550
        self.assertEqual(double_metaphone('Hardy'), ('HRT', ''))
1551
        self.assertEqual(double_metaphone('Harlock'), ('HRLK', ''))
1552
        self.assertEqual(double_metaphone('Harris'), ('HRS', ''))
1553
        self.assertEqual(double_metaphone('Hartley'), ('HRTL', ''))
1554
        self.assertEqual(double_metaphone('Harvey'), ('HRF', ''))
1555
        self.assertEqual(double_metaphone('Harvie'), ('HRF', ''))
1556
        self.assertEqual(double_metaphone('Harwood'), ('HRT', ''))
1557
        self.assertEqual(double_metaphone('Hathaway'), ('H0', 'HT'))
1558
        self.assertEqual(double_metaphone('Haukeness'), ('HKNS', ''))
1559
        self.assertEqual(double_metaphone('Hawkes'), ('HKS', ''))
1560
        self.assertEqual(double_metaphone('Hawkhurst'), ('HKRST', ''))
1561
        self.assertEqual(double_metaphone('Hawkins'), ('HKNS', ''))
1562
        self.assertEqual(double_metaphone('Hawley'), ('HL', ''))
1563
        self.assertEqual(double_metaphone('Heald'), ('HLT', ''))
1564
        self.assertEqual(double_metaphone('Helsdon'), ('HLSTN', ''))
1565
        self.assertEqual(double_metaphone('Hemenway'), ('HMN', ''))
1566
        self.assertEqual(double_metaphone('Hemmenway'), ('HMN', ''))
1567
        self.assertEqual(double_metaphone('Henck'), ('HNK', ''))
1568
        self.assertEqual(double_metaphone('Henderson'), ('HNTRSN', ''))
1569
        self.assertEqual(double_metaphone('Hendricks'), ('HNTRKS', ''))
1570
        self.assertEqual(double_metaphone('Hersey'), ('HRS', ''))
1571
        self.assertEqual(double_metaphone('Hewes'), ('HS', ''))
1572
        self.assertEqual(double_metaphone('Heyman'), ('HMN', ''))
1573
        self.assertEqual(double_metaphone('Hicks'), ('HKS', ''))
1574
        self.assertEqual(double_metaphone('Hidden'), ('HTN', ''))
1575
        self.assertEqual(double_metaphone('Higgs'), ('HKS', ''))
1576
        self.assertEqual(double_metaphone('Hill'), ('HL', ''))
1577
        self.assertEqual(double_metaphone('Hills'), ('HLS', ''))
1578
        self.assertEqual(double_metaphone('Hinckley'), ('HNKL', ''))
1579
        self.assertEqual(double_metaphone('Hipwell'), ('HPL', ''))
1580
        self.assertEqual(double_metaphone('Hobart'), ('HPRT', ''))
1581
        self.assertEqual(double_metaphone('Hoben'), ('HPN', ''))
1582
        self.assertEqual(double_metaphone('Hoffmann'), ('HFMN', ''))
1583
        self.assertEqual(double_metaphone('Hogan'), ('HKN', ''))
1584
        self.assertEqual(double_metaphone('Holmes'), ('HLMS', ''))
1585
        self.assertEqual(double_metaphone('Hoo'), ('H', ''))
1586
        self.assertEqual(double_metaphone('Hooker'), ('HKR', ''))
1587
        self.assertEqual(double_metaphone('Hopcott'), ('HPKT', ''))
1588
        self.assertEqual(double_metaphone('Hopkins'), ('HPKNS', ''))
1589
        self.assertEqual(double_metaphone('Hopkinson'), ('HPKNSN', ''))
1590
        self.assertEqual(double_metaphone('Hornsey'), ('HRNS', ''))
1591
        self.assertEqual(double_metaphone('Houckgeest'), ('HKJST', 'HKKST'))
1592
        self.assertEqual(double_metaphone('Hough'), ('H', ''))
1593
        self.assertEqual(double_metaphone('Houstin'), ('HSTN', ''))
1594
        self.assertEqual(double_metaphone('How'), ('H', 'HF'))
1595
        self.assertEqual(double_metaphone('Howe'), ('H', ''))
1596
        self.assertEqual(double_metaphone('Howland'), ('HLNT', ''))
1597
        self.assertEqual(double_metaphone('Hubner'), ('HPNR', ''))
1598
        self.assertEqual(double_metaphone('Hudnut'), ('HTNT', ''))
1599
        self.assertEqual(double_metaphone('Hughes'), ('HS', ''))
1600
        self.assertEqual(double_metaphone('Hull'), ('HL', ''))
1601
        self.assertEqual(double_metaphone('Hulme'), ('HLM', ''))
1602
        self.assertEqual(double_metaphone('Hume'), ('HM', ''))
1603
        self.assertEqual(double_metaphone('Hundertumark'), ('HNTRTMRK', ''))
1604
        self.assertEqual(double_metaphone('Hundley'), ('HNTL', ''))
1605
        self.assertEqual(double_metaphone('Hungerford'),
1606
                         ('HNKRFRT', 'HNJRFRT'))
1607
        self.assertEqual(double_metaphone('Hunt'), ('HNT', ''))
1608
        self.assertEqual(double_metaphone('Hurst'), ('HRST', ''))
1609
        self.assertEqual(double_metaphone('Husbands'), ('HSPNTS', ''))
1610
        self.assertEqual(double_metaphone('Hussey'), ('HS', ''))
1611
        self.assertEqual(double_metaphone('Husted'), ('HSTT', ''))
1612
        self.assertEqual(double_metaphone('Hutchins'), ('HXNS', ''))
1613
        self.assertEqual(double_metaphone('Hutchinson'), ('HXNSN', ''))
1614
        self.assertEqual(double_metaphone('Huttinger'), ('HTNKR', 'HTNJR'))
1615
        self.assertEqual(double_metaphone('Huybertsen'), ('HPRTSN', ''))
1616
        self.assertEqual(double_metaphone('Iddenden'), ('ATNTN', ''))
1617
        self.assertEqual(double_metaphone('Ingraham'), ('ANKRHM', ''))
1618
        self.assertEqual(double_metaphone('Ives'), ('AFS', ''))
1619
        self.assertEqual(double_metaphone('Jackson'), ('JKSN', 'AKSN'))
1620
        self.assertEqual(double_metaphone('Jacob'), ('JKP', 'AKP'))
1621
        self.assertEqual(double_metaphone('Jans'), ('JNS', 'ANS'))
1622
        self.assertEqual(double_metaphone('Jenkins'), ('JNKNS', 'ANKNS'))
1623
        self.assertEqual(double_metaphone('Jewett'), ('JT', 'AT'))
1624
        self.assertEqual(double_metaphone('Jewitt'), ('JT', 'AT'))
1625
        self.assertEqual(double_metaphone('Johnson'), ('JNSN', 'ANSN'))
1626
        self.assertEqual(double_metaphone('Jones'), ('JNS', 'ANS'))
1627
        self.assertEqual(double_metaphone('Josephine'), ('JSFN', 'HSFN'))
1628
        self.assertEqual(double_metaphone('Judd'), ('JT', 'AT'))
1629
        self.assertEqual(double_metaphone('June'), ('JN', 'AN'))
1630
        self.assertEqual(double_metaphone('Kamarowska'), ('KMRSK', ''))
1631
        self.assertEqual(double_metaphone('Kay'), ('K', ''))
1632
        self.assertEqual(double_metaphone('Kelley'), ('KL', ''))
1633
        self.assertEqual(double_metaphone('Kelly'), ('KL', ''))
1634
        self.assertEqual(double_metaphone('Keymber'), ('KMPR', ''))
1635
        self.assertEqual(double_metaphone('Keynes'), ('KNS', ''))
1636
        self.assertEqual(double_metaphone('Kilham'), ('KLM', ''))
1637
        self.assertEqual(double_metaphone('Kim'), ('KM', ''))
1638
        self.assertEqual(double_metaphone('Kimball'), ('KMPL', ''))
1639
        self.assertEqual(double_metaphone('King'), ('KNK', ''))
1640
        self.assertEqual(double_metaphone('Kinsey'), ('KNS', ''))
1641
        self.assertEqual(double_metaphone('Kirk'), ('KRK', ''))
1642
        self.assertEqual(double_metaphone('Kirton'), ('KRTN', ''))
1643
        self.assertEqual(double_metaphone('Kistler'), ('KSTLR', ''))
1644
        self.assertEqual(double_metaphone('Kitchen'), ('KXN', ''))
1645
        self.assertEqual(double_metaphone('Kitson'), ('KTSN', ''))
1646
        self.assertEqual(double_metaphone('Klett'), ('KLT', ''))
1647
        self.assertEqual(double_metaphone('Kline'), ('KLN', ''))
1648
        self.assertEqual(double_metaphone('Knapp'), ('NP', ''))
1649
        self.assertEqual(double_metaphone('Knight'), ('NT', ''))
1650
        self.assertEqual(double_metaphone('Knote'), ('NT', ''))
1651
        self.assertEqual(double_metaphone('Knott'), ('NT', ''))
1652
        self.assertEqual(double_metaphone('Knox'), ('NKS', ''))
1653
        self.assertEqual(double_metaphone('Koeller'), ('KLR', ''))
1654
        self.assertEqual(double_metaphone('La Pointe'), ('LPNT', ''))
1655
        self.assertEqual(double_metaphone('LaPlante'), ('LPLNT', ''))
1656
        self.assertEqual(double_metaphone('Laimbeer'), ('LMPR', ''))
1657
        self.assertEqual(double_metaphone('Lamb'), ('LMP', ''))
1658
        self.assertEqual(double_metaphone('Lambertson'), ('LMPRTSN', ''))
1659
        self.assertEqual(double_metaphone('Lancto'), ('LNKT', ''))
1660
        self.assertEqual(double_metaphone('Landry'), ('LNTR', ''))
1661
        self.assertEqual(double_metaphone('Lane'), ('LN', ''))
1662
        self.assertEqual(double_metaphone('Langendyck'), ('LNJNTK', 'LNKNTK'))
1663
        self.assertEqual(double_metaphone('Langer'), ('LNKR', 'LNJR'))
1664
        self.assertEqual(double_metaphone('Langford'), ('LNKFRT', ''))
1665
        self.assertEqual(double_metaphone('Lantersee'), ('LNTRS', ''))
1666
        self.assertEqual(double_metaphone('Laquer'), ('LKR', ''))
1667
        self.assertEqual(double_metaphone('Larkin'), ('LRKN', ''))
1668
        self.assertEqual(double_metaphone('Latham'), ('LTM', ''))
1669
        self.assertEqual(double_metaphone('Lathrop'), ('L0RP', 'LTRP'))
1670
        self.assertEqual(double_metaphone('Lauter'), ('LTR', ''))
1671
        self.assertEqual(double_metaphone('Lawrence'), ('LRNS', ''))
1672
        self.assertEqual(double_metaphone('Leach'), ('LK', ''))
1673
        self.assertEqual(double_metaphone('Leager'), ('LKR', 'LJR'))
1674
        self.assertEqual(double_metaphone('Learned'), ('LRNT', ''))
1675
        self.assertEqual(double_metaphone('Leavitt'), ('LFT', ''))
1676
        self.assertEqual(double_metaphone('Lee'), ('L', ''))
1677
        self.assertEqual(double_metaphone('Leete'), ('LT', ''))
1678
        self.assertEqual(double_metaphone('Leggett'), ('LKT', ''))
1679
        self.assertEqual(double_metaphone('Leland'), ('LLNT', ''))
1680
        self.assertEqual(double_metaphone('Leonard'), ('LNRT', ''))
1681
        self.assertEqual(double_metaphone('Lester'), ('LSTR', ''))
1682
        self.assertEqual(double_metaphone('Lestrange'), ('LSTRNJ', 'LSTRNK'))
1683
        self.assertEqual(double_metaphone('Lethem'), ('L0M', 'LTM'))
1684
        self.assertEqual(double_metaphone('Levine'), ('LFN', ''))
1685
        self.assertEqual(double_metaphone('Lewes'), ('LS', ''))
1686
        self.assertEqual(double_metaphone('Lewis'), ('LS', ''))
1687
        self.assertEqual(double_metaphone('Lincoln'), ('LNKLN', ''))
1688
        self.assertEqual(double_metaphone('Lindsey'), ('LNTS', ''))
1689
        self.assertEqual(double_metaphone('Linher'), ('LNR', ''))
1690
        self.assertEqual(double_metaphone('Lippet'), ('LPT', ''))
1691
        self.assertEqual(double_metaphone('Lippincott'), ('LPNKT', ''))
1692
        self.assertEqual(double_metaphone('Lockwood'), ('LKT', ''))
1693
        self.assertEqual(double_metaphone('Loines'), ('LNS', ''))
1694
        self.assertEqual(double_metaphone('Lombard'), ('LMPRT', ''))
1695
        self.assertEqual(double_metaphone('Long'), ('LNK', ''))
1696
        self.assertEqual(double_metaphone('Longespee'), ('LNJSP', 'LNKSP'))
1697
        self.assertEqual(double_metaphone('Look'), ('LK', ''))
1698
        self.assertEqual(double_metaphone('Lounsberry'), ('LNSPR', ''))
1699
        self.assertEqual(double_metaphone('Lounsbury'), ('LNSPR', ''))
1700
        self.assertEqual(double_metaphone('Louthe'), ('L0', 'LT'))
1701
        self.assertEqual(double_metaphone('Loveyne'), ('LFN', ''))
1702
        self.assertEqual(double_metaphone('Lowe'), ('L', ''))
1703
        self.assertEqual(double_metaphone('Ludlam'), ('LTLM', ''))
1704
        self.assertEqual(double_metaphone('Lumbard'), ('LMPRT', ''))
1705
        self.assertEqual(double_metaphone('Lund'), ('LNT', ''))
1706
        self.assertEqual(double_metaphone('Luno'), ('LN', ''))
1707
        self.assertEqual(double_metaphone('Lutz'), ('LTS', ''))
1708
        self.assertEqual(double_metaphone('Lydia'), ('LT', ''))
1709
        self.assertEqual(double_metaphone('Lynne'), ('LN', ''))
1710
        self.assertEqual(double_metaphone('Lyon'), ('LN', ''))
1711
        self.assertEqual(double_metaphone('MacAlpin'), ('MKLPN', ''))
1712
        self.assertEqual(double_metaphone('MacBricc'), ('MKPRK', ''))
1713
        self.assertEqual(double_metaphone('MacCrinan'), ('MKRNN', ''))
1714
        self.assertEqual(double_metaphone('MacKenneth'), ('MKN0', 'MKNT'))
1715
        self.assertEqual(double_metaphone('MacMael nam Bo'), ('MKMLNMP', ''))
1716
        self.assertEqual(double_metaphone('MacMurchada'), ('MKMRXT', 'MKMRKT'))
1717
        self.assertEqual(double_metaphone('Macomber'), ('MKMPR', ''))
1718
        self.assertEqual(double_metaphone('Macy'), ('MS', ''))
1719
        self.assertEqual(double_metaphone('Magnus'), ('MNS', 'MKNS'))
1720
        self.assertEqual(double_metaphone('Mahien'), ('MHN', ''))
1721
        self.assertEqual(double_metaphone('Malmains'), ('MLMNS', ''))
1722
        self.assertEqual(double_metaphone('Malory'), ('MLR', ''))
1723
        self.assertEqual(double_metaphone('Mancinelli'), ('MNSNL', ''))
1724
        self.assertEqual(double_metaphone('Mancini'), ('MNSN', ''))
1725
        self.assertEqual(double_metaphone('Mann'), ('MN', ''))
1726
        self.assertEqual(double_metaphone('Manning'), ('MNNK', ''))
1727
        self.assertEqual(double_metaphone('Manter'), ('MNTR', ''))
1728
        self.assertEqual(double_metaphone('Marion'), ('MRN', ''))
1729
        self.assertEqual(double_metaphone('Marley'), ('MRL', ''))
1730
        self.assertEqual(double_metaphone('Marmion'), ('MRMN', ''))
1731
        self.assertEqual(double_metaphone('Marquart'), ('MRKRT', ''))
1732
        self.assertEqual(double_metaphone('Marsh'), ('MRX', ''))
1733
        self.assertEqual(double_metaphone('Marshal'), ('MRXL', ''))
1734
        self.assertEqual(double_metaphone('Marshall'), ('MRXL', ''))
1735
        self.assertEqual(double_metaphone('Martel'), ('MRTL', ''))
1736
        self.assertEqual(double_metaphone('Martha'), ('MR0', 'MRT'))
1737
        self.assertEqual(double_metaphone('Martin'), ('MRTN', ''))
1738
        self.assertEqual(double_metaphone('Marturano'), ('MRTRN', ''))
1739
        self.assertEqual(double_metaphone('Marvin'), ('MRFN', ''))
1740
        self.assertEqual(double_metaphone('Mary'), ('MR', ''))
1741
        self.assertEqual(double_metaphone('Mason'), ('MSN', ''))
1742
        self.assertEqual(double_metaphone('Maxwell'), ('MKSL', ''))
1743
        self.assertEqual(double_metaphone('Mayhew'), ('MH', 'MHF'))
1744
        self.assertEqual(double_metaphone('McAllaster'), ('MKLSTR', ''))
1745
        self.assertEqual(double_metaphone('McAllister'), ('MKLSTR', ''))
1746
        self.assertEqual(double_metaphone('McConnell'), ('MKNL', ''))
1747
        self.assertEqual(double_metaphone('McFarland'), ('MKFRLNT', ''))
1748
        self.assertEqual(double_metaphone('McIlroy'), ('MSLR', ''))
1749
        self.assertEqual(double_metaphone('McNair'), ('MKNR', ''))
1750
        self.assertEqual(double_metaphone('McNair-Landry'), ('MKNRLNTR', ''))
1751
        self.assertEqual(double_metaphone('McRaven'), ('MKRFN', ''))
1752
        self.assertEqual(double_metaphone('Mead'), ('MT', ''))
1753
        self.assertEqual(double_metaphone('Meade'), ('MT', ''))
1754
        self.assertEqual(double_metaphone('Meck'), ('MK', ''))
1755
        self.assertEqual(double_metaphone('Melton'), ('MLTN', ''))
1756
        self.assertEqual(double_metaphone('Mendenhall'), ('MNTNL', ''))
1757
        self.assertEqual(double_metaphone('Mering'), ('MRNK', ''))
1758
        self.assertEqual(double_metaphone('Merrick'), ('MRK', ''))
1759
        self.assertEqual(double_metaphone('Merry'), ('MR', ''))
1760
        self.assertEqual(double_metaphone('Mighill'), ('ML', ''))
1761
        self.assertEqual(double_metaphone('Miller'), ('MLR', ''))
1762
        self.assertEqual(double_metaphone('Milton'), ('MLTN', ''))
1763
        self.assertEqual(double_metaphone('Mohun'), ('MHN', ''))
1764
        self.assertEqual(double_metaphone('Montague'), ('MNTK', ''))
1765
        self.assertEqual(double_metaphone('Montboucher'), ('MNTPXR', 'MNTPKR'))
1766
        self.assertEqual(double_metaphone('Moore'), ('MR', ''))
1767
        self.assertEqual(double_metaphone('Morrel'), ('MRL', ''))
1768
        self.assertEqual(double_metaphone('Morrill'), ('MRL', ''))
1769
        self.assertEqual(double_metaphone('Morris'), ('MRS', ''))
1770
        self.assertEqual(double_metaphone('Morton'), ('MRTN', ''))
1771
        self.assertEqual(double_metaphone('Moton'), ('MTN', ''))
1772
        self.assertEqual(double_metaphone('Muir'), ('MR', ''))
1773
        self.assertEqual(double_metaphone('Mulferd'), ('MLFRT', ''))
1774
        self.assertEqual(double_metaphone('Mullins'), ('MLNS', ''))
1775
        self.assertEqual(double_metaphone('Mulso'), ('MLS', ''))
1776
        self.assertEqual(double_metaphone('Munger'), ('MNKR', 'MNJR'))
1777
        self.assertEqual(double_metaphone('Munt'), ('MNT', ''))
1778
        self.assertEqual(double_metaphone('Murchad'), ('MRXT', 'MRKT'))
1779
        self.assertEqual(double_metaphone('Murdock'), ('MRTK', ''))
1780
        self.assertEqual(double_metaphone('Murray'), ('MR', ''))
1781
        self.assertEqual(double_metaphone('Muskett'), ('MSKT', ''))
1782
        self.assertEqual(double_metaphone('Myers'), ('MRS', ''))
1783
        self.assertEqual(double_metaphone('Myrick'), ('MRK', ''))
1784
        self.assertEqual(double_metaphone('NORRIS'), ('NRS', ''))
1785
        self.assertEqual(double_metaphone('Nayle'), ('NL', ''))
1786
        self.assertEqual(double_metaphone('Newcomb'), ('NKMP', ''))
1787
        self.assertEqual(double_metaphone('Newcomb(e)'), ('NKMP', ''))
1788
        self.assertEqual(double_metaphone('Newkirk'), ('NKRK', ''))
1789
        self.assertEqual(double_metaphone('Newton'), ('NTN', ''))
1790
        self.assertEqual(double_metaphone('Niles'), ('NLS', ''))
1791
        self.assertEqual(double_metaphone('Noble'), ('NPL', ''))
1792
        self.assertEqual(double_metaphone('Noel'), ('NL', ''))
1793
        self.assertEqual(double_metaphone('Northend'), ('NR0NT', 'NRTNT'))
1794
        self.assertEqual(double_metaphone('Norton'), ('NRTN', ''))
1795
        self.assertEqual(double_metaphone('Nutter'), ('NTR', ''))
1796
        self.assertEqual(double_metaphone('Odding'), ('ATNK', ''))
1797
        self.assertEqual(double_metaphone('Odenbaugh'), ('ATNP', ''))
1798
        self.assertEqual(double_metaphone('Ogborn'), ('AKPRN', ''))
1799
        self.assertEqual(double_metaphone('Oppenheimer'), ('APNMR', ''))
1800
        self.assertEqual(double_metaphone('Otis'), ('ATS', ''))
1801
        self.assertEqual(double_metaphone('Oviatt'), ('AFT', ''))
1802
        self.assertEqual(double_metaphone('PRUST?'), ('PRST', ''))
1803
        self.assertEqual(double_metaphone('Paddock'), ('PTK', ''))
1804
        self.assertEqual(double_metaphone('Page'), ('PJ', 'PK'))
1805
        self.assertEqual(double_metaphone('Paine'), ('PN', ''))
1806
        self.assertEqual(double_metaphone('Paist'), ('PST', ''))
1807
        self.assertEqual(double_metaphone('Palmer'), ('PLMR', ''))
1808
        self.assertEqual(double_metaphone('Park'), ('PRK', ''))
1809
        self.assertEqual(double_metaphone('Parker'), ('PRKR', ''))
1810
        self.assertEqual(double_metaphone('Parkhurst'), ('PRKRST', ''))
1811
        self.assertEqual(double_metaphone('Parrat'), ('PRT', ''))
1812
        self.assertEqual(double_metaphone('Parsons'), ('PRSNS', ''))
1813
        self.assertEqual(double_metaphone('Partridge'), ('PRTRJ', ''))
1814
        self.assertEqual(double_metaphone('Pashley'), ('PXL', ''))
1815
        self.assertEqual(double_metaphone('Pasley'), ('PSL', ''))
1816
        self.assertEqual(double_metaphone('Patrick'), ('PTRK', ''))
1817
        self.assertEqual(double_metaphone('Pattee'), ('PT', ''))
1818
        self.assertEqual(double_metaphone('Patten'), ('PTN', ''))
1819
        self.assertEqual(double_metaphone('Pawley'), ('PL', ''))
1820
        self.assertEqual(double_metaphone('Payne'), ('PN', ''))
1821
        self.assertEqual(double_metaphone('Peabody'), ('PPT', ''))
1822
        self.assertEqual(double_metaphone('Peake'), ('PK', ''))
1823
        self.assertEqual(double_metaphone('Pearson'), ('PRSN', ''))
1824
        self.assertEqual(double_metaphone('Peat'), ('PT', ''))
1825
        self.assertEqual(double_metaphone('Pedersen'), ('PTRSN', ''))
1826
        self.assertEqual(double_metaphone('Percy'), ('PRS', ''))
1827
        self.assertEqual(double_metaphone('Perkins'), ('PRKNS', ''))
1828
        self.assertEqual(double_metaphone('Perrine'), ('PRN', ''))
1829
        self.assertEqual(double_metaphone('Perry'), ('PR', ''))
1830
        self.assertEqual(double_metaphone('Peson'), ('PSN', ''))
1831
        self.assertEqual(double_metaphone('Peterson'), ('PTRSN', ''))
1832
        self.assertEqual(double_metaphone('Peyton'), ('PTN', ''))
1833
        self.assertEqual(double_metaphone('Phinney'), ('FN', ''))
1834
        self.assertEqual(double_metaphone('Pickard'), ('PKRT', ''))
1835
        self.assertEqual(double_metaphone('Pierce'), ('PRS', ''))
1836
        self.assertEqual(double_metaphone('Pierrepont'), ('PRPNT', ''))
1837
        self.assertEqual(double_metaphone('Pike'), ('PK', ''))
1838
        self.assertEqual(double_metaphone('Pinkham'), ('PNKM', ''))
1839
        self.assertEqual(double_metaphone('Pitman'), ('PTMN', ''))
1840
        self.assertEqual(double_metaphone('Pitt'), ('PT', ''))
1841
        self.assertEqual(double_metaphone('Pitts'), ('PTS', ''))
1842
        self.assertEqual(double_metaphone('Plantagenet'),
1843
                         ('PLNTJNT', 'PLNTKNT'))
1844
        self.assertEqual(double_metaphone('Platt'), ('PLT', ''))
1845
        self.assertEqual(double_metaphone('Platts'), ('PLTS', ''))
1846
        self.assertEqual(double_metaphone('Pleis'), ('PLS', ''))
1847
        self.assertEqual(double_metaphone('Pleiss'), ('PLS', ''))
1848
        self.assertEqual(double_metaphone('Plisko'), ('PLSK', ''))
1849
        self.assertEqual(double_metaphone('Pliskovitch'), ('PLSKFX', ''))
1850
        self.assertEqual(double_metaphone('Plum'), ('PLM', ''))
1851
        self.assertEqual(double_metaphone('Plume'), ('PLM', ''))
1852
        self.assertEqual(double_metaphone('Poitou'), ('PT', ''))
1853
        self.assertEqual(double_metaphone('Pomeroy'), ('PMR', ''))
1854
        self.assertEqual(double_metaphone('Poretiers'), ('PRTRS', ''))
1855
        self.assertEqual(double_metaphone('Pote'), ('PT', ''))
1856
        self.assertEqual(double_metaphone('Potter'), ('PTR', ''))
1857
        self.assertEqual(double_metaphone('Potts'), ('PTS', ''))
1858
        self.assertEqual(double_metaphone('Powell'), ('PL', ''))
1859
        self.assertEqual(double_metaphone('Pratt'), ('PRT', ''))
1860
        self.assertEqual(double_metaphone('Presbury'), ('PRSPR', ''))
1861
        self.assertEqual(double_metaphone('Priest'), ('PRST', ''))
1862
        self.assertEqual(double_metaphone('Prindle'), ('PRNTL', ''))
1863
        self.assertEqual(double_metaphone('Prior'), ('PRR', ''))
1864
        self.assertEqual(double_metaphone('Profumo'), ('PRFM', ''))
1865
        self.assertEqual(double_metaphone('Purdy'), ('PRT', ''))
1866
        self.assertEqual(double_metaphone('Purefoy'), ('PRF', ''))
1867
        self.assertEqual(double_metaphone('Pury'), ('PR', ''))
1868
        self.assertEqual(double_metaphone('Quinter'), ('KNTR', ''))
1869
        self.assertEqual(double_metaphone('Rachel'), ('RXL', 'RKL'))
1870
        self.assertEqual(double_metaphone('Rand'), ('RNT', ''))
1871
        self.assertEqual(double_metaphone('Rankin'), ('RNKN', ''))
1872
        self.assertEqual(double_metaphone('Ravenscroft'), ('RFNSKFT', ''))
1873
        self.assertEqual(double_metaphone('Raynsford'), ('RNSFRT', ''))
1874
        self.assertEqual(double_metaphone('Reakirt'), ('RKRT', ''))
1875
        self.assertEqual(double_metaphone('Reaves'), ('RFS', ''))
1876
        self.assertEqual(double_metaphone('Reeves'), ('RFS', ''))
1877
        self.assertEqual(double_metaphone('Reichert'), ('RXRT', 'RKRT'))
1878
        self.assertEqual(double_metaphone('Remmele'), ('RML', ''))
1879
        self.assertEqual(double_metaphone('Reynolds'), ('RNLTS', ''))
1880
        self.assertEqual(double_metaphone('Rhodes'), ('RTS', ''))
1881
        self.assertEqual(double_metaphone('Richards'), ('RXRTS', 'RKRTS'))
1882
        self.assertEqual(double_metaphone('Richardson'), ('RXRTSN', 'RKRTSN'))
1883
        self.assertEqual(double_metaphone('Ring'), ('RNK', ''))
1884
        self.assertEqual(double_metaphone('Roberts'), ('RPRTS', ''))
1885
        self.assertEqual(double_metaphone('Robertson'), ('RPRTSN', ''))
1886
        self.assertEqual(double_metaphone('Robson'), ('RPSN', ''))
1887
        self.assertEqual(double_metaphone('Rodie'), ('RT', ''))
1888
        self.assertEqual(double_metaphone('Rody'), ('RT', ''))
1889
        self.assertEqual(double_metaphone('Rogers'), ('RKRS', 'RJRS'))
1890
        self.assertEqual(double_metaphone('Ross'), ('RS', ''))
1891
        self.assertEqual(double_metaphone('Rosslevin'), ('RSLFN', ''))
1892
        self.assertEqual(double_metaphone('Rowland'), ('RLNT', ''))
1893
        self.assertEqual(double_metaphone('Ruehl'), ('RL', ''))
1894
        self.assertEqual(double_metaphone('Russell'), ('RSL', ''))
1895
        self.assertEqual(double_metaphone('Ruth'), ('R0', 'RT'))
1896
        self.assertEqual(double_metaphone('Ryan'), ('RN', ''))
1897
        self.assertEqual(double_metaphone('Rysse'), ('RS', ''))
1898
        self.assertEqual(double_metaphone('Sadler'), ('STLR', ''))
1899
        self.assertEqual(double_metaphone('Salmon'), ('SLMN', ''))
1900
        self.assertEqual(double_metaphone('Salter'), ('SLTR', ''))
1901
        self.assertEqual(double_metaphone('Salvatore'), ('SLFTR', ''))
1902
        self.assertEqual(double_metaphone('Sanders'), ('SNTRS', ''))
1903
        self.assertEqual(double_metaphone('Sands'), ('SNTS', ''))
1904
        self.assertEqual(double_metaphone('Sanford'), ('SNFRT', ''))
1905
        self.assertEqual(double_metaphone('Sanger'), ('SNKR', 'SNJR'))
1906
        self.assertEqual(double_metaphone('Sargent'), ('SRJNT', 'SRKNT'))
1907
        self.assertEqual(double_metaphone('Saunders'), ('SNTRS', ''))
1908
        self.assertEqual(double_metaphone('Schilling'), ('XLNK', ''))
1909
        self.assertEqual(double_metaphone('Schlegel'), ('XLKL', 'SLKL'))
1910
        self.assertEqual(double_metaphone('Scott'), ('SKT', ''))
1911
        self.assertEqual(double_metaphone('Sears'), ('SRS', ''))
1912
        self.assertEqual(double_metaphone('Segersall'), ('SJRSL', 'SKRSL'))
1913
        self.assertEqual(double_metaphone('Senecal'), ('SNKL', ''))
1914
        self.assertEqual(double_metaphone('Sergeaux'), ('SRJ', 'SRK'))
1915
        self.assertEqual(double_metaphone('Severance'), ('SFRNS', ''))
1916
        self.assertEqual(double_metaphone('Sharp'), ('XRP', ''))
1917
        self.assertEqual(double_metaphone('Sharpe'), ('XRP', ''))
1918
        self.assertEqual(double_metaphone('Sharply'), ('XRPL', ''))
1919
        self.assertEqual(double_metaphone('Shatswell'), ('XTSL', ''))
1920
        self.assertEqual(double_metaphone('Shattack'), ('XTK', ''))
1921
        self.assertEqual(double_metaphone('Shattock'), ('XTK', ''))
1922
        self.assertEqual(double_metaphone('Shattuck'), ('XTK', ''))
1923
        self.assertEqual(double_metaphone('Shaw'), ('X', 'XF'))
1924
        self.assertEqual(double_metaphone('Sheldon'), ('XLTN', ''))
1925
        self.assertEqual(double_metaphone('Sherman'), ('XRMN', ''))
1926
        self.assertEqual(double_metaphone('Shinn'), ('XN', ''))
1927
        self.assertEqual(double_metaphone('Shirford'), ('XRFRT', ''))
1928
        self.assertEqual(double_metaphone('Shirley'), ('XRL', ''))
1929
        self.assertEqual(double_metaphone('Shively'), ('XFL', ''))
1930
        self.assertEqual(double_metaphone('Shoemaker'), ('XMKR', ''))
1931
        self.assertEqual(double_metaphone('Short'), ('XRT', ''))
1932
        self.assertEqual(double_metaphone('Shotwell'), ('XTL', ''))
1933
        self.assertEqual(double_metaphone('Shute'), ('XT', ''))
1934
        self.assertEqual(double_metaphone('Sibley'), ('SPL', ''))
1935
        self.assertEqual(double_metaphone('Silver'), ('SLFR', ''))
1936
        self.assertEqual(double_metaphone('Simes'), ('SMS', ''))
1937
        self.assertEqual(double_metaphone('Sinken'), ('SNKN', ''))
1938
        self.assertEqual(double_metaphone('Sinn'), ('SN', ''))
1939
        self.assertEqual(double_metaphone('Skelton'), ('SKLTN', ''))
1940
        self.assertEqual(double_metaphone('Skiffe'), ('SKF', ''))
1941
        self.assertEqual(double_metaphone('Skotkonung'), ('SKTKNNK', ''))
1942
        self.assertEqual(double_metaphone('Slade'), ('SLT', 'XLT'))
1943
        self.assertEqual(double_metaphone('Slye'), ('SL', 'XL'))
1944
        self.assertEqual(double_metaphone('Smedley'), ('SMTL', 'XMTL'))
1945
        self.assertEqual(double_metaphone('Smith'), ('SM0', 'XMT'))
1946
        self.assertEqual(double_metaphone('Snow'), ('SN', 'XNF'))
1947
        self.assertEqual(double_metaphone('Soole'), ('SL', ''))
1948
        self.assertEqual(double_metaphone('Soule'), ('SL', ''))
1949
        self.assertEqual(double_metaphone('Southworth'), ('S0R0', 'STRT'))
1950
        self.assertEqual(double_metaphone('Sowles'), ('SLS', ''))
1951
        self.assertEqual(double_metaphone('Spalding'), ('SPLTNK', ''))
1952
        self.assertEqual(double_metaphone('Spark'), ('SPRK', ''))
1953
        self.assertEqual(double_metaphone('Spencer'), ('SPNSR', ''))
1954
        self.assertEqual(double_metaphone('Sperry'), ('SPR', ''))
1955
        self.assertEqual(double_metaphone('Spofford'), ('SPFRT', ''))
1956
        self.assertEqual(double_metaphone('Spooner'), ('SPNR', ''))
1957
        self.assertEqual(double_metaphone('Sprague'), ('SPRK', ''))
1958
        self.assertEqual(double_metaphone('Springer'), ('SPRNKR', 'SPRNJR'))
1959
        self.assertEqual(double_metaphone('St. Clair'), ('STKLR', ''))
1960
        self.assertEqual(double_metaphone('St. Claire'), ('STKLR', ''))
1961
        self.assertEqual(double_metaphone('St. Leger'), ('STLJR', 'STLKR'))
1962
        self.assertEqual(double_metaphone('St. Omer'), ('STMR', ''))
1963
        self.assertEqual(double_metaphone('Stafferton'), ('STFRTN', ''))
1964
        self.assertEqual(double_metaphone('Stafford'), ('STFRT', ''))
1965
        self.assertEqual(double_metaphone('Stalham'), ('STLM', ''))
1966
        self.assertEqual(double_metaphone('Stanford'), ('STNFRT', ''))
1967
        self.assertEqual(double_metaphone('Stanton'), ('STNTN', ''))
1968
        self.assertEqual(double_metaphone('Star'), ('STR', ''))
1969
        self.assertEqual(double_metaphone('Starbuck'), ('STRPK', ''))
1970
        self.assertEqual(double_metaphone('Starkey'), ('STRK', ''))
1971
        self.assertEqual(double_metaphone('Starkweather'),
1972
                         ('STRK0R', 'STRKTR'))
1973
        self.assertEqual(double_metaphone('Stearns'), ('STRNS', ''))
1974
        self.assertEqual(double_metaphone('Stebbins'), ('STPNS', ''))
1975
        self.assertEqual(double_metaphone('Steele'), ('STL', ''))
1976
        self.assertEqual(double_metaphone('Stephenson'), ('STFNSN', ''))
1977
        self.assertEqual(double_metaphone('Stevens'), ('STFNS', ''))
1978
        self.assertEqual(double_metaphone('Stoddard'), ('STTRT', ''))
1979
        self.assertEqual(double_metaphone('Stodder'), ('STTR', ''))
1980
        self.assertEqual(double_metaphone('Stone'), ('STN', ''))
1981
        self.assertEqual(double_metaphone('Storey'), ('STR', ''))
1982
        self.assertEqual(double_metaphone('Storrada'), ('STRT', ''))
1983
        self.assertEqual(double_metaphone('Story'), ('STR', ''))
1984
        self.assertEqual(double_metaphone('Stoughton'), ('STFTN', ''))
1985
        self.assertEqual(double_metaphone('Stout'), ('STT', ''))
1986
        self.assertEqual(double_metaphone('Stow'), ('ST', 'STF'))
1987
        self.assertEqual(double_metaphone('Strong'), ('STRNK', ''))
1988
        self.assertEqual(double_metaphone('Strutt'), ('STRT', ''))
1989
        self.assertEqual(double_metaphone('Stryker'), ('STRKR', ''))
1990
        self.assertEqual(double_metaphone('Stuckeley'), ('STKL', ''))
1991
        self.assertEqual(double_metaphone('Sturges'), ('STRJS', 'STRKS'))
1992
        self.assertEqual(double_metaphone('Sturgess'), ('STRJS', 'STRKS'))
1993
        self.assertEqual(double_metaphone('Sturgis'), ('STRJS', 'STRKS'))
1994
        self.assertEqual(double_metaphone('Suevain'), ('SFN', ''))
1995
        self.assertEqual(double_metaphone('Sulyard'), ('SLRT', ''))
1996
        self.assertEqual(double_metaphone('Sutton'), ('STN', ''))
1997
        self.assertEqual(double_metaphone('Swain'), ('SN', 'XN'))
1998
        self.assertEqual(double_metaphone('Swayne'), ('SN', 'XN'))
1999
        self.assertEqual(double_metaphone('Swayze'), ('SS', 'XTS'))
2000
        self.assertEqual(double_metaphone('Swift'), ('SFT', 'XFT'))
2001
        self.assertEqual(double_metaphone('Taber'), ('TPR', ''))
2002
        self.assertEqual(double_metaphone('Talcott'), ('TLKT', ''))
2003
        self.assertEqual(double_metaphone('Tarne'), ('TRN', ''))
2004
        self.assertEqual(double_metaphone('Tatum'), ('TTM', ''))
2005
        self.assertEqual(double_metaphone('Taverner'), ('TFRNR', ''))
2006
        self.assertEqual(double_metaphone('Taylor'), ('TLR', ''))
2007
        self.assertEqual(double_metaphone('Tenney'), ('TN', ''))
2008
        self.assertEqual(double_metaphone('Thayer'), ('0R', 'TR'))
2009
        self.assertEqual(double_metaphone('Thember'), ('0MPR', 'TMPR'))
2010
        self.assertEqual(double_metaphone('Thomas'), ('TMS', ''))
2011
        self.assertEqual(double_metaphone('Thompson'), ('TMPSN', ''))
2012
        self.assertEqual(double_metaphone('Thorne'), ('0RN', 'TRN'))
2013
        self.assertEqual(double_metaphone('Thornycraft'),
2014
                         ('0RNKRFT', 'TRNKRFT'))
2015
        self.assertEqual(double_metaphone('Threlkeld'), ('0RLKLT', 'TRLKLT'))
2016
        self.assertEqual(double_metaphone('Throckmorton'),
2017
                         ('0RKMRTN', 'TRKMRTN'))
2018
        self.assertEqual(double_metaphone('Thwaits'), ('0TS', 'TTS'))
2019
        self.assertEqual(double_metaphone('Tibbetts'), ('TPTS', ''))
2020
        self.assertEqual(double_metaphone('Tidd'), ('TT', ''))
2021
        self.assertEqual(double_metaphone('Tierney'), ('TRN', ''))
2022
        self.assertEqual(double_metaphone('Tilley'), ('TL', ''))
2023
        self.assertEqual(double_metaphone('Tillieres'), ('TLRS', ''))
2024
        self.assertEqual(double_metaphone('Tilly'), ('TL', ''))
2025
        self.assertEqual(double_metaphone('Tisdale'), ('TSTL', ''))
2026
        self.assertEqual(double_metaphone('Titus'), ('TTS', ''))
2027
        self.assertEqual(double_metaphone('Tobey'), ('TP', ''))
2028
        self.assertEqual(double_metaphone('Tooker'), ('TKR', ''))
2029
        self.assertEqual(double_metaphone('Towle'), ('TL', ''))
2030
        self.assertEqual(double_metaphone('Towne'), ('TN', ''))
2031
        self.assertEqual(double_metaphone('Townsend'), ('TNSNT', ''))
2032
        self.assertEqual(double_metaphone('Treadway'), ('TRT', ''))
2033
        self.assertEqual(double_metaphone('Trelawney'), ('TRLN', ''))
2034
        self.assertEqual(double_metaphone('Trinder'), ('TRNTR', ''))
2035
        self.assertEqual(double_metaphone('Tripp'), ('TRP', ''))
2036
        self.assertEqual(double_metaphone('Trippe'), ('TRP', ''))
2037
        self.assertEqual(double_metaphone('Trott'), ('TRT', ''))
2038
        self.assertEqual(double_metaphone('True'), ('TR', ''))
2039
        self.assertEqual(double_metaphone('Trussebut'), ('TRSPT', ''))
2040
        self.assertEqual(double_metaphone('Tucker'), ('TKR', ''))
2041
        self.assertEqual(double_metaphone('Turgeon'), ('TRJN', 'TRKN'))
2042
        self.assertEqual(double_metaphone('Turner'), ('TRNR', ''))
2043
        self.assertEqual(double_metaphone('Tuttle'), ('TTL', ''))
2044
        self.assertEqual(double_metaphone('Tyler'), ('TLR', ''))
2045
        self.assertEqual(double_metaphone('Tylle'), ('TL', ''))
2046
        self.assertEqual(double_metaphone('Tyrrel'), ('TRL', ''))
2047
        self.assertEqual(double_metaphone('Ua Tuathail'), ('AT0L', 'ATTL'))
2048
        self.assertEqual(double_metaphone('Ulrich'), ('ALRX', 'ALRK'))
2049
        self.assertEqual(double_metaphone('Underhill'), ('ANTRL', ''))
2050
        self.assertEqual(double_metaphone('Underwood'), ('ANTRT', ''))
2051
        self.assertEqual(double_metaphone('Unknown'), ('ANKNN', ''))
2052
        self.assertEqual(double_metaphone('Valentine'), ('FLNTN', ''))
2053
        self.assertEqual(double_metaphone('Van Egmond'), ('FNKMNT', ''))
2054
        self.assertEqual(double_metaphone('Van der Beek'), ('FNTRPK', ''))
2055
        self.assertEqual(double_metaphone('Vaughan'), ('FKN', ''))
2056
        self.assertEqual(double_metaphone('Vermenlen'), ('FRMNLN', ''))
2057
        self.assertEqual(double_metaphone('Vincent'), ('FNSNT', ''))
2058
        self.assertEqual(double_metaphone('Volentine'), ('FLNTN', ''))
2059
        self.assertEqual(double_metaphone('Wagner'), ('AKNR', 'FKNR'))
2060
        self.assertEqual(double_metaphone('Waite'), ('AT', 'FT'))
2061
        self.assertEqual(double_metaphone('Walker'), ('ALKR', 'FLKR'))
2062
        self.assertEqual(double_metaphone('Walter'), ('ALTR', 'FLTR'))
2063
        self.assertEqual(double_metaphone('Wandell'), ('ANTL', 'FNTL'))
2064
        self.assertEqual(double_metaphone('Wandesford'),
2065
                         ('ANTSFRT', 'FNTSFRT'))
2066
        self.assertEqual(double_metaphone('Warbleton'), ('ARPLTN', 'FRPLTN'))
2067
        self.assertEqual(double_metaphone('Ward'), ('ART', 'FRT'))
2068
        self.assertEqual(double_metaphone('Warde'), ('ART', 'FRT'))
2069
        self.assertEqual(double_metaphone('Ware'), ('AR', 'FR'))
2070
        self.assertEqual(double_metaphone('Wareham'), ('ARHM', 'FRHM'))
2071
        self.assertEqual(double_metaphone('Warner'), ('ARNR', 'FRNR'))
2072
        self.assertEqual(double_metaphone('Warren'), ('ARN', 'FRN'))
2073
        self.assertEqual(double_metaphone('Washburne'), ('AXPRN', 'FXPRN'))
2074
        self.assertEqual(double_metaphone('Waterbury'), ('ATRPR', 'FTRPR'))
2075
        self.assertEqual(double_metaphone('Watson'), ('ATSN', 'FTSN'))
2076
        self.assertEqual(double_metaphone('WatsonEllithorpe'),
2077
                         ('ATSNL0RP', 'FTSNLTRP'))
2078
        self.assertEqual(double_metaphone('Watts'), ('ATS', 'FTS'))
2079
        self.assertEqual(double_metaphone('Wayne'), ('AN', 'FN'))
2080
        self.assertEqual(double_metaphone('Webb'), ('AP', 'FP'))
2081
        self.assertEqual(double_metaphone('Weber'), ('APR', 'FPR'))
2082
        self.assertEqual(double_metaphone('Webster'), ('APSTR', 'FPSTR'))
2083
        self.assertEqual(double_metaphone('Weed'), ('AT', 'FT'))
2084
        self.assertEqual(double_metaphone('Weeks'), ('AKS', 'FKS'))
2085
        self.assertEqual(double_metaphone('Wells'), ('ALS', 'FLS'))
2086
        self.assertEqual(double_metaphone('Wenzell'), ('ANSL', 'FNTSL'))
2087
        self.assertEqual(double_metaphone('West'), ('AST', 'FST'))
2088
        self.assertEqual(double_metaphone('Westbury'), ('ASTPR', 'FSTPR'))
2089
        self.assertEqual(double_metaphone('Whatlocke'), ('ATLK', ''))
2090
        self.assertEqual(double_metaphone('Wheeler'), ('ALR', ''))
2091
        self.assertEqual(double_metaphone('Whiston'), ('ASTN', ''))
2092
        self.assertEqual(double_metaphone('White'), ('AT', ''))
2093
        self.assertEqual(double_metaphone('Whitman'), ('ATMN', ''))
2094
        self.assertEqual(double_metaphone('Whiton'), ('ATN', ''))
2095
        self.assertEqual(double_metaphone('Whitson'), ('ATSN', ''))
2096
        self.assertEqual(double_metaphone('Wickes'), ('AKS', 'FKS'))
2097
        self.assertEqual(double_metaphone('Wilbur'), ('ALPR', 'FLPR'))
2098
        self.assertEqual(double_metaphone('Wilcotes'), ('ALKTS', 'FLKTS'))
2099
        self.assertEqual(double_metaphone('Wilkinson'), ('ALKNSN', 'FLKNSN'))
2100
        self.assertEqual(double_metaphone('Willets'), ('ALTS', 'FLTS'))
2101
        self.assertEqual(double_metaphone('Willett'), ('ALT', 'FLT'))
2102
        self.assertEqual(double_metaphone('Willey'), ('AL', 'FL'))
2103
        self.assertEqual(double_metaphone('Williams'), ('ALMS', 'FLMS'))
2104
        self.assertEqual(double_metaphone('Williston'), ('ALSTN', 'FLSTN'))
2105
        self.assertEqual(double_metaphone('Wilson'), ('ALSN', 'FLSN'))
2106
        self.assertEqual(double_metaphone('Wimes'), ('AMS', 'FMS'))
2107
        self.assertEqual(double_metaphone('Winch'), ('ANX', 'FNK'))
2108
        self.assertEqual(double_metaphone('Winegar'), ('ANKR', 'FNKR'))
2109
        self.assertEqual(double_metaphone('Wing'), ('ANK', 'FNK'))
2110
        self.assertEqual(double_metaphone('Winsley'), ('ANSL', 'FNSL'))
2111
        self.assertEqual(double_metaphone('Winslow'), ('ANSL', 'FNSLF'))
2112
        self.assertEqual(double_metaphone('Winthrop'), ('AN0RP', 'FNTRP'))
2113
        self.assertEqual(double_metaphone('Wise'), ('AS', 'FS'))
2114
        self.assertEqual(double_metaphone('Wood'), ('AT', 'FT'))
2115
        self.assertEqual(double_metaphone('Woodbridge'), ('ATPRJ', 'FTPRJ'))
2116
        self.assertEqual(double_metaphone('Woodward'), ('ATRT', 'FTRT'))
2117
        self.assertEqual(double_metaphone('Wooley'), ('AL', 'FL'))
2118
        self.assertEqual(double_metaphone('Woolley'), ('AL', 'FL'))
2119
        self.assertEqual(double_metaphone('Worth'), ('AR0', 'FRT'))
2120
        self.assertEqual(double_metaphone('Worthen'), ('AR0N', 'FRTN'))
2121
        self.assertEqual(double_metaphone('Worthley'), ('AR0L', 'FRTL'))
2122
        self.assertEqual(double_metaphone('Wright'), ('RT', ''))
2123
        self.assertEqual(double_metaphone('Wyer'), ('AR', 'FR'))
2124
        self.assertEqual(double_metaphone('Wyere'), ('AR', 'FR'))
2125
        self.assertEqual(double_metaphone('Wynkoop'), ('ANKP', 'FNKP'))
2126
        self.assertEqual(double_metaphone('Yarnall'), ('ARNL', ''))
2127
        self.assertEqual(double_metaphone('Yeoman'), ('AMN', ''))
2128
        self.assertEqual(double_metaphone('Yorke'), ('ARK', ''))
2129
        self.assertEqual(double_metaphone('Young'), ('ANK', ''))
2130
        self.assertEqual(double_metaphone('ab Wennonwen'), ('APNNN', ''))
2131
        self.assertEqual(double_metaphone('ap Llewellyn'), ('APLLN', ''))
2132
        self.assertEqual(double_metaphone('ap Lorwerth'), ('APLRR0', 'APLRRT'))
2133
        self.assertEqual(double_metaphone('d\'Angouleme'), ('TNKLM', ''))
2134
        self.assertEqual(double_metaphone('de Audeham'), ('TTHM', ''))
2135
        self.assertEqual(double_metaphone('de Bavant'), ('TPFNT', ''))
2136
        self.assertEqual(double_metaphone('de Beauchamp'), ('TPXMP', 'TPKMP'))
2137
        self.assertEqual(double_metaphone('de Beaumont'), ('TPMNT', ''))
2138
        self.assertEqual(double_metaphone('de Bolbec'), ('TPLPK', ''))
2139
        self.assertEqual(double_metaphone('de Braiose'), ('TPRS', ''))
2140
        self.assertEqual(double_metaphone('de Braose'), ('TPRS', ''))
2141
        self.assertEqual(double_metaphone('de Briwere'), ('TPRR', ''))
2142
        self.assertEqual(double_metaphone('de Cantelou'), ('TKNTL', ''))
2143
        self.assertEqual(double_metaphone('de Cherelton'),
2144
                         ('TXRLTN', 'TKRLTN'))
2145
        self.assertEqual(double_metaphone('de Cherleton'),
2146
                         ('TXRLTN', 'TKRLTN'))
2147
        self.assertEqual(double_metaphone('de Clare'), ('TKLR', ''))
2148
        self.assertEqual(double_metaphone('de Claremont'), ('TKLRMNT', ''))
2149
        self.assertEqual(double_metaphone('de Clifford'), ('TKLFRT', ''))
2150
        self.assertEqual(double_metaphone('de Colville'), ('TKLFL', ''))
2151
        self.assertEqual(double_metaphone('de Courtenay'), ('TKRTN', ''))
2152
        self.assertEqual(double_metaphone('de Fauconberg'), ('TFKNPRK', ''))
2153
        self.assertEqual(double_metaphone('de Forest'), ('TFRST', ''))
2154
        self.assertEqual(double_metaphone('de Gai'), ('TK', ''))
2155
        self.assertEqual(double_metaphone('de Grey'), ('TKR', ''))
2156
        self.assertEqual(double_metaphone('de Guernons'), ('TKRNNS', ''))
2157
        self.assertEqual(double_metaphone('de Haia'), ('T', ''))
2158
        self.assertEqual(double_metaphone('de Harcourt'), ('TRKRT', ''))
2159
        self.assertEqual(double_metaphone('de Hastings'), ('TSTNKS', ''))
2160
        self.assertEqual(double_metaphone('de Hoke'), ('TK', ''))
2161
        self.assertEqual(double_metaphone('de Hooch'), ('TK', ''))
2162
        self.assertEqual(double_metaphone('de Hugelville'), ('TJLFL', 'TKLFL'))
2163
        self.assertEqual(double_metaphone('de Huntingdon'), ('TNTNKTN', ''))
2164
        self.assertEqual(double_metaphone('de Insula'), ('TNSL', ''))
2165
        self.assertEqual(double_metaphone('de Keynes'), ('TKNS', ''))
2166
        self.assertEqual(double_metaphone('de Lacy'), ('TLS', ''))
2167
        self.assertEqual(double_metaphone('de Lexington'), ('TLKSNKTN', ''))
2168
        self.assertEqual(double_metaphone('de Lusignan'), ('TLSNN', 'TLSKNN'))
2169
        self.assertEqual(double_metaphone('de Manvers'), ('TMNFRS', ''))
2170
        self.assertEqual(double_metaphone('de Montagu'), ('TMNTK', ''))
2171
        self.assertEqual(double_metaphone('de Montault'), ('TMNTLT', ''))
2172
        self.assertEqual(double_metaphone('de Montfort'), ('TMNTFRT', ''))
2173
        self.assertEqual(double_metaphone('de Mortimer'), ('TMRTMR', ''))
2174
        self.assertEqual(double_metaphone('de Morville'), ('TMRFL', ''))
2175
        self.assertEqual(double_metaphone('de Morvois'), ('TMRF', 'TMRFS'))
2176
        self.assertEqual(double_metaphone('de Neufmarche'),
2177
                         ('TNFMRX', 'TNFMRK'))
2178
        self.assertEqual(double_metaphone('de Odingsells'), ('TTNKSLS', ''))
2179
        self.assertEqual(double_metaphone('de Odyngsells'), ('TTNKSLS', ''))
2180
        self.assertEqual(double_metaphone('de Percy'), ('TPRS', ''))
2181
        self.assertEqual(double_metaphone('de Pierrepont'), ('TPRPNT', ''))
2182
        self.assertEqual(double_metaphone('de Plessetis'), ('TPLSTS', ''))
2183
        self.assertEqual(double_metaphone('de Porhoet'), ('TPRT', ''))
2184
        self.assertEqual(double_metaphone('de Prouz'), ('TPRS', ''))
2185
        self.assertEqual(double_metaphone('de Quincy'), ('TKNS', ''))
2186
        self.assertEqual(double_metaphone('de Ripellis'), ('TRPLS', ''))
2187
        self.assertEqual(double_metaphone('de Ros'), ('TRS', ''))
2188
        self.assertEqual(double_metaphone('de Salisbury'), ('TSLSPR', ''))
2189
        self.assertEqual(double_metaphone('de Sanford'), ('TSNFRT', ''))
2190
        self.assertEqual(double_metaphone('de Somery'), ('TSMR', ''))
2191
        self.assertEqual(double_metaphone('de St. Hilary'), ('TSTLR', ''))
2192
        self.assertEqual(double_metaphone('de St. Liz'), ('TSTLS', ''))
2193
        self.assertEqual(double_metaphone('de Sutton'), ('TSTN', ''))
2194
        self.assertEqual(double_metaphone('de Toeni'), ('TTN', ''))
2195
        self.assertEqual(double_metaphone('de Tony'), ('TTN', ''))
2196
        self.assertEqual(double_metaphone('de Umfreville'), ('TMFRFL', ''))
2197
        self.assertEqual(double_metaphone('de Valognes'), ('TFLNS', 'TFLKNS'))
2198
        self.assertEqual(double_metaphone('de Vaux'), ('TF', ''))
2199
        self.assertEqual(double_metaphone('de Vere'), ('TFR', ''))
2200
        self.assertEqual(double_metaphone('de Vermandois'),
2201
                         ('TFRMNT', 'TFRMNTS'))
2202
        self.assertEqual(double_metaphone('de Vernon'), ('TFRNN', ''))
2203
        self.assertEqual(double_metaphone('de Vexin'), ('TFKSN', ''))
2204
        self.assertEqual(double_metaphone('de Vitre'), ('TFTR', ''))
2205
        self.assertEqual(double_metaphone('de Wandesford'), ('TNTSFRT', ''))
2206
        self.assertEqual(double_metaphone('de Warenne'), ('TRN', ''))
2207
        self.assertEqual(double_metaphone('de Westbury'), ('TSTPR', ''))
2208
        self.assertEqual(double_metaphone('di Saluzzo'), ('TSLS', 'TSLTS'))
2209
        self.assertEqual(double_metaphone('fitz Alan'), ('FTSLN', ''))
2210
        self.assertEqual(double_metaphone('fitz Geoffrey'),
2211
                         ('FTSJFR', 'FTSKFR'))
2212
        self.assertEqual(double_metaphone('fitz Herbert'), ('FTSRPRT', ''))
2213
        self.assertEqual(double_metaphone('fitz John'), ('FTSJN', ''))
2214
        self.assertEqual(double_metaphone('fitz Patrick'), ('FTSPTRK', ''))
2215
        self.assertEqual(double_metaphone('fitz Payn'), ('FTSPN', ''))
2216
        self.assertEqual(double_metaphone('fitz Piers'), ('FTSPRS', ''))
2217
        self.assertEqual(double_metaphone('fitz Randolph'), ('FTSRNTLF', ''))
2218
        self.assertEqual(double_metaphone('fitz Richard'),
2219
                         ('FTSRXRT', 'FTSRKRT'))
2220
        self.assertEqual(double_metaphone('fitz Robert'), ('FTSRPRT', ''))
2221
        self.assertEqual(double_metaphone('fitz Roy'), ('FTSR', ''))
2222
        self.assertEqual(double_metaphone('fitz Scrob'), ('FTSSKP', ''))
2223
        self.assertEqual(double_metaphone('fitz Walter'), ('FTSLTR', ''))
2224
        self.assertEqual(double_metaphone('fitz Warin'), ('FTSRN', ''))
2225
        self.assertEqual(double_metaphone('fitz Williams'), ('FTSLMS', ''))
2226
        self.assertEqual(double_metaphone('la Zouche'), ('LSX', 'LSK'))
2227
        self.assertEqual(double_metaphone('le Botiller'), ('LPTLR', ''))
2228
        self.assertEqual(double_metaphone('le Despenser'), ('LTSPNSR', ''))
2229
        self.assertEqual(double_metaphone('le deSpencer'), ('LTSPNSR', ''))
2230
        self.assertEqual(double_metaphone('of Allendale'), ('AFLNTL', ''))
2231
        self.assertEqual(double_metaphone('of Angouleme'), ('AFNKLM', ''))
2232
        self.assertEqual(double_metaphone('of Anjou'), ('AFNJ', ''))
2233
        self.assertEqual(double_metaphone('of Aquitaine'), ('AFKTN', ''))
2234
        self.assertEqual(double_metaphone('of Aumale'), ('AFML', ''))
2235
        self.assertEqual(double_metaphone('of Bavaria'), ('AFPFR', ''))
2236
        self.assertEqual(double_metaphone('of Boulogne'), ('AFPLN', 'AFPLKN'))
2237
        self.assertEqual(double_metaphone('of Brittany'), ('AFPRTN', ''))
2238
        self.assertEqual(double_metaphone('of Brittary'), ('AFPRTR', ''))
2239
        self.assertEqual(double_metaphone('of Castile'), ('AFKSTL', ''))
2240
        self.assertEqual(double_metaphone('of Chester'), ('AFXSTR', 'AFKSTR'))
2241
        self.assertEqual(double_metaphone('of Clermont'), ('AFKLRMNT', ''))
2242
        self.assertEqual(double_metaphone('of Cologne'), ('AFKLN', 'AFKLKN'))
2243
        self.assertEqual(double_metaphone('of Dinan'), ('AFTNN', ''))
2244
        self.assertEqual(double_metaphone('of Dunbar'), ('AFTNPR', ''))
2245
        self.assertEqual(double_metaphone('of England'), ('AFNKLNT', ''))
2246
        self.assertEqual(double_metaphone('of Essex'), ('AFSKS', ''))
2247
        self.assertEqual(double_metaphone('of Falaise'), ('AFFLS', ''))
2248
        self.assertEqual(double_metaphone('of Flanders'), ('AFFLNTRS', ''))
2249
        self.assertEqual(double_metaphone('of Galloway'), ('AFKL', ''))
2250
        self.assertEqual(double_metaphone('of Germany'), ('AFKRMN', 'AFJRMN'))
2251
        self.assertEqual(double_metaphone('of Gloucester'), ('AFKLSSTR', ''))
2252
        self.assertEqual(double_metaphone('of Heristal'), ('AFRSTL', ''))
2253
        self.assertEqual(double_metaphone('of Hungary'), ('AFNKR', ''))
2254
        self.assertEqual(double_metaphone('of Huntington'), ('AFNTNKTN', ''))
2255
        self.assertEqual(double_metaphone('of Kiev'), ('AFKF', ''))
2256
        self.assertEqual(double_metaphone('of Kuno'), ('AFKN', ''))
2257
        self.assertEqual(double_metaphone('of Landen'), ('AFLNTN', ''))
2258
        self.assertEqual(double_metaphone('of Laon'), ('AFLN', ''))
2259
        self.assertEqual(double_metaphone('of Leinster'), ('AFLNSTR', ''))
2260
        self.assertEqual(double_metaphone('of Lens'), ('AFLNS', ''))
2261
        self.assertEqual(double_metaphone('of Lorraine'), ('AFLRN', ''))
2262
        self.assertEqual(double_metaphone('of Louvain'), ('AFLFN', ''))
2263
        self.assertEqual(double_metaphone('of Mercia'), ('AFMRS', 'AFMRX'))
2264
        self.assertEqual(double_metaphone('of Metz'), ('AFMTS', ''))
2265
        self.assertEqual(double_metaphone('of Meulan'), ('AFMLN', ''))
2266
        self.assertEqual(double_metaphone('of Nass'), ('AFNS', ''))
2267
        self.assertEqual(double_metaphone('of Normandy'), ('AFNRMNT', ''))
2268
        self.assertEqual(double_metaphone('of Ohningen'), ('AFNNJN', 'AFNNKN'))
2269
        self.assertEqual(double_metaphone('of Orleans'), ('AFRLNS', ''))
2270
        self.assertEqual(double_metaphone('of Poitou'), ('AFPT', ''))
2271
        self.assertEqual(double_metaphone('of Polotzk'), ('AFPLTSK', ''))
2272
        self.assertEqual(double_metaphone('of Provence'), ('AFPRFNS', ''))
2273
        self.assertEqual(double_metaphone('of Ringelheim'),
2274
                         ('AFRNJLM', 'AFRNKLM'))
2275
        self.assertEqual(double_metaphone('of Salisbury'), ('AFSLSPR', ''))
2276
        self.assertEqual(double_metaphone('of Saxony'), ('AFSKSN', ''))
2277
        self.assertEqual(double_metaphone('of Scotland'), ('AFSKTLNT', ''))
2278
        self.assertEqual(double_metaphone('of Senlis'), ('AFSNLS', ''))
2279
        self.assertEqual(double_metaphone('of Stafford'), ('AFSTFRT', ''))
2280
        self.assertEqual(double_metaphone('of Swabia'), ('AFSP', ''))
2281
        self.assertEqual(double_metaphone('of Tongres'), ('AFTNKRS', ''))
2282
        self.assertEqual(double_metaphone('of the Tributes'),
2283
                         ('AF0TRPTS', 'AFTTRPTS'))
2284
        self.assertEqual(double_metaphone('unknown'), ('ANKNN', ''))
2285
        self.assertEqual(double_metaphone('van der Gouda'), ('FNTRKT', ''))
2286
        self.assertEqual(double_metaphone('von Adenbaugh'), ('FNTNP', ''))
2287
        self.assertEqual(double_metaphone('ARCHITure'), ('ARKTR', ''))
2288
        self.assertEqual(double_metaphone('Arnoff'), ('ARNF', ''))
2289
        self.assertEqual(double_metaphone('Arnow'), ('ARN', 'ARNF'))
2290
        self.assertEqual(double_metaphone('DANGER'), ('TNJR', 'TNKR'))
2291
        self.assertEqual(double_metaphone('Jankelowicz'), ('JNKLTS', 'ANKLFX'))
2292
        self.assertEqual(double_metaphone('MANGER'), ('MNJR', 'MNKR'))
2293
        self.assertEqual(double_metaphone('McClellan'), ('MKLLN', ''))
2294
        self.assertEqual(double_metaphone('McHugh'), ('MK', ''))
2295
        self.assertEqual(double_metaphone('McLaughlin'), ('MKLFLN', ''))
2296
        self.assertEqual(double_metaphone('ORCHEStra'), ('ARKSTR', ''))
2297
        self.assertEqual(double_metaphone('ORCHID'), ('ARKT', ''))
2298
        self.assertEqual(double_metaphone('Pierce'), ('PRS', ''))
2299
        self.assertEqual(double_metaphone('RANGER'), ('RNJR', 'RNKR'))
2300
        self.assertEqual(double_metaphone('Schlesinger'), ('XLSNKR', 'SLSNJR'))
2301
        self.assertEqual(double_metaphone('Uomo'), ('AM', ''))
2302
        self.assertEqual(double_metaphone('Vasserman'), ('FSRMN', ''))
2303
        self.assertEqual(double_metaphone('Wasserman'), ('ASRMN', 'FSRMN'))
2304
        self.assertEqual(double_metaphone('Womo'), ('AM', 'FM'))
2305
        self.assertEqual(double_metaphone('Yankelovich'), ('ANKLFX', 'ANKLFK'))
2306
        self.assertEqual(double_metaphone('accede'), ('AKST', ''))
2307
        self.assertEqual(double_metaphone('accident'), ('AKSTNT', ''))
2308
        self.assertEqual(double_metaphone('adelsheim'), ('ATLSM', ''))
2309
        self.assertEqual(double_metaphone('aged'), ('AJT', 'AKT'))
2310
        self.assertEqual(double_metaphone('ageless'), ('AJLS', 'AKLS'))
2311
        self.assertEqual(double_metaphone('agency'), ('AJNS', 'AKNS'))
2312
        self.assertEqual(double_metaphone('aghast'), ('AKST', ''))
2313
        self.assertEqual(double_metaphone('agio'), ('AJ', 'AK'))
2314
        self.assertEqual(double_metaphone('agrimony'), ('AKRMN', ''))
2315
        self.assertEqual(double_metaphone('album'), ('ALPM', ''))
2316
        self.assertEqual(double_metaphone('alcmene'), ('ALKMN', ''))
2317
        self.assertEqual(double_metaphone('alehouse'), ('ALHS', ''))
2318
        self.assertEqual(double_metaphone('antique'), ('ANTK', ''))
2319
        self.assertEqual(double_metaphone('artois'), ('ART', 'ARTS'))
2320
        self.assertEqual(double_metaphone('automation'), ('ATMXN', ''))
2321
        self.assertEqual(double_metaphone('bacchus'), ('PKS', ''))
2322
        self.assertEqual(double_metaphone('bacci'), ('PX', ''))
2323
        self.assertEqual(double_metaphone('bajador'), ('PJTR', 'PHTR'))
2324
        self.assertEqual(double_metaphone('bellocchio'), ('PLX', ''))
2325
        self.assertEqual(double_metaphone('bertucci'), ('PRTX', ''))
2326
        self.assertEqual(double_metaphone('biaggi'), ('PJ', 'PK'))
2327
        self.assertEqual(double_metaphone('bough'), ('P', ''))
2328
        self.assertEqual(double_metaphone('breaux'), ('PR', ''))
2329
        self.assertEqual(double_metaphone('broughton'), ('PRTN', ''))
2330
        self.assertEqual(double_metaphone('cabrillo'), ('KPRL', 'KPR'))
2331
        self.assertEqual(double_metaphone('caesar'), ('SSR', ''))
2332
        self.assertEqual(double_metaphone('cagney'), ('KKN', ''))
2333
        self.assertEqual(double_metaphone('campbell'), ('KMPL', ''))
2334
        self.assertEqual(double_metaphone('carlisle'), ('KRLL', ''))
2335
        self.assertEqual(double_metaphone('carlysle'), ('KRLL', ''))
2336
        self.assertEqual(double_metaphone('chemistry'), ('KMSTR', ''))
2337
        self.assertEqual(double_metaphone('chianti'), ('KNT', ''))
2338
        self.assertEqual(double_metaphone('chorus'), ('KRS', ''))
2339
        self.assertEqual(double_metaphone('cough'), ('KF', ''))
2340
        self.assertEqual(double_metaphone('czerny'), ('SRN', 'XRN'))
2341
        self.assertEqual(double_metaphone('deffenbacher'), ('TFNPKR', ''))
2342
        self.assertEqual(double_metaphone('dumb'), ('TM', ''))
2343
        self.assertEqual(double_metaphone('edgar'), ('ATKR', ''))
2344
        self.assertEqual(double_metaphone('edge'), ('AJ', ''))
2345
        self.assertEqual(double_metaphone('filipowicz'), ('FLPTS', 'FLPFX'))
2346
        self.assertEqual(double_metaphone('focaccia'), ('FKX', ''))
2347
        self.assertEqual(double_metaphone('gallegos'), ('KLKS', 'KKS'))
2348
        self.assertEqual(double_metaphone('gambrelli'), ('KMPRL', ''))
2349
        self.assertEqual(double_metaphone('geithain'), ('K0N', 'JTN'))
2350
        self.assertEqual(double_metaphone('ghiradelli'), ('JRTL', ''))
2351
        self.assertEqual(double_metaphone('ghislane'), ('JLN', ''))
2352
        self.assertEqual(double_metaphone('gough'), ('KF', ''))
2353
        self.assertEqual(double_metaphone('hartheim'), ('HR0M', 'HRTM'))
2354
        self.assertEqual(double_metaphone('heimsheim'), ('HMSM', ''))
2355
        self.assertEqual(double_metaphone('hochmeier'), ('HKMR', ''))
2356
        self.assertEqual(double_metaphone('hugh'), ('H', ''))
2357
        self.assertEqual(double_metaphone('hunger'), ('HNKR', 'HNJR'))
2358
        self.assertEqual(double_metaphone('hungry'), ('HNKR', ''))
2359
        self.assertEqual(double_metaphone('island'), ('ALNT', ''))
2360
        self.assertEqual(double_metaphone('isle'), ('AL', ''))
2361
        self.assertEqual(double_metaphone('jose'), ('HS', ''))
2362
        self.assertEqual(double_metaphone('laugh'), ('LF', ''))
2363
        self.assertEqual(double_metaphone('mac caffrey'), ('MKFR', ''))
2364
        self.assertEqual(double_metaphone('mac gregor'), ('MKRKR', ''))
2365
        self.assertEqual(double_metaphone('pegnitz'), ('PNTS', 'PKNTS'))
2366
        self.assertEqual(double_metaphone('piskowitz'), ('PSKTS', 'PSKFX'))
2367
        self.assertEqual(double_metaphone('queen'), ('KN', ''))
2368
        self.assertEqual(double_metaphone('raspberry'), ('RSPR', ''))
2369
        self.assertEqual(double_metaphone('resnais'), ('RSN', 'RSNS'))
2370
        self.assertEqual(double_metaphone('rogier'), ('RJ', 'RJR'))
2371
        self.assertEqual(double_metaphone('rough'), ('RF', ''))
2372
        self.assertEqual(double_metaphone('san jacinto'), ('SNHSNT', ''))
2373
        self.assertEqual(double_metaphone('schenker'), ('XNKR', 'SKNKR'))
2374
        self.assertEqual(double_metaphone('schermerhorn'),
2375
                         ('XRMRRN', 'SKRMRRN'))
2376
        self.assertEqual(double_metaphone('schmidt'), ('XMT', 'SMT'))
2377
        self.assertEqual(double_metaphone('schneider'), ('XNTR', 'SNTR'))
2378
        self.assertEqual(double_metaphone('school'), ('SKL', ''))
2379
        self.assertEqual(double_metaphone('schooner'), ('SKNR', ''))
2380
        self.assertEqual(double_metaphone('schrozberg'), ('XRSPRK', 'SRSPRK'))
2381
        self.assertEqual(double_metaphone('schulman'), ('XLMN', ''))
2382
        self.assertEqual(double_metaphone('schwabach'), ('XPK', 'XFPK'))
2383
        self.assertEqual(double_metaphone('schwarzach'), ('XRSK', 'XFRTSK'))
2384
        self.assertEqual(double_metaphone('smith'), ('SM0', 'XMT'))
2385
        self.assertEqual(double_metaphone('snider'), ('SNTR', 'XNTR'))
2386
        self.assertEqual(double_metaphone('succeed'), ('SKST', ''))
2387
        self.assertEqual(double_metaphone('sugarcane'), ('XKRKN', 'SKRKN'))
2388
        self.assertEqual(double_metaphone('svobodka'), ('SFPTK', ''))
2389
        self.assertEqual(double_metaphone('tagliaro'), ('TKLR', 'TLR'))
2390
        self.assertEqual(double_metaphone('thames'), ('TMS', ''))
2391
        self.assertEqual(double_metaphone('theilheim'), ('0LM', 'TLM'))
2392
        self.assertEqual(double_metaphone('thomas'), ('TMS', ''))
2393
        self.assertEqual(double_metaphone('thumb'), ('0M', 'TM'))
2394
        self.assertEqual(double_metaphone('tichner'), ('TXNR', 'TKNR'))
2395
        self.assertEqual(double_metaphone('tough'), ('TF', ''))
2396
        self.assertEqual(double_metaphone('umbrella'), ('AMPRL', ''))
2397
        self.assertEqual(double_metaphone('vilshofen'), ('FLXFN', ''))
2398
        self.assertEqual(double_metaphone('von schuller'), ('FNXLR', ''))
2399
        self.assertEqual(double_metaphone('wachtler'), ('AKTLR', 'FKTLR'))
2400
        self.assertEqual(double_metaphone('wechsler'), ('AKSLR', 'FKSLR'))
2401
        self.assertEqual(double_metaphone('weikersheim'), ('AKRSM', 'FKRSM'))
2402
        self.assertEqual(double_metaphone('zhao'), ('J', ''))
2403
2404
    def test_double_metaphone_surnames4(self):
2405
        """Test abydos.phonetic.double_metaphone (surname data, 4-letter)."""
2406
        self.assertEqual(double_metaphone('', 4), ('', ''))
2407
        self.assertEqual(double_metaphone('ALLERTON', 4), ('ALRT', ''))
2408
        self.assertEqual(double_metaphone('Acton', 4), ('AKTN', ''))
2409
        self.assertEqual(double_metaphone('Adams', 4), ('ATMS', ''))
2410
        self.assertEqual(double_metaphone('Aggar', 4), ('AKR', ''))
2411
        self.assertEqual(double_metaphone('Ahl', 4), ('AL', ''))
2412
        self.assertEqual(double_metaphone('Aiken', 4), ('AKN', ''))
2413
        self.assertEqual(double_metaphone('Alan', 4), ('ALN', ''))
2414
        self.assertEqual(double_metaphone('Alcock', 4), ('ALKK', ''))
2415
        self.assertEqual(double_metaphone('Alden', 4), ('ALTN', ''))
2416
        self.assertEqual(double_metaphone('Aldham', 4), ('ALTM', ''))
2417
        self.assertEqual(double_metaphone('Allen', 4), ('ALN', ''))
2418
        self.assertEqual(double_metaphone('Allerton', 4), ('ALRT', ''))
2419
        self.assertEqual(double_metaphone('Alsop', 4), ('ALSP', ''))
2420
        self.assertEqual(double_metaphone('Alwein', 4), ('ALN', ''))
2421
        self.assertEqual(double_metaphone('Ambler', 4), ('AMPL', ''))
2422
        self.assertEqual(double_metaphone('Andevill', 4), ('ANTF', ''))
2423
        self.assertEqual(double_metaphone('Andrews', 4), ('ANTR', ''))
2424
        self.assertEqual(double_metaphone('Andreyco', 4), ('ANTR', ''))
2425
        self.assertEqual(double_metaphone('Andriesse', 4), ('ANTR', ''))
2426
        self.assertEqual(double_metaphone('Angier', 4), ('ANJ', 'ANJR'))
2427
        self.assertEqual(double_metaphone('Annabel', 4), ('ANPL', ''))
2428
        self.assertEqual(double_metaphone('Anne', 4), ('AN', ''))
2429
        self.assertEqual(double_metaphone('Anstye', 4), ('ANST', ''))
2430
        self.assertEqual(double_metaphone('Appling', 4), ('APLN', ''))
2431
        self.assertEqual(double_metaphone('Apuke', 4), ('APK', ''))
2432
        self.assertEqual(double_metaphone('Arnold', 4), ('ARNL', ''))
2433
        self.assertEqual(double_metaphone('Ashby', 4), ('AXP', ''))
2434
        self.assertEqual(double_metaphone('Astwood', 4), ('ASTT', ''))
2435
        self.assertEqual(double_metaphone('Atkinson', 4), ('ATKN', ''))
2436
        self.assertEqual(double_metaphone('Audley', 4), ('ATL', ''))
2437
        self.assertEqual(double_metaphone('Austin', 4), ('ASTN', ''))
2438
        self.assertEqual(double_metaphone('Avenal', 4), ('AFNL', ''))
2439
        self.assertEqual(double_metaphone('Ayer', 4), ('AR', ''))
2440
        self.assertEqual(double_metaphone('Ayot', 4), ('AT', ''))
2441
        self.assertEqual(double_metaphone('Babbitt', 4), ('PPT', ''))
2442
        self.assertEqual(double_metaphone('Bachelor', 4), ('PXLR', 'PKLR'))
2443
        self.assertEqual(double_metaphone('Bachelour', 4), ('PXLR', 'PKLR'))
2444
        self.assertEqual(double_metaphone('Bailey', 4), ('PL', ''))
2445
        self.assertEqual(double_metaphone('Baivel', 4), ('PFL', ''))
2446
        self.assertEqual(double_metaphone('Baker', 4), ('PKR', ''))
2447
        self.assertEqual(double_metaphone('Baldwin', 4), ('PLTN', ''))
2448
        self.assertEqual(double_metaphone('Balsley', 4), ('PLSL', ''))
2449
        self.assertEqual(double_metaphone('Barber', 4), ('PRPR', ''))
2450
        self.assertEqual(double_metaphone('Barker', 4), ('PRKR', ''))
2451
        self.assertEqual(double_metaphone('Barlow', 4), ('PRL', 'PRLF'))
2452
        self.assertEqual(double_metaphone('Barnard', 4), ('PRNR', ''))
2453
        self.assertEqual(double_metaphone('Barnes', 4), ('PRNS', ''))
2454
        self.assertEqual(double_metaphone('Barnsley', 4), ('PRNS', ''))
2455
        self.assertEqual(double_metaphone('Barouxis', 4), ('PRKS', ''))
2456
        self.assertEqual(double_metaphone('Bartlet', 4), ('PRTL', ''))
2457
        self.assertEqual(double_metaphone('Basley', 4), ('PSL', ''))
2458
        self.assertEqual(double_metaphone('Basset', 4), ('PST', ''))
2459
        self.assertEqual(double_metaphone('Bassett', 4), ('PST', ''))
2460
        self.assertEqual(double_metaphone('Batchlor', 4), ('PXLR', ''))
2461
        self.assertEqual(double_metaphone('Bates', 4), ('PTS', ''))
2462
        self.assertEqual(double_metaphone('Batson', 4), ('PTSN', ''))
2463
        self.assertEqual(double_metaphone('Bayes', 4), ('PS', ''))
2464
        self.assertEqual(double_metaphone('Bayley', 4), ('PL', ''))
2465
        self.assertEqual(double_metaphone('Beale', 4), ('PL', ''))
2466
        self.assertEqual(double_metaphone('Beauchamp', 4), ('PXMP', 'PKMP'))
2467
        self.assertEqual(double_metaphone('Beauclerc', 4), ('PKLR', ''))
2468
        self.assertEqual(double_metaphone('Beech', 4), ('PK', ''))
2469
        self.assertEqual(double_metaphone('Beers', 4), ('PRS', ''))
2470
        self.assertEqual(double_metaphone('Beke', 4), ('PK', ''))
2471
        self.assertEqual(double_metaphone('Belcher', 4), ('PLXR', 'PLKR'))
2472
        self.assertEqual(double_metaphone('Benjamin', 4), ('PNJM', ''))
2473
        self.assertEqual(double_metaphone('Benningham', 4), ('PNNK', ''))
2474
        self.assertEqual(double_metaphone('Bereford', 4), ('PRFR', ''))
2475
        self.assertEqual(double_metaphone('Bergen', 4), ('PRJN', 'PRKN'))
2476
        self.assertEqual(double_metaphone('Berkeley', 4), ('PRKL', ''))
2477
        self.assertEqual(double_metaphone('Berry', 4), ('PR', ''))
2478
        self.assertEqual(double_metaphone('Besse', 4), ('PS', ''))
2479
        self.assertEqual(double_metaphone('Bessey', 4), ('PS', ''))
2480
        self.assertEqual(double_metaphone('Bessiles', 4), ('PSLS', ''))
2481
        self.assertEqual(double_metaphone('Bigelow', 4), ('PJL', 'PKLF'))
2482
        self.assertEqual(double_metaphone('Bigg', 4), ('PK', ''))
2483
        self.assertEqual(double_metaphone('Bigod', 4), ('PKT', ''))
2484
        self.assertEqual(double_metaphone('Billings', 4), ('PLNK', ''))
2485
        self.assertEqual(double_metaphone('Bimper', 4), ('PMPR', ''))
2486
        self.assertEqual(double_metaphone('Binker', 4), ('PNKR', ''))
2487
        self.assertEqual(double_metaphone('Birdsill', 4), ('PRTS', ''))
2488
        self.assertEqual(double_metaphone('Bishop', 4), ('PXP', ''))
2489
        self.assertEqual(double_metaphone('Black', 4), ('PLK', ''))
2490
        self.assertEqual(double_metaphone('Blagge', 4), ('PLK', ''))
2491
        self.assertEqual(double_metaphone('Blake', 4), ('PLK', ''))
2492
        self.assertEqual(double_metaphone('Blanck', 4), ('PLNK', ''))
2493
        self.assertEqual(double_metaphone('Bledsoe', 4), ('PLTS', ''))
2494
        self.assertEqual(double_metaphone('Blennerhasset', 4), ('PLNR', ''))
2495
        self.assertEqual(double_metaphone('Blessing', 4), ('PLSN', ''))
2496
        self.assertEqual(double_metaphone('Blewett', 4), ('PLT', ''))
2497
        self.assertEqual(double_metaphone('Bloctgoed', 4), ('PLKT', ''))
2498
        self.assertEqual(double_metaphone('Bloetgoet', 4), ('PLTK', ''))
2499
        self.assertEqual(double_metaphone('Bloodgood', 4), ('PLTK', ''))
2500
        self.assertEqual(double_metaphone('Blossom', 4), ('PLSM', ''))
2501
        self.assertEqual(double_metaphone('Blount', 4), ('PLNT', ''))
2502
        self.assertEqual(double_metaphone('Bodine', 4), ('PTN', ''))
2503
        self.assertEqual(double_metaphone('Bodman', 4), ('PTMN', ''))
2504
        self.assertEqual(double_metaphone('BonCoeur', 4), ('PNKR', ''))
2505
        self.assertEqual(double_metaphone('Bond', 4), ('PNT', ''))
2506
        self.assertEqual(double_metaphone('Boscawen', 4), ('PSKN', ''))
2507
        self.assertEqual(double_metaphone('Bosworth', 4), ('PSR0', 'PSRT'))
2508
        self.assertEqual(double_metaphone('Bouchier', 4), ('PX', 'PKR'))
2509
        self.assertEqual(double_metaphone('Bowne', 4), ('PN', ''))
2510
        self.assertEqual(double_metaphone('Bradbury', 4), ('PRTP', ''))
2511
        self.assertEqual(double_metaphone('Bradder', 4), ('PRTR', ''))
2512
        self.assertEqual(double_metaphone('Bradford', 4), ('PRTF', ''))
2513
        self.assertEqual(double_metaphone('Bradstreet', 4), ('PRTS', ''))
2514
        self.assertEqual(double_metaphone('Braham', 4), ('PRHM', ''))
2515
        self.assertEqual(double_metaphone('Brailsford', 4), ('PRLS', ''))
2516
        self.assertEqual(double_metaphone('Brainard', 4), ('PRNR', ''))
2517
        self.assertEqual(double_metaphone('Brandish', 4), ('PRNT', ''))
2518
        self.assertEqual(double_metaphone('Braun', 4), ('PRN', ''))
2519
        self.assertEqual(double_metaphone('Brecc', 4), ('PRK', ''))
2520
        self.assertEqual(double_metaphone('Brent', 4), ('PRNT', ''))
2521
        self.assertEqual(double_metaphone('Brenton', 4), ('PRNT', ''))
2522
        self.assertEqual(double_metaphone('Briggs', 4), ('PRKS', ''))
2523
        self.assertEqual(double_metaphone('Brigham', 4), ('PRM', ''))
2524
        self.assertEqual(double_metaphone('Brobst', 4), ('PRPS', ''))
2525
        self.assertEqual(double_metaphone('Brome', 4), ('PRM', ''))
2526
        self.assertEqual(double_metaphone('Bronson', 4), ('PRNS', ''))
2527
        self.assertEqual(double_metaphone('Brooks', 4), ('PRKS', ''))
2528
        self.assertEqual(double_metaphone('Brouillard', 4), ('PRLR', ''))
2529
        self.assertEqual(double_metaphone('Brown', 4), ('PRN', ''))
2530
        self.assertEqual(double_metaphone('Browne', 4), ('PRN', ''))
2531
        self.assertEqual(double_metaphone('Brownell', 4), ('PRNL', ''))
2532
        self.assertEqual(double_metaphone('Bruley', 4), ('PRL', ''))
2533
        self.assertEqual(double_metaphone('Bryant', 4), ('PRNT', ''))
2534
        self.assertEqual(double_metaphone('Brzozowski', 4), ('PRSS', 'PRTS'))
2535
        self.assertEqual(double_metaphone('Buide', 4), ('PT', ''))
2536
        self.assertEqual(double_metaphone('Bulmer', 4), ('PLMR', ''))
2537
        self.assertEqual(double_metaphone('Bunker', 4), ('PNKR', ''))
2538
        self.assertEqual(double_metaphone('Burden', 4), ('PRTN', ''))
2539
        self.assertEqual(double_metaphone('Burge', 4), ('PRJ', 'PRK'))
2540
        self.assertEqual(double_metaphone('Burgoyne', 4), ('PRKN', ''))
2541
        self.assertEqual(double_metaphone('Burke', 4), ('PRK', ''))
2542
        self.assertEqual(double_metaphone('Burnett', 4), ('PRNT', ''))
2543
        self.assertEqual(double_metaphone('Burpee', 4), ('PRP', ''))
2544
        self.assertEqual(double_metaphone('Bursley', 4), ('PRSL', ''))
2545
        self.assertEqual(double_metaphone('Burton', 4), ('PRTN', ''))
2546
        self.assertEqual(double_metaphone('Bushnell', 4), ('PXNL', ''))
2547
        self.assertEqual(double_metaphone('Buss', 4), ('PS', ''))
2548
        self.assertEqual(double_metaphone('Buswell', 4), ('PSL', ''))
2549
        self.assertEqual(double_metaphone('Butler', 4), ('PTLR', ''))
2550
        self.assertEqual(double_metaphone('Calkin', 4), ('KLKN', ''))
2551
        self.assertEqual(double_metaphone('Canada', 4), ('KNT', ''))
2552
        self.assertEqual(double_metaphone('Canmore', 4), ('KNMR', ''))
2553
        self.assertEqual(double_metaphone('Canney', 4), ('KN', ''))
2554
        self.assertEqual(double_metaphone('Capet', 4), ('KPT', ''))
2555
        self.assertEqual(double_metaphone('Card', 4), ('KRT', ''))
2556
        self.assertEqual(double_metaphone('Carman', 4), ('KRMN', ''))
2557
        self.assertEqual(double_metaphone('Carpenter', 4), ('KRPN', ''))
2558
        self.assertEqual(double_metaphone('Cartwright', 4), ('KRTR', ''))
2559
        self.assertEqual(double_metaphone('Casey', 4), ('KS', ''))
2560
        self.assertEqual(double_metaphone('Catterfield', 4), ('KTRF', ''))
2561
        self.assertEqual(double_metaphone('Ceeley', 4), ('SL', ''))
2562
        self.assertEqual(double_metaphone('Chambers', 4), ('XMPR', ''))
2563
        self.assertEqual(double_metaphone('Champion', 4), ('XMPN', ''))
2564
        self.assertEqual(double_metaphone('Chapman', 4), ('XPMN', ''))
2565
        self.assertEqual(double_metaphone('Chase', 4), ('XS', ''))
2566
        self.assertEqual(double_metaphone('Cheney', 4), ('XN', ''))
2567
        self.assertEqual(double_metaphone('Chetwynd', 4), ('XTNT', ''))
2568
        self.assertEqual(double_metaphone('Chevalier', 4), ('XFL', 'XFLR'))
2569
        self.assertEqual(double_metaphone('Chillingsworth', 4), ('XLNK', ''))
2570
        self.assertEqual(double_metaphone('Christie', 4), ('KRST', ''))
2571
        self.assertEqual(double_metaphone('Chubbuck', 4), ('XPK', ''))
2572
        self.assertEqual(double_metaphone('Church', 4), ('XRX', 'XRK'))
2573
        self.assertEqual(double_metaphone('Clark', 4), ('KLRK', ''))
2574
        self.assertEqual(double_metaphone('Clarke', 4), ('KLRK', ''))
2575
        self.assertEqual(double_metaphone('Cleare', 4), ('KLR', ''))
2576
        self.assertEqual(double_metaphone('Clement', 4), ('KLMN', ''))
2577
        self.assertEqual(double_metaphone('Clerke', 4), ('KLRK', ''))
2578
        self.assertEqual(double_metaphone('Clibben', 4), ('KLPN', ''))
2579
        self.assertEqual(double_metaphone('Clifford', 4), ('KLFR', ''))
2580
        self.assertEqual(double_metaphone('Clivedon', 4), ('KLFT', ''))
2581
        self.assertEqual(double_metaphone('Close', 4), ('KLS', ''))
2582
        self.assertEqual(double_metaphone('Clothilde', 4), ('KL0L', 'KLTL'))
2583
        self.assertEqual(double_metaphone('Cobb', 4), ('KP', ''))
2584
        self.assertEqual(double_metaphone('Coburn', 4), ('KPRN', ''))
2585
        self.assertEqual(double_metaphone('Coburne', 4), ('KPRN', ''))
2586
        self.assertEqual(double_metaphone('Cocke', 4), ('KK', ''))
2587
        self.assertEqual(double_metaphone('Coffin', 4), ('KFN', ''))
2588
        self.assertEqual(double_metaphone('Coffyn', 4), ('KFN', ''))
2589
        self.assertEqual(double_metaphone('Colborne', 4), ('KLPR', ''))
2590
        self.assertEqual(double_metaphone('Colby', 4), ('KLP', ''))
2591
        self.assertEqual(double_metaphone('Cole', 4), ('KL', ''))
2592
        self.assertEqual(double_metaphone('Coleman', 4), ('KLMN', ''))
2593
        self.assertEqual(double_metaphone('Collier', 4), ('KL', 'KLR'))
2594
        self.assertEqual(double_metaphone('Compton', 4), ('KMPT', ''))
2595
        self.assertEqual(double_metaphone('Cone', 4), ('KN', ''))
2596
        self.assertEqual(double_metaphone('Cook', 4), ('KK', ''))
2597
        self.assertEqual(double_metaphone('Cooke', 4), ('KK', ''))
2598
        self.assertEqual(double_metaphone('Cooper', 4), ('KPR', ''))
2599
        self.assertEqual(double_metaphone('Copperthwaite', 4),
2600
                         ('KPR0', 'KPRT'))
2601
        self.assertEqual(double_metaphone('Corbet', 4), ('KRPT', ''))
2602
        self.assertEqual(double_metaphone('Corell', 4), ('KRL', ''))
2603
        self.assertEqual(double_metaphone('Corey', 4), ('KR', ''))
2604
        self.assertEqual(double_metaphone('Corlies', 4), ('KRLS', ''))
2605
        self.assertEqual(double_metaphone('Corneliszen', 4), ('KRNL', ''))
2606
        self.assertEqual(double_metaphone('Cornelius', 4), ('KRNL', ''))
2607
        self.assertEqual(double_metaphone('Cornwallis', 4), ('KRNL', ''))
2608
        self.assertEqual(double_metaphone('Cosgrove', 4), ('KSKR', ''))
2609
        self.assertEqual(double_metaphone('Count of Brionne', 4), ('KNTF', ''))
2610
        self.assertEqual(double_metaphone('Covill', 4), ('KFL', ''))
2611
        self.assertEqual(double_metaphone('Cowperthwaite', 4),
2612
                         ('KPR0', 'KPRT'))
2613
        self.assertEqual(double_metaphone('Cowperwaite', 4), ('KPRT', ''))
2614
        self.assertEqual(double_metaphone('Crane', 4), ('KRN', ''))
2615
        self.assertEqual(double_metaphone('Creagmile', 4), ('KRKM', ''))
2616
        self.assertEqual(double_metaphone('Crew', 4), ('KR', 'KRF'))
2617
        self.assertEqual(double_metaphone('Crispin', 4), ('KRSP', ''))
2618
        self.assertEqual(double_metaphone('Crocker', 4), ('KRKR', ''))
2619
        self.assertEqual(double_metaphone('Crockett', 4), ('KRKT', ''))
2620
        self.assertEqual(double_metaphone('Crosby', 4), ('KRSP', ''))
2621
        self.assertEqual(double_metaphone('Crump', 4), ('KRMP', ''))
2622
        self.assertEqual(double_metaphone('Cunningham', 4), ('KNNK', ''))
2623
        self.assertEqual(double_metaphone('Curtis', 4), ('KRTS', ''))
2624
        self.assertEqual(double_metaphone('Cutha', 4), ('K0', 'KT'))
2625
        self.assertEqual(double_metaphone('Cutter', 4), ('KTR', ''))
2626
        self.assertEqual(double_metaphone('D\'Aubigny', 4), ('TPN', 'TPKN'))
2627
        self.assertEqual(double_metaphone('DAVIS', 4), ('TFS', ''))
2628
        self.assertEqual(double_metaphone('Dabinott', 4), ('TPNT', ''))
2629
        self.assertEqual(double_metaphone('Dacre', 4), ('TKR', ''))
2630
        self.assertEqual(double_metaphone('Daggett', 4), ('TKT', ''))
2631
        self.assertEqual(double_metaphone('Danvers', 4), ('TNFR', ''))
2632
        self.assertEqual(double_metaphone('Darcy', 4), ('TRS', ''))
2633
        self.assertEqual(double_metaphone('Davis', 4), ('TFS', ''))
2634
        self.assertEqual(double_metaphone('Dawn', 4), ('TN', ''))
2635
        self.assertEqual(double_metaphone('Dawson', 4), ('TSN', ''))
2636
        self.assertEqual(double_metaphone('Day', 4), ('T', ''))
2637
        self.assertEqual(double_metaphone('Daye', 4), ('T', ''))
2638
        self.assertEqual(double_metaphone('DeGrenier', 4), ('TKRN', ''))
2639
        self.assertEqual(double_metaphone('Dean', 4), ('TN', ''))
2640
        self.assertEqual(double_metaphone('Deekindaugh', 4), ('TKNT', ''))
2641
        self.assertEqual(double_metaphone('Dennis', 4), ('TNS', ''))
2642
        self.assertEqual(double_metaphone('Denny', 4), ('TN', ''))
2643
        self.assertEqual(double_metaphone('Denton', 4), ('TNTN', ''))
2644
        self.assertEqual(double_metaphone('Desborough', 4), ('TSPR', ''))
2645
        self.assertEqual(double_metaphone('Despenser', 4), ('TSPN', ''))
2646
        self.assertEqual(double_metaphone('Deverill', 4), ('TFRL', ''))
2647
        self.assertEqual(double_metaphone('Devine', 4), ('TFN', ''))
2648
        self.assertEqual(double_metaphone('Dexter', 4), ('TKST', ''))
2649
        self.assertEqual(double_metaphone('Dillaway', 4), ('TL', ''))
2650
        self.assertEqual(double_metaphone('Dimmick', 4), ('TMK', ''))
2651
        self.assertEqual(double_metaphone('Dinan', 4), ('TNN', ''))
2652
        self.assertEqual(double_metaphone('Dix', 4), ('TKS', ''))
2653
        self.assertEqual(double_metaphone('Doggett', 4), ('TKT', ''))
2654
        self.assertEqual(double_metaphone('Donahue', 4), ('TNH', ''))
2655
        self.assertEqual(double_metaphone('Dorfman', 4), ('TRFM', ''))
2656
        self.assertEqual(double_metaphone('Dorris', 4), ('TRS', ''))
2657
        self.assertEqual(double_metaphone('Dow', 4), ('T', 'TF'))
2658
        self.assertEqual(double_metaphone('Downey', 4), ('TN', ''))
2659
        self.assertEqual(double_metaphone('Downing', 4), ('TNNK', ''))
2660
        self.assertEqual(double_metaphone('Dowsett', 4), ('TST', ''))
2661
        self.assertEqual(double_metaphone('Duck?', 4), ('TK', ''))
2662
        self.assertEqual(double_metaphone('Dudley', 4), ('TTL', ''))
2663
        self.assertEqual(double_metaphone('Duffy', 4), ('TF', ''))
2664
        self.assertEqual(double_metaphone('Dunn', 4), ('TN', ''))
2665
        self.assertEqual(double_metaphone('Dunsterville', 4), ('TNST', ''))
2666
        self.assertEqual(double_metaphone('Durrant', 4), ('TRNT', ''))
2667
        self.assertEqual(double_metaphone('Durrin', 4), ('TRN', ''))
2668
        self.assertEqual(double_metaphone('Dustin', 4), ('TSTN', ''))
2669
        self.assertEqual(double_metaphone('Duston', 4), ('TSTN', ''))
2670
        self.assertEqual(double_metaphone('Eames', 4), ('AMS', ''))
2671
        self.assertEqual(double_metaphone('Early', 4), ('ARL', ''))
2672
        self.assertEqual(double_metaphone('Easty', 4), ('AST', ''))
2673
        self.assertEqual(double_metaphone('Ebbett', 4), ('APT', ''))
2674
        self.assertEqual(double_metaphone('Eberbach', 4), ('APRP', ''))
2675
        self.assertEqual(double_metaphone('Eberhard', 4), ('APRR', ''))
2676
        self.assertEqual(double_metaphone('Eddy', 4), ('AT', ''))
2677
        self.assertEqual(double_metaphone('Edenden', 4), ('ATNT', ''))
2678
        self.assertEqual(double_metaphone('Edwards', 4), ('ATRT', ''))
2679
        self.assertEqual(double_metaphone('Eglinton', 4), ('AKLN', 'ALNT'))
2680
        self.assertEqual(double_metaphone('Eliot', 4), ('ALT', ''))
2681
        self.assertEqual(double_metaphone('Elizabeth', 4), ('ALSP', ''))
2682
        self.assertEqual(double_metaphone('Ellis', 4), ('ALS', ''))
2683
        self.assertEqual(double_metaphone('Ellison', 4), ('ALSN', ''))
2684
        self.assertEqual(double_metaphone('Ellot', 4), ('ALT', ''))
2685
        self.assertEqual(double_metaphone('Elny', 4), ('ALN', ''))
2686
        self.assertEqual(double_metaphone('Elsner', 4), ('ALSN', ''))
2687
        self.assertEqual(double_metaphone('Emerson', 4), ('AMRS', ''))
2688
        self.assertEqual(double_metaphone('Empson', 4), ('AMPS', ''))
2689
        self.assertEqual(double_metaphone('Est', 4), ('AST', ''))
2690
        self.assertEqual(double_metaphone('Estabrook', 4), ('ASTP', ''))
2691
        self.assertEqual(double_metaphone('Estes', 4), ('ASTS', ''))
2692
        self.assertEqual(double_metaphone('Estey', 4), ('AST', ''))
2693
        self.assertEqual(double_metaphone('Evans', 4), ('AFNS', ''))
2694
        self.assertEqual(double_metaphone('Fallowell', 4), ('FLL', ''))
2695
        self.assertEqual(double_metaphone('Farnsworth', 4), ('FRNS', ''))
2696
        self.assertEqual(double_metaphone('Feake', 4), ('FK', ''))
2697
        self.assertEqual(double_metaphone('Feke', 4), ('FK', ''))
2698
        self.assertEqual(double_metaphone('Fellows', 4), ('FLS', ''))
2699
        self.assertEqual(double_metaphone('Fettiplace', 4), ('FTPL', ''))
2700
        self.assertEqual(double_metaphone('Finney', 4), ('FN', ''))
2701
        self.assertEqual(double_metaphone('Fischer', 4), ('FXR', 'FSKR'))
2702
        self.assertEqual(double_metaphone('Fisher', 4), ('FXR', ''))
2703
        self.assertEqual(double_metaphone('Fisk', 4), ('FSK', ''))
2704
        self.assertEqual(double_metaphone('Fiske', 4), ('FSK', ''))
2705
        self.assertEqual(double_metaphone('Fletcher', 4), ('FLXR', ''))
2706
        self.assertEqual(double_metaphone('Folger', 4), ('FLKR', 'FLJR'))
2707
        self.assertEqual(double_metaphone('Foliot', 4), ('FLT', ''))
2708
        self.assertEqual(double_metaphone('Folyot', 4), ('FLT', ''))
2709
        self.assertEqual(double_metaphone('Fones', 4), ('FNS', ''))
2710
        self.assertEqual(double_metaphone('Fordham', 4), ('FRTM', ''))
2711
        self.assertEqual(double_metaphone('Forstner', 4), ('FRST', ''))
2712
        self.assertEqual(double_metaphone('Fosten', 4), ('FSTN', ''))
2713
        self.assertEqual(double_metaphone('Foster', 4), ('FSTR', ''))
2714
        self.assertEqual(double_metaphone('Foulke', 4), ('FLK', ''))
2715
        self.assertEqual(double_metaphone('Fowler', 4), ('FLR', ''))
2716
        self.assertEqual(double_metaphone('Foxwell', 4), ('FKSL', ''))
2717
        self.assertEqual(double_metaphone('Fraley', 4), ('FRL', ''))
2718
        self.assertEqual(double_metaphone('Franceys', 4), ('FRNS', ''))
2719
        self.assertEqual(double_metaphone('Franke', 4), ('FRNK', ''))
2720
        self.assertEqual(double_metaphone('Frascella', 4), ('FRSL', ''))
2721
        self.assertEqual(double_metaphone('Frazer', 4), ('FRSR', ''))
2722
        self.assertEqual(double_metaphone('Fredd', 4), ('FRT', ''))
2723
        self.assertEqual(double_metaphone('Freeman', 4), ('FRMN', ''))
2724
        self.assertEqual(double_metaphone('French', 4), ('FRNX', 'FRNK'))
2725
        self.assertEqual(double_metaphone('Freville', 4), ('FRFL', ''))
2726
        self.assertEqual(double_metaphone('Frey', 4), ('FR', ''))
2727
        self.assertEqual(double_metaphone('Frick', 4), ('FRK', ''))
2728
        self.assertEqual(double_metaphone('Frier', 4), ('FR', 'FRR'))
2729
        self.assertEqual(double_metaphone('Froe', 4), ('FR', ''))
2730
        self.assertEqual(double_metaphone('Frorer', 4), ('FRRR', ''))
2731
        self.assertEqual(double_metaphone('Frost', 4), ('FRST', ''))
2732
        self.assertEqual(double_metaphone('Frothingham', 4), ('FR0N', 'FRTN'))
2733
        self.assertEqual(double_metaphone('Fry', 4), ('FR', ''))
2734
        self.assertEqual(double_metaphone('Gaffney', 4), ('KFN', ''))
2735
        self.assertEqual(double_metaphone('Gage', 4), ('KJ', 'KK'))
2736
        self.assertEqual(double_metaphone('Gallion', 4), ('KLN', ''))
2737
        self.assertEqual(double_metaphone('Gallishan', 4), ('KLXN', ''))
2738
        self.assertEqual(double_metaphone('Gamble', 4), ('KMPL', ''))
2739
        self.assertEqual(double_metaphone('Garbrand', 4), ('KRPR', ''))
2740
        self.assertEqual(double_metaphone('Gardner', 4), ('KRTN', ''))
2741
        self.assertEqual(double_metaphone('Garrett', 4), ('KRT', ''))
2742
        self.assertEqual(double_metaphone('Gassner', 4), ('KSNR', ''))
2743
        self.assertEqual(double_metaphone('Gater', 4), ('KTR', ''))
2744
        self.assertEqual(double_metaphone('Gaunt', 4), ('KNT', ''))
2745
        self.assertEqual(double_metaphone('Gayer', 4), ('KR', ''))
2746
        self.assertEqual(double_metaphone('Gerken', 4), ('KRKN', 'JRKN'))
2747
        self.assertEqual(double_metaphone('Gerritsen', 4), ('KRTS', 'JRTS'))
2748
        self.assertEqual(double_metaphone('Gibbs', 4), ('KPS', 'JPS'))
2749
        self.assertEqual(double_metaphone('Giffard', 4), ('JFRT', 'KFRT'))
2750
        self.assertEqual(double_metaphone('Gilbert', 4), ('KLPR', 'JLPR'))
2751
        self.assertEqual(double_metaphone('Gill', 4), ('KL', 'JL'))
2752
        self.assertEqual(double_metaphone('Gilman', 4), ('KLMN', 'JLMN'))
2753
        self.assertEqual(double_metaphone('Glass', 4), ('KLS', ''))
2754
        self.assertEqual(double_metaphone('GoddardGifford', 4), ('KTRJ', ''))
2755
        self.assertEqual(double_metaphone('Godfrey', 4), ('KTFR', ''))
2756
        self.assertEqual(double_metaphone('Godwin', 4), ('KTN', ''))
2757
        self.assertEqual(double_metaphone('Goodale', 4), ('KTL', ''))
2758
        self.assertEqual(double_metaphone('Goodnow', 4), ('KTN', 'KTNF'))
2759
        self.assertEqual(double_metaphone('Gorham', 4), ('KRM', ''))
2760
        self.assertEqual(double_metaphone('Goseline', 4), ('KSLN', ''))
2761
        self.assertEqual(double_metaphone('Gott', 4), ('KT', ''))
2762
        self.assertEqual(double_metaphone('Gould', 4), ('KLT', ''))
2763
        self.assertEqual(double_metaphone('Grafton', 4), ('KRFT', ''))
2764
        self.assertEqual(double_metaphone('Grant', 4), ('KRNT', ''))
2765
        self.assertEqual(double_metaphone('Gray', 4), ('KR', ''))
2766
        self.assertEqual(double_metaphone('Green', 4), ('KRN', ''))
2767
        self.assertEqual(double_metaphone('Griffin', 4), ('KRFN', ''))
2768
        self.assertEqual(double_metaphone('Grill', 4), ('KRL', ''))
2769
        self.assertEqual(double_metaphone('Grim', 4), ('KRM', ''))
2770
        self.assertEqual(double_metaphone('Grisgonelle', 4), ('KRSK', ''))
2771
        self.assertEqual(double_metaphone('Gross', 4), ('KRS', ''))
2772
        self.assertEqual(double_metaphone('Guba', 4), ('KP', ''))
2773
        self.assertEqual(double_metaphone('Gybbes', 4), ('KPS', 'JPS'))
2774
        self.assertEqual(double_metaphone('Haburne', 4), ('HPRN', ''))
2775
        self.assertEqual(double_metaphone('Hackburne', 4), ('HKPR', ''))
2776
        self.assertEqual(double_metaphone('Haddon?', 4), ('HTN', ''))
2777
        self.assertEqual(double_metaphone('Haines', 4), ('HNS', ''))
2778
        self.assertEqual(double_metaphone('Hale', 4), ('HL', ''))
2779
        self.assertEqual(double_metaphone('Hall', 4), ('HL', ''))
2780
        self.assertEqual(double_metaphone('Hallet', 4), ('HLT', ''))
2781
        self.assertEqual(double_metaphone('Hallock', 4), ('HLK', ''))
2782
        self.assertEqual(double_metaphone('Halstead', 4), ('HLST', ''))
2783
        self.assertEqual(double_metaphone('Hammond', 4), ('HMNT', ''))
2784
        self.assertEqual(double_metaphone('Hance', 4), ('HNS', ''))
2785
        self.assertEqual(double_metaphone('Handy', 4), ('HNT', ''))
2786
        self.assertEqual(double_metaphone('Hanson', 4), ('HNSN', ''))
2787
        self.assertEqual(double_metaphone('Harasek', 4), ('HRSK', ''))
2788
        self.assertEqual(double_metaphone('Harcourt', 4), ('HRKR', ''))
2789
        self.assertEqual(double_metaphone('Hardy', 4), ('HRT', ''))
2790
        self.assertEqual(double_metaphone('Harlock', 4), ('HRLK', ''))
2791
        self.assertEqual(double_metaphone('Harris', 4), ('HRS', ''))
2792
        self.assertEqual(double_metaphone('Hartley', 4), ('HRTL', ''))
2793
        self.assertEqual(double_metaphone('Harvey', 4), ('HRF', ''))
2794
        self.assertEqual(double_metaphone('Harvie', 4), ('HRF', ''))
2795
        self.assertEqual(double_metaphone('Harwood', 4), ('HRT', ''))
2796
        self.assertEqual(double_metaphone('Hathaway', 4), ('H0', 'HT'))
2797
        self.assertEqual(double_metaphone('Haukeness', 4), ('HKNS', ''))
2798
        self.assertEqual(double_metaphone('Hawkes', 4), ('HKS', ''))
2799
        self.assertEqual(double_metaphone('Hawkhurst', 4), ('HKRS', ''))
2800
        self.assertEqual(double_metaphone('Hawkins', 4), ('HKNS', ''))
2801
        self.assertEqual(double_metaphone('Hawley', 4), ('HL', ''))
2802
        self.assertEqual(double_metaphone('Heald', 4), ('HLT', ''))
2803
        self.assertEqual(double_metaphone('Helsdon', 4), ('HLST', ''))
2804
        self.assertEqual(double_metaphone('Hemenway', 4), ('HMN', ''))
2805
        self.assertEqual(double_metaphone('Hemmenway', 4), ('HMN', ''))
2806
        self.assertEqual(double_metaphone('Henck', 4), ('HNK', ''))
2807
        self.assertEqual(double_metaphone('Henderson', 4), ('HNTR', ''))
2808
        self.assertEqual(double_metaphone('Hendricks', 4), ('HNTR', ''))
2809
        self.assertEqual(double_metaphone('Hersey', 4), ('HRS', ''))
2810
        self.assertEqual(double_metaphone('Hewes', 4), ('HS', ''))
2811
        self.assertEqual(double_metaphone('Heyman', 4), ('HMN', ''))
2812
        self.assertEqual(double_metaphone('Hicks', 4), ('HKS', ''))
2813
        self.assertEqual(double_metaphone('Hidden', 4), ('HTN', ''))
2814
        self.assertEqual(double_metaphone('Higgs', 4), ('HKS', ''))
2815
        self.assertEqual(double_metaphone('Hill', 4), ('HL', ''))
2816
        self.assertEqual(double_metaphone('Hills', 4), ('HLS', ''))
2817
        self.assertEqual(double_metaphone('Hinckley', 4), ('HNKL', ''))
2818
        self.assertEqual(double_metaphone('Hipwell', 4), ('HPL', ''))
2819
        self.assertEqual(double_metaphone('Hobart', 4), ('HPRT', ''))
2820
        self.assertEqual(double_metaphone('Hoben', 4), ('HPN', ''))
2821
        self.assertEqual(double_metaphone('Hoffmann', 4), ('HFMN', ''))
2822
        self.assertEqual(double_metaphone('Hogan', 4), ('HKN', ''))
2823
        self.assertEqual(double_metaphone('Holmes', 4), ('HLMS', ''))
2824
        self.assertEqual(double_metaphone('Hoo', 4), ('H', ''))
2825
        self.assertEqual(double_metaphone('Hooker', 4), ('HKR', ''))
2826
        self.assertEqual(double_metaphone('Hopcott', 4), ('HPKT', ''))
2827
        self.assertEqual(double_metaphone('Hopkins', 4), ('HPKN', ''))
2828
        self.assertEqual(double_metaphone('Hopkinson', 4), ('HPKN', ''))
2829
        self.assertEqual(double_metaphone('Hornsey', 4), ('HRNS', ''))
2830
        self.assertEqual(double_metaphone('Houckgeest', 4), ('HKJS', 'HKKS'))
2831
        self.assertEqual(double_metaphone('Hough', 4), ('H', ''))
2832
        self.assertEqual(double_metaphone('Houstin', 4), ('HSTN', ''))
2833
        self.assertEqual(double_metaphone('How', 4), ('H', 'HF'))
2834
        self.assertEqual(double_metaphone('Howe', 4), ('H', ''))
2835
        self.assertEqual(double_metaphone('Howland', 4), ('HLNT', ''))
2836
        self.assertEqual(double_metaphone('Hubner', 4), ('HPNR', ''))
2837
        self.assertEqual(double_metaphone('Hudnut', 4), ('HTNT', ''))
2838
        self.assertEqual(double_metaphone('Hughes', 4), ('HS', ''))
2839
        self.assertEqual(double_metaphone('Hull', 4), ('HL', ''))
2840
        self.assertEqual(double_metaphone('Hulme', 4), ('HLM', ''))
2841
        self.assertEqual(double_metaphone('Hume', 4), ('HM', ''))
2842
        self.assertEqual(double_metaphone('Hundertumark', 4), ('HNTR', ''))
2843
        self.assertEqual(double_metaphone('Hundley', 4), ('HNTL', ''))
2844
        self.assertEqual(double_metaphone('Hungerford', 4), ('HNKR', 'HNJR'))
2845
        self.assertEqual(double_metaphone('Hunt', 4), ('HNT', ''))
2846
        self.assertEqual(double_metaphone('Hurst', 4), ('HRST', ''))
2847
        self.assertEqual(double_metaphone('Husbands', 4), ('HSPN', ''))
2848
        self.assertEqual(double_metaphone('Hussey', 4), ('HS', ''))
2849
        self.assertEqual(double_metaphone('Husted', 4), ('HSTT', ''))
2850
        self.assertEqual(double_metaphone('Hutchins', 4), ('HXNS', ''))
2851
        self.assertEqual(double_metaphone('Hutchinson', 4), ('HXNS', ''))
2852
        self.assertEqual(double_metaphone('Huttinger', 4), ('HTNK', 'HTNJ'))
2853
        self.assertEqual(double_metaphone('Huybertsen', 4), ('HPRT', ''))
2854
        self.assertEqual(double_metaphone('Iddenden', 4), ('ATNT', ''))
2855
        self.assertEqual(double_metaphone('Ingraham', 4), ('ANKR', ''))
2856
        self.assertEqual(double_metaphone('Ives', 4), ('AFS', ''))
2857
        self.assertEqual(double_metaphone('Jackson', 4), ('JKSN', 'AKSN'))
2858
        self.assertEqual(double_metaphone('Jacob', 4), ('JKP', 'AKP'))
2859
        self.assertEqual(double_metaphone('Jans', 4), ('JNS', 'ANS'))
2860
        self.assertEqual(double_metaphone('Jenkins', 4), ('JNKN', 'ANKN'))
2861
        self.assertEqual(double_metaphone('Jewett', 4), ('JT', 'AT'))
2862
        self.assertEqual(double_metaphone('Jewitt', 4), ('JT', 'AT'))
2863
        self.assertEqual(double_metaphone('Johnson', 4), ('JNSN', 'ANSN'))
2864
        self.assertEqual(double_metaphone('Jones', 4), ('JNS', 'ANS'))
2865
        self.assertEqual(double_metaphone('Josephine', 4), ('JSFN', 'HSFN'))
2866
        self.assertEqual(double_metaphone('Judd', 4), ('JT', 'AT'))
2867
        self.assertEqual(double_metaphone('June', 4), ('JN', 'AN'))
2868
        self.assertEqual(double_metaphone('Kamarowska', 4), ('KMRS', ''))
2869
        self.assertEqual(double_metaphone('Kay', 4), ('K', ''))
2870
        self.assertEqual(double_metaphone('Kelley', 4), ('KL', ''))
2871
        self.assertEqual(double_metaphone('Kelly', 4), ('KL', ''))
2872
        self.assertEqual(double_metaphone('Keymber', 4), ('KMPR', ''))
2873
        self.assertEqual(double_metaphone('Keynes', 4), ('KNS', ''))
2874
        self.assertEqual(double_metaphone('Kilham', 4), ('KLM', ''))
2875
        self.assertEqual(double_metaphone('Kim', 4), ('KM', ''))
2876
        self.assertEqual(double_metaphone('Kimball', 4), ('KMPL', ''))
2877
        self.assertEqual(double_metaphone('King', 4), ('KNK', ''))
2878
        self.assertEqual(double_metaphone('Kinsey', 4), ('KNS', ''))
2879
        self.assertEqual(double_metaphone('Kirk', 4), ('KRK', ''))
2880
        self.assertEqual(double_metaphone('Kirton', 4), ('KRTN', ''))
2881
        self.assertEqual(double_metaphone('Kistler', 4), ('KSTL', ''))
2882
        self.assertEqual(double_metaphone('Kitchen', 4), ('KXN', ''))
2883
        self.assertEqual(double_metaphone('Kitson', 4), ('KTSN', ''))
2884
        self.assertEqual(double_metaphone('Klett', 4), ('KLT', ''))
2885
        self.assertEqual(double_metaphone('Kline', 4), ('KLN', ''))
2886
        self.assertEqual(double_metaphone('Knapp', 4), ('NP', ''))
2887
        self.assertEqual(double_metaphone('Knight', 4), ('NT', ''))
2888
        self.assertEqual(double_metaphone('Knote', 4), ('NT', ''))
2889
        self.assertEqual(double_metaphone('Knott', 4), ('NT', ''))
2890
        self.assertEqual(double_metaphone('Knox', 4), ('NKS', ''))
2891
        self.assertEqual(double_metaphone('Koeller', 4), ('KLR', ''))
2892
        self.assertEqual(double_metaphone('La Pointe', 4), ('LPNT', ''))
2893
        self.assertEqual(double_metaphone('LaPlante', 4), ('LPLN', ''))
2894
        self.assertEqual(double_metaphone('Laimbeer', 4), ('LMPR', ''))
2895
        self.assertEqual(double_metaphone('Lamb', 4), ('LMP', ''))
2896
        self.assertEqual(double_metaphone('Lambertson', 4), ('LMPR', ''))
2897
        self.assertEqual(double_metaphone('Lancto', 4), ('LNKT', ''))
2898
        self.assertEqual(double_metaphone('Landry', 4), ('LNTR', ''))
2899
        self.assertEqual(double_metaphone('Lane', 4), ('LN', ''))
2900
        self.assertEqual(double_metaphone('Langendyck', 4), ('LNJN', 'LNKN'))
2901
        self.assertEqual(double_metaphone('Langer', 4), ('LNKR', 'LNJR'))
2902
        self.assertEqual(double_metaphone('Langford', 4), ('LNKF', ''))
2903
        self.assertEqual(double_metaphone('Lantersee', 4), ('LNTR', ''))
2904
        self.assertEqual(double_metaphone('Laquer', 4), ('LKR', ''))
2905
        self.assertEqual(double_metaphone('Larkin', 4), ('LRKN', ''))
2906
        self.assertEqual(double_metaphone('Latham', 4), ('LTM', ''))
2907
        self.assertEqual(double_metaphone('Lathrop', 4), ('L0RP', 'LTRP'))
2908
        self.assertEqual(double_metaphone('Lauter', 4), ('LTR', ''))
2909
        self.assertEqual(double_metaphone('Lawrence', 4), ('LRNS', ''))
2910
        self.assertEqual(double_metaphone('Leach', 4), ('LK', ''))
2911
        self.assertEqual(double_metaphone('Leager', 4), ('LKR', 'LJR'))
2912
        self.assertEqual(double_metaphone('Learned', 4), ('LRNT', ''))
2913
        self.assertEqual(double_metaphone('Leavitt', 4), ('LFT', ''))
2914
        self.assertEqual(double_metaphone('Lee', 4), ('L', ''))
2915
        self.assertEqual(double_metaphone('Leete', 4), ('LT', ''))
2916
        self.assertEqual(double_metaphone('Leggett', 4), ('LKT', ''))
2917
        self.assertEqual(double_metaphone('Leland', 4), ('LLNT', ''))
2918
        self.assertEqual(double_metaphone('Leonard', 4), ('LNRT', ''))
2919
        self.assertEqual(double_metaphone('Lester', 4), ('LSTR', ''))
2920
        self.assertEqual(double_metaphone('Lestrange', 4), ('LSTR', ''))
2921
        self.assertEqual(double_metaphone('Lethem', 4), ('L0M', 'LTM'))
2922
        self.assertEqual(double_metaphone('Levine', 4), ('LFN', ''))
2923
        self.assertEqual(double_metaphone('Lewes', 4), ('LS', ''))
2924
        self.assertEqual(double_metaphone('Lewis', 4), ('LS', ''))
2925
        self.assertEqual(double_metaphone('Lincoln', 4), ('LNKL', ''))
2926
        self.assertEqual(double_metaphone('Lindsey', 4), ('LNTS', ''))
2927
        self.assertEqual(double_metaphone('Linher', 4), ('LNR', ''))
2928
        self.assertEqual(double_metaphone('Lippet', 4), ('LPT', ''))
2929
        self.assertEqual(double_metaphone('Lippincott', 4), ('LPNK', ''))
2930
        self.assertEqual(double_metaphone('Lockwood', 4), ('LKT', ''))
2931
        self.assertEqual(double_metaphone('Loines', 4), ('LNS', ''))
2932
        self.assertEqual(double_metaphone('Lombard', 4), ('LMPR', ''))
2933
        self.assertEqual(double_metaphone('Long', 4), ('LNK', ''))
2934
        self.assertEqual(double_metaphone('Longespee', 4), ('LNJS', 'LNKS'))
2935
        self.assertEqual(double_metaphone('Look', 4), ('LK', ''))
2936
        self.assertEqual(double_metaphone('Lounsberry', 4), ('LNSP', ''))
2937
        self.assertEqual(double_metaphone('Lounsbury', 4), ('LNSP', ''))
2938
        self.assertEqual(double_metaphone('Louthe', 4), ('L0', 'LT'))
2939
        self.assertEqual(double_metaphone('Loveyne', 4), ('LFN', ''))
2940
        self.assertEqual(double_metaphone('Lowe', 4), ('L', ''))
2941
        self.assertEqual(double_metaphone('Ludlam', 4), ('LTLM', ''))
2942
        self.assertEqual(double_metaphone('Lumbard', 4), ('LMPR', ''))
2943
        self.assertEqual(double_metaphone('Lund', 4), ('LNT', ''))
2944
        self.assertEqual(double_metaphone('Luno', 4), ('LN', ''))
2945
        self.assertEqual(double_metaphone('Lutz', 4), ('LTS', ''))
2946
        self.assertEqual(double_metaphone('Lydia', 4), ('LT', ''))
2947
        self.assertEqual(double_metaphone('Lynne', 4), ('LN', ''))
2948
        self.assertEqual(double_metaphone('Lyon', 4), ('LN', ''))
2949
        self.assertEqual(double_metaphone('MacAlpin', 4), ('MKLP', ''))
2950
        self.assertEqual(double_metaphone('MacBricc', 4), ('MKPR', ''))
2951
        self.assertEqual(double_metaphone('MacCrinan', 4), ('MKRN', ''))
2952
        self.assertEqual(double_metaphone('MacKenneth', 4), ('MKN0', 'MKNT'))
2953
        self.assertEqual(double_metaphone('MacMael nam Bo', 4), ('MKML', ''))
2954
        self.assertEqual(double_metaphone('MacMurchada', 4), ('MKMR', ''))
2955
        self.assertEqual(double_metaphone('Macomber', 4), ('MKMP', ''))
2956
        self.assertEqual(double_metaphone('Macy', 4), ('MS', ''))
2957
        self.assertEqual(double_metaphone('Magnus', 4), ('MNS', 'MKNS'))
2958
        self.assertEqual(double_metaphone('Mahien', 4), ('MHN', ''))
2959
        self.assertEqual(double_metaphone('Malmains', 4), ('MLMN', ''))
2960
        self.assertEqual(double_metaphone('Malory', 4), ('MLR', ''))
2961
        self.assertEqual(double_metaphone('Mancinelli', 4), ('MNSN', ''))
2962
        self.assertEqual(double_metaphone('Mancini', 4), ('MNSN', ''))
2963
        self.assertEqual(double_metaphone('Mann', 4), ('MN', ''))
2964
        self.assertEqual(double_metaphone('Manning', 4), ('MNNK', ''))
2965
        self.assertEqual(double_metaphone('Manter', 4), ('MNTR', ''))
2966
        self.assertEqual(double_metaphone('Marion', 4), ('MRN', ''))
2967
        self.assertEqual(double_metaphone('Marley', 4), ('MRL', ''))
2968
        self.assertEqual(double_metaphone('Marmion', 4), ('MRMN', ''))
2969
        self.assertEqual(double_metaphone('Marquart', 4), ('MRKR', ''))
2970
        self.assertEqual(double_metaphone('Marsh', 4), ('MRX', ''))
2971
        self.assertEqual(double_metaphone('Marshal', 4), ('MRXL', ''))
2972
        self.assertEqual(double_metaphone('Marshall', 4), ('MRXL', ''))
2973
        self.assertEqual(double_metaphone('Martel', 4), ('MRTL', ''))
2974
        self.assertEqual(double_metaphone('Martha', 4), ('MR0', 'MRT'))
2975
        self.assertEqual(double_metaphone('Martin', 4), ('MRTN', ''))
2976
        self.assertEqual(double_metaphone('Marturano', 4), ('MRTR', ''))
2977
        self.assertEqual(double_metaphone('Marvin', 4), ('MRFN', ''))
2978
        self.assertEqual(double_metaphone('Mary', 4), ('MR', ''))
2979
        self.assertEqual(double_metaphone('Mason', 4), ('MSN', ''))
2980
        self.assertEqual(double_metaphone('Maxwell', 4), ('MKSL', ''))
2981
        self.assertEqual(double_metaphone('Mayhew', 4), ('MH', 'MHF'))
2982
        self.assertEqual(double_metaphone('McAllaster', 4), ('MKLS', ''))
2983
        self.assertEqual(double_metaphone('McAllister', 4), ('MKLS', ''))
2984
        self.assertEqual(double_metaphone('McConnell', 4), ('MKNL', ''))
2985
        self.assertEqual(double_metaphone('McFarland', 4), ('MKFR', ''))
2986
        self.assertEqual(double_metaphone('McIlroy', 4), ('MSLR', ''))
2987
        self.assertEqual(double_metaphone('McNair', 4), ('MKNR', ''))
2988
        self.assertEqual(double_metaphone('McNair-Landry', 4), ('MKNR', ''))
2989
        self.assertEqual(double_metaphone('McRaven', 4), ('MKRF', ''))
2990
        self.assertEqual(double_metaphone('Mead', 4), ('MT', ''))
2991
        self.assertEqual(double_metaphone('Meade', 4), ('MT', ''))
2992
        self.assertEqual(double_metaphone('Meck', 4), ('MK', ''))
2993
        self.assertEqual(double_metaphone('Melton', 4), ('MLTN', ''))
2994
        self.assertEqual(double_metaphone('Mendenhall', 4), ('MNTN', ''))
2995
        self.assertEqual(double_metaphone('Mering', 4), ('MRNK', ''))
2996
        self.assertEqual(double_metaphone('Merrick', 4), ('MRK', ''))
2997
        self.assertEqual(double_metaphone('Merry', 4), ('MR', ''))
2998
        self.assertEqual(double_metaphone('Mighill', 4), ('ML', ''))
2999
        self.assertEqual(double_metaphone('Miller', 4), ('MLR', ''))
3000
        self.assertEqual(double_metaphone('Milton', 4), ('MLTN', ''))
3001
        self.assertEqual(double_metaphone('Mohun', 4), ('MHN', ''))
3002
        self.assertEqual(double_metaphone('Montague', 4), ('MNTK', ''))
3003
        self.assertEqual(double_metaphone('Montboucher', 4), ('MNTP', ''))
3004
        self.assertEqual(double_metaphone('Moore', 4), ('MR', ''))
3005
        self.assertEqual(double_metaphone('Morrel', 4), ('MRL', ''))
3006
        self.assertEqual(double_metaphone('Morrill', 4), ('MRL', ''))
3007
        self.assertEqual(double_metaphone('Morris', 4), ('MRS', ''))
3008
        self.assertEqual(double_metaphone('Morton', 4), ('MRTN', ''))
3009
        self.assertEqual(double_metaphone('Moton', 4), ('MTN', ''))
3010
        self.assertEqual(double_metaphone('Muir', 4), ('MR', ''))
3011
        self.assertEqual(double_metaphone('Mulferd', 4), ('MLFR', ''))
3012
        self.assertEqual(double_metaphone('Mullins', 4), ('MLNS', ''))
3013
        self.assertEqual(double_metaphone('Mulso', 4), ('MLS', ''))
3014
        self.assertEqual(double_metaphone('Munger', 4), ('MNKR', 'MNJR'))
3015
        self.assertEqual(double_metaphone('Munt', 4), ('MNT', ''))
3016
        self.assertEqual(double_metaphone('Murchad', 4), ('MRXT', 'MRKT'))
3017
        self.assertEqual(double_metaphone('Murdock', 4), ('MRTK', ''))
3018
        self.assertEqual(double_metaphone('Murray', 4), ('MR', ''))
3019
        self.assertEqual(double_metaphone('Muskett', 4), ('MSKT', ''))
3020
        self.assertEqual(double_metaphone('Myers', 4), ('MRS', ''))
3021
        self.assertEqual(double_metaphone('Myrick', 4), ('MRK', ''))
3022
        self.assertEqual(double_metaphone('NORRIS', 4), ('NRS', ''))
3023
        self.assertEqual(double_metaphone('Nayle', 4), ('NL', ''))
3024
        self.assertEqual(double_metaphone('Newcomb', 4), ('NKMP', ''))
3025
        self.assertEqual(double_metaphone('Newcomb(e)', 4), ('NKMP', ''))
3026
        self.assertEqual(double_metaphone('Newkirk', 4), ('NKRK', ''))
3027
        self.assertEqual(double_metaphone('Newton', 4), ('NTN', ''))
3028
        self.assertEqual(double_metaphone('Niles', 4), ('NLS', ''))
3029
        self.assertEqual(double_metaphone('Noble', 4), ('NPL', ''))
3030
        self.assertEqual(double_metaphone('Noel', 4), ('NL', ''))
3031
        self.assertEqual(double_metaphone('Northend', 4), ('NR0N', 'NRTN'))
3032
        self.assertEqual(double_metaphone('Norton', 4), ('NRTN', ''))
3033
        self.assertEqual(double_metaphone('Nutter', 4), ('NTR', ''))
3034
        self.assertEqual(double_metaphone('Odding', 4), ('ATNK', ''))
3035
        self.assertEqual(double_metaphone('Odenbaugh', 4), ('ATNP', ''))
3036
        self.assertEqual(double_metaphone('Ogborn', 4), ('AKPR', ''))
3037
        self.assertEqual(double_metaphone('Oppenheimer', 4), ('APNM', ''))
3038
        self.assertEqual(double_metaphone('Otis', 4), ('ATS', ''))
3039
        self.assertEqual(double_metaphone('Oviatt', 4), ('AFT', ''))
3040
        self.assertEqual(double_metaphone('PRUST?', 4), ('PRST', ''))
3041
        self.assertEqual(double_metaphone('Paddock', 4), ('PTK', ''))
3042
        self.assertEqual(double_metaphone('Page', 4), ('PJ', 'PK'))
3043
        self.assertEqual(double_metaphone('Paine', 4), ('PN', ''))
3044
        self.assertEqual(double_metaphone('Paist', 4), ('PST', ''))
3045
        self.assertEqual(double_metaphone('Palmer', 4), ('PLMR', ''))
3046
        self.assertEqual(double_metaphone('Park', 4), ('PRK', ''))
3047
        self.assertEqual(double_metaphone('Parker', 4), ('PRKR', ''))
3048
        self.assertEqual(double_metaphone('Parkhurst', 4), ('PRKR', ''))
3049
        self.assertEqual(double_metaphone('Parrat', 4), ('PRT', ''))
3050
        self.assertEqual(double_metaphone('Parsons', 4), ('PRSN', ''))
3051
        self.assertEqual(double_metaphone('Partridge', 4), ('PRTR', ''))
3052
        self.assertEqual(double_metaphone('Pashley', 4), ('PXL', ''))
3053
        self.assertEqual(double_metaphone('Pasley', 4), ('PSL', ''))
3054
        self.assertEqual(double_metaphone('Patrick', 4), ('PTRK', ''))
3055
        self.assertEqual(double_metaphone('Pattee', 4), ('PT', ''))
3056
        self.assertEqual(double_metaphone('Patten', 4), ('PTN', ''))
3057
        self.assertEqual(double_metaphone('Pawley', 4), ('PL', ''))
3058
        self.assertEqual(double_metaphone('Payne', 4), ('PN', ''))
3059
        self.assertEqual(double_metaphone('Peabody', 4), ('PPT', ''))
3060
        self.assertEqual(double_metaphone('Peake', 4), ('PK', ''))
3061
        self.assertEqual(double_metaphone('Pearson', 4), ('PRSN', ''))
3062
        self.assertEqual(double_metaphone('Peat', 4), ('PT', ''))
3063
        self.assertEqual(double_metaphone('Pedersen', 4), ('PTRS', ''))
3064
        self.assertEqual(double_metaphone('Percy', 4), ('PRS', ''))
3065
        self.assertEqual(double_metaphone('Perkins', 4), ('PRKN', ''))
3066
        self.assertEqual(double_metaphone('Perrine', 4), ('PRN', ''))
3067
        self.assertEqual(double_metaphone('Perry', 4), ('PR', ''))
3068
        self.assertEqual(double_metaphone('Peson', 4), ('PSN', ''))
3069
        self.assertEqual(double_metaphone('Peterson', 4), ('PTRS', ''))
3070
        self.assertEqual(double_metaphone('Peyton', 4), ('PTN', ''))
3071
        self.assertEqual(double_metaphone('Phinney', 4), ('FN', ''))
3072
        self.assertEqual(double_metaphone('Pickard', 4), ('PKRT', ''))
3073
        self.assertEqual(double_metaphone('Pierce', 4), ('PRS', ''))
3074
        self.assertEqual(double_metaphone('Pierrepont', 4), ('PRPN', ''))
3075
        self.assertEqual(double_metaphone('Pike', 4), ('PK', ''))
3076
        self.assertEqual(double_metaphone('Pinkham', 4), ('PNKM', ''))
3077
        self.assertEqual(double_metaphone('Pitman', 4), ('PTMN', ''))
3078
        self.assertEqual(double_metaphone('Pitt', 4), ('PT', ''))
3079
        self.assertEqual(double_metaphone('Pitts', 4), ('PTS', ''))
3080
        self.assertEqual(double_metaphone('Plantagenet', 4), ('PLNT', ''))
3081
        self.assertEqual(double_metaphone('Platt', 4), ('PLT', ''))
3082
        self.assertEqual(double_metaphone('Platts', 4), ('PLTS', ''))
3083
        self.assertEqual(double_metaphone('Pleis', 4), ('PLS', ''))
3084
        self.assertEqual(double_metaphone('Pleiss', 4), ('PLS', ''))
3085
        self.assertEqual(double_metaphone('Plisko', 4), ('PLSK', ''))
3086
        self.assertEqual(double_metaphone('Pliskovitch', 4), ('PLSK', ''))
3087
        self.assertEqual(double_metaphone('Plum', 4), ('PLM', ''))
3088
        self.assertEqual(double_metaphone('Plume', 4), ('PLM', ''))
3089
        self.assertEqual(double_metaphone('Poitou', 4), ('PT', ''))
3090
        self.assertEqual(double_metaphone('Pomeroy', 4), ('PMR', ''))
3091
        self.assertEqual(double_metaphone('Poretiers', 4), ('PRTR', ''))
3092
        self.assertEqual(double_metaphone('Pote', 4), ('PT', ''))
3093
        self.assertEqual(double_metaphone('Potter', 4), ('PTR', ''))
3094
        self.assertEqual(double_metaphone('Potts', 4), ('PTS', ''))
3095
        self.assertEqual(double_metaphone('Powell', 4), ('PL', ''))
3096
        self.assertEqual(double_metaphone('Pratt', 4), ('PRT', ''))
3097
        self.assertEqual(double_metaphone('Presbury', 4), ('PRSP', ''))
3098
        self.assertEqual(double_metaphone('Priest', 4), ('PRST', ''))
3099
        self.assertEqual(double_metaphone('Prindle', 4), ('PRNT', ''))
3100
        self.assertEqual(double_metaphone('Prior', 4), ('PRR', ''))
3101
        self.assertEqual(double_metaphone('Profumo', 4), ('PRFM', ''))
3102
        self.assertEqual(double_metaphone('Purdy', 4), ('PRT', ''))
3103
        self.assertEqual(double_metaphone('Purefoy', 4), ('PRF', ''))
3104
        self.assertEqual(double_metaphone('Pury', 4), ('PR', ''))
3105
        self.assertEqual(double_metaphone('Quinter', 4), ('KNTR', ''))
3106
        self.assertEqual(double_metaphone('Rachel', 4), ('RXL', 'RKL'))
3107
        self.assertEqual(double_metaphone('Rand', 4), ('RNT', ''))
3108
        self.assertEqual(double_metaphone('Rankin', 4), ('RNKN', ''))
3109
        self.assertEqual(double_metaphone('Ravenscroft', 4), ('RFNS', ''))
3110
        self.assertEqual(double_metaphone('Raynsford', 4), ('RNSF', ''))
3111
        self.assertEqual(double_metaphone('Reakirt', 4), ('RKRT', ''))
3112
        self.assertEqual(double_metaphone('Reaves', 4), ('RFS', ''))
3113
        self.assertEqual(double_metaphone('Reeves', 4), ('RFS', ''))
3114
        self.assertEqual(double_metaphone('Reichert', 4), ('RXRT', 'RKRT'))
3115
        self.assertEqual(double_metaphone('Remmele', 4), ('RML', ''))
3116
        self.assertEqual(double_metaphone('Reynolds', 4), ('RNLT', ''))
3117
        self.assertEqual(double_metaphone('Rhodes', 4), ('RTS', ''))
3118
        self.assertEqual(double_metaphone('Richards', 4), ('RXRT', 'RKRT'))
3119
        self.assertEqual(double_metaphone('Richardson', 4), ('RXRT', 'RKRT'))
3120
        self.assertEqual(double_metaphone('Ring', 4), ('RNK', ''))
3121
        self.assertEqual(double_metaphone('Roberts', 4), ('RPRT', ''))
3122
        self.assertEqual(double_metaphone('Robertson', 4), ('RPRT', ''))
3123
        self.assertEqual(double_metaphone('Robson', 4), ('RPSN', ''))
3124
        self.assertEqual(double_metaphone('Rodie', 4), ('RT', ''))
3125
        self.assertEqual(double_metaphone('Rody', 4), ('RT', ''))
3126
        self.assertEqual(double_metaphone('Rogers', 4), ('RKRS', 'RJRS'))
3127
        self.assertEqual(double_metaphone('Ross', 4), ('RS', ''))
3128
        self.assertEqual(double_metaphone('Rosslevin', 4), ('RSLF', ''))
3129
        self.assertEqual(double_metaphone('Rowland', 4), ('RLNT', ''))
3130
        self.assertEqual(double_metaphone('Ruehl', 4), ('RL', ''))
3131
        self.assertEqual(double_metaphone('Russell', 4), ('RSL', ''))
3132
        self.assertEqual(double_metaphone('Ruth', 4), ('R0', 'RT'))
3133
        self.assertEqual(double_metaphone('Ryan', 4), ('RN', ''))
3134
        self.assertEqual(double_metaphone('Rysse', 4), ('RS', ''))
3135
        self.assertEqual(double_metaphone('Sadler', 4), ('STLR', ''))
3136
        self.assertEqual(double_metaphone('Salmon', 4), ('SLMN', ''))
3137
        self.assertEqual(double_metaphone('Salter', 4), ('SLTR', ''))
3138
        self.assertEqual(double_metaphone('Salvatore', 4), ('SLFT', ''))
3139
        self.assertEqual(double_metaphone('Sanders', 4), ('SNTR', ''))
3140
        self.assertEqual(double_metaphone('Sands', 4), ('SNTS', ''))
3141
        self.assertEqual(double_metaphone('Sanford', 4), ('SNFR', ''))
3142
        self.assertEqual(double_metaphone('Sanger', 4), ('SNKR', 'SNJR'))
3143
        self.assertEqual(double_metaphone('Sargent', 4), ('SRJN', 'SRKN'))
3144
        self.assertEqual(double_metaphone('Saunders', 4), ('SNTR', ''))
3145
        self.assertEqual(double_metaphone('Schilling', 4), ('XLNK', ''))
3146
        self.assertEqual(double_metaphone('Schlegel', 4), ('XLKL', 'SLKL'))
3147
        self.assertEqual(double_metaphone('Scott', 4), ('SKT', ''))
3148
        self.assertEqual(double_metaphone('Sears', 4), ('SRS', ''))
3149
        self.assertEqual(double_metaphone('Segersall', 4), ('SJRS', 'SKRS'))
3150
        self.assertEqual(double_metaphone('Senecal', 4), ('SNKL', ''))
3151
        self.assertEqual(double_metaphone('Sergeaux', 4), ('SRJ', 'SRK'))
3152
        self.assertEqual(double_metaphone('Severance', 4), ('SFRN', ''))
3153
        self.assertEqual(double_metaphone('Sharp', 4), ('XRP', ''))
3154
        self.assertEqual(double_metaphone('Sharpe', 4), ('XRP', ''))
3155
        self.assertEqual(double_metaphone('Sharply', 4), ('XRPL', ''))
3156
        self.assertEqual(double_metaphone('Shatswell', 4), ('XTSL', ''))
3157
        self.assertEqual(double_metaphone('Shattack', 4), ('XTK', ''))
3158
        self.assertEqual(double_metaphone('Shattock', 4), ('XTK', ''))
3159
        self.assertEqual(double_metaphone('Shattuck', 4), ('XTK', ''))
3160
        self.assertEqual(double_metaphone('Shaw', 4), ('X', 'XF'))
3161
        self.assertEqual(double_metaphone('Sheldon', 4), ('XLTN', ''))
3162
        self.assertEqual(double_metaphone('Sherman', 4), ('XRMN', ''))
3163
        self.assertEqual(double_metaphone('Shinn', 4), ('XN', ''))
3164
        self.assertEqual(double_metaphone('Shirford', 4), ('XRFR', ''))
3165
        self.assertEqual(double_metaphone('Shirley', 4), ('XRL', ''))
3166
        self.assertEqual(double_metaphone('Shively', 4), ('XFL', ''))
3167
        self.assertEqual(double_metaphone('Shoemaker', 4), ('XMKR', ''))
3168
        self.assertEqual(double_metaphone('Short', 4), ('XRT', ''))
3169
        self.assertEqual(double_metaphone('Shotwell', 4), ('XTL', ''))
3170
        self.assertEqual(double_metaphone('Shute', 4), ('XT', ''))
3171
        self.assertEqual(double_metaphone('Sibley', 4), ('SPL', ''))
3172
        self.assertEqual(double_metaphone('Silver', 4), ('SLFR', ''))
3173
        self.assertEqual(double_metaphone('Simes', 4), ('SMS', ''))
3174
        self.assertEqual(double_metaphone('Sinken', 4), ('SNKN', ''))
3175
        self.assertEqual(double_metaphone('Sinn', 4), ('SN', ''))
3176
        self.assertEqual(double_metaphone('Skelton', 4), ('SKLT', ''))
3177
        self.assertEqual(double_metaphone('Skiffe', 4), ('SKF', ''))
3178
        self.assertEqual(double_metaphone('Skotkonung', 4), ('SKTK', ''))
3179
        self.assertEqual(double_metaphone('Slade', 4), ('SLT', 'XLT'))
3180
        self.assertEqual(double_metaphone('Slye', 4), ('SL', 'XL'))
3181
        self.assertEqual(double_metaphone('Smedley', 4), ('SMTL', 'XMTL'))
3182
        self.assertEqual(double_metaphone('Smith', 4), ('SM0', 'XMT'))
3183
        self.assertEqual(double_metaphone('Snow', 4), ('SN', 'XNF'))
3184
        self.assertEqual(double_metaphone('Soole', 4), ('SL', ''))
3185
        self.assertEqual(double_metaphone('Soule', 4), ('SL', ''))
3186
        self.assertEqual(double_metaphone('Southworth', 4), ('S0R0', 'STRT'))
3187
        self.assertEqual(double_metaphone('Sowles', 4), ('SLS', ''))
3188
        self.assertEqual(double_metaphone('Spalding', 4), ('SPLT', ''))
3189
        self.assertEqual(double_metaphone('Spark', 4), ('SPRK', ''))
3190
        self.assertEqual(double_metaphone('Spencer', 4), ('SPNS', ''))
3191
        self.assertEqual(double_metaphone('Sperry', 4), ('SPR', ''))
3192
        self.assertEqual(double_metaphone('Spofford', 4), ('SPFR', ''))
3193
        self.assertEqual(double_metaphone('Spooner', 4), ('SPNR', ''))
3194
        self.assertEqual(double_metaphone('Sprague', 4), ('SPRK', ''))
3195
        self.assertEqual(double_metaphone('Springer', 4), ('SPRN', ''))
3196
        self.assertEqual(double_metaphone('St. Clair', 4), ('STKL', ''))
3197
        self.assertEqual(double_metaphone('St. Claire', 4), ('STKL', ''))
3198
        self.assertEqual(double_metaphone('St. Leger', 4), ('STLJ', 'STLK'))
3199
        self.assertEqual(double_metaphone('St. Omer', 4), ('STMR', ''))
3200
        self.assertEqual(double_metaphone('Stafferton', 4), ('STFR', ''))
3201
        self.assertEqual(double_metaphone('Stafford', 4), ('STFR', ''))
3202
        self.assertEqual(double_metaphone('Stalham', 4), ('STLM', ''))
3203
        self.assertEqual(double_metaphone('Stanford', 4), ('STNF', ''))
3204
        self.assertEqual(double_metaphone('Stanton', 4), ('STNT', ''))
3205
        self.assertEqual(double_metaphone('Star', 4), ('STR', ''))
3206
        self.assertEqual(double_metaphone('Starbuck', 4), ('STRP', ''))
3207
        self.assertEqual(double_metaphone('Starkey', 4), ('STRK', ''))
3208
        self.assertEqual(double_metaphone('Starkweather', 4), ('STRK', ''))
3209
        self.assertEqual(double_metaphone('Stearns', 4), ('STRN', ''))
3210
        self.assertEqual(double_metaphone('Stebbins', 4), ('STPN', ''))
3211
        self.assertEqual(double_metaphone('Steele', 4), ('STL', ''))
3212
        self.assertEqual(double_metaphone('Stephenson', 4), ('STFN', ''))
3213
        self.assertEqual(double_metaphone('Stevens', 4), ('STFN', ''))
3214
        self.assertEqual(double_metaphone('Stoddard', 4), ('STTR', ''))
3215
        self.assertEqual(double_metaphone('Stodder', 4), ('STTR', ''))
3216
        self.assertEqual(double_metaphone('Stone', 4), ('STN', ''))
3217
        self.assertEqual(double_metaphone('Storey', 4), ('STR', ''))
3218
        self.assertEqual(double_metaphone('Storrada', 4), ('STRT', ''))
3219
        self.assertEqual(double_metaphone('Story', 4), ('STR', ''))
3220
        self.assertEqual(double_metaphone('Stoughton', 4), ('STFT', ''))
3221
        self.assertEqual(double_metaphone('Stout', 4), ('STT', ''))
3222
        self.assertEqual(double_metaphone('Stow', 4), ('ST', 'STF'))
3223
        self.assertEqual(double_metaphone('Strong', 4), ('STRN', ''))
3224
        self.assertEqual(double_metaphone('Strutt', 4), ('STRT', ''))
3225
        self.assertEqual(double_metaphone('Stryker', 4), ('STRK', ''))
3226
        self.assertEqual(double_metaphone('Stuckeley', 4), ('STKL', ''))
3227
        self.assertEqual(double_metaphone('Sturges', 4), ('STRJ', 'STRK'))
3228
        self.assertEqual(double_metaphone('Sturgess', 4), ('STRJ', 'STRK'))
3229
        self.assertEqual(double_metaphone('Sturgis', 4), ('STRJ', 'STRK'))
3230
        self.assertEqual(double_metaphone('Suevain', 4), ('SFN', ''))
3231
        self.assertEqual(double_metaphone('Sulyard', 4), ('SLRT', ''))
3232
        self.assertEqual(double_metaphone('Sutton', 4), ('STN', ''))
3233
        self.assertEqual(double_metaphone('Swain', 4), ('SN', 'XN'))
3234
        self.assertEqual(double_metaphone('Swayne', 4), ('SN', 'XN'))
3235
        self.assertEqual(double_metaphone('Swayze', 4), ('SS', 'XTS'))
3236
        self.assertEqual(double_metaphone('Swift', 4), ('SFT', 'XFT'))
3237
        self.assertEqual(double_metaphone('Taber', 4), ('TPR', ''))
3238
        self.assertEqual(double_metaphone('Talcott', 4), ('TLKT', ''))
3239
        self.assertEqual(double_metaphone('Tarne', 4), ('TRN', ''))
3240
        self.assertEqual(double_metaphone('Tatum', 4), ('TTM', ''))
3241
        self.assertEqual(double_metaphone('Taverner', 4), ('TFRN', ''))
3242
        self.assertEqual(double_metaphone('Taylor', 4), ('TLR', ''))
3243
        self.assertEqual(double_metaphone('Tenney', 4), ('TN', ''))
3244
        self.assertEqual(double_metaphone('Thayer', 4), ('0R', 'TR'))
3245
        self.assertEqual(double_metaphone('Thember', 4), ('0MPR', 'TMPR'))
3246
        self.assertEqual(double_metaphone('Thomas', 4), ('TMS', ''))
3247
        self.assertEqual(double_metaphone('Thompson', 4), ('TMPS', ''))
3248
        self.assertEqual(double_metaphone('Thorne', 4), ('0RN', 'TRN'))
3249
        self.assertEqual(double_metaphone('Thornycraft', 4), ('0RNK', 'TRNK'))
3250
        self.assertEqual(double_metaphone('Threlkeld', 4), ('0RLK', 'TRLK'))
3251
        self.assertEqual(double_metaphone('Throckmorton', 4), ('0RKM', 'TRKM'))
3252
        self.assertEqual(double_metaphone('Thwaits', 4), ('0TS', 'TTS'))
3253
        self.assertEqual(double_metaphone('Tibbetts', 4), ('TPTS', ''))
3254
        self.assertEqual(double_metaphone('Tidd', 4), ('TT', ''))
3255
        self.assertEqual(double_metaphone('Tierney', 4), ('TRN', ''))
3256
        self.assertEqual(double_metaphone('Tilley', 4), ('TL', ''))
3257
        self.assertEqual(double_metaphone('Tillieres', 4), ('TLRS', ''))
3258
        self.assertEqual(double_metaphone('Tilly', 4), ('TL', ''))
3259
        self.assertEqual(double_metaphone('Tisdale', 4), ('TSTL', ''))
3260
        self.assertEqual(double_metaphone('Titus', 4), ('TTS', ''))
3261
        self.assertEqual(double_metaphone('Tobey', 4), ('TP', ''))
3262
        self.assertEqual(double_metaphone('Tooker', 4), ('TKR', ''))
3263
        self.assertEqual(double_metaphone('Towle', 4), ('TL', ''))
3264
        self.assertEqual(double_metaphone('Towne', 4), ('TN', ''))
3265
        self.assertEqual(double_metaphone('Townsend', 4), ('TNSN', ''))
3266
        self.assertEqual(double_metaphone('Treadway', 4), ('TRT', ''))
3267
        self.assertEqual(double_metaphone('Trelawney', 4), ('TRLN', ''))
3268
        self.assertEqual(double_metaphone('Trinder', 4), ('TRNT', ''))
3269
        self.assertEqual(double_metaphone('Tripp', 4), ('TRP', ''))
3270
        self.assertEqual(double_metaphone('Trippe', 4), ('TRP', ''))
3271
        self.assertEqual(double_metaphone('Trott', 4), ('TRT', ''))
3272
        self.assertEqual(double_metaphone('True', 4), ('TR', ''))
3273
        self.assertEqual(double_metaphone('Trussebut', 4), ('TRSP', ''))
3274
        self.assertEqual(double_metaphone('Tucker', 4), ('TKR', ''))
3275
        self.assertEqual(double_metaphone('Turgeon', 4), ('TRJN', 'TRKN'))
3276
        self.assertEqual(double_metaphone('Turner', 4), ('TRNR', ''))
3277
        self.assertEqual(double_metaphone('Tuttle', 4), ('TTL', ''))
3278
        self.assertEqual(double_metaphone('Tyler', 4), ('TLR', ''))
3279
        self.assertEqual(double_metaphone('Tylle', 4), ('TL', ''))
3280
        self.assertEqual(double_metaphone('Tyrrel', 4), ('TRL', ''))
3281
        self.assertEqual(double_metaphone('Ua Tuathail', 4), ('AT0L', 'ATTL'))
3282
        self.assertEqual(double_metaphone('Ulrich', 4), ('ALRX', 'ALRK'))
3283
        self.assertEqual(double_metaphone('Underhill', 4), ('ANTR', ''))
3284
        self.assertEqual(double_metaphone('Underwood', 4), ('ANTR', ''))
3285
        self.assertEqual(double_metaphone('Unknown', 4), ('ANKN', ''))
3286
        self.assertEqual(double_metaphone('Valentine', 4), ('FLNT', ''))
3287
        self.assertEqual(double_metaphone('Van Egmond', 4), ('FNKM', ''))
3288
        self.assertEqual(double_metaphone('Van der Beek', 4), ('FNTR', ''))
3289
        self.assertEqual(double_metaphone('Vaughan', 4), ('FKN', ''))
3290
        self.assertEqual(double_metaphone('Vermenlen', 4), ('FRMN', ''))
3291
        self.assertEqual(double_metaphone('Vincent', 4), ('FNSN', ''))
3292
        self.assertEqual(double_metaphone('Volentine', 4), ('FLNT', ''))
3293
        self.assertEqual(double_metaphone('Wagner', 4), ('AKNR', 'FKNR'))
3294
        self.assertEqual(double_metaphone('Waite', 4), ('AT', 'FT'))
3295
        self.assertEqual(double_metaphone('Walker', 4), ('ALKR', 'FLKR'))
3296
        self.assertEqual(double_metaphone('Walter', 4), ('ALTR', 'FLTR'))
3297
        self.assertEqual(double_metaphone('Wandell', 4), ('ANTL', 'FNTL'))
3298
        self.assertEqual(double_metaphone('Wandesford', 4), ('ANTS', 'FNTS'))
3299
        self.assertEqual(double_metaphone('Warbleton', 4), ('ARPL', 'FRPL'))
3300
        self.assertEqual(double_metaphone('Ward', 4), ('ART', 'FRT'))
3301
        self.assertEqual(double_metaphone('Warde', 4), ('ART', 'FRT'))
3302
        self.assertEqual(double_metaphone('Ware', 4), ('AR', 'FR'))
3303
        self.assertEqual(double_metaphone('Wareham', 4), ('ARHM', 'FRHM'))
3304
        self.assertEqual(double_metaphone('Warner', 4), ('ARNR', 'FRNR'))
3305
        self.assertEqual(double_metaphone('Warren', 4), ('ARN', 'FRN'))
3306
        self.assertEqual(double_metaphone('Washburne', 4), ('AXPR', 'FXPR'))
3307
        self.assertEqual(double_metaphone('Waterbury', 4), ('ATRP', 'FTRP'))
3308
        self.assertEqual(double_metaphone('Watson', 4), ('ATSN', 'FTSN'))
3309
        self.assertEqual(double_metaphone('WatsonEllithorpe', 4),
3310
                         ('ATSN', 'FTSN'))
3311
        self.assertEqual(double_metaphone('Watts', 4), ('ATS', 'FTS'))
3312
        self.assertEqual(double_metaphone('Wayne', 4), ('AN', 'FN'))
3313
        self.assertEqual(double_metaphone('Webb', 4), ('AP', 'FP'))
3314
        self.assertEqual(double_metaphone('Weber', 4), ('APR', 'FPR'))
3315
        self.assertEqual(double_metaphone('Webster', 4), ('APST', 'FPST'))
3316
        self.assertEqual(double_metaphone('Weed', 4), ('AT', 'FT'))
3317
        self.assertEqual(double_metaphone('Weeks', 4), ('AKS', 'FKS'))
3318
        self.assertEqual(double_metaphone('Wells', 4), ('ALS', 'FLS'))
3319
        self.assertEqual(double_metaphone('Wenzell', 4), ('ANSL', 'FNTS'))
3320
        self.assertEqual(double_metaphone('West', 4), ('AST', 'FST'))
3321
        self.assertEqual(double_metaphone('Westbury', 4), ('ASTP', 'FSTP'))
3322
        self.assertEqual(double_metaphone('Whatlocke', 4), ('ATLK', ''))
3323
        self.assertEqual(double_metaphone('Wheeler', 4), ('ALR', ''))
3324
        self.assertEqual(double_metaphone('Whiston', 4), ('ASTN', ''))
3325
        self.assertEqual(double_metaphone('White', 4), ('AT', ''))
3326
        self.assertEqual(double_metaphone('Whitman', 4), ('ATMN', ''))
3327
        self.assertEqual(double_metaphone('Whiton', 4), ('ATN', ''))
3328
        self.assertEqual(double_metaphone('Whitson', 4), ('ATSN', ''))
3329
        self.assertEqual(double_metaphone('Wickes', 4), ('AKS', 'FKS'))
3330
        self.assertEqual(double_metaphone('Wilbur', 4), ('ALPR', 'FLPR'))
3331
        self.assertEqual(double_metaphone('Wilcotes', 4), ('ALKT', 'FLKT'))
3332
        self.assertEqual(double_metaphone('Wilkinson', 4), ('ALKN', 'FLKN'))
3333
        self.assertEqual(double_metaphone('Willets', 4), ('ALTS', 'FLTS'))
3334
        self.assertEqual(double_metaphone('Willett', 4), ('ALT', 'FLT'))
3335
        self.assertEqual(double_metaphone('Willey', 4), ('AL', 'FL'))
3336
        self.assertEqual(double_metaphone('Williams', 4), ('ALMS', 'FLMS'))
3337
        self.assertEqual(double_metaphone('Williston', 4), ('ALST', 'FLST'))
3338
        self.assertEqual(double_metaphone('Wilson', 4), ('ALSN', 'FLSN'))
3339
        self.assertEqual(double_metaphone('Wimes', 4), ('AMS', 'FMS'))
3340
        self.assertEqual(double_metaphone('Winch', 4), ('ANX', 'FNK'))
3341
        self.assertEqual(double_metaphone('Winegar', 4), ('ANKR', 'FNKR'))
3342
        self.assertEqual(double_metaphone('Wing', 4), ('ANK', 'FNK'))
3343
        self.assertEqual(double_metaphone('Winsley', 4), ('ANSL', 'FNSL'))
3344
        self.assertEqual(double_metaphone('Winslow', 4), ('ANSL', 'FNSL'))
3345
        self.assertEqual(double_metaphone('Winthrop', 4), ('AN0R', 'FNTR'))
3346
        self.assertEqual(double_metaphone('Wise', 4), ('AS', 'FS'))
3347
        self.assertEqual(double_metaphone('Wood', 4), ('AT', 'FT'))
3348
        self.assertEqual(double_metaphone('Woodbridge', 4), ('ATPR', 'FTPR'))
3349
        self.assertEqual(double_metaphone('Woodward', 4), ('ATRT', 'FTRT'))
3350
        self.assertEqual(double_metaphone('Wooley', 4), ('AL', 'FL'))
3351
        self.assertEqual(double_metaphone('Woolley', 4), ('AL', 'FL'))
3352
        self.assertEqual(double_metaphone('Worth', 4), ('AR0', 'FRT'))
3353
        self.assertEqual(double_metaphone('Worthen', 4), ('AR0N', 'FRTN'))
3354
        self.assertEqual(double_metaphone('Worthley', 4), ('AR0L', 'FRTL'))
3355
        self.assertEqual(double_metaphone('Wright', 4), ('RT', ''))
3356
        self.assertEqual(double_metaphone('Wyer', 4), ('AR', 'FR'))
3357
        self.assertEqual(double_metaphone('Wyere', 4), ('AR', 'FR'))
3358
        self.assertEqual(double_metaphone('Wynkoop', 4), ('ANKP', 'FNKP'))
3359
        self.assertEqual(double_metaphone('Yarnall', 4), ('ARNL', ''))
3360
        self.assertEqual(double_metaphone('Yeoman', 4), ('AMN', ''))
3361
        self.assertEqual(double_metaphone('Yorke', 4), ('ARK', ''))
3362
        self.assertEqual(double_metaphone('Young', 4), ('ANK', ''))
3363
        self.assertEqual(double_metaphone('ab Wennonwen', 4), ('APNN', ''))
3364
        self.assertEqual(double_metaphone('ap Llewellyn', 4), ('APLL', ''))
3365
        self.assertEqual(double_metaphone('ap Lorwerth', 4), ('APLR', ''))
3366
        self.assertEqual(double_metaphone('d\'Angouleme', 4), ('TNKL', ''))
3367
        self.assertEqual(double_metaphone('de Audeham', 4), ('TTHM', ''))
3368
        self.assertEqual(double_metaphone('de Bavant', 4), ('TPFN', ''))
3369
        self.assertEqual(double_metaphone('de Beauchamp', 4), ('TPXM', 'TPKM'))
3370
        self.assertEqual(double_metaphone('de Beaumont', 4), ('TPMN', ''))
3371
        self.assertEqual(double_metaphone('de Bolbec', 4), ('TPLP', ''))
3372
        self.assertEqual(double_metaphone('de Braiose', 4), ('TPRS', ''))
3373
        self.assertEqual(double_metaphone('de Braose', 4), ('TPRS', ''))
3374
        self.assertEqual(double_metaphone('de Briwere', 4), ('TPRR', ''))
3375
        self.assertEqual(double_metaphone('de Cantelou', 4), ('TKNT', ''))
3376
        self.assertEqual(double_metaphone('de Cherelton', 4), ('TXRL', 'TKRL'))
3377
        self.assertEqual(double_metaphone('de Cherleton', 4), ('TXRL', 'TKRL'))
3378
        self.assertEqual(double_metaphone('de Clare', 4), ('TKLR', ''))
3379
        self.assertEqual(double_metaphone('de Claremont', 4), ('TKLR', ''))
3380
        self.assertEqual(double_metaphone('de Clifford', 4), ('TKLF', ''))
3381
        self.assertEqual(double_metaphone('de Colville', 4), ('TKLF', ''))
3382
        self.assertEqual(double_metaphone('de Courtenay', 4), ('TKRT', ''))
3383
        self.assertEqual(double_metaphone('de Fauconberg', 4), ('TFKN', ''))
3384
        self.assertEqual(double_metaphone('de Forest', 4), ('TFRS', ''))
3385
        self.assertEqual(double_metaphone('de Gai', 4), ('TK', ''))
3386
        self.assertEqual(double_metaphone('de Grey', 4), ('TKR', ''))
3387
        self.assertEqual(double_metaphone('de Guernons', 4), ('TKRN', ''))
3388
        self.assertEqual(double_metaphone('de Haia', 4), ('T', ''))
3389
        self.assertEqual(double_metaphone('de Harcourt', 4), ('TRKR', ''))
3390
        self.assertEqual(double_metaphone('de Hastings', 4), ('TSTN', ''))
3391
        self.assertEqual(double_metaphone('de Hoke', 4), ('TK', ''))
3392
        self.assertEqual(double_metaphone('de Hooch', 4), ('TK', ''))
3393
        self.assertEqual(double_metaphone('de Hugelville', 4),
3394
                         ('TJLF', 'TKLF'))
3395
        self.assertEqual(double_metaphone('de Huntingdon', 4), ('TNTN', ''))
3396
        self.assertEqual(double_metaphone('de Insula', 4), ('TNSL', ''))
3397
        self.assertEqual(double_metaphone('de Keynes', 4), ('TKNS', ''))
3398
        self.assertEqual(double_metaphone('de Lacy', 4), ('TLS', ''))
3399
        self.assertEqual(double_metaphone('de Lexington', 4), ('TLKS', ''))
3400
        self.assertEqual(double_metaphone('de Lusignan', 4), ('TLSN', 'TLSK'))
3401
        self.assertEqual(double_metaphone('de Manvers', 4), ('TMNF', ''))
3402
        self.assertEqual(double_metaphone('de Montagu', 4), ('TMNT', ''))
3403
        self.assertEqual(double_metaphone('de Montault', 4), ('TMNT', ''))
3404
        self.assertEqual(double_metaphone('de Montfort', 4), ('TMNT', ''))
3405
        self.assertEqual(double_metaphone('de Mortimer', 4), ('TMRT', ''))
3406
        self.assertEqual(double_metaphone('de Morville', 4), ('TMRF', ''))
3407
        self.assertEqual(double_metaphone('de Morvois', 4), ('TMRF', ''))
3408
        self.assertEqual(double_metaphone('de Neufmarche', 4), ('TNFM', ''))
3409
        self.assertEqual(double_metaphone('de Odingsells', 4), ('TTNK', ''))
3410
        self.assertEqual(double_metaphone('de Odyngsells', 4), ('TTNK', ''))
3411
        self.assertEqual(double_metaphone('de Percy', 4), ('TPRS', ''))
3412
        self.assertEqual(double_metaphone('de Pierrepont', 4), ('TPRP', ''))
3413
        self.assertEqual(double_metaphone('de Plessetis', 4), ('TPLS', ''))
3414
        self.assertEqual(double_metaphone('de Porhoet', 4), ('TPRT', ''))
3415
        self.assertEqual(double_metaphone('de Prouz', 4), ('TPRS', ''))
3416
        self.assertEqual(double_metaphone('de Quincy', 4), ('TKNS', ''))
3417
        self.assertEqual(double_metaphone('de Ripellis', 4), ('TRPL', ''))
3418
        self.assertEqual(double_metaphone('de Ros', 4), ('TRS', ''))
3419
        self.assertEqual(double_metaphone('de Salisbury', 4), ('TSLS', ''))
3420
        self.assertEqual(double_metaphone('de Sanford', 4), ('TSNF', ''))
3421
        self.assertEqual(double_metaphone('de Somery', 4), ('TSMR', ''))
3422
        self.assertEqual(double_metaphone('de St. Hilary', 4), ('TSTL', ''))
3423
        self.assertEqual(double_metaphone('de St. Liz', 4), ('TSTL', ''))
3424
        self.assertEqual(double_metaphone('de Sutton', 4), ('TSTN', ''))
3425
        self.assertEqual(double_metaphone('de Toeni', 4), ('TTN', ''))
3426
        self.assertEqual(double_metaphone('de Tony', 4), ('TTN', ''))
3427
        self.assertEqual(double_metaphone('de Umfreville', 4), ('TMFR', ''))
3428
        self.assertEqual(double_metaphone('de Valognes', 4), ('TFLN', 'TFLK'))
3429
        self.assertEqual(double_metaphone('de Vaux', 4), ('TF', ''))
3430
        self.assertEqual(double_metaphone('de Vere', 4), ('TFR', ''))
3431
        self.assertEqual(double_metaphone('de Vermandois', 4), ('TFRM', ''))
3432
        self.assertEqual(double_metaphone('de Vernon', 4), ('TFRN', ''))
3433
        self.assertEqual(double_metaphone('de Vexin', 4), ('TFKS', ''))
3434
        self.assertEqual(double_metaphone('de Vitre', 4), ('TFTR', ''))
3435
        self.assertEqual(double_metaphone('de Wandesford', 4), ('TNTS', ''))
3436
        self.assertEqual(double_metaphone('de Warenne', 4), ('TRN', ''))
3437
        self.assertEqual(double_metaphone('de Westbury', 4), ('TSTP', ''))
3438
        self.assertEqual(double_metaphone('di Saluzzo', 4), ('TSLS', 'TSLT'))
3439
        self.assertEqual(double_metaphone('fitz Alan', 4), ('FTSL', ''))
3440
        self.assertEqual(double_metaphone('fitz Geoffrey', 4),
3441
                         ('FTSJ', 'FTSK'))
3442
        self.assertEqual(double_metaphone('fitz Herbert', 4), ('FTSR', ''))
3443
        self.assertEqual(double_metaphone('fitz John', 4), ('FTSJ', ''))
3444
        self.assertEqual(double_metaphone('fitz Patrick', 4), ('FTSP', ''))
3445
        self.assertEqual(double_metaphone('fitz Payn', 4), ('FTSP', ''))
3446
        self.assertEqual(double_metaphone('fitz Piers', 4), ('FTSP', ''))
3447
        self.assertEqual(double_metaphone('fitz Randolph', 4), ('FTSR', ''))
3448
        self.assertEqual(double_metaphone('fitz Richard', 4), ('FTSR', ''))
3449
        self.assertEqual(double_metaphone('fitz Robert', 4), ('FTSR', ''))
3450
        self.assertEqual(double_metaphone('fitz Roy', 4), ('FTSR', ''))
3451
        self.assertEqual(double_metaphone('fitz Scrob', 4), ('FTSS', ''))
3452
        self.assertEqual(double_metaphone('fitz Walter', 4), ('FTSL', ''))
3453
        self.assertEqual(double_metaphone('fitz Warin', 4), ('FTSR', ''))
3454
        self.assertEqual(double_metaphone('fitz Williams', 4), ('FTSL', ''))
3455
        self.assertEqual(double_metaphone('la Zouche', 4), ('LSX', 'LSK'))
3456
        self.assertEqual(double_metaphone('le Botiller', 4), ('LPTL', ''))
3457
        self.assertEqual(double_metaphone('le Despenser', 4), ('LTSP', ''))
3458
        self.assertEqual(double_metaphone('le deSpencer', 4), ('LTSP', ''))
3459
        self.assertEqual(double_metaphone('of Allendale', 4), ('AFLN', ''))
3460
        self.assertEqual(double_metaphone('of Angouleme', 4), ('AFNK', ''))
3461
        self.assertEqual(double_metaphone('of Anjou', 4), ('AFNJ', ''))
3462
        self.assertEqual(double_metaphone('of Aquitaine', 4), ('AFKT', ''))
3463
        self.assertEqual(double_metaphone('of Aumale', 4), ('AFML', ''))
3464
        self.assertEqual(double_metaphone('of Bavaria', 4), ('AFPF', ''))
3465
        self.assertEqual(double_metaphone('of Boulogne', 4), ('AFPL', ''))
3466
        self.assertEqual(double_metaphone('of Brittany', 4), ('AFPR', ''))
3467
        self.assertEqual(double_metaphone('of Brittary', 4), ('AFPR', ''))
3468
        self.assertEqual(double_metaphone('of Castile', 4), ('AFKS', ''))
3469
        self.assertEqual(double_metaphone('of Chester', 4), ('AFXS', 'AFKS'))
3470
        self.assertEqual(double_metaphone('of Clermont', 4), ('AFKL', ''))
3471
        self.assertEqual(double_metaphone('of Cologne', 4), ('AFKL', ''))
3472
        self.assertEqual(double_metaphone('of Dinan', 4), ('AFTN', ''))
3473
        self.assertEqual(double_metaphone('of Dunbar', 4), ('AFTN', ''))
3474
        self.assertEqual(double_metaphone('of England', 4), ('AFNK', ''))
3475
        self.assertEqual(double_metaphone('of Essex', 4), ('AFSK', ''))
3476
        self.assertEqual(double_metaphone('of Falaise', 4), ('AFFL', ''))
3477
        self.assertEqual(double_metaphone('of Flanders', 4), ('AFFL', ''))
3478
        self.assertEqual(double_metaphone('of Galloway', 4), ('AFKL', ''))
3479
        self.assertEqual(double_metaphone('of Germany', 4), ('AFKR', 'AFJR'))
3480
        self.assertEqual(double_metaphone('of Gloucester', 4), ('AFKL', ''))
3481
        self.assertEqual(double_metaphone('of Heristal', 4), ('AFRS', ''))
3482
        self.assertEqual(double_metaphone('of Hungary', 4), ('AFNK', ''))
3483
        self.assertEqual(double_metaphone('of Huntington', 4), ('AFNT', ''))
3484
        self.assertEqual(double_metaphone('of Kiev', 4), ('AFKF', ''))
3485
        self.assertEqual(double_metaphone('of Kuno', 4), ('AFKN', ''))
3486
        self.assertEqual(double_metaphone('of Landen', 4), ('AFLN', ''))
3487
        self.assertEqual(double_metaphone('of Laon', 4), ('AFLN', ''))
3488
        self.assertEqual(double_metaphone('of Leinster', 4), ('AFLN', ''))
3489
        self.assertEqual(double_metaphone('of Lens', 4), ('AFLN', ''))
3490
        self.assertEqual(double_metaphone('of Lorraine', 4), ('AFLR', ''))
3491
        self.assertEqual(double_metaphone('of Louvain', 4), ('AFLF', ''))
3492
        self.assertEqual(double_metaphone('of Mercia', 4), ('AFMR', ''))
3493
        self.assertEqual(double_metaphone('of Metz', 4), ('AFMT', ''))
3494
        self.assertEqual(double_metaphone('of Meulan', 4), ('AFML', ''))
3495
        self.assertEqual(double_metaphone('of Nass', 4), ('AFNS', ''))
3496
        self.assertEqual(double_metaphone('of Normandy', 4), ('AFNR', ''))
3497
        self.assertEqual(double_metaphone('of Ohningen', 4), ('AFNN', ''))
3498
        self.assertEqual(double_metaphone('of Orleans', 4), ('AFRL', ''))
3499
        self.assertEqual(double_metaphone('of Poitou', 4), ('AFPT', ''))
3500
        self.assertEqual(double_metaphone('of Polotzk', 4), ('AFPL', ''))
3501
        self.assertEqual(double_metaphone('of Provence', 4), ('AFPR', ''))
3502
        self.assertEqual(double_metaphone('of Ringelheim', 4), ('AFRN', ''))
3503
        self.assertEqual(double_metaphone('of Salisbury', 4), ('AFSL', ''))
3504
        self.assertEqual(double_metaphone('of Saxony', 4), ('AFSK', ''))
3505
        self.assertEqual(double_metaphone('of Scotland', 4), ('AFSK', ''))
3506
        self.assertEqual(double_metaphone('of Senlis', 4), ('AFSN', ''))
3507
        self.assertEqual(double_metaphone('of Stafford', 4), ('AFST', ''))
3508
        self.assertEqual(double_metaphone('of Swabia', 4), ('AFSP', ''))
3509
        self.assertEqual(double_metaphone('of Tongres', 4), ('AFTN', ''))
3510
        self.assertEqual(double_metaphone('of the Tributes', 4),
3511
                         ('AF0T', 'AFTT'))
3512
        self.assertEqual(double_metaphone('unknown', 4), ('ANKN', ''))
3513
        self.assertEqual(double_metaphone('van der Gouda', 4), ('FNTR', ''))
3514
        self.assertEqual(double_metaphone('von Adenbaugh', 4), ('FNTN', ''))
3515
        self.assertEqual(double_metaphone('ARCHITure', 4), ('ARKT', ''))
3516
        self.assertEqual(double_metaphone('Arnoff', 4), ('ARNF', ''))
3517
        self.assertEqual(double_metaphone('Arnow', 4), ('ARN', 'ARNF'))
3518
        self.assertEqual(double_metaphone('DANGER', 4), ('TNJR', 'TNKR'))
3519
        self.assertEqual(double_metaphone('Jankelowicz', 4), ('JNKL', 'ANKL'))
3520
        self.assertEqual(double_metaphone('MANGER', 4), ('MNJR', 'MNKR'))
3521
        self.assertEqual(double_metaphone('McClellan', 4), ('MKLL', ''))
3522
        self.assertEqual(double_metaphone('McHugh', 4), ('MK', ''))
3523
        self.assertEqual(double_metaphone('McLaughlin', 4), ('MKLF', ''))
3524
        self.assertEqual(double_metaphone('ORCHEStra', 4), ('ARKS', ''))
3525
        self.assertEqual(double_metaphone('ORCHID', 4), ('ARKT', ''))
3526
        self.assertEqual(double_metaphone('Pierce', 4), ('PRS', ''))
3527
        self.assertEqual(double_metaphone('RANGER', 4), ('RNJR', 'RNKR'))
3528
        self.assertEqual(double_metaphone('Schlesinger', 4), ('XLSN', 'SLSN'))
3529
        self.assertEqual(double_metaphone('Uomo', 4), ('AM', ''))
3530
        self.assertEqual(double_metaphone('Vasserman', 4), ('FSRM', ''))
3531
        self.assertEqual(double_metaphone('Wasserman', 4), ('ASRM', 'FSRM'))
3532
        self.assertEqual(double_metaphone('Womo', 4), ('AM', 'FM'))
3533
        self.assertEqual(double_metaphone('Yankelovich', 4), ('ANKL', ''))
3534
        self.assertEqual(double_metaphone('accede', 4), ('AKST', ''))
3535
        self.assertEqual(double_metaphone('accident', 4), ('AKST', ''))
3536
        self.assertEqual(double_metaphone('adelsheim', 4), ('ATLS', ''))
3537
        self.assertEqual(double_metaphone('aged', 4), ('AJT', 'AKT'))
3538
        self.assertEqual(double_metaphone('ageless', 4), ('AJLS', 'AKLS'))
3539
        self.assertEqual(double_metaphone('agency', 4), ('AJNS', 'AKNS'))
3540
        self.assertEqual(double_metaphone('aghast', 4), ('AKST', ''))
3541
        self.assertEqual(double_metaphone('agio', 4), ('AJ', 'AK'))
3542
        self.assertEqual(double_metaphone('agrimony', 4), ('AKRM', ''))
3543
        self.assertEqual(double_metaphone('album', 4), ('ALPM', ''))
3544
        self.assertEqual(double_metaphone('alcmene', 4), ('ALKM', ''))
3545
        self.assertEqual(double_metaphone('alehouse', 4), ('ALHS', ''))
3546
        self.assertEqual(double_metaphone('antique', 4), ('ANTK', ''))
3547
        self.assertEqual(double_metaphone('artois', 4), ('ART', 'ARTS'))
3548
        self.assertEqual(double_metaphone('automation', 4), ('ATMX', ''))
3549
        self.assertEqual(double_metaphone('bacchus', 4), ('PKS', ''))
3550
        self.assertEqual(double_metaphone('bacci', 4), ('PX', ''))
3551
        self.assertEqual(double_metaphone('bajador', 4), ('PJTR', 'PHTR'))
3552
        self.assertEqual(double_metaphone('bellocchio', 4), ('PLX', ''))
3553
        self.assertEqual(double_metaphone('bertucci', 4), ('PRTX', ''))
3554
        self.assertEqual(double_metaphone('biaggi', 4), ('PJ', 'PK'))
3555
        self.assertEqual(double_metaphone('bough', 4), ('P', ''))
3556
        self.assertEqual(double_metaphone('breaux', 4), ('PR', ''))
3557
        self.assertEqual(double_metaphone('broughton', 4), ('PRTN', ''))
3558
        self.assertEqual(double_metaphone('cabrillo', 4), ('KPRL', 'KPR'))
3559
        self.assertEqual(double_metaphone('caesar', 4), ('SSR', ''))
3560
        self.assertEqual(double_metaphone('cagney', 4), ('KKN', ''))
3561
        self.assertEqual(double_metaphone('campbell', 4), ('KMPL', ''))
3562
        self.assertEqual(double_metaphone('carlisle', 4), ('KRLL', ''))
3563
        self.assertEqual(double_metaphone('carlysle', 4), ('KRLL', ''))
3564
        self.assertEqual(double_metaphone('chemistry', 4), ('KMST', ''))
3565
        self.assertEqual(double_metaphone('chianti', 4), ('KNT', ''))
3566
        self.assertEqual(double_metaphone('chorus', 4), ('KRS', ''))
3567
        self.assertEqual(double_metaphone('cough', 4), ('KF', ''))
3568
        self.assertEqual(double_metaphone('czerny', 4), ('SRN', 'XRN'))
3569
        self.assertEqual(double_metaphone('deffenbacher', 4), ('TFNP', ''))
3570
        self.assertEqual(double_metaphone('dumb', 4), ('TM', ''))
3571
        self.assertEqual(double_metaphone('edgar', 4), ('ATKR', ''))
3572
        self.assertEqual(double_metaphone('edge', 4), ('AJ', ''))
3573
        self.assertEqual(double_metaphone('filipowicz', 4), ('FLPT', 'FLPF'))
3574
        self.assertEqual(double_metaphone('focaccia', 4), ('FKX', ''))
3575
        self.assertEqual(double_metaphone('gallegos', 4), ('KLKS', 'KKS'))
3576
        self.assertEqual(double_metaphone('gambrelli', 4), ('KMPR', ''))
3577
        self.assertEqual(double_metaphone('geithain', 4), ('K0N', 'JTN'))
3578
        self.assertEqual(double_metaphone('ghiradelli', 4), ('JRTL', ''))
3579
        self.assertEqual(double_metaphone('ghislane', 4), ('JLN', ''))
3580
        self.assertEqual(double_metaphone('gough', 4), ('KF', ''))
3581
        self.assertEqual(double_metaphone('hartheim', 4), ('HR0M', 'HRTM'))
3582
        self.assertEqual(double_metaphone('heimsheim', 4), ('HMSM', ''))
3583
        self.assertEqual(double_metaphone('hochmeier', 4), ('HKMR', ''))
3584
        self.assertEqual(double_metaphone('hugh', 4), ('H', ''))
3585
        self.assertEqual(double_metaphone('hunger', 4), ('HNKR', 'HNJR'))
3586
        self.assertEqual(double_metaphone('hungry', 4), ('HNKR', ''))
3587
        self.assertEqual(double_metaphone('island', 4), ('ALNT', ''))
3588
        self.assertEqual(double_metaphone('isle', 4), ('AL', ''))
3589
        self.assertEqual(double_metaphone('jose', 4), ('HS', ''))
3590
        self.assertEqual(double_metaphone('laugh', 4), ('LF', ''))
3591
        self.assertEqual(double_metaphone('mac caffrey', 4), ('MKFR', ''))
3592
        self.assertEqual(double_metaphone('mac gregor', 4), ('MKRK', ''))
3593
        self.assertEqual(double_metaphone('pegnitz', 4), ('PNTS', 'PKNT'))
3594
        self.assertEqual(double_metaphone('piskowitz', 4), ('PSKT', 'PSKF'))
3595
        self.assertEqual(double_metaphone('queen', 4), ('KN', ''))
3596
        self.assertEqual(double_metaphone('raspberry', 4), ('RSPR', ''))
3597
        self.assertEqual(double_metaphone('resnais', 4), ('RSN', 'RSNS'))
3598
        self.assertEqual(double_metaphone('rogier', 4), ('RJ', 'RJR'))
3599
        self.assertEqual(double_metaphone('rough', 4), ('RF', ''))
3600
        self.assertEqual(double_metaphone('san jacinto', 4), ('SNHS', ''))
3601
        self.assertEqual(double_metaphone('schenker', 4), ('XNKR', 'SKNK'))
3602
        self.assertEqual(double_metaphone('schermerhorn', 4), ('XRMR', 'SKRM'))
3603
        self.assertEqual(double_metaphone('schmidt', 4), ('XMT', 'SMT'))
3604
        self.assertEqual(double_metaphone('schneider', 4), ('XNTR', 'SNTR'))
3605
        self.assertEqual(double_metaphone('school', 4), ('SKL', ''))
3606
        self.assertEqual(double_metaphone('schooner', 4), ('SKNR', ''))
3607
        self.assertEqual(double_metaphone('schrozberg', 4), ('XRSP', 'SRSP'))
3608
        self.assertEqual(double_metaphone('schulman', 4), ('XLMN', ''))
3609
        self.assertEqual(double_metaphone('schwabach', 4), ('XPK', 'XFPK'))
3610
        self.assertEqual(double_metaphone('schwarzach', 4), ('XRSK', 'XFRT'))
3611
        self.assertEqual(double_metaphone('smith', 4), ('SM0', 'XMT'))
3612
        self.assertEqual(double_metaphone('snider', 4), ('SNTR', 'XNTR'))
3613
        self.assertEqual(double_metaphone('succeed', 4), ('SKST', ''))
3614
        self.assertEqual(double_metaphone('sugarcane', 4), ('XKRK', 'SKRK'))
3615
        self.assertEqual(double_metaphone('svobodka', 4), ('SFPT', ''))
3616
        self.assertEqual(double_metaphone('tagliaro', 4), ('TKLR', 'TLR'))
3617
        self.assertEqual(double_metaphone('thames', 4), ('TMS', ''))
3618
        self.assertEqual(double_metaphone('theilheim', 4), ('0LM', 'TLM'))
3619
        self.assertEqual(double_metaphone('thomas', 4), ('TMS', ''))
3620
        self.assertEqual(double_metaphone('thumb', 4), ('0M', 'TM'))
3621
        self.assertEqual(double_metaphone('tichner', 4), ('TXNR', 'TKNR'))
3622
        self.assertEqual(double_metaphone('tough', 4), ('TF', ''))
3623
        self.assertEqual(double_metaphone('umbrella', 4), ('AMPR', ''))
3624
        self.assertEqual(double_metaphone('vilshofen', 4), ('FLXF', ''))
3625
        self.assertEqual(double_metaphone('von schuller', 4), ('FNXL', ''))
3626
        self.assertEqual(double_metaphone('wachtler', 4), ('AKTL', 'FKTL'))
3627
        self.assertEqual(double_metaphone('wechsler', 4), ('AKSL', 'FKSL'))
3628
        self.assertEqual(double_metaphone('weikersheim', 4), ('AKRS', 'FKRS'))
3629
        self.assertEqual(double_metaphone('zhao', 4), ('J', ''))
3630
3631
3632
class CaverphoneTestCases(unittest.TestCase):
3633
    """Test Caverphone functions.
3634
3635
    test cases for abydos.phonetic.caverphone
3636
    """
3637
3638
    def test_caverphone2(self):
3639
        """Test abydos.phonetic.caverphone (Caverphone 2)."""
3640
        self.assertEqual(caverphone(''), '1111111111')
3641
        self.assertEqual(caverphone('', 2), '1111111111')
3642
        self.assertEqual(caverphone('', version=2), '1111111111')
3643
3644
        # http://ntz-develop.blogspot.com/2011/03/phonetic-algorithms.html
3645
        self.assertEqual(caverphone('Henrichsen'), 'ANRKSN1111')
3646
        self.assertEqual(caverphone('Henricsson'), 'ANRKSN1111')
3647
        self.assertEqual(caverphone('Henriksson'), 'ANRKSN1111')
3648
        self.assertEqual(caverphone('Hinrichsen'), 'ANRKSN1111')
3649
        self.assertEqual(caverphone('Izchaki'), 'ASKKA11111')
3650
        self.assertEqual(caverphone('Maclaverty'), 'MKLFTA1111')
3651
        self.assertEqual(caverphone('Mccleverty'), 'MKLFTA1111')
3652
        self.assertEqual(caverphone('Mcclifferty'), 'MKLFTA1111')
3653
        self.assertEqual(caverphone('Mclafferty'), 'MKLFTA1111')
3654
        self.assertEqual(caverphone('Mclaverty'), 'MKLFTA1111')
3655
        self.assertEqual(caverphone('Slocomb'), 'SLKM111111')
3656
        self.assertEqual(caverphone('Slocombe'), 'SLKM111111')
3657
        self.assertEqual(caverphone('Slocumb'), 'SLKM111111')
3658
        self.assertEqual(caverphone('Whitlam'), 'WTLM111111')
3659
3660
        # http://caversham.otago.ac.nz/files/working/ctp150804.pdf
3661
        self.assertEqual(caverphone('Stevenson'), 'STFNSN1111')
3662
        self.assertEqual(caverphone('Peter'), 'PTA1111111')
3663
        for word in ('Darda', 'Datha', 'Dedie', 'Deedee', 'Deerdre', 'Deidre',
3664
                     'Deirdre', 'Detta', 'Didi', 'Didier', 'Dido', 'Dierdre',
3665
                     'Dieter', 'Dita', 'Ditter', 'Dodi', 'Dodie', 'Dody',
3666
                     'Doherty', 'Dorthea', 'Dorthy', 'Doti', 'Dotti', 'Dottie',
3667
                     'Dotty', 'Doty', 'Doughty', 'Douty', 'Dowdell', 'Duthie',
3668
                     'Tada', 'Taddeo', 'Tadeo', 'Tadio', 'Tati', 'Teador',
3669
                     'Tedda', 'Tedder', 'Teddi', 'Teddie', 'Teddy', 'Tedi',
3670
                     'Tedie', 'Teeter', 'Teodoor', 'Teodor', 'Terti', 'Theda',
3671
                     'Theodor', 'Theodore', 'Theta', 'Thilda', 'Thordia',
3672
                     'Tilda', 'Tildi', 'Tildie', 'Tildy', 'Tita', 'Tito',
3673
                     'Tjader', 'Toddie', 'Toddy', 'Torto', 'Tuddor', 'Tudor',
3674
                     'Turtle', 'Tuttle', 'Tutto'):
3675
            self.assertEqual(caverphone(word), 'TTA1111111')
3676
            self.assertEqual(caverphone(word, 2), 'TTA1111111')
3677
            self.assertEqual(caverphone(word, version=2), 'TTA1111111')
3678
        for word in ('Cailean', 'Calan', 'Calen', 'Callahan', 'Callan',
3679
                     'Callean', 'Carleen', 'Carlen', 'Carlene', 'Carlin',
3680
                     'Carline', 'Carlyn', 'Carlynn', 'Carlynne', 'Charlean',
3681
                     'Charleen', 'Charlene', 'Charline', 'Cherlyn', 'Chirlin',
3682
                     'Clein', 'Cleon', 'Cline', 'Cohleen', 'Colan', 'Coleen',
3683
                     'Colene', 'Colin', 'Colleen', 'Collen', 'Collin',
3684
                     'Colline', 'Colon', 'Cullan', 'Cullen', 'Cullin',
3685
                     'Gaelan', 'Galan', 'Galen', 'Garlan', 'Garlen', 'Gaulin',
3686
                     'Gayleen', 'Gaylene', 'Giliane', 'Gillan', 'Gillian',
3687
                     'Glen', 'Glenn', 'Glyn', 'Glynn', 'Gollin', 'Gorlin',
3688
                     'Kalin', 'Karlan', 'Karleen', 'Karlen', 'Karlene',
3689
                     'Karlin', 'Karlyn', 'Kaylyn', 'Keelin', 'Kellen',
3690
                     'Kellene', 'Kellyann', 'Kellyn', 'Khalin', 'Kilan',
3691
                     'Kilian', 'Killen', 'Killian', 'Killion', 'Klein',
3692
                     'Kleon', 'Kline', 'Koerlin', 'Kylen', 'Kylynn', 'Quillan',
3693
                     'Quillon', 'Qulllon', 'Xylon'):
3694
            self.assertEqual(caverphone(word), 'KLN1111111')
3695
            self.assertEqual(caverphone(word, 2), 'KLN1111111')
3696
            self.assertEqual(caverphone(word, version=2), 'KLN1111111')
3697
        for word in ('Dan', 'Dane', 'Dann', 'Darn', 'Daune', 'Dawn', 'Ddene',
3698
                     'Dean', 'Deane', 'Deanne', 'DeeAnn', 'Deeann', 'Deeanne',
3699
                     'Deeyn', 'Den', 'Dene', 'Denn', 'Deonne', 'Diahann',
3700
                     'Dian', 'Diane', 'Diann', 'Dianne', 'Diannne', 'Dine',
3701
                     'Dion', 'Dione', 'Dionne', 'Doane', 'Doehne', 'Don',
3702
                     'Donn', 'Doone', 'Dorn', 'Down', 'Downe', 'Duane', 'Dun',
3703
                     'Dunn', 'Duyne', 'Dyan', 'Dyane', 'Dyann', 'Dyanne',
3704
                     'Dyun', 'Tan', 'Tann', 'Teahan', 'Ten', 'Tenn', 'Terhune',
3705
                     'Thain', 'Thaine', 'Thane', 'Thanh', 'Thayne', 'Theone',
3706
                     'Thin', 'Thorn', 'Thorne', 'Thun', 'Thynne', 'Tien',
3707
                     'Tine', 'Tjon', 'Town', 'Towne', 'Turne', 'Tyne'):
3708
            self.assertEqual(caverphone(word), 'TN11111111')
3709
            self.assertEqual(caverphone(word, 2), 'TN11111111')
3710
            self.assertEqual(caverphone(word, version=2), 'TN11111111')
3711
3712
        # etc. (for code coverage)
3713
        self.assertEqual(caverphone('enough'), 'ANF1111111')
3714
        self.assertEqual(caverphone('trough'), 'TRF1111111')
3715
        self.assertEqual(caverphone('gnu'), 'NA11111111')
3716
3717
    def test_caverphone2_php_testset(self):
3718
        """Test abydos.phonetic.caverphone (PHP version testset)."""
3719
        # https://raw.githubusercontent.com/kiphughes/caverphone/master/unit_tests.php
3720
        with open(TESTDIR + '/corpora/php_caverphone.csv') as php_testset:
3721
            for php_line in php_testset:
3722
                (word, caver) = php_line.strip().split(',')
3723
                self.assertEqual(caverphone(word), caver)
3724
3725
    def test_caverphone1(self):
3726
        """Test abydos.phonetic.caverphone (Caverphone 1)."""
3727
        self.assertEqual(caverphone('', 1), '111111')
3728
        self.assertEqual(caverphone('', version=1), '111111')
3729
3730
        # http://caversham.otago.ac.nz/files/working/ctp060902.pdf
3731
        self.assertEqual(caverphone('David', version=1), 'TFT111')
3732
        self.assertEqual(caverphone('Whittle', version=1), 'WTL111')
3733
3734
    def test_caversham(self):
3735
        """Test using Caversham test set (SoundEx, Metaphone, & Caverphone)."""
3736
        with open(TESTDIR + '/corpora/variantNames.csv') as cav_testset:
3737
            next(cav_testset)
3738
            for cav_line in cav_testset:
3739
                (name1, soundex1, metaphone1, caverphone1,
3740
                 name2, soundex2, metaphone2, caverphone2,
3741
                 soundex_same, metaphone_same, caverphone_same) = \
3742
                 cav_line.strip().split(',')
3743
3744
                self.assertEqual(soundex(name1), soundex1)
3745
                self.assertEqual(soundex(name2), soundex2)
3746
                if soundex_same == '1':
3747
                    self.assertEqual(soundex(name1), soundex(name2))
3748
                else:
3749
                    self.assertNotEqual(soundex(name1), soundex(name2))
3750
3751
                self.assertEqual(metaphone(name1), metaphone1)
3752
                self.assertEqual(metaphone(name2), metaphone2)
3753
                if metaphone_same == '1':
3754
                    self.assertEqual(metaphone(name1), metaphone(name2))
3755
                else:
3756
                    self.assertNotEqual(metaphone(name1), metaphone(name2))
3757
3758
                self.assertEqual(caverphone(name1), caverphone1)
3759
                self.assertEqual(caverphone(name2), caverphone2)
3760
                if caverphone_same == '1':
3761
                    self.assertEqual(caverphone(name1), caverphone(name2))
3762
                else:
3763
                    self.assertNotEqual(caverphone(name1), caverphone(name2))
3764
3765
3766
class AlphaSisTestCases(unittest.TestCase):
3767
    """Test Alpha-SIS functions.
3768
3769
    test cases for abydos.phonetic.alpha_sis
3770
    """
3771
3772
    def test_alpha_sis(self):
3773
        """Test abydos.phonetic.alpha_sis."""
3774
        self.assertEqual(alpha_sis('')[0], '00000000000000')
3775
3776
        self.assertEqual(alpha_sis('Rodgers')[0], '04740000000000')
3777
        self.assertEqual(alpha_sis('Rogers')[0], '04740000000000')
3778
        self.assertEqual(alpha_sis('Kant')[0], '07210000000000')
3779
        self.assertEqual(alpha_sis('Knuth')[0], '02100000000000')
3780
        self.assertEqual(alpha_sis('Harper')[0], '24940000000000')
3781
        self.assertEqual(alpha_sis('Collier')[0], '07540000000000')
3782
        self.assertEqual(alpha_sis('Schultz')[0], '06500000000000')
3783
        self.assertEqual(alpha_sis('Livingston')[0], '05827012000000')
3784
3785
        # tests of repeated letters
3786
        self.assertEqual(alpha_sis('Colllier')[0], '07554000000000')
3787
        self.assertEqual(alpha_sis('Collllier')[0], '07554000000000')
3788
        self.assertEqual(alpha_sis('Colllllier')[0], '07555400000000')
3789
        self.assertEqual(alpha_sis('Collllllier')[0], '07555400000000')
3790
        self.assertEqual(alpha_sis('Colalalier')[0], '07555400000000')
3791
3792
        # maxlength bounds tests
3793
        self.assertEqual(alpha_sis('Niall', maxlength=float('inf'))[0],
3794
                         '02500000000000000000000000000000000000000000000000' +
3795
                         '00000000000000')
3796
        self.assertEqual(alpha_sis('Niall', maxlength=None)[0],
3797
                         '02500000000000000000000000000000000000000000000000' +
3798
                         '00000000000000')
3799
        self.assertEqual(alpha_sis('Niall', maxlength=0)[0], '0250')
3800
3801
3802
class FuzzySoundexTestCases(unittest.TestCase):
3803
    """Test Fuzzy Soundex functions.
3804
3805
    test cases for abydos.phonetic.fuzzy_soundex
3806
    """
3807
3808
    def test_fuzzy_soundex(self):
3809
        """Test abydos.phonetic.fuzzy_soundex."""
3810
        self.assertEqual(fuzzy_soundex(''), '00000')
3811
        # http://wayback.archive.org/web/20100629121128/http://www.ir.iit.edu/publications/downloads/IEEESoundexV5.pdf
3812
        self.assertEqual(fuzzy_soundex('Kristen'), 'K6935')
3813
        self.assertEqual(fuzzy_soundex('Krissy'), 'K6900')
3814
        self.assertEqual(fuzzy_soundex('Christen'), 'K6935')
3815
3816
        # http://books.google.com/books?id=LZrT6eWf9NMC&lpg=PA76&ots=Tex3FqNwGP&dq=%22phonix%20algorithm%22&pg=PA75#v=onepage&q=%22phonix%20algorithm%22&f=false
3817
        self.assertEqual(fuzzy_soundex('peter', 4), 'P360')
3818
        self.assertEqual(fuzzy_soundex('pete', 4), 'P300')
3819
        self.assertEqual(fuzzy_soundex('pedro', 4), 'P360')
3820
        self.assertEqual(fuzzy_soundex('stephen', 4), 'S315')
3821
        self.assertEqual(fuzzy_soundex('steve', 4), 'S310')
3822
        self.assertEqual(fuzzy_soundex('smith', 4), 'S530')
3823
        self.assertEqual(fuzzy_soundex('smythe', 4), 'S530')
3824
        self.assertEqual(fuzzy_soundex('gail', 4), 'G400')
3825
        self.assertEqual(fuzzy_soundex('gayle', 4), 'G400')
3826
        self.assertEqual(fuzzy_soundex('christine', 4), 'K693')
3827
        self.assertEqual(fuzzy_soundex('christina', 4), 'K693')
3828
        self.assertEqual(fuzzy_soundex('kristina', 4), 'K693')
3829
3830
        # etc. (for code coverage)
3831
        self.assertEqual(fuzzy_soundex('Wight'), 'W3000')
3832
        self.assertEqual(fuzzy_soundex('Hardt'), 'H6000')
3833
        self.assertEqual(fuzzy_soundex('Knight'), 'N3000')
3834
        self.assertEqual(fuzzy_soundex('Czech'), 'S7000')
3835
        self.assertEqual(fuzzy_soundex('Tsech'), 'S7000')
3836
        self.assertEqual(fuzzy_soundex('gnomic'), 'N5900')
3837
        self.assertEqual(fuzzy_soundex('Wright'), 'R3000')
3838
        self.assertEqual(fuzzy_soundex('Hrothgar'), 'R3760')
3839
        self.assertEqual(fuzzy_soundex('Hwaet'), 'W3000')
3840
        self.assertEqual(fuzzy_soundex('Grant'), 'G6300')
3841
        self.assertEqual(fuzzy_soundex('Hart'), 'H6000')
3842
        self.assertEqual(fuzzy_soundex('Hardt'), 'H6000')
3843
3844
        # maxlength bounds tests
3845
        self.assertEqual(fuzzy_soundex('Niall', maxlength=float('inf')),
3846
                         'N4000000000000000000000000000000000000000000000000' +
3847
                         '00000000000000')
3848
        self.assertEqual(fuzzy_soundex('Niall', maxlength=None),
3849
                         'N4000000000000000000000000000000000000000000000000' +
3850
                         '00000000000000')
3851
        self.assertEqual(fuzzy_soundex('Niall', maxlength=0), 'N400')
3852
3853
        # zero_pad tests
3854
        self.assertEqual(fuzzy_soundex('Niall', maxlength=float('inf'),
3855
                                       zero_pad=False), 'N4')
3856
        self.assertEqual(fuzzy_soundex('Niall', maxlength=None,
3857
                                       zero_pad=False), 'N4')
3858
        self.assertEqual(fuzzy_soundex('Niall', maxlength=0,
3859
                                       zero_pad=False), 'N4')
3860
        self.assertEqual(fuzzy_soundex('Niall', maxlength=0,
3861
                                       zero_pad=True), 'N400')
3862
        self.assertEqual(fuzzy_soundex('', maxlength=4, zero_pad=False), '0')
3863
        self.assertEqual(fuzzy_soundex('', maxlength=4, zero_pad=True), '0000')
3864
3865
3866
class PhonexTestCases(unittest.TestCase):
3867
    """Test Phonex functions.
3868
3869
    test cases for abydos.phonetic.phonex
3870
    """
3871
3872
    def test_phonex(self):
3873
        """Test abydos.phonetic.phonex."""
3874
        self.assertEqual(phonex(''), '0000')
3875
3876
        # http://homepages.cs.ncl.ac.uk/brian.randell/Genealogy/NameMatching.pdf
3877
        self.assertEqual(phonex('Ewell'), 'A400')
3878
        self.assertEqual(phonex('Filp'), 'F100')
3879
        self.assertEqual(phonex('Heames'), 'A500')
3880
        self.assertEqual(phonex('Kneves'), 'N100')
3881
        self.assertEqual(phonex('River'), 'R160')
3882
        self.assertEqual(phonex('Corley'), 'C400')
3883
        self.assertEqual(phonex('Carton'), 'C350')
3884
        self.assertEqual(phonex('Cachpole'), 'C214')
3885
3886
        self.assertEqual(phonex('Ewell'), phonex('Ule'))
3887
        self.assertEqual(phonex('Filp'), phonex('Philp'))
3888
        self.assertEqual(phonex('Yule'), phonex('Ewell'))
3889
        self.assertEqual(phonex('Heames'), phonex('Eames'))
3890
        self.assertEqual(phonex('Kneves'), phonex('Neves'))
3891
        self.assertEqual(phonex('River'), phonex('Rivers'))
3892
        self.assertEqual(phonex('Corley'), phonex('Coley'))
3893
        self.assertEqual(phonex('Carton'), phonex('Carlton'))
3894
        self.assertEqual(phonex('Cachpole'), phonex('Catchpole'))
3895
3896
        # etc. (for code coverage)
3897
        self.assertEqual(phonex('Saxon'), 'S250')
3898
        self.assertEqual(phonex('Wright'), 'R230')
3899
        self.assertEqual(phonex('Ai'), 'A000')
3900
        self.assertEqual(phonex('Barth'), 'B300')
3901
        self.assertEqual(phonex('Perry'), 'B600')
3902
        self.assertEqual(phonex('Garth'), 'G300')
3903
        self.assertEqual(phonex('Jerry'), 'G600')
3904
        self.assertEqual(phonex('Gerry'), 'G600')
3905
        self.assertEqual(phonex('Camden'), 'C500')
3906
        self.assertEqual(phonex('Ganges'), 'G500')
3907
        self.assertEqual(phonex('A-1'), 'A000')
3908
3909
        # maxlength bounds tests
3910
        self.assertEqual(phonex('Niall', maxlength=float('inf')),
3911
                         'N4000000000000000000000000000000000000000000000000' +
3912
                         '00000000000000')
3913
        self.assertEqual(phonex('Niall', maxlength=None),
3914
                         'N4000000000000000000000000000000000000000000000000' +
3915
                         '00000000000000')
3916
        self.assertEqual(phonex('Niall', maxlength=0), 'N400')
3917
3918
        # zero_pad tests
3919
        self.assertEqual(phonex('Niall', maxlength=float('inf'),
3920
                                zero_pad=False), 'N4')
3921
        self.assertEqual(phonex('Niall', maxlength=None, zero_pad=False),
3922
                         'N4')
3923
        self.assertEqual(phonex('Niall', maxlength=0, zero_pad=False),
3924
                         'N4')
3925
        self.assertEqual(phonex('Niall', maxlength=0, zero_pad=True),
3926
                         'N400')
3927
        self.assertEqual(phonex('', maxlength=4, zero_pad=False), '0')
3928
        self.assertEqual(phonex('', maxlength=4, zero_pad=True), '0000')
3929
3930
3931
class PhonemTestCases(unittest.TestCase):
3932
    """Test Phonem functions.
3933
3934
    test cases for abydos.phonetic.phonem
3935
    """
3936
3937
    def test_phonem(self):
3938
        """Test abydos.phonetic.phonem."""
3939
        self.assertEqual(phonem(''), '')
3940
3941
        # http://phonetik.phil-fak.uni-koeln.de/fileadmin/home/ritters/Allgemeine_Dateien/Martin_Wilz.pdf
3942
        self.assertEqual(phonem('müller'), 'MYLR')
3943
        self.assertEqual(phonem('schmidt'), 'CMYD')
3944
        self.assertEqual(phonem('schneider'), 'CNAYDR')
3945
        self.assertEqual(phonem('fischer'), 'VYCR')
3946
        self.assertEqual(phonem('weber'), 'VBR')
3947
        self.assertEqual(phonem('meyer'), 'MAYR')
3948
        self.assertEqual(phonem('wagner'), 'VACNR')
3949
        self.assertEqual(phonem('schulz'), 'CULC')
3950
        self.assertEqual(phonem('becker'), 'BCR')
3951
        self.assertEqual(phonem('hoffmann'), 'OVMAN')
3952
        self.assertEqual(phonem('schäfer'), 'CVR')
3953
3954
        # http://cpansearch.perl.org/src/MAROS/Text-Phonetic-2.05/t/008_phonem.t
3955
        self.assertEqual(phonem('mair'), 'MAYR')
3956
        self.assertEqual(phonem('bäker'), 'BCR')
3957
        self.assertEqual(phonem('schaeffer'), 'CVR')
3958
        self.assertEqual(phonem('computer'), 'COMBUDR')
3959
        self.assertEqual(phonem('pfeifer'), 'VAYVR')
3960
        self.assertEqual(phonem('pfeiffer'), 'VAYVR')
3961
3962
3963
class PhonixTestCases(unittest.TestCase):
3964
    """Test Phonix functions.
3965
3966
    test cases for abydos.phonetic.phonix
3967
    """
3968
3969
    def test_phonix(self):
3970
        """Test abydos.phonetic.phonix."""
3971
        self.assertEqual(phonix(''), '0000')
3972
3973
        # http://cpansearch.perl.org/src/MAROS/Text-Phonetic-2.05/t/007_phonix.t
3974
        self.assertEqual(phonix('Müller'), 'M400')
3975
        self.assertEqual(phonix('schneider'), 'S530')
3976
        self.assertEqual(phonix('fischer'), 'F800')
3977
        self.assertEqual(phonix('weber'), 'W100')
3978
        self.assertEqual(phonix('meyer'), 'M000')
3979
        self.assertEqual(phonix('wagner'), 'W250')
3980
        self.assertEqual(phonix('schulz'), 'S480')
3981
        self.assertEqual(phonix('becker'), 'B200')
3982
        self.assertEqual(phonix('hoffmann'), 'H755')
3983
        self.assertEqual(phonix('schäfer'), 'S700')
3984
        self.assertEqual(phonix('schmidt'), 'S530')
3985
3986
        # http://cpansearch.perl.org/src/MAROS/Text-Phonetic-2.05/t/007_phonix.t:
3987
        # testcases from Wais Module
3988
        self.assertEqual(phonix('computer'), 'K513')
3989
        self.assertEqual(phonix('computers'), 'K513')
3990
        self.assertEqual(phonix('computers', 5), 'K5138')
3991
        self.assertEqual(phonix('pfeifer'), 'F700')
3992
        self.assertEqual(phonix('pfeiffer'), 'F700')
3993
        self.assertEqual(phonix('knight'), 'N300')
3994
        self.assertEqual(phonix('night'), 'N300')
3995
3996
        # http://cpansearch.perl.org/src/MAROS/Text-Phonetic-2.05/t/007_phonix.t:
3997
        # testcases from
3998
        # http://www.cl.uni-heidelberg.de/~bormann/documents/phono/
3999
        # They use a sliglty different algorithm (first char is not included in
4000
        # num code here)
4001
        self.assertEqual(phonix('wait'), 'W300')
4002
        self.assertEqual(phonix('weight'), 'W300')
4003
        self.assertEqual(phonix('gnome'), 'N500')
4004
        self.assertEqual(phonix('noam'), 'N500')
4005
        self.assertEqual(phonix('rees'), 'R800')
4006
        self.assertEqual(phonix('reece'), 'R800')
4007
        self.assertEqual(phonix('yaeger'), 'v200')
4008
4009
        # http://books.google.com/books?id=xtWPI7Is9wIC&lpg=PA29&ots=DXhaL7ZkvK&dq=phonix%20gadd&pg=PA29#v=onepage&q=phonix%20gadd&f=false
4010
        self.assertEqual(phonix('alam'), 'v450')
4011
        self.assertEqual(phonix('berkpakaian'), 'B212')
4012
        self.assertEqual(phonix('capaian'), 'K150')
4013
4014
        # http://books.google.com/books?id=LZrT6eWf9NMC&lpg=PA76&ots=Tex3FqNwGP&dq=%22phonix%20algorithm%22&pg=PA75#v=onepage&q=%22phonix%20algorithm%22&f=false
4015
        self.assertEqual(phonix('peter'), 'P300')
4016
        self.assertEqual(phonix('pete'), 'P300')
4017
        self.assertEqual(phonix('pedro'), 'P360')
4018
        self.assertEqual(phonix('stephen'), 'S375')
4019
        self.assertEqual(phonix('steve'), 'S370')
4020
        self.assertEqual(phonix('smith'), 'S530')
4021
        self.assertEqual(phonix('smythe'), 'S530')
4022
        self.assertEqual(phonix('gail'), 'G400')
4023
        self.assertEqual(phonix('gayle'), 'G400')
4024
        self.assertEqual(phonix('christine'), 'K683')
4025
        self.assertEqual(phonix('christina'), 'K683')
4026
        self.assertEqual(phonix('kristina'), 'K683')
4027
4028
        # maxlength bounds tests
4029
        self.assertEqual(phonix('Niall', maxlength=float('inf')), 'N4'+'0'*62)
4030
        self.assertEqual(phonix('Niall', maxlength=None), 'N4'+'0'*62)
4031
        self.assertEqual(phonix('Niall', maxlength=0), 'N400')
4032
4033
        # zero_pad tests
4034
        self.assertEqual(phonix('Niall', maxlength=float('inf'),
4035
                                zero_pad=False), 'N4')
4036
        self.assertEqual(phonix('Niall', maxlength=None, zero_pad=False),
4037
                         'N4')
4038
        self.assertEqual(phonix('Niall', maxlength=0, zero_pad=False),
4039
                         'N4')
4040
        self.assertEqual(phonix('Niall', maxlength=0, zero_pad=True),
4041
                         'N400')
4042
        self.assertEqual(phonix('', maxlength=4, zero_pad=False), '0')
4043
        self.assertEqual(phonix('', maxlength=4, zero_pad=True), '0000')
4044
4045
4046
class SfinxBisTestCases(unittest.TestCase):
4047
    """Test SfinxBis functions.
4048
4049
    test cases for abydos.phonetic.sfinxbis
4050
    """
4051
4052
    def test_sfinxbis(self):
4053
        """Test abydos.phonetic.sfinxbis."""
4054
        self.assertEqual(sfinxbis(''), ('',))
4055
4056
        # http://www.swami.se/download/18.248ad5af12aa81365338000106/TestSfinx.txt
4057
        # cases where the gold standard gave clearly wrong values have been
4058
        # corrected below (marked with '# wrong'
4059
        self.assertEqual(sfinxbis('af Sandeberg'), ('S53162',))
4060
        self.assertEqual(sfinxbis('av Ekenstam'), ('$25835',))
4061
        self.assertEqual(sfinxbis('Da Costa'), ('K83',))
4062
        self.assertEqual(sfinxbis('Das Neves'), ('D8', 'N78'))
4063
        self.assertEqual(sfinxbis('de Besche'), ('B8',))
4064
        self.assertEqual(sfinxbis('de la Motte'), ('M3',))
4065
        self.assertEqual(sfinxbis('de Las Heras'), ('H68',))  # wrong
4066
        self.assertEqual(sfinxbis('de Los Santos'), ('S538',))
4067
        self.assertEqual(sfinxbis('del Rosario'), ('R862',))
4068
        self.assertEqual(sfinxbis('Den Boer'), ('B6',))
4069
        self.assertEqual(sfinxbis('Der de Kazinczy'),
4070
                         ('D6', 'K8528',))  # wrong
4071
        self.assertEqual(sfinxbis('des Rieux'), ('R28',))
4072
        self.assertEqual(sfinxbis('Di Luca'), ('L2',))
4073
        self.assertEqual(sfinxbis('Do Rosario'), ('R862',))
4074
        self.assertEqual(sfinxbis('Don Lind'), ('L53',))
4075
        self.assertEqual(sfinxbis('Dos Santos'), ('S538',))
4076
        self.assertEqual(sfinxbis('du Rietz'), ('R38',))
4077
        self.assertEqual(sfinxbis('in de Betou'), ('B3',))
4078
        self.assertEqual(sfinxbis('La Fleur'), ('F46',))
4079
        self.assertEqual(sfinxbis('Le Grand'), ('G653',))
4080
        self.assertEqual(sfinxbis('li Puma'), ('L', 'P5'))
4081
        self.assertEqual(sfinxbis('lo Martire'), ('L', 'M636'))
4082
        self.assertEqual(sfinxbis('mac Donald'), ('D543',))
4083
        self.assertEqual(sfinxbis('mc Intosh'), ('$538',))
4084
        self.assertEqual(sfinxbis('S:t Cyr'), ('S6',))
4085
        self.assertEqual(sfinxbis('Van Doom'), ('D5',))
4086
        self.assertEqual(sfinxbis('Van de Peppel'), ('P14',))
4087
        self.assertEqual(sfinxbis('Van den Berg'), ('B62',))
4088
        self.assertEqual(sfinxbis('Van Der Kwast'), ('K783',))
4089
        self.assertEqual(sfinxbis('von Ahn'), ('$5',))
4090
        self.assertEqual(sfinxbis('von Dem Knesebeck'), ('K5812',))
4091
        self.assertEqual(sfinxbis('von Der Burg'), ('B62',))
4092
        self.assertEqual(sfinxbis('D\'Angelo'), ('D524',))
4093
        self.assertEqual(sfinxbis('O\'Conner'), ('$256',))
4094
        self.assertEqual(sfinxbis('Los'), ('L8',))
4095
        self.assertEqual(sfinxbis('Mac'), ('M2',))
4096
        self.assertEqual(sfinxbis('Till'), ('T4',))
4097
        self.assertEqual(sfinxbis('Van'), ('V5',))
4098
        self.assertEqual(sfinxbis('Von'), ('V5',))
4099
        self.assertEqual(sfinxbis('Bernadotte af Wisborg'), ('B6533', 'V8162'))
4100
        self.assertEqual(sfinxbis('Hjort af Ornäs'), ('J63', '$658'))
4101
        self.assertEqual(sfinxbis('Horn af Åminne'), ('H65', '$55'))
4102
        self.assertEqual(sfinxbis('Horn av Åminne'), ('H65', '$55'))
4103
        self.assertEqual(sfinxbis('Hård af Segerstad'), ('H63', 'S26833'))
4104
        self.assertEqual(sfinxbis('Hård av Segerstad'), ('H63', 'S26833'))
4105
        self.assertEqual(sfinxbis('Stael von Holstein'), ('S34', 'H48325'))
4106
        self.assertEqual(sfinxbis('de Oliveira e Silva'), ('$4726', 'S47'))
4107
        self.assertEqual(sfinxbis('de Alfaro y Gómez'), ('$476', 'G58'))
4108
        self.assertEqual(sfinxbis('Arjaliès-de la Lande'), ('$6248', 'L53'))
4109
        self.assertEqual(sfinxbis('Dominicus van den Bussche'),
4110
                         ('D5528', 'B8'))
4111
        self.assertEqual(sfinxbis('Edebol Eeg-Olofsson'),
4112
                         ('$314', '$2', '$4785'))
4113
        self.assertEqual(sfinxbis('Jonsson-Blomqvist'), ('J585', 'B452783'))
4114
        self.assertEqual(sfinxbis('Kiviniemi Birgersson'), ('#755', 'B62685'))
4115
        self.assertEqual(sfinxbis('Massena Serpa dos Santos'),
4116
                         ('M85', 'S61', 'S538'))
4117
        self.assertEqual(sfinxbis('S:t Clair Renard'), ('K426', 'R563'))
4118
        self.assertEqual(sfinxbis('Skoog H Andersson'), ('S22', 'H', '$53685'))
4119
        self.assertEqual(sfinxbis('von Post-Skagegård'), ('P83', 'S22263'))
4120
        self.assertEqual(sfinxbis('von Zur-Mühlen'), ('S6', 'M45'))
4121
        self.assertEqual(sfinxbis('Waltå O:son'), ('V43', '$85'))
4122
        self.assertEqual(sfinxbis('Zardán Gómez de la Torre'),
4123
                         ('S635', 'G58', 'T6'))
4124
        self.assertEqual(sfinxbis('af Jochnick'), ('J252',))
4125
        self.assertEqual(sfinxbis('af Ioscnick'), ('J8252',))
4126
        self.assertEqual(sfinxbis('Aabakken'), ('$125',))
4127
        self.assertEqual(sfinxbis('Åbacken'), ('$125',))
4128
        self.assertEqual(sfinxbis('Ahlen'), ('$45',))
4129
        self.assertEqual(sfinxbis('Aleen'), ('$45',))
4130
        self.assertEqual(sfinxbis('Braunerhielm'), ('B656245',))
4131
        self.assertEqual(sfinxbis('Branneerhielm'), ('B656245',))
4132
        self.assertEqual(sfinxbis('Carlzon'), ('K6485',))
4133
        self.assertEqual(sfinxbis('Karlsson'), ('K6485',))
4134
        self.assertEqual(sfinxbis('Enochsson'), ('$5285',))
4135
        self.assertEqual(sfinxbis('Ericsson'), ('$6285',))
4136
        self.assertEqual(sfinxbis('Ericksson'), ('$6285',))
4137
        self.assertEqual(sfinxbis('Erixson'), ('$6285',))
4138
        self.assertEqual(sfinxbis('Filipsson'), ('F4185',))
4139
        self.assertEqual(sfinxbis('Philipson'), ('F4185',))
4140
        self.assertEqual(sfinxbis('Flycht'), ('F423',))
4141
        self.assertEqual(sfinxbis('Flygt'), ('F423',))
4142
        self.assertEqual(sfinxbis('Flykt'), ('F423',))
4143
        self.assertEqual(sfinxbis('Fröijer'), ('F626',))
4144
        self.assertEqual(sfinxbis('Fröjer'), ('F626',))
4145
        self.assertEqual(sfinxbis('Gertner'), ('J6356',))
4146
        self.assertEqual(sfinxbis('Hiertner'), ('J6356',))
4147
        self.assertEqual(sfinxbis('Hirch'), ('H62',))
4148
        self.assertEqual(sfinxbis('Hirsch'), ('H68',))
4149
        self.assertEqual(sfinxbis('Haegermarck'), ('H26562',))
4150
        self.assertEqual(sfinxbis('Hägermark'), ('H26562',))
4151
        self.assertEqual(sfinxbis('Isaxon'), ('$8285',))
4152
        self.assertEqual(sfinxbis('Isacsson'), ('$8285',))
4153
        self.assertEqual(sfinxbis('Joachimsson'), ('J2585',))
4154
        self.assertEqual(sfinxbis('Joakimson'), ('J2585',))
4155
        self.assertEqual(sfinxbis('Kjell'), ('#4',))
4156
        self.assertEqual(sfinxbis('Käll'), ('#4',))
4157
        self.assertEqual(sfinxbis('Knapp'), ('K51',))
4158
        self.assertEqual(sfinxbis('Krans'), ('K658',))
4159
        self.assertEqual(sfinxbis('Krantz'), ('K6538',))
4160
        self.assertEqual(sfinxbis('Kvist'), ('K783',))
4161
        self.assertEqual(sfinxbis('Quist'), ('K783',))
4162
        self.assertEqual(sfinxbis('Lidbeck'), ('L312',))
4163
        self.assertEqual(sfinxbis('Lidbäck'), ('L312',))
4164
        self.assertEqual(sfinxbis('Linnér'), ('L56',))
4165
        self.assertEqual(sfinxbis('Linner'), ('L56',))
4166
        self.assertEqual(sfinxbis('Lorenzsonn'), ('L6585',))
4167
        self.assertEqual(sfinxbis('Lorentzon'), ('L65385',))
4168
        self.assertEqual(sfinxbis('Lorenßon'), ('L6585',))
4169
        self.assertEqual(sfinxbis('Lyxell'), ('L284',))
4170
        self.assertEqual(sfinxbis('Lycksell'), ('L284',))
4171
        self.assertEqual(sfinxbis('Marcström'), ('M628365',))
4172
        self.assertEqual(sfinxbis('Markström'), ('M628365',))
4173
        self.assertEqual(sfinxbis('Michaelsson'), ('M2485',))
4174
        self.assertEqual(sfinxbis('Mikaelson'), ('M2485',))
4175
        self.assertEqual(sfinxbis('Mörch'), ('M62',))
4176
        self.assertEqual(sfinxbis('Mörck'), ('M62',))
4177
        self.assertEqual(sfinxbis('Mörk'), ('M62',))
4178
        self.assertEqual(sfinxbis('Mørk'), ('M62',))
4179
        self.assertEqual(sfinxbis('Nääs'), ('N8',))
4180
        self.assertEqual(sfinxbis('Naess'), ('N8',))
4181
        self.assertEqual(sfinxbis('Nordstedt'), ('N63833',))
4182
        self.assertEqual(sfinxbis('Oxenstierna'), ('$28583265',))
4183
        self.assertEqual(sfinxbis('Palmçrañtz'), ('P4526538',))
4184
        self.assertEqual(sfinxbis('Palmcrantz'), ('P4526538',))
4185
        self.assertEqual(sfinxbis('Palmkrantz'), ('P4526538',))
4186
        self.assertEqual(sfinxbis('Preuss'), ('P68',))
4187
        self.assertEqual(sfinxbis('Preutz'), ('P638',))
4188
        self.assertEqual(sfinxbis('Richardson'), ('R26385',))
4189
        self.assertEqual(sfinxbis('Rikardson'), ('R26385',))
4190
        self.assertEqual(sfinxbis('Ruuth'), ('R3',))
4191
        self.assertEqual(sfinxbis('Ruth'), ('R3',))
4192
        self.assertEqual(sfinxbis('Sæter'), ('S36',))
4193
        self.assertEqual(sfinxbis('Zäter'), ('S36',))
4194
        self.assertEqual(sfinxbis('Schedin'), ('#35',))
4195
        self.assertEqual(sfinxbis('Sjödin'), ('#35',))
4196
        self.assertEqual(sfinxbis('Siöö'), ('#',))
4197
        self.assertEqual(sfinxbis('Sjöh'), ('#',))
4198
        self.assertEqual(sfinxbis('Svedberg'), ('S73162',))
4199
        self.assertEqual(sfinxbis('Zwedberg'), ('S73162',))
4200
        self.assertEqual(sfinxbis('Tjäder'), ('#36',))
4201
        self.assertEqual(sfinxbis('þornquist'), ('T652783',))
4202
        self.assertEqual(sfinxbis('Thörnqvist'), ('T652783',))
4203
        self.assertEqual(sfinxbis('Törnkvist'), ('T652783',))
4204
        self.assertEqual(sfinxbis('Wichman'), ('V255',))
4205
        self.assertEqual(sfinxbis('Wickman'), ('V255',))
4206
        self.assertEqual(sfinxbis('Wictorin'), ('V2365',))
4207
        self.assertEqual(sfinxbis('Wictorsson'), ('V23685',))
4208
        self.assertEqual(sfinxbis('Viktorson'), ('V23685',))
4209
        self.assertEqual(sfinxbis('Zachrisson'), ('S2685',))
4210
        self.assertEqual(sfinxbis('Zakrison'), ('S2685',))
4211
        self.assertEqual(sfinxbis('Övragård'), ('$76263',))
4212
        self.assertEqual(sfinxbis('Öfvragårdh'), ('$76263',))
4213
        self.assertEqual(sfinxbis('Bogdanovic'), ('B23572',))
4214
        self.assertEqual(sfinxbis('Bogdanovitch'), ('B235732',))
4215
        self.assertEqual(sfinxbis('Dieterich'), ('D362',))
4216
        self.assertEqual(sfinxbis('Eichorn'), ('$265',))
4217
        self.assertEqual(sfinxbis('Friedrich'), ('F6362',))
4218
        self.assertEqual(sfinxbis('Grantcharova'), ('G653267',))
4219
        self.assertEqual(sfinxbis('Ilichev'), ('$427',))
4220
        self.assertEqual(sfinxbis('Ivankovic'), ('$75272',))
4221
        self.assertEqual(sfinxbis('Ivangurich'), ('$75262',))
4222
        self.assertEqual(sfinxbis('Kinch'), ('#52',))
4223
        self.assertEqual(sfinxbis('Kirchmann'), ('#6255',))
4224
        self.assertEqual(sfinxbis('Machado'), ('M23',))
4225
        self.assertEqual(sfinxbis('Reich'), ('R2',))
4226
        self.assertEqual(sfinxbis('Roche'), ('R2',))
4227
        self.assertEqual(sfinxbis('Rubaszkin'), ('R1825',))
4228
        self.assertEqual(sfinxbis('Rubaschkin'), ('R1825',))
4229
        self.assertEqual(sfinxbis('Sanchez'), ('S528',))
4230
        self.assertEqual(sfinxbis('Walukiewicz'), ('V42728',))
4231
        self.assertEqual(sfinxbis('Valukievitch'), ('V42732',))
4232
        self.assertEqual(sfinxbis('K'), ('K',))
4233
        self.assertEqual(sfinxbis('2010'), ('',))
4234
        self.assertEqual(sfinxbis('cese'), ('S8',))
4235
4236
        # a few maxlength tests
4237
        self.assertEqual(sfinxbis('Kiviniemi Birgersson', 3), ('#75', 'B62'))
4238
        self.assertEqual(sfinxbis('Eichorn', 4), ('$265',))
4239
        self.assertEqual(sfinxbis('Friedrich', 4), ('F636',))
4240
        self.assertEqual(sfinxbis('Grantcharova', 4), ('G653',))
4241
        self.assertEqual(sfinxbis('Ilichev', 4), ('$427',))
4242
        self.assertEqual(sfinxbis('Ivankovic', 4), ('$752',))
4243
        self.assertEqual(sfinxbis('Ivangurich', 4), ('$752',))
4244
        self.assertEqual(sfinxbis('Kinch', 4), ('#52',))
4245
        self.assertEqual(sfinxbis('Kirchmann', 4), ('#625',))
4246
        self.assertEqual(sfinxbis('Machado', 4), ('M23',))
4247
        self.assertEqual(sfinxbis('Reich', 4), ('R2',))
4248
        self.assertEqual(sfinxbis('Roche', 4), ('R2',))
4249
        self.assertEqual(sfinxbis('Rubaszkin', 4), ('R182',))
4250
        self.assertEqual(sfinxbis('Rubaschkin', 4), ('R182',))
4251
        self.assertEqual(sfinxbis('Sanchez', 4), ('S528',))
4252
        self.assertEqual(sfinxbis('Walukiewicz', 4), ('V427',))
4253
        self.assertEqual(sfinxbis('Valukievitch', 4), ('V427',))
4254
        self.assertEqual(sfinxbis('K', 4), ('K',))
4255
        self.assertEqual(sfinxbis('2010', 4), ('',))
4256
        self.assertEqual(sfinxbis('cese', 4), ('S8',))
4257
4258
        # etc. (for code coverage)
4259
        self.assertEqual(sfinxbis('chans'), ('#58',))
4260
        self.assertEqual(sfinxbis('ljud'), ('J3',))
4261
        self.assertEqual(sfinxbis('qi'), ('K',))
4262
        self.assertEqual(sfinxbis('xavier'), ('S76',))
4263
        self.assertEqual(sfinxbis('skjul'), ('#4',))
4264
        self.assertEqual(sfinxbis('schul'), ('#4',))
4265
        self.assertEqual(sfinxbis('skil'), ('#4',))
4266
4267
        # maxlength bounds tests
4268
        self.assertEqual(sfinxbis('Niall', maxlength=float('inf')), ('N4',))
4269
        self.assertEqual(sfinxbis('Niall', maxlength=None), ('N4',))
4270
        self.assertEqual(sfinxbis('Niall', maxlength=0), ('N4',))
4271
4272
4273
class PhonetTestCases(unittest.TestCase):
4274
    """Test Phonet functions.
4275
4276
    test cases for abydos.phonetic.phonet
4277
    """
4278
4279
    def test_phonet_german(self):
4280
        """Test abydos.phonetic.phonet (German)."""
4281
        self.assertEqual(phonet(''), '')
4282
4283
        # https://code.google.com/p/phonet4java/source/browse/trunk/src/test/java/com/googlecode/phonet4java/Phonet1Test.java
4284
        self.assertEqual(phonet('', 1), '')
4285
        self.assertEqual(phonet('Zedlitz', 1), 'ZETLIZ')
4286
        self.assertEqual(phonet('Bremerhaven', 1), 'BREMAHAFN')
4287
        self.assertEqual(phonet('Hamburger Hafen', 1), 'HAMBURGA HAFN')
4288
        self.assertEqual(phonet('Jesper', 1), 'IESPA')
4289
        self.assertEqual(phonet('elisabeth', 1), 'ELISABET')
4290
        self.assertEqual(phonet('elisabet', 1), 'ELISABET')
4291
        self.assertEqual(phonet('Ziegler', 1), 'ZIKLA')
4292
        self.assertEqual(phonet('Scherer', 1), 'SHERA')
4293
        self.assertEqual(phonet('Bartels', 1), 'BARTLS')
4294
        self.assertEqual(phonet('Jansen', 1), 'IANSN')
4295
        self.assertEqual(phonet('Sievers', 1), 'SIWAS')
4296
        self.assertEqual(phonet('Michels', 1), 'MICHLS')
4297
        self.assertEqual(phonet('Ewers', 1), 'EWERS')
4298
        self.assertEqual(phonet('Evers', 1), 'EWERS')
4299
        self.assertEqual(phonet('Wessels', 1), 'WESLS')
4300
        self.assertEqual(phonet('Gottschalk', 1), 'GOSHALK')
4301
        self.assertEqual(phonet('Brückmann', 1), 'BRÜKMAN')
4302
        self.assertEqual(phonet('Blechschmidt', 1), 'BLECHSHMIT')
4303
        self.assertEqual(phonet('Kolodziej', 1), 'KOLOTZI')
4304
        self.assertEqual(phonet('Krauße', 1), 'KRAUSE')
4305
        self.assertEqual(phonet('Cachel', 1), 'KESHL')
4306
4307
        self.assertEqual(phonet('', 2), '')
4308
        self.assertEqual(phonet('Zedlitz', 2), 'ZETLIZ')
4309
        self.assertEqual(phonet('Bremerhaven', 2), 'BRENAFN')
4310
        self.assertEqual(phonet('Schönberg', 2), 'ZÖNBAK')
4311
        self.assertEqual(phonet('Hamburger Hafen', 2), 'ANBURKA AFN')
4312
        self.assertEqual(phonet('Ziegler', 2), 'ZIKLA')
4313
        self.assertEqual(phonet('Scherer', 2), 'ZERA')
4314
        self.assertEqual(phonet('Jansen', 2), 'IANZN')
4315
        self.assertEqual(phonet('Eberhardt', 2), 'EBART')
4316
        self.assertEqual(phonet('Gottschalk', 2), 'KUZALK')
4317
        self.assertEqual(phonet('Brückmann', 2), 'BRIKNAN')
4318
        self.assertEqual(phonet('Blechschmidt', 2), 'BLEKZNIT')
4319
        self.assertEqual(phonet('Kolodziej', 2), 'KULUTZI')
4320
        self.assertEqual(phonet('Krauße', 2), 'KRAUZE')
4321
4322
        # etc. (for code coverage)
4323
        self.assertEqual(phonet('Jesper', 1), 'IESPA')
4324
        self.assertEqual(phonet('Glacéhandschuh', 1), 'GLAZANSHU')
4325
        self.assertEqual(phonet('Blechschmidt', 1), 'BLECHSHMIT')
4326
        self.assertEqual(phonet('Burgdorf', 1), 'BURKDORF')
4327
        self.assertEqual(phonet('Holzschuh', 1), 'HOLSHU')
4328
        self.assertEqual(phonet('Aachen', 1), 'ACHN')
4329
        self.assertEqual(phonet('Abendspaziergang', 1), 'ABENTSPAZIRGANK')
4330
4331
    def test_phonet_nolang(self):
4332
        """Test abydos.phonetic.phonet (no language)."""
4333
        self.assertEqual(phonet('', lang='none'), '')
4334
4335
        # https://code.google.com/p/phonet4java/source/browse/trunk/src/test/java/com/googlecode/phonet4java/Phonet1Test.java
4336
        self.assertEqual(phonet('', 1, 'none'), '')
4337
        self.assertEqual(phonet('Zedlitz', 1, 'none'), 'ZEDLITZ')
4338
        self.assertEqual(phonet('Bremerhaven', 1, 'none'), 'BREMERHAVEN')
4339
        self.assertEqual(phonet('Schönberg', 2, 'none'), 'SCHOENBERG')
4340
        self.assertEqual(phonet('Brückmann', 1, 'none'), 'BRUECKMAN')
4341
        self.assertEqual(phonet('Krauße', 1, 'none'), 'KRAUSE')
4342
4343
        self.assertEqual(phonet('', 2, 'none'), '')
4344
        self.assertEqual(phonet('Zedlitz', 2, 'none'), 'ZEDLITZ')
4345
        self.assertEqual(phonet('Bremerhaven', 2, 'none'), 'BREMERHAVEN')
4346
        self.assertEqual(phonet('Schönberg', 2, 'none'), 'SCHOENBERG')
4347
        self.assertEqual(phonet('Brückmann', 2, 'none'), 'BRUECKMAN')
4348
        self.assertEqual(phonet('Krauße', 2, 'none'), 'KRAUSE')
4349
4350
    def test_phonet_nachnamen(self):
4351
        """Test abydos.phonetic.phonet (Nachnamen set)."""
4352
        if not ALLOW_RANDOM:
4353
            return
4354
        with codecs.open(TESTDIR + '/corpora/nachnamen.csv',
4355
                         encoding='utf-8') as nachnamen_testset:
4356
            for nn_line in nachnamen_testset:
4357
                if nn_line[0] != '#':
4358
                    nn_line = nn_line.strip().split(',')
4359
                    # This test set is very large (~10000 entries)
4360
                    # so let's just randomly select about 100 for testing
4361
                    if len(nn_line) >= 3 and one_in(100):
4362
                        (term, ph1, ph2) = nn_line
4363
                        self.assertEqual(phonet(term, 1), ph1)
4364
                        self.assertEqual(phonet(term, 2), ph2)
4365
4366
    def test_phonet_ngerman(self):
4367
        """Test abydos.phonetic.phonet (ngerman set)."""
4368
        if not ALLOW_RANDOM:
4369
            return
4370
        with codecs.open(TESTDIR + '/corpora/ngerman.csv',
4371
                         encoding='utf-8') as ngerman_testset:
4372
            for ng_line in ngerman_testset:
4373
                if ng_line[0] != '#':
4374
                    ng_line = ng_line.strip().split(',')
4375
                    # This test set is very large (~3000000 entries)
4376
                    # so let's just randomly select about 30 for testing
4377
                    if len(ng_line) >= 3 and one_in(10000):
4378
                        (term, ph1, ph2) = ng_line
4379
                        self.assertEqual(phonet(term, 1), ph1)
4380
                        self.assertEqual(phonet(term, 2), ph2)
4381
4382
4383
class SPFCTestCases(unittest.TestCase):
4384
    """Test SPFC functions.
4385
4386
    test cases for abydos.phonetic.spfc
4387
    """
4388
4389
    def test_spfc(self):
4390
        """Test abydos.phonetic.spfc."""
4391
        self.assertEqual(spfc(''), '')
4392
4393
        # https://archive.org/stream/accessingindivid00moor#page/19/mode/1up
4394
        self.assertEqual(spfc(('J', 'KUHNS')), '16760')
4395
        self.assertEqual(spfc(('G', 'ALTSHULER')), '35797')
4396
        self.assertEqual(spfc('J KUHNS'), '16760')
4397
        self.assertEqual(spfc('G ALTSHULER'), '35797')
4398
        self.assertEqual(spfc('J. KUHNS'), '16760')
4399
        self.assertEqual(spfc('G. ALTSHULER'), '35797')
4400
        self.assertEqual(spfc('J. Kuhns'), '16760')
4401
        self.assertEqual(spfc('G. Altshuler'), '35797')
4402
        self.assertEqual(spfc('T. Vines'), '16760')
4403
        self.assertEqual(spfc('J. Butler'), '35779')
4404
        self.assertNotEqual(spfc('J. Kuhns'), spfc('J. Kuntz'))
4405
        self.assertEqual(spfc('Jon Kuhns'), '16760')
4406
        self.assertEqual(spfc('James Kuhns'), '16760')
4407
4408
        self.assertRaises(AttributeError, spfc, ('J', 'A', 'Kuhns'))
4409
        self.assertRaises(AttributeError, spfc, 'JKuhns')
4410
        self.assertRaises(AttributeError, spfc, 5)
4411
4412
        # etc. (for code coverage)
4413
        self.assertEqual(spfc('James Goldstein'), '78795')
4414
        self.assertEqual(spfc('James Hansen'), '58760')
4415
        self.assertEqual(spfc('James Hester'), '59700')
4416
        self.assertEqual(spfc('James Bardot'), '31745')
4417
        self.assertEqual(spfc('James Windsor'), '29765')
4418
        self.assertEqual(spfc('James Wenders'), '27760')
4419
        self.assertEqual(spfc('James Ventor'), '17760')
4420
        self.assertEqual(spfc('þ þ'), '00')
4421
4422
4423
class StatisticsCanadaTestCases(unittest.TestCase):
4424
    """Test Statistics Canada functions.
4425
4426
    test cases for abydos.phonetic.statistics_canada
4427
    """
4428
4429
    def test_statistics_canada(self):
4430
        """Test abydos.phonetic.statistics_canada."""
4431
        self.assertEqual(statistics_canada(''), '')
4432
4433
        # https://naldc.nal.usda.gov/download/27833/PDF
4434
        self.assertEqual(statistics_canada('Daves'), 'DVS')
4435
        self.assertEqual(statistics_canada('Davies'), 'DVS')
4436
        self.assertEqual(statistics_canada('Devese'), 'DVS')
4437
        self.assertEqual(statistics_canada('Devies'), 'DVS')
4438
        self.assertEqual(statistics_canada('Devos'), 'DVS')
4439
4440
        self.assertEqual(statistics_canada('Smathers'), 'SMTH')
4441
        self.assertEqual(statistics_canada('Smithart'), 'SMTH')
4442
        self.assertEqual(statistics_canada('Smithbower'), 'SMTH')
4443
        self.assertEqual(statistics_canada('Smitherman'), 'SMTH')
4444
        self.assertEqual(statistics_canada('Smithey'), 'SMTH')
4445
        self.assertEqual(statistics_canada('Smithgall'), 'SMTH')
4446
        self.assertEqual(statistics_canada('Smithingall'), 'SMTH')
4447
        self.assertEqual(statistics_canada('Smithmyer'), 'SMTH')
4448
        self.assertEqual(statistics_canada('Smithpeter'), 'SMTH')
4449
        self.assertEqual(statistics_canada('Smithson'), 'SMTH')
4450
        self.assertEqual(statistics_canada('Smithy'), 'SMTH')
4451
        self.assertEqual(statistics_canada('Smotherman'), 'SMTH')
4452
        self.assertEqual(statistics_canada('Smothers'), 'SMTH')
4453
        self.assertEqual(statistics_canada('Smyth'), 'SMTH')
4454
4455
        # Additional tests from @Yomguithereal's talisman
4456
        # https://github.com/Yomguithereal/talisman/blob/master/test/phonetics/statcan.js
4457
        self.assertEqual(statistics_canada('Guillaume'), 'GLM')
4458
        self.assertEqual(statistics_canada('Arlène'), 'ARLN')
4459
        self.assertEqual(statistics_canada('Lüdenscheidt'), 'LDNS')
4460
4461
4462
class LeinTestCases(unittest.TestCase):
4463
    """Test Lein functions.
4464
4465
    test cases for abydos.phonetic.lein
4466
    """
4467
4468
    def test_lein(self):
4469
        """Test abydos.phonetic.lein."""
4470
        self.assertEqual(lein(''), '')
4471
4472
        # https://naldc.nal.usda.gov/download/27833/PDF
4473
        self.assertEqual(lein('Dubose'), 'D450')
4474
        self.assertEqual(lein('Dubs'), 'D450')
4475
        self.assertEqual(lein('Dubbs'), 'D450')
4476
        self.assertEqual(lein('Doviak'), 'D450')
4477
        self.assertEqual(lein('Dubke'), 'D450')
4478
        self.assertEqual(lein('Dubus'), 'D450')
4479
        self.assertEqual(lein('Dubois'), 'D450')
4480
        self.assertEqual(lein('Duboise'), 'D450')
4481
        self.assertEqual(lein('Doubek'), 'D450')
4482
        self.assertEqual(lein('Defigh'), 'D450')
4483
        self.assertEqual(lein('Defazio'), 'D450')
4484
        self.assertEqual(lein('Debaca'), 'D450')
4485
        self.assertEqual(lein('Dabbs'), 'D450')
4486
        self.assertEqual(lein('Davies'), 'D450')
4487
        self.assertEqual(lein('Dubukey'), 'D450')
4488
        self.assertEqual(lein('Debus'), 'D450')
4489
        self.assertEqual(lein('Debose'), 'D450')
4490
        self.assertEqual(lein('Daves'), 'D450')
4491
        self.assertEqual(lein('Dipiazza'), 'D450')
4492
        self.assertEqual(lein('Dobbs'), 'D450')
4493
        self.assertEqual(lein('Dobak'), 'D450')
4494
        self.assertEqual(lein('Dobis'), 'D450')
4495
        self.assertEqual(lein('Dobish'), 'D450')
4496
        self.assertEqual(lein('Doepke'), 'D450')
4497
        self.assertEqual(lein('Divish'), 'D450')
4498
        self.assertEqual(lein('Dobosh'), 'D450')
4499
        self.assertEqual(lein('Dupois'), 'D450')
4500
        self.assertEqual(lein('Dufek'), 'D450')
4501
        self.assertEqual(lein('Duffek'), 'D450')
4502
        self.assertEqual(lein('Dupuis'), 'D450')
4503
        self.assertEqual(lein('Dupas'), 'D450')
4504
        self.assertEqual(lein('Devese'), 'D450')
4505
        self.assertEqual(lein('Devos'), 'D450')
4506
        self.assertEqual(lein('Deveaux'), 'D450')
4507
        self.assertEqual(lein('Devies'), 'D450')
4508
4509
        self.assertEqual(lein('Sand'), 'S210')
4510
        self.assertEqual(lein('Sandau'), 'S210')
4511
        self.assertEqual(lein('Sande'), 'S210')
4512
        self.assertEqual(lein('Sandia'), 'S210')
4513
        self.assertEqual(lein('Sando'), 'S210')
4514
        self.assertEqual(lein('Sandoe'), 'S210')
4515
        self.assertEqual(lein('Sandy'), 'S210')
4516
        self.assertEqual(lein('Santee'), 'S210')
4517
        self.assertEqual(lein('Santi'), 'S210')
4518
        self.assertEqual(lein('Santo'), 'S210')
4519
        self.assertEqual(lein('Send'), 'S210')
4520
        self.assertEqual(lein('Sennet'), 'S210')
4521
        self.assertEqual(lein('Shemoit'), 'S210')
4522
        self.assertEqual(lein('Shenot'), 'S210')
4523
        self.assertEqual(lein('Shumate'), 'S210')
4524
        self.assertEqual(lein('Simmet'), 'S210')
4525
        self.assertEqual(lein('Simot'), 'S210')
4526
        self.assertEqual(lein('Sineath'), 'S210')
4527
        self.assertEqual(lein('Sinnott'), 'S210')
4528
        self.assertEqual(lein('Sintay'), 'S210')
4529
        self.assertEqual(lein('Smead'), 'S210')
4530
        self.assertEqual(lein('Smeda'), 'S210')
4531
        self.assertEqual(lein('Smit'), 'S210')
4532
4533
        # Additional tests from @Yomguithereal's talisman
4534
        # https://github.com/Yomguithereal/talisman/blob/master/test/phonetics/lein.js
4535
        self.assertEqual(lein('Guillaume'), 'G320')
4536
        self.assertEqual(lein('Arlène'), 'A332')
4537
        self.assertEqual(lein('Lüdenscheidt'), 'L125')
4538
4539
        # Coverage
4540
        self.assertEqual(lein('Lüdenscheidt', zero_pad=False), 'L125')
4541
        self.assertEqual(lein('Smith', zero_pad=False), 'S21')
4542
4543
4544
class RogerRootTestCases(unittest.TestCase):
4545
    """Test Roger Root functions.
4546
4547
    test cases for abydos.phonetic.roger_root
4548
    """
4549
4550
    def test_roger_root(self):
4551
        """Test abydos.phonetic.roger_root."""
4552
        self.assertEqual(roger_root(''), '00000')
4553
4554
        # https://naldc.nal.usda.gov/download/27833/PDF
4555
        self.assertEqual(roger_root('BROWNER'), '09424')
4556
        self.assertEqual(roger_root('STANLEY'), '00125')
4557
        self.assertEqual(roger_root('CHALMAN'), '06532')
4558
        self.assertEqual(roger_root('CHING'), '06270')
4559
        self.assertEqual(roger_root('ANDERSON'), '12140')
4560
        self.assertEqual(roger_root('OVERSTREET'), '18401')
4561
        self.assertEqual(roger_root('HECKEL'), '27500')
4562
        self.assertEqual(roger_root('WYSZYNSKI'), '40207')
4563
        self.assertEqual(roger_root('WHITTED'), '41100')
4564
        self.assertEqual(roger_root('ONGOQO'), '12770')  # PDF had a typo?
4565
        self.assertEqual(roger_root('JOHNSON'), '32020')
4566
        self.assertEqual(roger_root('WILLIAMS'), '45300')
4567
        self.assertEqual(roger_root('SMITH'), '00310')
4568
        self.assertEqual(roger_root('JONES'), '32000')
4569
        self.assertEqual(roger_root('BROWN'), '09420')
4570
        self.assertEqual(roger_root('DAVIS'), '01800')
4571
        self.assertEqual(roger_root('JACKSON'), '37020')
4572
        self.assertEqual(roger_root('WILSON'), '45020')
4573
        self.assertEqual(roger_root('LEE'), '05000')
4574
        self.assertEqual(roger_root('THOMAS'), '01300')
4575
4576
        self.assertEqual(roger_root('Defouw'), '01800')
4577
        self.assertEqual(roger_root('Dauphi'), '01800')
4578
        self.assertEqual(roger_root('Defazio'), '01800')
4579
        self.assertEqual(roger_root('Defay'), '01800')
4580
        self.assertEqual(roger_root('Davy'), '01800')
4581
        self.assertEqual(roger_root('Defee'), '01800')
4582
        self.assertEqual(roger_root('Dayhoff'), '01800')
4583
        self.assertEqual(roger_root('Davie'), '01800')
4584
        self.assertEqual(roger_root('Davey'), '01800')
4585
        self.assertEqual(roger_root('Davies'), '01800')
4586
        self.assertEqual(roger_root('Daves'), '01800')
4587
        self.assertEqual(roger_root('Deife'), '01800')
4588
        self.assertEqual(roger_root('Dehoff'), '01800')
4589
        self.assertEqual(roger_root('Devese'), '01800')
4590
        self.assertEqual(roger_root('Devoe'), '01800')
4591
        self.assertEqual(roger_root('Devee'), '01800')
4592
        self.assertEqual(roger_root('Devies'), '01800')
4593
        self.assertEqual(roger_root('Devos'), '01800')
4594
        self.assertEqual(roger_root('Dafoe'), '01800')
4595
        self.assertEqual(roger_root('Dove'), '01800')
4596
        self.assertEqual(roger_root('Duff'), '01800')
4597
        self.assertEqual(roger_root('Duffey'), '01800')
4598
        self.assertEqual(roger_root('Duffie'), '01800')
4599
        self.assertEqual(roger_root('Duffy'), '01800')
4600
        self.assertEqual(roger_root('Duyava'), '01800')
4601
        self.assertEqual(roger_root('Tafoya'), '01800')
4602
        self.assertEqual(roger_root('Tevis'), '01800')
4603
        self.assertEqual(roger_root('Tiffee'), '01800')
4604
        self.assertEqual(roger_root('Tivis'), '01800')
4605
        self.assertEqual(roger_root('Thevis'), '01800')
4606
        self.assertEqual(roger_root('Tovey'), '01800')
4607
        self.assertEqual(roger_root('Toeves'), '01800')
4608
        self.assertEqual(roger_root('Tuffs'), '01800')
4609
4610
        self.assertEqual(roger_root('Samotid'), '00311')
4611
        self.assertEqual(roger_root('Simmet'), '00310')
4612
        self.assertEqual(roger_root('Simot'), '00310')
4613
        self.assertEqual(roger_root('Smead'), '00310')
4614
        self.assertEqual(roger_root('Smeda'), '00310')
4615
        self.assertEqual(roger_root('Smit'), '00310')
4616
        self.assertEqual(roger_root('Smite'), '00310')
4617
        self.assertEqual(roger_root('Smithe'), '00310')
4618
        self.assertEqual(roger_root('Smithey'), '00310')
4619
        self.assertEqual(roger_root('Smithson'), '00310')
4620
        self.assertEqual(roger_root('Smithy'), '00310')
4621
        self.assertEqual(roger_root('Smoot'), '00310')
4622
        self.assertEqual(roger_root('Smyth'), '00310')
4623
        self.assertEqual(roger_root('Szmodis'), '00310')
4624
        self.assertEqual(roger_root('Zemaitis'), '00310')
4625
        self.assertEqual(roger_root('Zmuda'), '00310')
4626
4627
        # Additional tests from @Yomguithereal's talisman
4628
        # https://github.com/Yomguithereal/talisman/blob/master/test/phonetics/roger-root.js
4629
        self.assertEqual(roger_root('Guillaume'), '07530')
4630
        self.assertEqual(roger_root('Arlène'), '14520')
4631
        self.assertEqual(roger_root('Lüdenscheidt'), '05126')
4632
4633
        # no zero_pad
4634
        self.assertEqual(roger_root('BROWNER', zero_pad=False), '09424')
4635
        self.assertEqual(roger_root('STANLEY', zero_pad=False), '00125')
4636
        self.assertEqual(roger_root('CHALMAN', zero_pad=False), '06532')
4637
        self.assertEqual(roger_root('CHING', zero_pad=False), '0627')
4638
        self.assertEqual(roger_root('ANDERSON', zero_pad=False), '12140')
4639
        self.assertEqual(roger_root('OVERSTREET, zero_pad=False'), '18401')
4640
        self.assertEqual(roger_root('HECKEL', zero_pad=False), '275')
4641
        self.assertEqual(roger_root('WYSZYNSKI', zero_pad=False), '40207')
4642
        self.assertEqual(roger_root('WHITTED', zero_pad=False), '411')
4643
        self.assertEqual(roger_root('ONGOQO', zero_pad=False), '1277')
4644
        self.assertEqual(roger_root('JOHNSON', zero_pad=False), '3202')
4645
        self.assertEqual(roger_root('WILLIAMS', zero_pad=False), '4530')
4646
        self.assertEqual(roger_root('SMITH', zero_pad=False), '0031')
4647
        self.assertEqual(roger_root('JONES', zero_pad=False), '320')
4648
        self.assertEqual(roger_root('BROWN', zero_pad=False), '0942')
4649
        self.assertEqual(roger_root('DAVIS', zero_pad=False), '0180')
4650
        self.assertEqual(roger_root('JACKSON', zero_pad=False), '3702')
4651
        self.assertEqual(roger_root('WILSON', zero_pad=False), '4502')
4652
        self.assertEqual(roger_root('LEE', zero_pad=False), '05')
4653
        self.assertEqual(roger_root('THOMAS', zero_pad=False), '0130')
4654
4655
4656
class ONCATestCases(unittest.TestCase):
4657
    """Test ONCA functions.
4658
4659
    test cases for abydos.phonetic.onca
4660
    """
4661
4662
    def test_onca(self):
4663
        """Test abydos.phonetic.onca."""
4664
        # https://nces.ed.gov/FCSM/pdf/RLT97.pdf
4665
        self.assertEqual(onca('HALL'), 'H400')
4666
        self.assertEqual(onca('SMITH'), 'S530')
4667
4668
        # http://nchod.uhce.ox.ac.uk/NCHOD%20Oxford%20E5%20Report%201st%20Feb_VerAM2.pdf
4669
        self.assertEqual(onca('HAWTON'), 'H350')
4670
        self.assertEqual(onca('HORTON'), 'H635')
4671
        self.assertEqual(onca('HOUGHTON'), 'H235')
4672
4673
4674
class EudexTestCases(unittest.TestCase):
4675
    """Test eudex functions.
4676
4677
    test cases for abydos.phonetic.eudex
4678
    """
4679
4680
    def test_eudex(self):
4681
        """Test abydos.phonetic.eudex."""
4682
        # base cases
4683
        self.assertEqual(eudex(''), 18374686479671623680)
4684
        self.assertEqual(eudex(' '), 18374686479671623680)
4685
4686
        # exact & mismatch cases from
4687
        # https://github.com/ticki/eudex/blob/master/src/tests.rs
4688
        self.assertEqual(eudex('JAva'), eudex('jAva'))
4689
        self.assertEqual(eudex('co!mputer'), eudex('computer'))
4690
        self.assertEqual(eudex('comp-uter'), eudex('computer'))
4691
        self.assertEqual(eudex('comp@u#te?r'), eudex('computer'))
4692
        self.assertEqual(eudex('lal'), eudex('lel'))
4693
        self.assertEqual(eudex('rindom'), eudex('ryndom'))
4694
        self.assertEqual(eudex('riiiindom'), eudex('ryyyyyndom'))
4695
        self.assertEqual(eudex('riyiyiiindom'), eudex('ryyyyyndom'))
4696
        self.assertEqual(eudex('triggered'), eudex('TRIGGERED'))
4697
        self.assertEqual(eudex('repert'), eudex('ropert'))
4698
4699
        self.assertNotEqual(eudex('reddit'), eudex('eddit'))
4700
        self.assertNotEqual(eudex('lol'), eudex('lulz'))
4701
        self.assertNotEqual(eudex('ijava'), eudex('java'))
4702
        self.assertNotEqual(eudex('jiva'), eudex('java'))
4703
        self.assertNotEqual(eudex('jesus'), eudex('iesus'))
4704
        self.assertNotEqual(eudex('aesus'), eudex('iesus'))
4705
        self.assertNotEqual(eudex('iesus'), eudex('yesus'))
4706
        self.assertNotEqual(eudex('rupirt'), eudex('ropert'))
4707
        self.assertNotEqual(eudex('ripert'), eudex('ropyrt'))
4708
        self.assertNotEqual(eudex('rrr'), eudex('rraaaa'))
4709
        self.assertNotEqual(eudex('randomal'), eudex('randomai'))
4710
4711
        # manually checked against algorithm
4712
        self.assertEqual(eudex('guillaume'), 288230383131034112)
4713
        self.assertEqual(eudex('niall'), 648518346341351840)
4714
        self.assertEqual(eudex('hello'), 144115188075896832)
4715
        self.assertEqual(eudex('christopher'), 433648490138894409)
4716
        self.assertEqual(eudex('colin'), 432345564238053650)
4717
4718
4719
class HaasePhonetikTestCases(unittest.TestCase):
4720
    """Test Haase Phonetik functions.
4721
4722
    test cases for abydos.phonetic.haase_phonetik
4723
    """
4724
4725
    def test_haase_phonetik(self):
4726
        """Test abydos.phonetic.haase_phonetik."""
4727
        # Base cases
4728
        self.assertEqual(haase_phonetik(''), ('',))
4729
4730
        # equivalents
4731
        self.assertEqual(haase_phonetik('Häschen'), haase_phonetik('Haeschen'))
4732
        self.assertEqual(haase_phonetik('Schloß'), haase_phonetik('Schloss'))
4733
        self.assertEqual(haase_phonetik('üben'), haase_phonetik('ueben'))
4734
        self.assertEqual(haase_phonetik('Eichörnchen'),
4735
                         haase_phonetik('Eichoernchen'))
4736
4737
        # coverage completion
4738
        self.assertEqual(haase_phonetik('Häschen'), ('9896', '9496'))
4739
        self.assertEqual(haase_phonetik('Häschen', primary_only=True),
4740
                         ('9896',))
4741
        self.assertEqual(haase_phonetik('Eichörnchen'), ('94976496',))
4742
        self.assertEqual(haase_phonetik('Hexe'), ('9489',))
4743
        self.assertEqual(haase_phonetik('Chemie'), ('4969', '8969'))
4744
4745
        self.assertEqual(haase_phonetik('Brille'), ('17959', '179'))
4746
        self.assertEqual(haase_phonetik('Brilleille'),
4747
                         ('1795959', '17959', '179'))
4748
        self.assertEqual(haase_phonetik('Niveau'), ('6939',))
4749
        self.assertEqual(haase_phonetik('Korb'), ('4971', '4973'))
4750
        self.assertEqual(haase_phonetik('Heino'), ('969', '9693'))
4751
        self.assertEqual(haase_phonetik('Nekka'), ('6949', '69497'))
4752
        self.assertEqual(haase_phonetik('Aleph'), ('9593',))
4753
        self.assertEqual(haase_phonetik('Aleppo'), ('95919', '959193'))
4754
        self.assertEqual(haase_phonetik('Endzipfel'), ('96891395',))
4755
        self.assertEqual(haase_phonetik('verbrandt'), ('39717962', '39737962'))
4756
        self.assertEqual(haase_phonetik('Cent'), ('8962',))
4757
        self.assertEqual(haase_phonetik('addiscendae'), ('92989629',))
4758
        self.assertEqual(haase_phonetik('kickx'), ('4948',))
4759
        self.assertEqual(haase_phonetik('sanctionen'), ('896829696',))
4760
4761
4762
class RethSchekTestCases(unittest.TestCase):
4763
    """Test Reth-Schek Phonetik functions.
4764
4765
    test cases for abydos.phonetic.reth_schek_phonetik
4766
    """
4767
4768
    def test_reth_schek_phonetik(self):
4769
        """Test abydos.phonetic.reth_schek_phonetik."""
4770
        # Base cases
4771
        self.assertEqual(reth_schek_phonetik(''), '')
4772
4773
        # equivalents
4774
        self.assertEqual(reth_schek_phonetik('Häschen'),
4775
                         reth_schek_phonetik('Haeschen'))
4776
        self.assertEqual(reth_schek_phonetik('Schloß'),
4777
                         reth_schek_phonetik('Schloss'))
4778
        self.assertEqual(reth_schek_phonetik('üben'),
4779
                         reth_schek_phonetik('ueben'))
4780
        self.assertEqual(reth_schek_phonetik('Eichörnchen'),
4781
                         reth_schek_phonetik('Eichoernchen'))
4782
4783
        self.assertEqual(reth_schek_phonetik('Häschen'), 'HESCHEN')
4784
        self.assertEqual(reth_schek_phonetik('Eichörnchen'), 'AIGHOERNGHEN')
4785
        self.assertEqual(reth_schek_phonetik('Hexe'), 'HEXE')
4786
        self.assertEqual(reth_schek_phonetik('Chemie'), 'GHEMI')
4787
        self.assertEqual(reth_schek_phonetik('Brille'), 'BRILE')
4788
        self.assertEqual(reth_schek_phonetik('Brilleille'), 'BRILAILE')
4789
        self.assertEqual(reth_schek_phonetik('Niveau'), 'NIFEAU')
4790
        self.assertEqual(reth_schek_phonetik('Korb'), 'GORB')
4791
        self.assertEqual(reth_schek_phonetik('Heino'), 'HAINO')
4792
        self.assertEqual(reth_schek_phonetik('Nekka'), 'NEKA')
4793
        self.assertEqual(reth_schek_phonetik('Aleph'), 'ALEF')
4794
        self.assertEqual(reth_schek_phonetik('Aleppo'), 'ALEBO')
4795
        self.assertEqual(reth_schek_phonetik('Endzipfel'), 'ENDZIBFL')
4796
        self.assertEqual(reth_schek_phonetik('verbrandt'), 'FERBRAND')
4797
        self.assertEqual(reth_schek_phonetik('Cent'), 'GEND')
4798
        self.assertEqual(reth_schek_phonetik('addiscendae'), 'ADISGENDE')
4799
        self.assertEqual(reth_schek_phonetik('kickx'), 'GIGX')
4800
        self.assertEqual(reth_schek_phonetik('sanctionen'), 'SANGDIONEN')
4801
        self.assertEqual(reth_schek_phonetik('Kuh'), 'GU')
4802
        self.assertEqual(reth_schek_phonetik('lecker'), 'LEGR')
4803
        self.assertEqual(reth_schek_phonetik('rödlich'), 'ROEDLIG')
4804
4805
4806
class FonemTestCases(unittest.TestCase):
4807
    """Test FONEM functions.
4808
4809
    test cases for abydos.phonetic.fonem
4810
    """
4811
4812
    def test_fonem(self):
4813
        """Test abydos.phonetic.fonem."""
4814
        # Base cases
4815
        self.assertEqual(fonem(''), '')
4816
4817
        # Test cases, mostly from the FONEM specification,
4818
        # but copied from Talisman:
4819
        # https://github.com/Yomguithereal/talisman/blob/master/test/phonetics/french/fonem.js
4820
        test_cases = (
4821
            ('BEAULAC', 'BOLAK'),
4822
            ('BAULAC', 'BOLAK'),
4823
            ('IMBEAULT', 'INBO'),
4824
            ('DUFAUT', 'DUFO'),
4825
            ('THIBOUTOT', 'TIBOUTOT'),
4826
            ('DEVAUX', 'DEVO'),
4827
            ('RONDEAUX', 'RONDO'),
4828
            ('BOURGAULX', 'BOURGO'),
4829
            ('PINCHAUD', 'PINCHO'),
4830
            ('PEDNAULD', 'PEDNO'),
4831
            ('MAZENOD', 'MASENOD'),
4832
            ('ARNOLD', 'ARNOL'),
4833
            ('BERTOLD', 'BERTOL'),
4834
            ('BELLAY', 'BELE'),
4835
            ('SANDAY', 'SENDE'),
4836
            ('GAY', 'GAI'),
4837
            ('FAYARD', 'FAYAR'),
4838
            ('LEMIEUX', 'LEMIEU'),
4839
            ('LHEUREUX', 'LEUREU'),
4840
            ('BELLEY', 'BELE'),
4841
            ('WELLEY', 'WELE'),
4842
            ('MEYER', 'MEYER'),
4843
            ('BOILY', 'BOILI'),
4844
            ('LOYSEAU', 'LOISO'),
4845
            ('MAYRAND', 'MAIREN'),
4846
            ('GUYON', 'GUYON'),
4847
            ('FAILLARD', 'FAYAR'),
4848
            ('FAIARD', 'FAYAR'),
4849
            ('MEIER', 'MEYER'),
4850
            ('MEILLER', 'MEYER'),
4851
            ('GUILLON', 'GUYON'),
4852
            ('LAVILLE', 'LAVILLE'),
4853
            ('COUET', 'CWET'),
4854
            ('EDOUARD', 'EDWAR'),
4855
            ('GIROUARD', 'JIRWAR'),
4856
            ('OZOUADE', 'OSWADE'),  # differs from test set
4857
            ('BOUILLE', 'BOUYE'),
4858
            ('POUYEZ', 'POUYES'),  # differs from test set
4859
            ('LEMEE', 'LEME'),
4860
            ('ABRAAM', 'ABRAM'),
4861
            ('ARCHEMBAULT', 'ARCHENBO'),
4862
            ('AMTHIME', 'ENTIME'),
4863
            ('ROMPRE', 'RONPRE'),
4864
            ('BOMSECOURS', 'BONSECOURS'),
4865
            ('BOULANGER', 'BOULENJER'),
4866
            ('TANCREDE', 'TENKREDE'),
4867
            ('BLAIN', 'BLIN'),
4868
            ('BLAINVILLE', 'BLINVILLE'),
4869
            ('MAINARD', 'MAINAR'),
4870
            ('RAIMOND', 'RAIMON'),
4871
            ('BLACKBORN', 'BLAKBURN'),
4872
            ('SEABOURNE', 'SEABURN'),
4873
            ('IMBO', 'INBO'),
4874
            ('RIMFRET', 'RINFRET'),
4875
            ('LEFEBVRE', 'LEFEVRE'),
4876
            ('MACE', 'MASSE'),
4877
            ('MACON', 'MACON'),
4878
            ('MARCELIN', 'MARSELIN'),
4879
            ('MARCEAU', 'MARSO'),
4880
            ('VINCELETTE', 'VINSELETE'),
4881
            ('FORCADE', 'FORCADE'),
4882
            ('CELINE', 'SELINE'),
4883
            ('CERAPHIN', 'SERAFIN'),
4884
            ('CAMILLE', 'KAMILLE'),
4885
            ('CAYETTE', 'KAYETE'),
4886
            ('CARINE', 'KARINE'),
4887
            ('LUC', 'LUK'),
4888
            ('LEBLANC', 'LEBLEN'),
4889
            ('VICTOR', 'VIKTOR'),
4890
            ('LACCOULINE', 'LAKOULINE'),
4891
            ('MACCIMILIEN', 'MAXIMILIEN'),
4892
            ('MAGELLA', 'MAJELA'),
4893
            ('GINETTE', 'JINETE'),
4894
            ('GANDET', 'GANDET'),
4895
            ('GEORGES', 'JORJES'),
4896
            ('GEOFFROID', 'JOFROID'),
4897
            ('PAGEAU', 'PAJO'),
4898
            ('GAGNION', 'GAGNON'),
4899
            ('MIGNIER', 'MIGNER'),
4900
            ('HALLEY', 'ALE'),
4901
            ('GAUTHIER', 'GOTIER'),
4902
            ('CHARTIER', 'CHARTIER'),
4903
            ('JEANNE', 'JANE'),
4904
            ('MACGREGOR', 'MACGREGOR'),
4905
            ('MACKAY', 'MACKE'),
4906
            ('MCNICOL', 'MACNICOL'),
4907
            ('MCNEIL', 'MACNEIL'),
4908
            ('PHANEUF', 'FANEUF'),
4909
            ('PHILIPPE', 'FILIPE'),
4910
            ('QUENNEVILLE', 'KENEVILLE'),
4911
            ('LAROCQUE', 'LAROKE'),
4912
            ('SCIPION', 'SIPION'),
4913
            ('ASCELIN', 'ASSELIN'),
4914
            ('VASCO', 'VASKO'),
4915
            ('PASCALINE', 'PASKALINE'),
4916
            ('ESHEMBACK', 'ECHENBAK'),
4917
            ('ASHED', 'ACHED'),
4918
            ('GRATIA', 'GRASSIA'),
4919
            ('PATRITIA', 'PATRISSIA'),
4920
            ('BERTIO', 'BERTIO'),
4921
            ('MATIEU', 'MATIEU'),
4922
            ('BERTIAUME', 'BERTIOME'),
4923
            ('MUNROW', 'MUNRO'),
4924
            ('BRANISLAW', 'BRANISLA'),
4925
            ('LOWMEN', 'LOMEN'),
4926
            ('ANDREW', 'ENDREW'),
4927
            ('EXCEL', 'EXEL'),
4928
            ('EXCERINE', 'EXERINE'),
4929
            ('EXSILDA', 'EXILDA'),
4930
            ('EXZELDA', 'EXELDA'),
4931
            ('CAZEAU', 'KASO'),
4932
            ('BRAZEAU', 'BRASO'),
4933
            ('FITZPATRICK', 'FITSPATRIK'),
4934
            ('SINGELAIS', 'ST-JELAIS'),
4935
            ('CINQMARS', 'ST-MARS'),
4936
            ('SAINT-AMAND', 'ST-AMEN'),
4937
            ('SAINTECROIX', 'STE-KROIX'),
4938
            ('ST-HILAIRE', 'ST-ILAIRE'),
4939
            ('STE-CROIX', 'STE-KROIX'),
4940
            ('LAVALLEE', 'LAVALE'),
4941
            ('CORINNE', 'KORINE'),
4942
            ('DUTILE', 'DUTILLE')
4943
        )
4944
        for name, encoding in test_cases:
4945
            self.assertEqual(fonem(name), encoding)
4946
4947
4948
class ParmarKumbharanaTestCases(unittest.TestCase):
4949
    """Test Parmar-Kumbharana functions.
4950
4951
    test cases for abydos.phonetic.parmar_kumbharana
4952
    """
4953
4954
    def test_parmar_kumbharana(self):
4955
        """Test abydos.phonetic.parmar_kumbharana."""
4956
        # Base cases
4957
        self.assertEqual(fonem(''), '')
4958
4959
        # Test cases from Parmar & Kumbharana (2014)
4960
        test_cases = (
4961
            ('Week', 'WK'),
4962
            ('Weak', 'WK'),
4963
            ('Piece', 'PS'),
4964
            ('Peace', 'PS'),
4965
            ('Bed', 'BD'),
4966
            ('Bad', 'BD'),
4967
            ('Would', 'WD'),
4968
            ('Wood', 'WD'),
4969
            ('Sun', 'SN'),
4970
            ('Son', 'SN'),
4971
            ('Ship', 'SP'),
4972
            ('Sheep', 'SP'),
4973
            ('Later', 'LTR'),
4974
            ('Letter', 'LTR'),
4975
            ('Low', 'LW'),
4976
            ('Law', 'LW'),
4977
            ('She', 'S'),
4978
            ('See', 'S'),
4979
            ('Sea', 'S'),
4980
            ('Case', 'CS'),
4981
            ('Cash', 'CS'),
4982
            ('Of', 'OF'),
4983
            ('Off', 'OF'),
4984
            ('Live', 'LV'),
4985
            ('Leave', 'LV'),
4986
            ('Sign', 'SN'),
4987
            ('Sine', 'SN'),
4988
            ('Sin', 'SN'),
4989
            ('Seen', 'SN'),
4990
            ('By', 'B'),
4991
            ('Bye', 'B'),
4992
            ('Reach', 'RCH'),
4993
            ('Rich', 'RCH'),
4994
            ('Sort', 'SRT'),
4995
            ('Short', 'SRT'),
4996
            ('Center', 'SNTR'),
4997
            ('Centre', 'SNTR'),
4998
            ('Full', 'FL'),
4999
            ('Fool', 'FL'),
5000
            ('Then', 'THN'),
5001
            ('Than', 'THN'),
5002
            ('Fill', 'FL'),
5003
            ('Feel', 'FL'),
5004
            ('Two', 'TW'),
5005
            ('To', 'T'),
5006
            ('Too', 'T'),
5007
            ('Four', 'FR'),
5008
            ('For', 'FR'),
5009
            ('Mat', 'MT'),
5010
            ('Met', 'MT'),
5011
            ('Merry', 'MR'),
5012
            ('Marry', 'MR')
5013
        )
5014
        for word, encoding in test_cases:
5015
            self.assertEqual(parmar_kumbharana(word), encoding)
5016
5017
5018
class DavidsonTestCases(unittest.TestCase):
5019
    """Test class Davidson functions.
5020
5021
    test cases for abydos.phonetic.davidson
5022
    """
5023
5024
    def test_davidson(self):
5025
        """Test abydos.phonetic.davidson."""
5026
        # Base cases
5027
        self.assertEqual(davidson('', omit_fname=True), '    ')
5028
        self.assertEqual(davidson(''), '    .')
5029
5030
        # Test cases from Gadd (1988) "'Fisching fore werds': phonetic
5031
        # retrieval of written text in information systems." Program,
5032
        # 22(3). 222--237.
5033
        # doi:10.1108/eb046999
5034
        test_cases = (
5035
            ('WAIT', 'WT  '),
5036
            ('WEIGHT', 'WGT '),
5037
            ('KNIGHT', 'KNGT'),
5038
            ('NIGHT', 'NGT '),
5039
            ('NITE', 'NT  '),
5040
            ('GNOME', 'GNM '),
5041
            ('NOAM', 'NM  '),
5042
            ('SMIDT', 'SMDT'),
5043
            ('SMIT', 'SMT '),
5044
            ('SMITH', 'SMT '),
5045
            ('SCHMIT', 'SCMT'),
5046
            ('CRAFT', 'CRFT'),
5047
            ('KRAFT', 'KRFT'),
5048
            ('REES', 'RS  '),
5049
            ('REECE', 'RC  '),
5050
        )
5051
        for word, encoding in test_cases:
5052
            self.assertEqual(davidson(word, omit_fname=True), encoding)
5053
5054
5055
class SoundDTestCases(unittest.TestCase):
5056
    """Test class SoundD functions.
5057
5058
    test cases for abydos.phonetic.sound_d
5059
    """
5060
5061
    def test_sound_d(self):
5062
        """Test abydos.phonetic.sound_d."""
5063
        # Base cases
5064
        self.assertEqual(sound_d(''), '0000')
5065
        self.assertEqual(sound_d('', maxlength=6), '000000')
5066
5067
        self.assertEqual(sound_d('knight'), '5300')
5068
        self.assertEqual(sound_d('accept'), '2130')
5069
        self.assertEqual(sound_d('pneuma'), '5500')
5070
        self.assertEqual(sound_d('ax'), '2000')
5071
        self.assertEqual(sound_d('wherever'), '6160')
5072
        self.assertEqual(sound_d('pox'), '1200')
5073
        self.assertEqual(sound_d('anywhere'), '5600')
5074
        self.assertEqual(sound_d('adenosine'), '3525')
5075
        self.assertEqual(sound_d('judge'), '2200')
5076
        self.assertEqual(sound_d('rough'), '6000')
5077
        self.assertEqual(sound_d('x-ray'), '2600')
5078
        self.assertEqual(sound_d('acetylcholine', maxlength=None), '234245')
5079
        self.assertEqual(sound_d('rough', maxlength=None), '6')
5080
5081
5082
class PSHPSoundexTestCases(unittest.TestCase):
5083
    """Test PSHP Soundex functions.
5084
5085
    test cases for abydos.phonetic.pshp_soundex_last & pshp_soundex_first
5086
    """
5087
5088
    def test_pshp_soundex_last(self):
5089
        """Test abydos.phonetic.pshp_soundex_last."""
5090
        # Base case
5091
        self.assertEqual(pshp_soundex_last(''), '0000')
5092
5093
        self.assertEqual(pshp_soundex_last('JAMES'), 'J500')
5094
        self.assertEqual(pshp_soundex_last('JOHN'), 'J500')
5095
        self.assertEqual(pshp_soundex_last('PAT'), 'P300')
5096
        self.assertEqual(pshp_soundex_last('PETER'), 'P350')
5097
5098
        self.assertEqual(pshp_soundex_last('Smith'), 'S530')
5099
        self.assertEqual(pshp_soundex_last('van Damme'), 'D500')
5100
        self.assertEqual(pshp_soundex_last('MacNeil'), 'M400')
5101
        self.assertEqual(pshp_soundex_last('McNeil'), 'M400')
5102
        self.assertEqual(pshp_soundex_last('Edwards'), 'A353')
5103
        self.assertEqual(pshp_soundex_last('Gin'), 'J500')
5104
        self.assertEqual(pshp_soundex_last('Cillian'), 'S450')
5105
        self.assertEqual(pshp_soundex_last('Christopher'), 'K523')
5106
        self.assertEqual(pshp_soundex_last('Carme'), 'K500')
5107
        self.assertEqual(pshp_soundex_last('Knight'), 'N230')
5108
        self.assertEqual(pshp_soundex_last('Phillip'), 'F410')
5109
        self.assertEqual(pshp_soundex_last('Wein'), 'V500')
5110
        self.assertEqual(pshp_soundex_last('Wagner', german=True), 'V255')
5111
        self.assertEqual(pshp_soundex_last('Pence'), 'P500')
5112
        self.assertEqual(pshp_soundex_last('Less'), 'L000')
5113
        self.assertEqual(pshp_soundex_last('Simpson'), 'S525')
5114
        self.assertEqual(pshp_soundex_last('Samson'), 'S250')
5115
        self.assertEqual(pshp_soundex_last('Lang'), 'L500')
5116
        self.assertEqual(pshp_soundex_last('Hagan'), 'H500')
5117
        self.assertEqual(pshp_soundex_last('Cartes', german=True), 'K500')
5118
        self.assertEqual(pshp_soundex_last('Kats', german=True), 'K000')
5119
        self.assertEqual(pshp_soundex_last('Schultze', german=True), 'S400')
5120
        self.assertEqual(pshp_soundex_last('Alze', german=True), 'A400')
5121
        self.assertEqual(pshp_soundex_last('Galz', german=True), 'G400')
5122
        self.assertEqual(pshp_soundex_last('Alte', german=True), 'A400')
5123
        self.assertEqual(pshp_soundex_last('Alte', maxlength=None), 'A43')
5124
        self.assertEqual(pshp_soundex_last('Altemaier', maxlength=None),
5125
                         'A4355')
5126
5127
    def test_pshp_soundex_first(self):
5128
        """Test abydos.phonetic.pshp_soundex_first."""
5129
        # Base case
5130
        self.assertEqual(pshp_soundex_first(''), '0000')
5131
5132
        # Examples given in defining paper (Hershberg, et al. 1976)
5133
        self.assertEqual(pshp_soundex_first('JAMES'), 'J700')
5134
        self.assertEqual(pshp_soundex_first('JOHN'), 'J500')
5135
        self.assertEqual(pshp_soundex_first('PAT'), 'P700')
5136
        self.assertEqual(pshp_soundex_first('PETER'), 'P300')
5137
5138
        # Additions for coverage
5139
        self.assertEqual(pshp_soundex_first('Giles'), 'J400')
5140
        self.assertEqual(pshp_soundex_first('Cy'), 'S000')
5141
        self.assertEqual(pshp_soundex_first('Chris'), 'K500')
5142
        self.assertEqual(pshp_soundex_first('Caleb'), 'K400')
5143
        self.assertEqual(pshp_soundex_first('Knabe'), 'N100')
5144
        self.assertEqual(pshp_soundex_first('Phil'), 'F400')
5145
        self.assertEqual(pshp_soundex_first('Wieland'), 'V400')
5146
        self.assertEqual(pshp_soundex_first('Wayne', german=True), 'V500')
5147
        self.assertEqual(pshp_soundex_first('Christopher', maxlength=None),
5148
                         'K5')
5149
        self.assertEqual(pshp_soundex_first('Asdaananndsjsjasd',
5150
                                            maxlength=None), 'A23553223')
5151
        self.assertEqual(pshp_soundex_first('Asdaananndsjsjasd'), 'A235')
5152
5153
5154
class HenryCodeTestCases(unittest.TestCase):
5155
    """Test Henry Code functions.
5156
5157
    test cases for abydos.phonetic.henry_early
5158
    """
5159
5160
    def test_henry_early(self):
5161
        """Test abydos.phonetic.henry_early."""
5162
        # Base case
5163
        self.assertEqual(henry_early(''), '')
5164
5165
        # Examples from Legare 1972 paper
5166
        self.assertEqual(henry_early('Descarry'), 'DKR')
5167
        self.assertEqual(henry_early('Descaries'), 'DKR')
5168
        self.assertEqual(henry_early('Campo'), 'KP')
5169
        self.assertEqual(henry_early('Campot'), 'KP')
5170
        self.assertEqual(henry_early('Gausselin'), 'GSL')
5171
        self.assertEqual(henry_early('Gosselin'), 'GSL')
5172
        self.assertEqual(henry_early('Bergeron'), 'BRJ')
5173
        self.assertEqual(henry_early('Bergereau'), 'BRJ')
5174
        self.assertEqual(henry_early('Bosseron'), 'BSR')
5175
        self.assertEqual(henry_early('Cicire'), 'SSR')
5176
        self.assertEqual(henry_early('Lechevalier'), 'LCV')
5177
        self.assertEqual(henry_early('Chevalier'), 'CVL')
5178
        self.assertEqual(henry_early('Peloy'), 'PL')
5179
        self.assertEqual(henry_early('Beloy'), 'BL')
5180
        self.assertEqual(henry_early('Beret'), 'BR')
5181
        self.assertEqual(henry_early('Benet'), 'BN')
5182
        self.assertEqual(henry_early('Turcot'), 'TRK')
5183
        self.assertEqual(henry_early('Turgot'), 'TRG')
5184
        self.assertEqual(henry_early('Vigier'), 'VJ')
5185
        self.assertEqual(henry_early('Vigiere'), 'VJR')
5186
        self.assertEqual(henry_early('Dodin'), 'DD')
5187
        self.assertEqual(henry_early('Dodelin'), 'DDL')
5188
5189
        # Tests to complete coverage
5190
        self.assertEqual(henry_early('Anil'), 'ANL')
5191
        self.assertEqual(henry_early('Emmanuel'), 'AMN')
5192
        self.assertEqual(henry_early('Ainu'), 'EN')
5193
        self.assertEqual(henry_early('Oeuf'), 'OF')
5194
        self.assertEqual(henry_early('Yves'), 'IV')
5195
        self.assertEqual(henry_early('Yo'), 'I')
5196
        self.assertEqual(henry_early('Umman'), 'EM')
5197
        self.assertEqual(henry_early('Omman'), 'OM')
5198
        self.assertEqual(henry_early('Zoe'), 'S')
5199
        self.assertEqual(henry_early('Beauchamp'), 'BCP')
5200
        self.assertEqual(henry_early('Chloe'), 'KL')
5201
        self.assertEqual(henry_early('Gerard'), 'JRR')
5202
        self.assertEqual(henry_early('Agnes'), 'ANN')
5203
        self.assertEqual(henry_early('Pinot'), 'PN')
5204
        self.assertEqual(henry_early('Philo'), 'FL')
5205
        self.assertEqual(henry_early('Quisling'), 'GL')
5206
        self.assertEqual(henry_early('Qualite'), 'KLT')
5207
        self.assertEqual(henry_early('Sainte-Marie'), 'XMR')
5208
        self.assertEqual(henry_early('Saint-Jean'), 'XJ')
5209
        self.assertEqual(henry_early('Ste-Marie'), 'XMR')
5210
        self.assertEqual(henry_early('St-Jean'), 'XJ')
5211
        self.assertEqual(henry_early('Cloe'), 'KL')
5212
        self.assertEqual(henry_early('Ahch-To'), 'AKT')
5213
        self.assertEqual(henry_early('Zdavros'), 'SDV')
5214
        self.assertEqual(henry_early('Sdavros'), 'DVR')
5215
        self.assertEqual(henry_early('Coulomb'), 'KLB')
5216
        self.assertEqual(henry_early('Calm'), 'K')
5217
        self.assertEqual(henry_early('Omnia'), 'ON')
5218
        self.assertEqual(henry_early('Ramps'), 'RPS')
5219
        self.assertEqual(henry_early('Renault'), 'RN')
5220
        self.assertEqual(henry_early('Czech'), 'CSK')
5221
        self.assertEqual(henry_early('Imran'), 'ER')
5222
        self.assertEqual(henry_early('Christopher', maxlength=None), 'KRXF')
5223
5224
5225
class NorphoneTestCases(unittest.TestCase):
5226
    """Test Norphone functions.
5227
5228
    test cases for abydos.phonetic.norphone
5229
    """
5230
5231
    def test_norphone(self):
5232
        """Test abydos.phonetic.norphone."""
5233
        # Base case
5234
        self.assertEqual(norphone(''), '')
5235
5236
        # Examples given at
5237
        # https://github.com/larsga/Duke/blob/master/duke-core/src/test/java/no/priv/garshol/duke/comparators/NorphoneComparatorTest.java
5238
        self.assertEqual(norphone('Aarestad'), norphone('\u00C5rrestad'))
5239
        self.assertEqual(norphone('Andreasen'), norphone('Andreassen'))
5240
        self.assertEqual(norphone('Arntsen'), norphone('Arntzen'))
5241
        self.assertEqual(norphone('Bache'), norphone('Bakke'))
5242
        self.assertEqual(norphone('Frank'), norphone('Franck'))
5243
        self.assertEqual(norphone('Christian'), norphone('Kristian'))
5244
        self.assertEqual(norphone('Kielland'), norphone('Kjelland'))
5245
        self.assertEqual(norphone('Krogh'), norphone('Krog'))
5246
        self.assertEqual(norphone('Krog'), norphone('Krohg'))
5247
        self.assertEqual(norphone('Jendal'), norphone('Jendahl'))
5248
        self.assertEqual(norphone('Jendal'), norphone('Hjendal'))
5249
        self.assertEqual(norphone('Jendal'), norphone('Gjendal'))
5250
        self.assertEqual(norphone('Vold'), norphone('Wold'))
5251
        self.assertEqual(norphone('Thomas'), norphone('Tomas'))
5252
        self.assertEqual(norphone('Aamodt'), norphone('Aamot'))
5253
        self.assertEqual(norphone('Aksel'), norphone('Axel'))
5254
        self.assertEqual(norphone('Kristoffersen'), norphone('Christophersen'))
5255
        self.assertEqual(norphone('Voll'), norphone('Vold'))
5256
        self.assertEqual(norphone('Granli'), norphone('Granlid'))
5257
        self.assertEqual(norphone('Gjever'), norphone('Giever'))
5258
        self.assertEqual(norphone('Sannerhaugen'), norphone('Sanderhaugen'))
5259
        self.assertEqual(norphone('Jahren'), norphone('Jaren'))
5260
        self.assertEqual(norphone('Amundsrud'), norphone('Amundsr\u00F8d'))
5261
        self.assertEqual(norphone('Karlson'), norphone('Carlson'))
5262
5263
        # Additional tests to increase coverage
5264
        self.assertEqual(norphone('Århus'), 'ÅRHS')
5265
        self.assertEqual(norphone('Skyrim'), 'XRM')
5266
        self.assertEqual(norphone('kyss'), 'XS')
5267
        self.assertEqual(norphone('Äthelwulf'), 'ÆTLVLF')
5268
        self.assertEqual(norphone('eit'), 'ÆT')
5269
        self.assertEqual(norphone('Öl'), 'ØL')
5270
5271
        # test cases by larsga (the algorithm's author) posted to Reddit
5272
        # https://www.reddit.com/r/norge/comments/vksb5/norphone_mitt_forslag_til_en_norsk_soundex_vel/
5273
        # modified, where necessary to match the "not implemented" rules
5274
        # and rule added after the Reddit post
5275
        reddit_tests = (('MKLSN', ('MICHALSEN', 'MIKKELSEN', 'MIKALSEN',
5276
                                   'MICHAELSEN', 'MIKAELSEN', 'MICKAELSEN',
5277
                                   'MICHELSEN', 'MIKELSEN')),
5278
                        ('BRKR', ('BERGER', 'BORGERUD', 'BURGER', 'BORGER',
5279
                                  'BORGAR', 'BIRGER', 'BRAGER', 'BERGERUD')),
5280
                        ('TMS', ('TOMMAS', 'THOMAS', 'THAMS', 'TOUMAS',
5281
                                 'THOMMAS', 'TIMMS', 'TOMAS', 'TUOMAS')),
5282
                        ('HLR', ('HOLER', 'HELLERUD', 'HALLRE', 'HOLLERUD',
5283
                                 'HILLER', 'HALLERUD', 'HOLLER', 'HALLER')),
5284
                        ('MS', ('MASS', 'MMS', 'MSS', 'MOES', 'MEZZO', 'MESA',
5285
                                'MESSE', 'MOSS')),
5286
                        ('HRST', ('HIRSTI', 'HAARSETH', 'HAARSTAD', 'HARSTAD',
5287
                                  'HARESTUA', 'HERSETH', 'HERSTAD',
5288
                                  'HERSTUA')),
5289
                        ('SVN', ('SWANN', 'SVENI', 'SWAN', 'SVEN', 'SVEIN',
5290
                                 'SVEEN', 'SVENN', 'SVANE')),
5291
                        ('SLT', ('SELTE', 'SALT', 'SALTE', 'SLOTT', 'SLAATTO',
5292
                                 'SLETT', 'SLETTA', 'SLETTE')),
5293
                        ('JNSN', ('JANSSEN', 'JANSEN', 'JENSEN', 'JONASSEN',
5294
                                  'JANSON', 'JONSON', 'JENSSEN', 'JONSSON')),
5295
                        ('ANRSN', ('ANDRESSEN', 'ANDERSSON', 'ANDRESEN',
5296
                                   'ANDREASSEN', 'ANDERSEN', 'ANDERSON',
5297
                                   'ANDORSEN', 'ANDERSSEN')),
5298
                        ('BRK', ('BREKKE', 'BORCH', 'BRAKKE', 'BORK', 'BRECKE',
5299
                                 'BROCH', 'BRICK', 'BRUK')),
5300
                        ('LN', ('LINDE', 'LENDE', 'LUND', 'LAND', 'LINDA',
5301
                                'LANDE', 'LIND', 'LUNDE')),
5302
                        ('SF', ('SOPHIE', 'SFE', 'SEFF', 'SEAFOOD', 'SOFIE',
5303
                                'SAFE', 'SOFI', 'SOPHIA')),
5304
                        ('BRST', ('BRUASET', 'BUERSTAD', 'BARSTAD', 'BAARSTAD',
5305
                                  'BRUSETH', 'BERSTAD', 'BORSTAD', 'BRUSTAD')),
5306
                        ('OLSN', ('OHLSSON', 'OLESEN', 'OLSSON', 'OLAUSSON',
5307
                                  'OLAUSEN', 'OLAUSSEN', 'OLSEN', 'OLSON')),
5308
                        ('MKL', ('MIKAEL', 'MICHELA', 'MEIKLE', 'MIKAL',
5309
                                 'MIKKEL', 'MICHEL', 'MICHAL', 'MICHAEL')),
5310
                        ('HR', ('HEIER', 'HAR', 'HEER', 'HARRY', 'HEIR',
5311
                                'HURRE', 'HERO', 'HUURRE')),
5312
                        ('VLM', ('VILLUM', 'WOLLUM', 'WILLIAM', 'WILLAM',
5313
                                 'WALLEM', 'WILLUM', 'VALUM', 'WILMO')),
5314
                        ('SNS', ('SYNNES', 'SINUS', 'SNUS', 'SNEIS', 'SANNES',
5315
                                 'SUNAAS', 'SUNNAAS', 'SAINES')),
5316
                        ('SNL', ('SANDAL', 'SANDAHL', 'SUNDEL', 'SANDLI',
5317
                                 'SUNNDAL', 'SANDELL', 'SANDLIE', 'SUNDAL')),
5318
                        ('VK', ('VEKA', 'VIKA', 'WIIK', 'WOK', 'WIKE', 'WEEK',
5319
                                'VIK', 'VIAK')),
5320
                        ('MTS', ('METSO', 'MOTHES', 'MATHIAS', 'MATHIS',
5321
                                 'MATTIS', 'MYTHES', 'METOS', 'MATS')))
5322
        for encoded, names in reddit_tests:
5323
            for name in names:
5324
                self.assertEqual(encoded, norphone(name))
5325
5326
5327
class DolbyTestCases(unittest.TestCase):
5328
    """Test Dolby functions.
5329
5330
    test cases for abydos.phonetic.dolby
5331
    """
5332
5333
    def test_dolby(self):
5334
        """Test abydos.phonetic.dolby."""
5335
        # Base case
5336
        self.assertEqual(dolby(''), '')
5337
5338
        # Tests from Dolby (1970) pp. 264--274
5339
        # https://ejournals.bc.edu/ojs/index.php/ital/article/download/5259/4734
5340
        # Checked against Cunningham, et al. (1969) pp. 127--136, as needed.
5341
        # https://files.eric.ed.gov/fulltext/ED029679.pdf
5342
        test_cases = (('*BL', 'Abel', 'Abele', 'Abell', 'Able'),
5343
                      ('*BRMS', 'Abrahams', 'Abrams'),
5344
                      ('*BRMSN', 'Abrahamson', 'Abramson'),
5345
                      ('*D', 'Eddy', 'Eddie'),
5346
                      ('*DMNS', 'Edmonds', 'Edmunds'),
5347
                      ('*DMNSN', 'Edmondson', 'Edmundson'),
5348
                      ('*DMS', 'Adams', 'Addems'),
5349
                      ('*GN', 'Eagen', 'Egan', 'Eggen'),
5350
                      ('*GR', '!Jaeger', 'Yaeger', 'Yeager'),
5351
                      ('*KN', 'Aiken', 'Aikin', 'Aitken'),
5352
                      ('*KNS', 'Adkins', 'Akins'),
5353
                      ('*KR', 'Acker', 'Aker'),
5354
                      ('*KR', 'Eckard', 'Eckardt', 'Eckart', 'Eckert',
5355
                       'Eckhardt'),
5356
                      ('*KS', 'Oakes', 'Oaks', 'Ochs'),
5357
                      ('*LBRD', 'Albright', 'Allbright'),
5358
                      ('*LD', 'Elliot', 'Elliott'),
5359
                      ('*LN', 'Allan', 'Allen', 'Allyn'),
5360
                      ('*LSN', 'Ohlsen', 'Olesen', 'Olsen', 'Olson', 'Olsson'),
5361
                      ('*LVR', 'Oliveira', 'Olivera', 'Olivero'),
5362
                      ('*MS', 'Ames', 'Eames'),
5363
                      ('*NGL', 'Engel', 'Engle', 'Ingle'),
5364
                      ('*NL', 'O\'Neal', 'O\'Neil', 'O\'Neill'),
5365
                      ('*NRS', 'Andrews', 'Andrus'),
5366
                      ('*NRSN', 'Andersen', 'Anderson', 'Andreasen'),
5367
                      ('*NS', 'Ennis', 'Enos'),
5368
                      # Corrected: 'Enrichsen' below was an error
5369
                      # (It's correct in Cunningham, et al. 1969.)
5370
                      ('*RKSN', 'Erichsen', 'Erickson', 'Ericson', 'Ericsson',
5371
                       'Eriksen'),
5372
                      ('*RL', 'Earley', 'Early'),
5373
                      ('*RN', 'Erwin', 'Irwin'),
5374
                      ('*RNS', 'Aarons', 'Ahrends', 'Ahrens', 'Arens',
5375
                       'Arentz', 'Arons'),
5376
                      ('*RS', 'Ayers', 'Ayres'),
5377
                      ('*RVN', 'Ervin', 'Ervine', 'Irvin', 'Irvine'),
5378
                      ('*RVNG', 'Erving', 'Irving'),
5379
                      ('*SBRN', 'Osborn', 'Osborne', 'Osbourne', 'Osburn'),
5380
                      ('B*D', 'Beatie', 'Beattie', 'Beatty', 'Beaty',
5381
                       'Beedie'),
5382
                      ('B*DS', 'Betts', 'Betz'),
5383
                      ('B*KMN', 'Bachman', 'Bachmann', 'Backman'),
5384
                      ('B*L', 'Bailey', 'Baillie', 'Bailly', 'Baily',
5385
                       'Bayley'),
5386
                      ('B*L', 'Beal', 'Beale', 'Beall', 'Biehl'),
5387
                      ('B*L', 'Belew', 'Ballou', 'Bellew'),
5388
                      ('B*L', 'Buhl', 'Buell'),
5389
                      ('B*L', 'Belle', 'Bell'),
5390
                      # Corrected: No reason for D to disappear
5391
                      ('B*LDN', 'Bolton', 'Boulton'),
5392
                      ('B*M', 'Baum', 'Bohm', 'Bohme'),
5393
                      ('B*MN', 'Bauman', 'Bowman'),
5394
                      ('B*N', 'Bain', 'Bane', 'Bayne'),
5395
                      ('B*ND', 'Bennet', 'Bennett'),
5396
                      ('B*R', 'Baer', 'Bahr', 'Baier', 'Bair', 'Bare', 'Bear',
5397
                       'Beare', 'Behr', 'Beier', 'Bier', '!Bryer'),
5398
                      ('B*R', 'Barry', 'Beare', 'Beery', 'Berry'),
5399
                      ('B*R', 'Bauer', 'Baur', 'Bower'),
5400
                      ('B*R', 'Bird', 'Burd', 'Byrd'),
5401
                      ('B*RBR', 'Barbour', 'Barber'),
5402
                      ('B*RG', 'Berg', 'Bergh', 'Burge'),
5403
                      ('B*RGR', 'Berger', 'Burger'),
5404
                      ('B*RK', 'Boerke', 'Birk', 'Bourke', 'Burk', 'Burke'),
5405
                      ('B*RN', 'Burn', 'Byrne'),
5406
                      ('B*RNR', 'Bernard', 'Bernhard', 'Bernhardt',
5407
                       'Bernhart'),
5408
                      ('B*RNS', 'Berns', 'Birns', 'Burns', 'Byrns', 'Byrnes'),
5409
                      ('B*RNSN', 'Bernstein', 'Bornstein'),
5410
                      # Corrected: 'RCH' -> 'RH' in rule 2
5411
                      ('B*RS', 'Bertsch', '!Birch', '!Burch'),
5412
                      ('BL*KBRN', 'Blackburn', '!Blagburn'),
5413
                      ('BL*M', 'Blom', 'Bloom', 'Bluhm', 'Blum', 'Blume'),
5414
                      ('BR*D', 'Brode', 'Brodie', 'Brody'),
5415
                      ('BR*N', 'Braun', 'Brown', 'Browne'),
5416
                      ('BR*N', 'Brand', 'Brandt', 'Brant'),
5417
                      # Corrected: 'Diezt' -> 'D*SD', so reversed zt -> tz
5418
                      # (Correct in Cunningham, et al. 1969.)
5419
                      ('D*DS', 'Dietz', 'Ditz'),
5420
                      ('D*F', 'Duffie', 'Duffy'),
5421
                      ('D*GN', 'Dougan', 'Dugan', 'Duggan'),
5422
                      ('D*K', 'Dickey', 'Dicke'),
5423
                      ('D*KNSN', 'Dickenson', '!Dickerson', 'Dickinson',
5424
                       '!Dickison'),
5425
                      ('D*KSN', 'Dickson', 'Dixon', 'Dixson'),
5426
                      ('D*L', 'Dailey', 'Daily', 'Daley', 'Daly'),
5427
                      ('D*L', 'Dahl', 'Dahle', 'Dall', 'Doll'),
5428
                      ('D*L', 'Deahl', 'Deal', 'Diehl'),
5429
                      ('D*MN', 'Diamond', 'Dimond', 'Dymond'),
5430
                      ('D*N', 'Dean', 'Deane', 'Deen'),
5431
                      ('D*N', 'Denney', 'Denny'),
5432
                      ('D*N', 'Donahoo', 'Donahue', 'Donoho', 'Donohoe',
5433
                       'Donohoo,'),
5434
                      ('D*N', 'Donohue', 'Dunnahoo'),
5435
                      ('D*N', 'Downey', 'Downie'),
5436
                      ('D*N', 'Dunn', 'Dunne'),
5437
                      ('D*NL', 'Donley', 'Donnelley', 'Donnelly'),
5438
                      ('D*R', 'Daugherty', 'Doherty', 'Dougherty'),
5439
                      ('D*R', 'Dyar', 'Dyer'),
5440
                      ('D*RM', 'Derham', 'Durham'),
5441
                      ('D*VDSN', 'Davidsen', 'Davidson', '!Davison'),
5442
                      ('D*VS', 'Davies', 'Davis'),
5443
                      ('DR*SL', 'Driscoll', 'Driskell'),
5444
                      ('F*', 'Fay', 'Fahay', 'Fahey'),
5445
                      ('F*FR', 'Fifer', 'Pfeffer', 'Pfeiffer'),
5446
                      ('F*GN', 'Fagan', 'Feigan', 'Fegan'),
5447
                      ('F*L', 'Feil', 'Pfeil'),
5448
                      # Corrected: T -> D after LD -> D
5449
                      ('F*L', 'Feld', 'Feldt', '!Felt'),
5450
                      ('F*LKNR', 'Faulkner', 'Falconer'),
5451
                      ('F*LPS', 'Philips', 'Phillips'),
5452
                      ('F*NGN', 'Finnegan', 'Finnigan'),
5453
                      ('F*NL', 'Finlay', 'Finley'),
5454
                      ('F*RL', 'Farrell', 'Ferrell'),
5455
                      ('F*RR', 'Ferrara', 'Ferreira', 'Ferriera'),
5456
                      # Corrected: No reason for S to be eliminated
5457
                      ('F*RSR', 'Foerster', 'Forester', 'Forrester',
5458
                       'Forster'),
5459
                      ('F*RS', 'Forrest', 'Forest'),
5460
                      ('F*RS', 'Faris', 'Farriss', 'Ferris', 'Ferriss'),
5461
                      ('F*RS', 'First', 'Fuerst', 'Furst'),
5462
                      ('F*SR', 'Fischer', 'Fisher'),
5463
                      ('FL*N', 'Flinn', 'Flynn'),
5464
                      ('FL*NGN', 'Flanagan', 'Flanigan', 'Flannigan'),
5465
                      ('FR*', 'Frei', 'Frey', 'Fry', 'Frye'),
5466
                      ('FR*DMN', 'Freedman', 'Friedman'),
5467
                      # Corrected: Fredickson -> Fredrickson
5468
                      # (Correct in Cunningham, et al. 1969.)
5469
                      ('FR*DRKSN', 'Frederickson', 'Frederiksen',
5470
                       'Fredrickson', 'Fredriksson'),
5471
                      # Corrected: NK would not reduce to K because of rule 4
5472
                      ('FR*NK', 'Franck', 'Frank'),
5473
                      ('FR*NS', 'France', 'Frantz', 'Franz'),
5474
                      # Corrected: vowel deletion happens after double
5475
                      # consonant deletion
5476
                      ('FR*NSS', 'Frances', 'Francis'),
5477
                      ('FR*S', 'Freeze', 'Freese', 'Fries'),
5478
                      ('FR*SR', 'Fraser', 'Frasier', 'Frazer', 'Frazier'),
5479
                      ('G*D', 'Good', 'Goode'),
5480
                      ('G*DS', 'Getz', 'Goetz', 'Goetze'),
5481
                      ('G*F', 'Goff', 'Gough'),
5482
                      ('G*L', 'Gold', 'Goold', 'Gould'),
5483
                      ('G*LMR', 'Gilmer', 'Gilmore', 'Gilmour'),
5484
                      ('G*LR', 'Gallagher', 'Gallaher', 'Galleher'),
5485
                      ('G*MS', 'Gomes', 'Gomez'),
5486
                      ('G*NR', 'Guenther', 'Gunther'),
5487
                      ('G*NSLS', 'Gonzales', 'Gonzalez'),
5488
                      # Corrected: 'Consalves' for the first case likely a typo
5489
                      # (Correct in Cunningham, et al. 1969.)
5490
                      ('G*NSLVS', 'Gonsalves', 'Gonzalves'),
5491
                      ('G*RD', 'Garratt', 'Garrett'),
5492
                      ('G*RD', 'Garrity', 'Geraghty', 'Geraty', 'Gerrity'),
5493
                      ('G*RN', 'Gorden', 'Gordohn', 'Gordon'),
5494
                      ('G*RNR', 'Gardiner', 'Gardner', 'Gartner'),
5495
                      ('G*RR', 'Garrard', 'Gerard', 'Gerrard', 'Girard'),
5496
                      ('G*S', 'Gauss', 'Goss'),
5497
                      ('GR*', 'Gray', 'Grey'),
5498
                      ('GR*FD', 'Griffeth', 'Griffith'),
5499
                      ('GR*N', 'Green', 'Greene'),
5500
                      ('GR*S', 'Gros', 'Grose', 'Gross'),
5501
                      ('H*D', 'Hyde', 'Heidt'),
5502
                      ('H*F', 'Hoff', 'Hough', 'Huff'),
5503
                      ('H*FMN', 'Hoffman', 'Hoffmann', 'Hofman', 'Hofmann',
5504
                       'Huffman'),
5505
                      ('H*G', 'Hoag', 'Hoge', 'Hogue'),
5506
                      ('H*GN', 'Hagan', 'Hagen'),
5507
                      ('H*K', 'Hauch', 'Hauck', 'Hauk', 'Hauke'),
5508
                      ('H*KSN', 'Hutcheson', 'Hutchison'),
5509
                      ('H*L', 'Holley', 'Holly'),
5510
                      ('H*L', 'Holl', 'Hall'),
5511
                      ('H*L', 'Halley', 'Haley'),
5512
                      ('H*L', 'Haile', 'Hale'),
5513
                      ('H*LD', 'Holiday', 'Halliday', 'Holladay', 'Holliday'),
5514
                      ('H*LG', 'Helwig', 'Hellwig'),
5515
                      ('H*LM', 'Holm', '!Home'),
5516
                      ('H*LMS', 'Holmes', '!Homes'),
5517
                      ('H*LN', 'Highland', 'Hyland'),
5518
                      ('H*M', 'Ham', 'Hamm'),
5519
                      ('H*MR', 'Hammar', 'Hammer'),
5520
                      ('H*N', 'Hanna', 'Hannah'),
5521
                      ('H*N', 'Hahn', 'Hahne', 'Hann', 'Haun'),
5522
                      ('H*NN', 'Hanan', 'Hannan', 'Hannon'),
5523
                      ('H*NRKS', 'Hendricks', 'Hendrix', 'Henriques'),
5524
                      ('H*NRKSN', 'Hendrickson', 'Henriksen', 'Henrikson'),
5525
                      ('H*NS', 'Heintz', 'Heinz', 'Heinze', 'Hindes', 'Hinds',
5526
                       'Hines', 'Hinze'),
5527
                      ('H*NS', 'Haines', 'Haynes'),
5528
                      ('H*NSN', 'Henson', 'Hansen', 'Hanson', 'Hanssen',
5529
                       'Hansson', 'Hanszen'),
5530
                      ('H*R', 'Herd', 'Heard', 'Hird', 'Hurd'),
5531
                      ('H*R', 'Hart', 'Hardt', 'Harte', 'Heart'),
5532
                      ('H*R', 'Hare', 'Hair'),
5533
                      ('H*R', 'Hardey', 'Hardie', 'Hardy'),
5534
                      ('H*RMN', 'Hartman', 'Hardmen', 'Hardman', 'Hartmann'),
5535
                      ('H*RMN', 'Herman', 'Hermann', 'Herrmann'),
5536
                      ('H*RMN', 'Harman', 'Harmon'),
5537
                      ('H*RN', 'Heron', 'Herrin', 'Herron'),
5538
                      ('H*RN', 'Hardin', 'Harden'),
5539
                      ('H*RN', 'Horn', 'Horne'),
5540
                      ('H*RNGDN', 'Herrington', 'Harrington'),
5541
                      ('H*S', 'Haas', 'Haase', 'Hasse'),
5542
                      ('H*S', 'Howes', 'House', 'Howse'),
5543
                      ('H*S', 'Hays', 'Hayes'),
5544
                      ('H*SN', 'Houston', 'Huston'),
5545
                      ('H*VR', 'Hoover', 'Hover'),
5546
                      ('J*', 'Jew', 'Jue'),
5547
                      ('J*FR', 'Jeffery', 'Jeffrey'),
5548
                      ('J*FRS', 'Jefferies', 'Jefferis', 'Jefferys',
5549
                       'Jeffreys'),
5550
                      ('J*KB', 'Jacobi', 'Jacoby'),
5551
                      ('J*KBSN', 'Jacobsen', 'Jacobson', 'Jackobsen'),
5552
                      ('J*KS', 'Jacques', 'Jacks', 'Jaques'),
5553
                      ('J*L', 'Jewell', 'Juhl'),
5554
                      ('J*MS', 'Jaimes', 'James'),
5555
                      ('J*MSN', 'Jameson', 'Jamieson', 'Jamison'),
5556
                      ('J*NSN', 'Jahnsen', 'Jansen', 'Jansohn', 'Janssen',
5557
                       'Jansson,', 'Janzen', 'Jensen', 'Jenson'),
5558
                      ('J*S', 'Joice', 'Joyce'),
5559
                      ('K*', 'Kay', 'Kaye'),
5560
                      ('K*F', 'Coffee', 'Coffey'),
5561
                      ('K*FMN', 'Coffman', 'Kauffman', 'Kaufman', 'Kaufmann'),
5562
                      ('K*K', 'Cook', 'Cooke', 'Koch', 'Koche'),
5563
                      ('K*K', 'Cook', 'Cooke', 'Koch', 'Koche'),
5564
                      ('K*L', 'Cole', 'Kohl', 'Koll'),
5565
                      ('K*L', 'Cole', 'Kohl', 'Koll'),
5566
                      ('K*L', 'Kelley', 'Kelly'),
5567
                      ('K*LMN', 'Coleman', 'Colman'),
5568
                      ('K*LR', 'Koehler', 'Koeller', 'Kohler', 'Koller'),
5569
                      ('K*MBRLN', 'Chamberlain', 'Chamberlin'),
5570
                      ('K*MBS', 'Combs', 'Coombes', 'Coombs'),
5571
                      ('K*MP', 'Camp', 'Kampe', 'Kampf'),
5572
                      ('K*MPS', 'Campos', 'Campus'),
5573
                      ('K*N', 'Cahn', 'Conn', 'Kahn'),
5574
                      ('K*N', 'Cahen', 'Cain', 'Caine', 'Cane', 'Kain',
5575
                       'Kane'),
5576
                      ('K*N', 'Chin', 'Chinn'),
5577
                      ('K*N', 'Chaney', 'Cheney'),
5578
                      ('K*N', 'Coen', 'Cohan', 'Cohen', 'Cohn', 'Cone',
5579
                       'Koehn', 'Kahn'),
5580
                      ('K*N', 'Coon', 'Kuhn', 'Kuhne'),
5581
                      ('K*N', 'Kenney', 'Kenny', 'Kinney'),
5582
                      ('K*NL', 'Conley', 'Conly', 'Connelly', 'Connolly'),
5583
                      ('K*NR', 'Conner', 'Connor'),
5584
                      ('K*NS', 'Coons', 'Koontz', 'Kuhns', 'Kuns', 'Kuntz',
5585
                       'Kunz'),
5586
                      ('K*P', 'Coop', 'Co-op', 'Coope', 'Coupe', 'Koop'),
5587
                      ('K*PL', 'Chapel', 'Chapell', 'Chappel', 'Chappell',
5588
                       'Chappelle', 'Chapple'),
5589
                      ('K*R', 'Carrie', 'Carey', 'Cary'),
5590
                      ('K*R', 'Corey', 'Cory'),
5591
                      ('K*R', 'Carr', 'Kar', 'Karr'),
5592
                      # Corrected: No reason to strip S
5593
                      ('K*RS', 'Kurtz', 'Kurz'),
5594
                      ('K*R', 'Kehr', 'Ker', 'Kerr'),
5595
                      ('K*RD', 'Cartwright', 'Cortright'),
5596
                      # Corrected: No reason to strip D
5597
                      ('K*RLDN', 'Carleton', 'Carlton'),
5598
                      # Corrected: CE -> SE
5599
                      ('K*RN', 'Carney', '!Cerney', 'Kearney'),
5600
                      # Corrected: RC -> R
5601
                      ('K*RSNR', 'Kirschner', '!Kirchner'),
5602
                      ('K*S', 'Chace', 'Chase'),
5603
                      ('K*S', 'Cass', 'Kass'),
5604
                      ('K*S', 'Kees', 'Keyes', 'Keys'),
5605
                      ('K*SL', 'Cassel', 'Cassell', 'Castle'),
5606
                      ('K*SLR', 'Kesler', 'Kessler', 'Kestler'),
5607
                      ('K*SR', 'Kaiser', 'Kayser', 'Keizer', 'Keyser',
5608
                       'Kieser', 'Kiser', 'Kizer'),
5609
                      ('KL*N', 'Cline', 'Klein', 'Kleine', 'Kline'),
5610
                      ('KL*RK', 'Clark', 'Clarke'),
5611
                      ('KL*SN', 'Claussen', 'Clausen', 'Clawson', 'Closson'),
5612
                      ('KR*', 'Crow', 'Crowe'),
5613
                      ('KR*GR', 'Krieger', 'Kroeger', 'Krueger', 'Kruger'),
5614
                      ('KR*MR', 'Creamer', 'Cramer', 'Kraemer', 'Kramer',
5615
                       'Kremer'),
5616
                      ('KR*N', 'Craine', 'Crane'),
5617
                      ('KR*S', 'Christie', 'Christy', 'Kristee'),
5618
                      ('KR*S', 'Crouss', 'Kraus', 'Krausch', 'Krause',
5619
                       'Krouse'),
5620
                      ('KR*S', 'Cross', 'Krost'),
5621
                      ('KR*S', 'Crews', 'Cruz', 'Kruse'),
5622
                      ('KR*SNSN', 'Christensen', 'Christiansen',
5623
                       'Christianson'),
5624
                      ('L*', 'Loe', 'Loewe', 'Low', 'Lowe'),
5625
                      ('L*', 'Lea', 'Lee', '!Leigh'),
5626
                      ('L*D', 'Lloyd', 'Loyd'),
5627
                      ('L*DL', 'Litle', 'Littell', 'Little', 'Lytle'),
5628
                      ('L*DRMN', 'Ledterman', 'Letterman'),
5629
                      ('L*K', 'Leach', 'Leech', 'Leitch'),
5630
                      ('L*KS', 'Lucas', 'Lukas'),
5631
                      ('L*LN', 'Laughlin', 'Loughlin'),
5632
                      ('L*LR', 'Lawler', 'Lawlor'),
5633
                      ('L*MB', 'Lamb', '!Lamm'),
5634
                      ('L*MN', 'Lemen', 'Lemmon', 'Lemon'),
5635
                      ('L*MN', 'Layman', 'Lehman', 'Lehmann'),
5636
                      ('L*N', 'Lind', 'Lynd', 'Lynde'),
5637
                      ('L*N', 'Lion', 'Lyon'),
5638
                      ('L*N', 'Lin', 'Linn', 'Lynn', 'Lynne'),
5639
                      # Corrected: NG -> NG (!N)
5640
                      ('L*N', 'Lain', 'Laine', '!Laing', 'Lane', 'Layne'),
5641
                      ('L*NG', 'Lang', 'Lange'),
5642
                      ('L*NN', 'London', 'Lundin'),
5643
                      ('L*NS', 'Lindsay', 'Lindsey', '!Lindsley', '!Linsley'),
5644
                      ('L*R', 'Lawry', 'Lowery', 'Lowrey', 'Lowry'),
5645
                      ('L*RNS', 'Lawrence', 'Lowrance'),
5646
                      ('L*RNS', 'Laurence', 'Lawrance', 'Lawrence', 'Lorence',
5647
                       'Lorenz'),
5648
                      ('L*RSN', 'Larsen', 'Larson'),
5649
                      ('L*S', 'Lewis', 'Louis', 'Luis', 'Luiz'),
5650
                      ('L*S', 'Lacey', 'Lacy'),
5651
                      ('L*SR', '!Leicester', 'Lester'),
5652
                      ('L*V', 'Levey', 'Levi', 'Levy'),
5653
                      ('L*VD', 'Leavett', 'Leavitt', 'Levit'),
5654
                      ('L*VL', 'Lavell', 'Lavelle', 'Leavelle', 'Loveall',
5655
                       'Lovell'),
5656
                      ('L*VN', 'Lavin', 'Levin', 'Levine'),
5657
                      ('M*D', 'Mead', 'Meade'),
5658
                      # Corrected: RT*N -> R*N -> RN
5659
                      ('M*RN', '!Moretton', 'Morton'),
5660
                      ('M*DS', 'Mathews', 'Matthews'),
5661
                      ('M*DSN', 'Madison', 'Madsen', 'Matson', 'Matteson',
5662
                       'Mattison', 'Mattson'),
5663
                      ('M*KL', 'Michael', 'Michel'),
5664
                      ('M*KM', 'Meacham', 'Mechem'),
5665
                      # Corrected: RQ*S -> RKS, not KS
5666
                      ('M*RKS', 'Marques', 'Marquez', 'Marquis', 'Marquiss'),
5667
                      # Corrected: RKS does not compress to KS
5668
                      ('M*RKS', 'Marcks', 'Marks', 'Marx'),
5669
                      ('M*LN', 'Maloney', 'Moloney', 'Molony'),
5670
                      ('M*LN', 'Mullan', 'Mullen', 'Mullin'),
5671
                      ('M*LR', 'Mallery', 'Mallory'),
5672
                      ('M*LR', 'Moeller', 'Moller', 'Mueller', 'Muller'),
5673
                      ('M*LR', 'Millar', 'Miller'),
5674
                      ('M*LS', 'Miles', 'Myles'),
5675
                      ('M*N', 'Mahan', 'Mann'),
5676
                      ('M*NR', 'Miner', 'Minor'),
5677
                      ('M*NR', 'Monroe', 'Munro'),
5678
                      ('M*NSN', 'Monson', 'Munson'),
5679
                      ('M*R', 'Murray', 'Murrey'),
5680
                      ('M*R', 'Maher', 'Maier', 'Mayer'),
5681
                      ('M*R', 'Mohr', 'Moor', 'Moore'),
5682
                      # Corrected: No reason to eliminate final S
5683
                      ('M*RS', 'Meyers', 'Myers'),
5684
                      ('M*R', 'Meier', 'Meyer', 'Mieir', 'Myhre'),
5685
                      ('M*RF', 'Murphey', 'Murphy'),
5686
                      ('M*RL', 'Merrell', 'Merrill'),
5687
                      ('M*RN', 'Marten', 'Martin', 'Martine', 'Martyn'),
5688
                      ('M*RS', 'Meyers', 'Myers'),
5689
                      ('M*RS', 'Maurice', 'Morris', 'Morse'),
5690
                      ('MK*', 'McCoy', 'McCaughey'),
5691
                      ('MK*', 'Magee', 'McGee', 'McGehee', 'McGhie'),
5692
                      ('MK*', 'Mackey', 'MacKay', 'Mackie', 'McKay'),
5693
                      ('MK*', 'McCue', '!McHugh'),
5694
                      ('MK*L', 'Magill', 'McGill'),
5695
                      ('MK*LF', 'McCollough', '!McCullah', 'McCullough'),
5696
                      ('MK*LM', 'McCallum', 'McCollum', 'McColm'),
5697
                      ('MK*N', 'McKenney', 'McKinney'),
5698
                      ('MK*NR', 'Macintyre', 'McEntire', 'Mcintire',
5699
                       'Mcintyre'),
5700
                      ('MK*NS', 'MacKenzie', 'McKenzie'),
5701
                      ('MK*NS', 'Maginnis', 'McGinnis', 'McGuinness',
5702
                       'Mcinnes', 'Mcinnis'),
5703
                      ('MK*R', 'Maguire', 'McGuire'),
5704
                      ('MK*R', 'McCarthy', 'McCarty'),
5705
                      ('MKD*NL', 'MacDonald', 'McDonald', 'McDonnell'),
5706
                      ('MKF*RLN', 'MacFarland', 'MacFarlane', 'McFarland',
5707
                       'McFarlane'),
5708
                      ('MKF*RSN', 'MacPherson', 'McPherson'),
5709
                      ('MKL*D', 'MacLeod', 'McCloud', 'McLeod'),
5710
                      ('MKL*KLN', 'MacLachlan', 'Maclachlin', 'McLachlan',
5711
                       '!McLaughlin,', '!McLoughlin'),
5712
                      ('MKL*LN', 'McClellan', 'McClelland', 'McLellan'),
5713
                      ('MKL*N', 'McClain', 'McClaine', 'McLain', 'McLane'),
5714
                      ('MKL*N', 'MacLean', 'McClean', 'McLean'),
5715
                      ('MKL*S', 'McCloskey', 'McClosky', 'McCluskey'),
5716
                      ('MKM*LN', 'MacMillan', 'McMillan', 'McMillin'),
5717
                      ('MKN*L', 'MacNeal', 'McNeal', 'McNeil', 'McNeill'),
5718
                      ('MKR*D', 'Magrath', 'McGrath'),
5719
                      ('N*KL', 'Nichol', 'Nicholl', 'Nickel', 'Nickle',
5720
                       'Nicol', 'Nicoll'),
5721
                      ('N*KLS', 'Nicholls', 'Nichols', 'Nickels', 'Nickles',
5722
                       'Nicols'),
5723
                      ('N*KLS', 'Nicholas', 'Nicolas'),
5724
                      ('N*KLSN', 'Nicholsen', 'Nicholson', 'Nicolaisen',
5725
                       'Nicolson'),
5726
                      ('N*KSN', 'Nickson', 'Nixon'),
5727
                      ('N*L', 'Neal', 'Neale', 'Neall', 'Neel', 'Neil',
5728
                       'Neill'),
5729
                      ('N*LSN', 'Neilsen', 'Neilson', 'Nelsen', 'Nelson',
5730
                       'Nielsen', 'Nielson,', 'Nilson', 'Nilssen', 'Nilsson'),
5731
                      ('N*MN', 'Neumann', 'Newman'),
5732
                      ('N*RS', 'Norris', 'Nourse'),
5733
                      ('N*SBD', 'Nesbit', 'Nesbitt', 'Nisbet'),
5734
                      ('P*D', 'Pettee', 'Petty'),
5735
                      ('P*DRSN', 'Peterson', 'Pederson', 'Pedersen',
5736
                       'Petersen', 'Petterson'),
5737
                      ('P*G', 'Page', 'Paige'),
5738
                      ('P*LK', 'Polak', 'Pollack', 'Pollak', 'Pollock'),
5739
                      ('P*LSN', 'Polson', 'Paulsen', 'Paulson', 'Poulsen',
5740
                       'Poulsson'),
5741
                      ('P*N', 'Paine', 'Payn', 'Payne'),
5742
                      ('P*R', 'Parry', 'Perry'),
5743
                      ('P*R', 'Parr', 'Paar'),
5744
                      ('P*RK', 'Park', 'Parke'),
5745
                      ('P*RKS', 'Parks', 'Parkes'),
5746
                      # Corrected: RC -> R
5747
                      ('P*R', 'Pierce', 'Pearce', 'Peirce', '!Piers'),
5748
                      ('P*RS', 'Parish', 'Parrish'),
5749
                      ('P*RS', 'Paris', 'Parris'),
5750
                      ('P*RSN', 'Pierson', 'Pearson', 'Pehrson', 'Peirson'),
5751
                      ('PR*KR', 'Prichard', 'Pritchard'),
5752
                      ('PR*NS', 'Prince', 'Prinz'),
5753
                      ('PR*R', 'Prior', 'Pryor'),
5754
                      ('R*', 'Roe', 'Rowe'),
5755
                      ('R*', 'Rae', 'Ray', 'Raye', 'Rea', 'Rey', 'Wray'),
5756
                      ('R*BNSN', 'Robinson', '!Robison'),
5757
                      ('R*D', 'Rothe', 'Roth'),
5758
                      ('R*D', 'Rudd', 'Rood', 'Rude'),
5759
                      ('R*D', 'Reed', 'Read', 'Reade', 'Reid'),
5760
                      ('R*DR', 'Rider', 'Ryder'),
5761
                      ('R*DS', 'Rhoades', 'Rhoads', 'Rhodes'),
5762
                      ('R*GN', 'Regan', 'Ragon', 'Reagan'),
5763
                      # Corrected: No reason to drop final S
5764
                      ('R*GRS', 'Rodgers', 'Rogers'),
5765
                      ('R*K', 'Richey', 'Ritchey', 'Ritchie'),
5766
                      ('R*K', 'Reich', 'Reiche'),
5767
                      ('R*KR', 'Reichardt', 'Richert', 'Rickard'),
5768
                      ('R*L', 'Reilley', 'Reilly', 'Reilli', 'Riley'),
5769
                      # Corrected: T -> D
5770
                      ('R*MNGDN', 'Remington', 'Rimington'),
5771
                      ('R*MR', 'Reamer', 'Reimer', 'Riemer', 'Rimmer'),
5772
                      ('R*MS', 'Ramsay', 'Ramsey'),
5773
                      ('R*N', 'Rhein', 'Rhine', 'Ryan'),
5774
                      ('R*NR', 'Reinhard', 'Reinhardt', 'Reinhart',
5775
                       'Rhinehart', 'Rinehart'),
5776
                      ('R*S', 'Reas', 'Reece', 'Rees', 'Reese', 'Reis',
5777
                       'Reiss', 'Ries'),
5778
                      ('R*S', '!Rauch', 'Rausch', '!Roach', '!Roche', 'Roush'),
5779
                      ('R*S', 'Rush', 'Rusch'),
5780
                      ('R*S', 'Russ', 'Rus'),
5781
                      ('R*VS', 'Reaves', 'Reeves'),
5782
                      ('S*BR', 'Seibert', 'Siebert'),
5783
                      ('S*FL', 'Schofield', 'Scofield'),
5784
                      ('S*FN', 'Stefan', 'Steffan', 'Steffen', 'Stephan',
5785
                       'Stephen'),
5786
                      ('S*FNS', 'Steffens', 'Stephens', '!Stevens'),
5787
                      ('S*FNSN', 'Steffensen', 'Steffenson', 'Stephenson',
5788
                       '!Stevenson'),
5789
                      ('S*FR', 'Schaefer', 'Schaeffer', 'Schafer', 'Schaffer',
5790
                       'Schafer,', 'Shaffer', 'Sheaffer'),
5791
                      ('S*FR', 'Stauffer', 'Stouffer'),
5792
                      ('S*GL', 'Siegal', 'Sigal'),
5793
                      ('S*GLR', 'Sigler', 'Ziegler'),
5794
                      ('S*K', 'Schuck', 'Shuck'),
5795
                      ('S*KS', 'Sachs', 'Sacks', 'Saks', 'Sax', 'Saxe'),
5796
                      ('S*L', 'Seeley', 'Seely', 'Seley'),
5797
                      ('S*L', 'Schell', 'Shell'),
5798
                      ('S*LR', 'Schuler', 'Schuller'),
5799
                      # Corrected: LD -> L precedes T -> D
5800
                      ('S*LDS', 'Schultz', 'Schultze', '!Schulz', '!Schulze',
5801
                       'Shults', 'Shultz'),
5802
                      ('S*LV', 'Silva', 'Sylva'),
5803
                      ('S*LVR', 'Silveira', 'Silvera', 'Silveria'),
5804
                      ('S*MKR', 'Schomaker', 'Schumacher', 'Schumaker',
5805
                       'Shoemaker,', 'Shumaker'),
5806
                      ('S*MN', 'Simon', 'Symon'),
5807
                      ('S*MN', 'Seaman', 'Seemann', 'Semon'),
5808
                      ('S*MRS', 'Somers', 'Sommars', 'Sommers', 'Summers'),
5809
                      ('S*MS', 'Simms', 'Sims'),
5810
                      ('S*N', 'Stein', 'Stine'),
5811
                      ('S*N', 'Sweeney', 'Sweeny', 'Sweney'),
5812
                      ('S*NR', 'Senter', 'Center'),
5813
                      ('S*NRS', 'Sanders', 'Saunders'),
5814
                      ('S*PR', 'Shepard', '!Shephard', '!Shepheard',
5815
                       '!Shepherd', 'Sheppard'),
5816
                      ('S*R', 'Stahr', 'Star', 'Starr'),
5817
                      ('S*R', 'Stewart', 'Stuart'),
5818
                      ('S*R', 'Storey', 'Story'),
5819
                      ('S*R', 'Saier', 'Sayre'),
5820
                      # Corrected: No reason to strip final S
5821
                      ('S*RS', 'Schwartz', 'Schwarz', 'Schwarze', 'Swartz'),
5822
                      ('S*RL', 'Schirle', 'Shirley'),
5823
                      ('S*RLNG', 'Sterling', 'Stirling'),
5824
                      ('S*RMN', 'Scheuermann', 'Schurman', 'Sherman'),
5825
                      ('S*RN', 'Stearn', 'Stern'),
5826
                      ('S*RR', 'Scherer', 'Shearer', 'Sharer', 'Sherer',
5827
                       'Sheerer'),
5828
                      ('S*S', 'Sousa', 'Souza'),
5829
                      ('SM*D', 'Smith', 'Smyth', 'Smythe'),
5830
                      ('SM*D', 'Schmid', 'Schmidt', 'Schmit', 'Schmitt',
5831
                       'Smit'),
5832
                      ('SN*DR', 'Schneider', 'Schnieder', 'Snaider', 'Snider',
5833
                       'Snyder'),
5834
                      ('SN*L', 'Schnell', 'Snell'),
5835
                      ('SP*LNG', 'Spalding', 'Spaulding'),
5836
                      ('SP*R', 'Spear', 'Speer', '!Speirer'),
5837
                      # Corrected: No reason to strip final S
5838
                      ('SP*RS', 'Spears', 'Speers'),
5839
                      ('SR*DR', 'Schroder', 'Schroeder', 'Schroeter'),
5840
                      ('SR*DR', 'Schrader', 'Shrader'),
5841
                      # Corrected: Everywhere else, rule 3 applies to char 1
5842
                      ('D*D', 'Tait', 'Tate'),
5843
                      ('D*MSN', 'Thomason', '!Thompson', 'Thomsen', 'Thomson',
5844
                       'Tomson'),
5845
                      ('D*RL', 'Terrel', 'Terrell', 'Terrill'),
5846
                      ('DR*S', 'Tracey', 'Tracy'),
5847
                      ('V*L', 'Vail', 'Vaile', 'Vale'),
5848
                      ('V*L', 'Valley', 'Valle'),
5849
                      ('V*R', 'Vieira', 'Vierra'),
5850
                      ('W*D', 'White', 'Wight'),
5851
                      ('W*DKR', 'Whitacre', 'Whitaker', 'Whiteaker',
5852
                       'Whittaker'),
5853
                      ('W*DL', 'Whiteley', 'Whitley'),
5854
                      ('W*DMN', 'Whitman', 'Wittman'),
5855
                      ('W*DR', 'Woodard', 'Woodward'),
5856
                      ('W*DRS', 'Waters', 'Watters'),
5857
                      ('W*GNR', 'Wagener', 'Waggener', 'Wagoner', 'Wagner',
5858
                       'Wegner,', 'Waggoner'),
5859
                      ('W*L', 'Willey', 'Willi'),
5860
                      ('W*L', 'Wiley', 'Wylie'),
5861
                      ('W*L', 'Wahl', 'Wall'),
5862
                      ('W*LBR', 'Wilber', 'Wilbur'),
5863
                      ('W*LF', 'Wolf', 'Wolfe', 'Wolff', 'Woolf', 'Woulfe',
5864
                       'Wulf', 'Wulff'),
5865
                      ('W*LKNS', 'Wilkens', 'Wilkins'),
5866
                      ('W*LKS', 'Wilkes', 'Wilks'),
5867
                      ('W*LN', 'Whalen', 'Whelan'),
5868
                      # Corrected: LD -> L precedes T -> D
5869
                      ('W*LDR', 'Walter', 'Walther', 'Wolter'),
5870
                      ('W*LDRS', 'Walters', 'Walthers', 'Wolters'),
5871
                      ('W*LS', 'Wallace', 'Wallis'),
5872
                      ('W*LS', 'Welch', 'Welsh'),
5873
                      ('W*LS', 'Welles', 'Wells'),
5874
                      ('W*LSN', 'Willson', 'Wilson'),
5875
                      ('W*N', 'Winn', 'Wynn', 'Wynne'),
5876
                      ('W*R', 'Worth', 'Wirth'),
5877
                      ('W*R', 'Ware', 'Wear', 'Weir', 'Wier'),
5878
                      ('W*RL', 'Wehrle', 'Wehrlie', 'Werle', 'Worley'),
5879
                      ('W*RNR', 'Warner', 'Werner'),
5880
                      ('W*S', 'Weis', 'Weiss', 'Wiese', 'Wise', 'Wyss'),
5881
                      ('W*SMN', 'Weismann', 'Weissman', 'Weseman', 'Wiseman,',
5882
                       'Wismonn', 'Wissman'))
5883
5884
        for tests in test_cases:
5885
            result, names = tests[0], tests[1:]
5886
            for name in names:
5887
                if name[0] == '!':
5888
                    self.assertNotEqual(result, dolby(name[1:]))
5889
                else:
5890
                    self.assertEqual(result, dolby(name))
5891
5892
        # Additional tests to improve coverage
5893
        self.assertEqual(dolby('Rune'), 'R*N')
5894
        self.assertEqual(dolby('Rune', keep_vowels=True), 'R*N*')
5895
        self.assertEqual(dolby('Rune', vowel_char=''), 'RN')
5896
        self.assertEqual(dolby('Rune', vowel_char='A'), 'RAN')
5897
        self.assertEqual(dolby('Rune', maxlength=2), 'R*')
5898
        self.assertEqual(dolby('Rune', maxlength=2), 'R*')
5899
        self.assertEqual(dolby('Wassermann', maxlength=4), 'W*SR')
5900
        self.assertEqual(dolby('Wassermanns', maxlength=4, keep_vowels=True),
5901
                         'W*S*')
5902
        self.assertEqual(dolby('Wassermanns'), 'W*SRMNS')
5903
5904
5905
class PhoneticSpanishTestCases(unittest.TestCase):
5906
    """Test PhoneticSpanish functions.
5907
5908
    test cases for abydos.phonetic.phonetic_spanish
5909
    """
5910
5911
    def test_phonetic_spanish(self):
5912
        """Test abydos.phonetic.phonetic_spanish."""
5913
        # Base case
5914
        self.assertEqual(phonetic_spanish(''), '')
5915
5916
        # Examples given in
5917
        self.assertEqual(phonetic_spanish('Giraldo'), '8953')
5918
        self.assertEqual(phonetic_spanish('Jiraldo'), '8953')
5919
        self.assertEqual(phonetic_spanish('Halla'), '25')
5920
        self.assertEqual(phonetic_spanish('Haya'), '25')
5921
        self.assertEqual(phonetic_spanish('Cielo'), '45')
5922
        self.assertEqual(phonetic_spanish('Sielo'), '45')
5923
5924
        # Test to maximize coverage
5925
        self.assertEqual(phonetic_spanish('Giraldo', maxlength=2), '89')
5926
5927
5928
class SpanishMetaphoneTestCases(unittest.TestCase):
5929
    """Test Spanish Metaphone functions.
5930
5931
    test cases for abydos.phonetic.spanish_metaphone
5932
    """
5933
5934
    def test_spanish_metaphone(self):
5935
        """Test abydos.phonetic.spanish_metaphone."""
5936
        # Base case
5937
        self.assertEqual(spanish_metaphone(''), '')
5938
5939
        # Examples given in
5940
        # https://github.com/amsqr/Spanish-Metaphone/blob/master/phonetic_algorithms_es.py
5941
        self.assertEqual(spanish_metaphone('X'), 'X')
5942
        self.assertEqual(spanish_metaphone('xplosion'), 'EXPLSN')
5943
        self.assertEqual(spanish_metaphone('escalera'), 'ESKLR')
5944
        self.assertEqual(spanish_metaphone('scalera'), 'ESKLR')
5945
        self.assertEqual(spanish_metaphone('mi'), 'M')
5946
        self.assertEqual(spanish_metaphone('tu'), 'T')
5947
        self.assertEqual(spanish_metaphone('su'), 'S')
5948
        self.assertEqual(spanish_metaphone('te'), 'T')
5949
        self.assertEqual(spanish_metaphone('ochooomiiiillllllll'), 'OXMYY')
5950
        self.assertEqual(spanish_metaphone('complicado'), 'KMPLKD')
5951
        self.assertEqual(spanish_metaphone('ácaro'), 'AKR')
5952
        self.assertEqual(spanish_metaphone('ácido'), 'AZD')
5953
        self.assertEqual(spanish_metaphone('clown'), 'KLUN')
5954
        self.assertEqual(spanish_metaphone('down'), 'DUN')
5955
        self.assertEqual(spanish_metaphone('col'), 'KL')
5956
        self.assertEqual(spanish_metaphone('clon'), 'KLN')
5957
        self.assertEqual(spanish_metaphone('waterpolo'), 'UTRPL')
5958
        self.assertEqual(spanish_metaphone('aquino'), 'AKN')
5959
        self.assertEqual(spanish_metaphone('rebosar'), 'RVSR')
5960
        self.assertEqual(spanish_metaphone('rebozar'), 'RVZR')
5961
        self.assertEqual(spanish_metaphone('grajea'), 'GRJ')
5962
        self.assertEqual(spanish_metaphone('gragea'), 'GRJ')
5963
        self.assertEqual(spanish_metaphone('encima'), 'ENZM')
5964
        self.assertEqual(spanish_metaphone('enzima'), 'ENZM')
5965
        self.assertEqual(spanish_metaphone('alhamar'), 'ALAMR')
5966
        self.assertEqual(spanish_metaphone('abollar'), 'AVYR')
5967
        self.assertEqual(spanish_metaphone('aboyar'), 'AVYR')
5968
        self.assertEqual(spanish_metaphone('huevo'), 'UV')
5969
        self.assertEqual(spanish_metaphone('webo'), 'UV')
5970
        self.assertEqual(spanish_metaphone('macho'), 'MX')
5971
        self.assertEqual(spanish_metaphone('xocolate'), 'XKLT')
5972
        self.assertEqual(spanish_metaphone('chocolate'), 'XKLT')
5973
        self.assertEqual(spanish_metaphone('axioma'), 'AXM')
5974
        self.assertEqual(spanish_metaphone('abedul'), 'AVDL')
5975
        self.assertEqual(spanish_metaphone('a'), 'A')
5976
        self.assertEqual(spanish_metaphone('gengibre'), 'JNJVR')
5977
        self.assertEqual(spanish_metaphone('yema'), 'YM')
5978
        self.assertEqual(spanish_metaphone('wHISKY'), 'UISKY')
5979
        self.assertEqual(spanish_metaphone('google'), 'GGL')
5980
        self.assertEqual(spanish_metaphone('xilófono'), 'XLFN')
5981
        self.assertEqual(spanish_metaphone('web'), 'UV')
5982
        self.assertEqual(spanish_metaphone('guerra'), 'GRR')
5983
        self.assertEqual(spanish_metaphone('pingüino'), 'PNUN')
5984
        self.assertEqual(spanish_metaphone('si'), 'S')
5985
        self.assertEqual(spanish_metaphone('ke'), 'K')
5986
        self.assertEqual(spanish_metaphone('que'), 'K')
5987
        self.assertEqual(spanish_metaphone('tu'), 'T')
5988
        self.assertEqual(spanish_metaphone('gato'), 'GT')
5989
        self.assertEqual(spanish_metaphone('gitano'), 'JTN')
5990
        self.assertEqual(spanish_metaphone('queso'), 'KS')
5991
        self.assertEqual(spanish_metaphone('paquete'), 'PKT')
5992
        self.assertEqual(spanish_metaphone('cuco'), 'KK')
5993
        self.assertEqual(spanish_metaphone('perro'), 'PRR')
5994
        self.assertEqual(spanish_metaphone('pero'), 'PR')
5995
        self.assertEqual(spanish_metaphone('arrebato'), 'ARRVT')
5996
        self.assertEqual(spanish_metaphone('hola'), 'OL')
5997
        self.assertEqual(spanish_metaphone('zapato'), 'ZPT')
5998
        self.assertEqual(spanish_metaphone('españa'), 'ESPNY')
5999
        self.assertEqual(spanish_metaphone('garrulo'), 'GRRL')
6000
        self.assertEqual(spanish_metaphone('expansión'), 'EXPNSN')
6001
        self.assertEqual(spanish_metaphone('membrillo'), 'MMVRY')
6002
        self.assertEqual(spanish_metaphone('jamón'), 'JMN')
6003
        self.assertEqual(spanish_metaphone('risa'), 'RS')
6004
        self.assertEqual(spanish_metaphone('caricia'), 'KRZ')
6005
        self.assertEqual(spanish_metaphone('llaves'), 'YVS')
6006
        self.assertEqual(spanish_metaphone('paella'), 'PY')
6007
        self.assertEqual(spanish_metaphone('cerilla'), 'ZRY')
6008
6009
        # tests from file:///home/chrislit/Downloads/ICTRS_2016_12.pdf
6010
        # including of the modified version of the algorithm
6011
        self.assertEqual(spanish_metaphone('Caricia'), 'KRZ')
6012
        self.assertEqual(spanish_metaphone('Caricia', modified=True), 'KRZ')
6013
        self.assertEqual(spanish_metaphone('Llaves'), 'YVS')
6014
        self.assertEqual(spanish_metaphone('Llaves', modified=True), 'YVZ')
6015
        self.assertEqual(spanish_metaphone('Paella'), 'PY')
6016
        self.assertEqual(spanish_metaphone('Paella', modified=True), 'PY')
6017
        self.assertEqual(spanish_metaphone('Cerilla'), 'ZRY')
6018
        self.assertEqual(spanish_metaphone('Cerilla', modified=True), 'ZRY')
6019
        self.assertEqual(spanish_metaphone('Empeorar'), 'EMPRR')
6020
        self.assertEqual(spanish_metaphone('Empeorar', modified=True), 'ENPRR')
6021
        self.assertEqual(spanish_metaphone('Embotellar'), 'EMVTYR')
6022
        self.assertEqual(spanish_metaphone('Embotellar', modified=True),
6023
                         'ENVTYR')
6024
        self.assertEqual(spanish_metaphone('Hoy'), 'OY')
6025
        self.assertEqual(spanish_metaphone('Hoy', modified=True), 'OY')
6026
        self.assertEqual(spanish_metaphone('Xochimilco'), 'XXMLK')
6027
        self.assertEqual(spanish_metaphone('Xochimilco', modified=True),
6028
                         'XXMLK')
6029
        self.assertEqual(spanish_metaphone('Psiquiatra'), 'PSKTR')
6030
        self.assertEqual(spanish_metaphone('Psiquiatra', modified=True),
6031
                         'ZKTR')
6032
        self.assertEqual(spanish_metaphone('siquiatra'), 'SKTR')
6033
        self.assertEqual(spanish_metaphone('siquiatra', modified=True), 'ZKTR')
6034
        self.assertEqual(spanish_metaphone('Obscuro'), 'OVSKR')
6035
        self.assertEqual(spanish_metaphone('Obscuro', modified=True), 'OZKR')
6036
        self.assertEqual(spanish_metaphone('Oscuro'), 'OSKR')
6037
        self.assertEqual(spanish_metaphone('Oscuro', modified=True), 'OZKR')
6038
        self.assertEqual(spanish_metaphone('Combate'), 'KMVT')
6039
        self.assertEqual(spanish_metaphone('Combate', modified=True), 'KNVT')
6040
        self.assertEqual(spanish_metaphone('Convate'), 'KNVT')
6041
        self.assertEqual(spanish_metaphone('Convate', modified=True), 'KNVT')
6042
        self.assertEqual(spanish_metaphone('Conbate'), 'KNVT')
6043
        self.assertEqual(spanish_metaphone('Conbate', modified=True), 'KNVT')
6044
        self.assertEqual(spanish_metaphone('Comportar'), 'KMPRTR')
6045
        self.assertEqual(spanish_metaphone('Comportar', modified=True),
6046
                         'KNPRTR')
6047
        self.assertEqual(spanish_metaphone('Conportar'), 'KNPRTR')
6048
        self.assertEqual(spanish_metaphone('Conportar', modified=True),
6049
                         'KNPRTR')
6050
        self.assertEqual(spanish_metaphone('Zapato'), 'ZPT')
6051
        self.assertEqual(spanish_metaphone('Zapato', modified=True), 'ZPT')
6052
        self.assertEqual(spanish_metaphone('Sapato'), 'SPT')
6053
        self.assertEqual(spanish_metaphone('Sapato', modified=True), 'ZPT')
6054
        self.assertEqual(spanish_metaphone('Escalera'), 'ESKLR')
6055
        self.assertEqual(spanish_metaphone('Escalera', modified=True), 'EZKLR')
6056
        self.assertEqual(spanish_metaphone('scalera'), 'ESKLR')
6057
        self.assertEqual(spanish_metaphone('scalera', modified=True), 'EZKLR')
6058
6059
        # terms from algorithm/source
6060
        self.assertEqual(spanish_metaphone('acción'), 'AXN')
6061
        self.assertEqual(spanish_metaphone('reacción'), 'RXN')
6062
        self.assertEqual(spanish_metaphone('cesar'), 'ZSR')
6063
        self.assertEqual(spanish_metaphone('cien'), 'ZN')
6064
        self.assertEqual(spanish_metaphone('cid'), 'ZD')
6065
        self.assertEqual(spanish_metaphone('conciencia'), 'KNZNZ')
6066
        self.assertEqual(spanish_metaphone('gente'), 'JNT')
6067
        self.assertEqual(spanish_metaphone('ecologia'), 'EKLJ')
6068
6069
        # completing coverage
6070
        self.assertEqual(spanish_metaphone('hola'), 'OL')
6071
        self.assertEqual(spanish_metaphone('aqi'), 'AK')
6072
        self.assertEqual(spanish_metaphone('hjordis'), 'HJRDS')
6073
6074
6075
class MetaSoundexTestCases(unittest.TestCase):
6076
    """Test MetaSoundex functions.
6077
6078
    test cases for abydos.phonetic.metasoundex
6079
    """
6080
6081
    def test_metasoundex(self):
6082
        """Test abydos.phonetic.metasoundex."""
6083
        # Base cases
6084
        self.assertEqual(metasoundex(''), '0000')
6085
        self.assertEqual(metasoundex('', lang='en'), '0000')
6086
        self.assertEqual(metasoundex('', lang='es'), '')
6087
6088
        # Top 10 Anglo surnames in US
6089
        self.assertEqual(metasoundex('Smith', lang='en'), '4500')
6090
        self.assertEqual(metasoundex('Johnson', lang='en'), '1525')
6091
        self.assertEqual(metasoundex('Williams', lang='en'), '7452')
6092
        self.assertEqual(metasoundex('Brown', lang='en'), '7650')
6093
        self.assertEqual(metasoundex('Jones', lang='en'), '1520')
6094
        self.assertEqual(metasoundex('Miller', lang='en'), '6460')
6095
        self.assertEqual(metasoundex('Davis', lang='en'), '3120')
6096
        self.assertEqual(metasoundex('Wilson', lang='en'), '7425')
6097
        self.assertEqual(metasoundex('Anderson', lang='en'), '0536')
6098
        self.assertEqual(metasoundex('Thomas', lang='en'), '6200')
6099
6100
        self.assertEqual(metasoundex('Smith', lang='es'), '4632')
6101
        self.assertEqual(metasoundex('Johnson', lang='es'), '82646')
6102
        self.assertEqual(metasoundex('Williams', lang='es'), '564')
6103
        self.assertEqual(metasoundex('Brown', lang='es'), '196')
6104
        self.assertEqual(metasoundex('Jones', lang='es'), '864')
6105
        self.assertEqual(metasoundex('Miller', lang='es'), '659')
6106
        self.assertEqual(metasoundex('Davis', lang='es'), '314')
6107
        self.assertEqual(metasoundex('Wilson', lang='es'), '546')
6108
        self.assertEqual(metasoundex('Anderson', lang='es'), '63946')
6109
        self.assertEqual(metasoundex('Thomas', lang='es'), '364')
6110
6111
        # Top 10 Mexican surnames
6112
        self.assertEqual(metasoundex('Hernández', lang='en'), '5653')
6113
        self.assertEqual(metasoundex('García', lang='en'), '5620')
6114
        self.assertEqual(metasoundex('Lòpez', lang='en'), '8120')
6115
        self.assertEqual(metasoundex('Martìnez', lang='en'), '6635')
6116
        self.assertEqual(metasoundex('Rodrìguez', lang='en'), '9362')
6117
        self.assertEqual(metasoundex('González', lang='en'), '5524')
6118
        self.assertEqual(metasoundex('Pérez', lang='en'), '7620')
6119
        self.assertEqual(metasoundex('Sánchez', lang='en'), '4520')
6120
        self.assertEqual(metasoundex('Gómez', lang='en'), '5520')
6121
        self.assertEqual(metasoundex('Flores', lang='en'), '7462')
6122
6123
        self.assertEqual(metasoundex('Hernández', lang='es'), '96634')
6124
        self.assertEqual(metasoundex('García', lang='es'), '894')
6125
        self.assertEqual(metasoundex('Lòpez', lang='es'), '504')
6126
        self.assertEqual(metasoundex('Martìnez', lang='es'), '69364')
6127
        self.assertEqual(metasoundex('Rodrìguez', lang='es'), '93984')
6128
        self.assertEqual(metasoundex('González', lang='es'), '86454')
6129
        self.assertEqual(metasoundex('Pérez', lang='es'), '094')
6130
        self.assertEqual(metasoundex('Sánchez', lang='es'), '4644')
6131
        self.assertEqual(metasoundex('Gómez', lang='es'), '864')
6132
        self.assertEqual(metasoundex('Flores', lang='es'), '2594')
6133
6134
6135
class SoundexBRTestCases(unittest.TestCase):
6136
    """Test SoundexBR functions.
6137
6138
    test cases for abydos.phonetic.soundex_br
6139
    """
6140
6141
    def test_soundex_br(self):
6142
        """Test abydos.phonetic.soundex_br."""
6143
        # Base case
6144
        self.assertEqual(soundex_br(''), '0000')
6145
6146
        # Examples given at https://github.com/danielmarcelino/SoundexBR
6147
        self.assertEqual(soundex_br('Ana Karolina Kuhnen'), 'A526')
6148
        self.assertEqual(soundex_br('Ana Carolina Kuhnen'), 'A526')
6149
        self.assertEqual(soundex_br('Ana Karolina'), 'A526')
6150
        self.assertEqual(soundex_br('João Souza'), 'J220')
6151
        self.assertEqual(soundex_br('Dilma Vana Rousseff'), 'D451')
6152
        self.assertEqual(soundex_br('Dilma Rousef'), 'D456')
6153
        self.assertEqual(soundex_br('Aécio Neves'), 'A251')
6154
        self.assertEqual(soundex_br('Aecio Neves'), 'A251')
6155
        self.assertEqual(soundex_br('HILBERT'), 'I416')
6156
        self.assertEqual(soundex_br('Heilbronn'), 'E416')
6157
        self.assertEqual(soundex_br('Gauss'), 'G200')
6158
        self.assertEqual(soundex_br('Kant'), 'C530')
6159
6160
        # Tests to complete coverage
6161
        self.assertEqual(soundex_br('Wasser'), 'V260')
6162
        self.assertEqual(soundex_br('Cici'), 'S200')
6163
        self.assertEqual(soundex_br('Gerard'), 'J663')
6164
        self.assertEqual(soundex_br('Yglesias'), 'I242')
6165
        self.assertEqual(soundex_br('Cici', zero_pad=False), 'S2')
6166
6167
6168
class NRLTestCases(unittest.TestCase):
6169
    """Test Naval Research Laboratory phonetic encoding functions.
6170
6171
    test cases for abydos.phonetic.nrl
6172
    """
6173
6174
    def test_nrl(self):
6175
        """Test abydos.phonetic.nrl."""
6176
        # Base case
6177
        self.assertEqual(soundex_br(''), '0000')
6178
6179
        # common English words
6180
        self.assertEqual(nrl('the'), 'DHAX')
6181
        self.assertEqual(nrl('of'), 'AXv')
6182
        self.assertEqual(nrl('and'), 'AEnd')
6183
        self.assertEqual(nrl('a'), 'AX')
6184
        self.assertEqual(nrl('to'), 'tUW')
6185
        self.assertEqual(nrl('in'), 'IHn')
6186
        self.assertEqual(nrl('is'), 'IHz')
6187
        self.assertEqual(nrl('you'), 'yUW')
6188
        self.assertEqual(nrl('that'), 'DHAEt')
6189
        self.assertEqual(nrl('it'), 'IHt')
6190
        self.assertEqual(nrl('he'), 'hIY')
6191
        self.assertEqual(nrl('was'), 'wAAz')
6192
        self.assertEqual(nrl('for'), 'fAOr')
6193
        self.assertEqual(nrl('on'), 'AAn')
6194
        self.assertEqual(nrl('are'), 'AAr')
6195
        self.assertEqual(nrl('as'), 'AEz')
6196
        self.assertEqual(nrl('with'), 'wIHTH')
6197
        self.assertEqual(nrl('his'), 'hIHz')
6198
        self.assertEqual(nrl('they'), 'DHEY')
6199
        self.assertEqual(nrl('I'), 'AY')
6200
        self.assertEqual(nrl('at'), 'AEt')
6201
        self.assertEqual(nrl('be'), 'bIY')
6202
        self.assertEqual(nrl('this'), 'DHIHs')
6203
        self.assertEqual(nrl('have'), 'hAEv')
6204
        self.assertEqual(nrl('from'), 'frAAm')
6205
        self.assertEqual(nrl('or'), 'AOr')
6206
        self.assertEqual(nrl('one'), 'wAHn')
6207
        self.assertEqual(nrl('had'), 'hAEd')
6208
        self.assertEqual(nrl('by'), 'bAY')
6209
        self.assertEqual(nrl('word'), 'wERd')
6210
        self.assertEqual(nrl('but'), 'bAHt')
6211
        self.assertEqual(nrl('not'), 'nAAt')
6212
        self.assertEqual(nrl('what'), 'WHAAt')
6213
        self.assertEqual(nrl('all'), 'AOl')
6214
        self.assertEqual(nrl('were'), 'wER')
6215
        self.assertEqual(nrl('we'), 'wIY')
6216
        self.assertEqual(nrl('when'), 'WHEHn')
6217
        self.assertEqual(nrl('your'), 'yUWr')
6218
        self.assertEqual(nrl('can'), 'kAEn')
6219
        self.assertEqual(nrl('said'), 'sEHd')
6220
        self.assertEqual(nrl('there'), 'DHEHr')
6221
        self.assertEqual(nrl('use'), 'yUWz')
6222
        self.assertEqual(nrl('an'), 'AEn')
6223
        self.assertEqual(nrl('each'), 'IYCH')
6224
        self.assertEqual(nrl('which'), 'WHIHCH')
6225
        self.assertEqual(nrl('she'), 'SHIY')
6226
        self.assertEqual(nrl('do'), 'dUW')
6227
        self.assertEqual(nrl('how'), 'hAW')
6228
        self.assertEqual(nrl('their'), 'DHEHr')
6229
        self.assertEqual(nrl('if'), 'IHf')
6230
        self.assertEqual(nrl('will'), 'wIHl')
6231
        self.assertEqual(nrl('up'), 'AHp')
6232
        self.assertEqual(nrl('other'), 'AHDHER')
6233
        self.assertEqual(nrl('about'), 'AEbAWt')
6234
        self.assertEqual(nrl('out'), 'AWt')
6235
        self.assertEqual(nrl('many'), 'mEHnIY')
6236
        self.assertEqual(nrl('then'), 'DHEHn')
6237
        self.assertEqual(nrl('them'), 'DHEHm')
6238
        self.assertEqual(nrl('these'), 'DHIYz')
6239
        self.assertEqual(nrl('so'), 'sOW')
6240
        self.assertEqual(nrl('some'), 'sAHm')
6241
        self.assertEqual(nrl('her'), 'hER')
6242
        self.assertEqual(nrl('would'), 'wUHd')
6243
        self.assertEqual(nrl('make'), 'mEYk')
6244
        self.assertEqual(nrl('like'), 'lAYk')
6245
        self.assertEqual(nrl('him'), 'hIHm')
6246
        self.assertEqual(nrl('into'), 'IHntUW')
6247
        self.assertEqual(nrl('time'), 'tAYm')
6248
        self.assertEqual(nrl('has'), 'hAEz')
6249
        self.assertEqual(nrl('look'), 'lUHk')
6250
        self.assertEqual(nrl('two'), 'tUW')
6251
        self.assertEqual(nrl('more'), 'mAOr')
6252
        self.assertEqual(nrl('write'), 'rAYt')
6253
        self.assertEqual(nrl('go'), 'gOW')
6254
        self.assertEqual(nrl('see'), 'sIY')
6255
        self.assertEqual(nrl('number'), 'nAHmbER')
6256
        self.assertEqual(nrl('no'), 'nOW')
6257
        self.assertEqual(nrl('way'), 'wEY')
6258
        self.assertEqual(nrl('could'), 'kUHd')
6259
        self.assertEqual(nrl('people'), 'pIYpl')
6260
        self.assertEqual(nrl('my'), 'mAY')
6261
        self.assertEqual(nrl('than'), 'DHAEn')
6262
        self.assertEqual(nrl('first'), 'fERst')
6263
        self.assertEqual(nrl('water'), 'wAAtER')
6264
        self.assertEqual(nrl('been'), 'bIYn')
6265
        self.assertEqual(nrl('call'), 'kAOl')
6266
        self.assertEqual(nrl('who'), 'hUW')
6267
        self.assertEqual(nrl('oil'), 'OYl')
6268
        self.assertEqual(nrl('its'), 'IHtz')
6269
        self.assertEqual(nrl('now'), 'nAW')
6270
        self.assertEqual(nrl('find'), 'fAYnd')
6271
        self.assertEqual(nrl('long'), 'lAONG')
6272
        self.assertEqual(nrl('down'), 'dAWn')
6273
        self.assertEqual(nrl('day'), 'dEY')
6274
        self.assertEqual(nrl('did'), 'dIHd')
6275
        self.assertEqual(nrl('get'), 'gEHt')
6276
        self.assertEqual(nrl('come'), 'kAHm')
6277
        self.assertEqual(nrl('made'), 'mEYd')
6278
        self.assertEqual(nrl('may'), 'mEY')
6279
        self.assertEqual(nrl('part'), 'pAArt')
6280
        self.assertEqual(nrl('supply'), 'sAHpplIH')
6281
        self.assertEqual(nrl('corner'), 'kAOrnER')
6282
        self.assertEqual(nrl('electric'), 'IYlEHktrIHk')
6283
        self.assertEqual(nrl('insects'), 'IHnsEHktz')
6284
        self.assertEqual(nrl('crops'), 'krAAps')
6285
        self.assertEqual(nrl('tone'), 'tOWn')
6286
        self.assertEqual(nrl('hit'), 'hIHt')
6287
        self.assertEqual(nrl('sand'), 'sAEnd')
6288
        self.assertEqual(nrl('doctor'), 'dAAktER')
6289
        self.assertEqual(nrl('provide'), 'prAHvAYd')
6290
        self.assertEqual(nrl('thus'), 'DHAHs')
6291
        self.assertEqual(nrl('won\'t'), 'wOWnt')
6292
        self.assertEqual(nrl('cook'), 'kUHk')
6293
        self.assertEqual(nrl('bones'), 'bOWnz')
6294
        self.assertEqual(nrl('tail'), 'tEYl')
6295
        self.assertEqual(nrl('board'), 'bOWrd')
6296
        self.assertEqual(nrl('modern'), 'mOWdERn')
6297
        self.assertEqual(nrl('compound'), 'kAAmpAWnd')
6298
        self.assertEqual(nrl('mine'), 'mAYn')
6299
        self.assertEqual(nrl('wasn\'t'), 'wAAzAXnt')
6300
        self.assertEqual(nrl('fit'), 'fIHt')
6301
        self.assertEqual(nrl('addition'), 'AEddIHSHAXn')
6302
        self.assertEqual(nrl('belong'), 'bIHlAONG')
6303
        self.assertEqual(nrl('safe'), 'sEYf')
6304
        self.assertEqual(nrl('soldiers'), 'sOWldIYERs')
6305
        self.assertEqual(nrl('guess'), 'gEHs')
6306
        self.assertEqual(nrl('silent'), 'sAYlEHnt')
6307
        self.assertEqual(nrl('trade'), 'trEYd')
6308
        self.assertEqual(nrl('rather'), 'rAEDHER')
6309
        self.assertEqual(nrl('compare'), 'kAAmpEHr')
6310
        self.assertEqual(nrl('crowd'), 'krOWd')
6311
        self.assertEqual(nrl('poem'), 'pOWEHm')
6312
        self.assertEqual(nrl('enjoy'), 'EHnjOY')
6313
        self.assertEqual(nrl('elements'), 'IYlIYmEHntz')
6314
        self.assertEqual(nrl('indicate'), 'IHndIHkEYt')
6315
        self.assertEqual(nrl('except'), 'EHkssEHpt')
6316
        self.assertEqual(nrl('expect'), 'EHkspEHkt')
6317
        self.assertEqual(nrl('flat'), 'flAEt')
6318
        self.assertEqual(nrl('seven'), 'sIYvEHn')
6319
        self.assertEqual(nrl('interest'), 'IHntIYrEHst')
6320
        self.assertEqual(nrl('sense'), 'sEHns')
6321
        self.assertEqual(nrl('string'), 'strIHNG')
6322
        self.assertEqual(nrl('blow'), 'blOW')
6323
        self.assertEqual(nrl('famous'), 'fAEmAXs')
6324
        self.assertEqual(nrl('value'), 'vAElUW')
6325
        self.assertEqual(nrl('wings'), 'wIHNGz')
6326
        self.assertEqual(nrl('movement'), 'mUWvIYmEHnt')
6327
        self.assertEqual(nrl('pole'), 'pOWl')
6328
        self.assertEqual(nrl('exciting'), 'EHkssAYtIHNG')
6329
        self.assertEqual(nrl('branches'), 'brAEnCHIHz')
6330
        self.assertEqual(nrl('thick'), 'THIHk')
6331
        self.assertEqual(nrl('blood'), 'blUHd')
6332
        self.assertEqual(nrl('lie'), 'lAY')
6333
        self.assertEqual(nrl('spot'), 'spAAt')
6334
        self.assertEqual(nrl('bell'), 'bEHl')
6335
        self.assertEqual(nrl('fun'), 'fAHn')
6336
        self.assertEqual(nrl('loud'), 'lAWd')
6337
        self.assertEqual(nrl('consider'), 'kAAnsAYdER')
6338
        self.assertEqual(nrl('suggested'), 'sAHgjEHstIHd')
6339
        self.assertEqual(nrl('thin'), 'THIHn')
6340
        self.assertEqual(nrl('position'), 'pAAzIHSHAXn')
6341
        self.assertEqual(nrl('entered'), 'EHntIYrd')
6342
        self.assertEqual(nrl('fruit'), 'frUWIHt')
6343
        self.assertEqual(nrl('tied'), 'tAYd')
6344
        self.assertEqual(nrl('rich'), 'rIHCH')
6345
        self.assertEqual(nrl('dollars'), 'dAAlAArs')
6346
        self.assertEqual(nrl('send'), 'sEHnd')
6347
        self.assertEqual(nrl('sight'), 'sAYt')
6348
        self.assertEqual(nrl('chief'), 'CHAYEHf')
6349
        self.assertEqual(nrl('Japanese'), 'jAEpAEnIYz')
6350
        self.assertEqual(nrl('stream'), 'strIYm')
6351
        self.assertEqual(nrl('plants'), 'plAEntz')
6352
        self.assertEqual(nrl('rhythm'), 'rIHTHm')
6353
        self.assertEqual(nrl('eight'), 'EYt')
6354
        self.assertEqual(nrl('science'), 'sAYEHns')
6355
        self.assertEqual(nrl('major'), 'mAEjER')
6356
        self.assertEqual(nrl('observe'), 'AAbsERv')
6357
        self.assertEqual(nrl('tube'), 'tUWb')
6358
        self.assertEqual(nrl('necessary'), 'nIYsEHsAArIH')
6359
        self.assertEqual(nrl('weight'), 'wEYt')
6360
        self.assertEqual(nrl('meat'), 'mIYt')
6361
        self.assertEqual(nrl('lifted'), 'lIHftIHd')
6362
        self.assertEqual(nrl('process'), 'prOWsEHs')
6363
        self.assertEqual(nrl('army'), 'AArmIY')
6364
        self.assertEqual(nrl('hat'), 'hAEt')
6365
        self.assertEqual(nrl('property'), 'prOWpERtIH')
6366
        self.assertEqual(nrl('particular'), 'pAArtIHkyUWlER')
6367
        self.assertEqual(nrl('swim'), 'swIHm')
6368
        self.assertEqual(nrl('terms'), 'tERmz')
6369
        self.assertEqual(nrl('current'), 'kERrEHnt')
6370
        self.assertEqual(nrl('park'), 'pAArk')
6371
        self.assertEqual(nrl('sell'), 'sEHl')
6372
        self.assertEqual(nrl('shoulder'), 'SHUHdER')
6373
        self.assertEqual(nrl('industry'), 'IHndAHstrIH')
6374
        self.assertEqual(nrl('wash'), 'wAASH')
6375
        self.assertEqual(nrl('block'), 'blAAk')
6376
        self.assertEqual(nrl('spread'), 'sprEHd')
6377
        self.assertEqual(nrl('cattle'), 'kAEttl')
6378
        self.assertEqual(nrl('wife'), 'wAYf')
6379
        self.assertEqual(nrl('sharp'), 'SHAArp')
6380
        self.assertEqual(nrl('company'), 'kAAmpAEnIH')
6381
        self.assertEqual(nrl('radio'), 'rEYdIHOW')
6382
        self.assertEqual(nrl('we\'ll'), 'wEHl')
6383
        self.assertEqual(nrl('action'), 'AEkSHAXn')
6384
        self.assertEqual(nrl('capital'), 'kAEpIHtAXl')
6385
        self.assertEqual(nrl('factories'), 'fAEktAOrIYs')
6386
        self.assertEqual(nrl('settled'), 'sEHttld')
6387
        self.assertEqual(nrl('yellow'), 'yEHlOW')
6388
        self.assertEqual(nrl('isn\'t'), 'IHzAXnt')
6389
        self.assertEqual(nrl('southern'), 'sAWDHERn')
6390
        self.assertEqual(nrl('truck'), 'trAHk')
6391
        self.assertEqual(nrl('train'), 'trEYn')
6392
        self.assertEqual(nrl('printed'), 'prIHntIHd')
6393
        self.assertEqual(nrl('wouldn\'t'), 'wUHdnt')
6394
        self.assertEqual(nrl('ahead'), 'EYhEHd')
6395
        self.assertEqual(nrl('chance'), 'CHAEns')
6396
        self.assertEqual(nrl('born'), 'bAOrn')
6397
        self.assertEqual(nrl('level'), 'lIYvEHl')
6398
        self.assertEqual(nrl('triangle'), 'trIHAENGgAXl')
6399
        self.assertEqual(nrl('molecules'), 'mOWlEHkyUWlz')
6400
        self.assertEqual(nrl('France'), 'frAEns')
6401
        self.assertEqual(nrl('repeated'), 'rIYpIYtIHd')
6402
        self.assertEqual(nrl('column'), 'kAAlAHmn')
6403
        self.assertEqual(nrl('western'), 'wEHstERn')
6404
        self.assertEqual(nrl('church'), 'CHERCH')
6405
        self.assertEqual(nrl('sister'), 'sIHstER')
6406
        self.assertEqual(nrl('oxygen'), 'AAksIHjEHn')
6407
        self.assertEqual(nrl('plural'), 'plUHrAXl')
6408
        self.assertEqual(nrl('various'), 'vEHrIHAXs')
6409
        self.assertEqual(nrl('agreed'), 'AEgrIYd')
6410
        self.assertEqual(nrl('opposite'), 'AAppAAzAYt')
6411
        self.assertEqual(nrl('wrong'), 'rAONG')
6412
        self.assertEqual(nrl('chart'), 'CHAArt')
6413
        self.assertEqual(nrl('prepared'), 'prEHpEHrd')
6414
        self.assertEqual(nrl('pretty'), 'prEHttIH')
6415
        self.assertEqual(nrl('solution'), 'sAAlUWSHAXn')
6416
        self.assertEqual(nrl('fresh'), 'frEHSH')
6417
        self.assertEqual(nrl('shop'), 'SHAAp')
6418
        self.assertEqual(nrl('suffix'), 'sAHffIHks')
6419
        self.assertEqual(nrl('especially'), 'EHspEHSHAXlIY')
6420
        self.assertEqual(nrl('shoes'), 'SHOWz')
6421
        self.assertEqual(nrl('actually'), 'AEkCHUWAXlIY')
6422
        self.assertEqual(nrl('nose'), 'nOWz')
6423
        self.assertEqual(nrl('afraid'), 'AEfrEYd')
6424
        self.assertEqual(nrl('dead'), 'dEHd')
6425
        self.assertEqual(nrl('sugar'), 'sUWgER')
6426
        self.assertEqual(nrl('adjective'), 'AEdjEHktAYv')
6427
        self.assertEqual(nrl('fig'), 'fIHg')
6428
        self.assertEqual(nrl('office'), 'AOffIHs')
6429
        self.assertEqual(nrl('huge'), 'hyUWj')
6430
        self.assertEqual(nrl('gun'), 'gAHn')
6431
        self.assertEqual(nrl('similar'), 'sIHmIHlER')
6432
        self.assertEqual(nrl('death'), 'dIYTH')
6433
        self.assertEqual(nrl('score'), 'skAOr')
6434
        self.assertEqual(nrl('forward'), 'fAOrwAOrd')
6435
        self.assertEqual(nrl('stretched'), 'strEHtCHd')
6436
        self.assertEqual(nrl('experience'), 'EHkspIYrIYEHns')
6437
        self.assertEqual(nrl('rose'), 'rOWz')
6438
        self.assertEqual(nrl('allow'), 'AOlOW')
6439
        self.assertEqual(nrl('fear'), 'fIYr')
6440
        self.assertEqual(nrl('workers'), 'wERkERs')
6441
        self.assertEqual(nrl('Washington'), 'wAASHIHNGtAXn')
6442
        self.assertEqual(nrl('Greek'), 'grIYk')
6443
        self.assertEqual(nrl('women'), 'wOWmEHn')
6444
        self.assertEqual(nrl('brought'), 'brAOt')
6445
        self.assertEqual(nrl('led'), 'lEHd')
6446
        self.assertEqual(nrl('march'), 'mAArCH')
6447
        self.assertEqual(nrl('northern'), 'nAOrDHERn')
6448
        self.assertEqual(nrl('create'), 'krIYt')
6449
        self.assertEqual(nrl('British'), 'brAYtIHSH')
6450
        self.assertEqual(nrl('difficult'), 'dIHffIHkAHlt')
6451
        self.assertEqual(nrl('match'), 'mAEtCH')
6452
        self.assertEqual(nrl('win'), 'wIHn')
6453
        self.assertEqual(nrl('doesn\'t'), 'dAHznt')
6454
        self.assertEqual(nrl('steel'), 'stIYl')
6455
        self.assertEqual(nrl('total'), 'tAAtAXl')
6456
        self.assertEqual(nrl('deal'), 'dIYl')
6457
        self.assertEqual(nrl('determine'), 'dIHtERmAYn')
6458
        self.assertEqual(nrl('evening'), 'IYvIYnIHNG')
6459
        self.assertEqual(nrl('nor'), 'nAOr')
6460
        self.assertEqual(nrl('rope'), 'rOWp')
6461
        self.assertEqual(nrl('cotton'), 'kAAttAXn')
6462
        self.assertEqual(nrl('apple'), 'AEppAXl')
6463
        self.assertEqual(nrl('details'), 'dIHtEYlz')
6464
        self.assertEqual(nrl('entire'), 'EHntAYr')
6465
        self.assertEqual(nrl('corn'), 'kAOrn')
6466
        self.assertEqual(nrl('substances'), 'sAHbstAEnsIHz')
6467
        self.assertEqual(nrl('smell'), 'smEHl')
6468
        self.assertEqual(nrl('tools'), 'tUWlz')
6469
        self.assertEqual(nrl('conditions'), 'kAAndIHSHAXnz')
6470
        self.assertEqual(nrl('cows'), 'kOWz')
6471
        self.assertEqual(nrl('track'), 'trAEk')
6472
        self.assertEqual(nrl('arrived'), 'AXrIHvd')
6473
        self.assertEqual(nrl('located'), 'lOWkEYtIHd')
6474
        self.assertEqual(nrl('sir'), 'sER')
6475
        self.assertEqual(nrl('seat'), 'sIYt')
6476
        self.assertEqual(nrl('division'), 'dIHvIHZHAXn')
6477
        self.assertEqual(nrl('effect'), 'EHffEHkt')
6478
        self.assertEqual(nrl('underline'), 'AHndERlAYn')
6479
        self.assertEqual(nrl('view'), 'vyUW')
6480
6481
        # non-English words (with letters not used in English)
6482
        self.assertEqual(nrl('garçon'), 'gAArÇAAn')
6483
        self.assertEqual(nrl('ðæt'), 'ÐÆt')
6484
        self.assertEqual(nrl('wünschen'), 'wÜnsCHEHn')
6485
        self.assertEqual(nrl('øl'), 'Øl')
6486
6487
6488
class BeiderMorseTestCases(unittest.TestCase):
6489
    """Test BMPM functions.
6490
6491
    test cases for abydos.phonetic.bmpm and abydos.bm.*
6492
    """
6493
6494
    def test_bmpm(self):
6495
        """Test abydos.phonetic.bmpm.
6496
6497
        Most test cases from:
6498
        http://svn.apache.org/viewvc/commons/proper/codec/trunk/src/test/java/org/apache/commons/codec/language/bm/
6499
6500
        As a rule, the test cases are copied from the above code, but the
6501
        resultant values are not. This is largely because this Python port
6502
        follows the PHP reference implementation much more closely than the
6503
        Java port in Apache Commons Codec does. As a result, these tests have
6504
        been conformed to the output produced by the PHP implementation,
6505
        particularly in terms of formatting and ordering.
6506
        """
6507
        # base cases
6508
        self.assertEqual(bmpm(''), '')
6509
6510
        for langs in ('', 1, 'spanish', 'english,italian', 3):
6511
            for name_mode in ('gen', 'ash', 'sep'):
6512
                for match_mode in ('approx', 'exact'):
6513
                    for concat in (False, True):
6514
                        if (isinstance(langs, text_type) and
6515
                            ((name_mode == 'ash' and 'italian' in langs) or
6516
                             (name_mode == 'sep' and 'english' in langs))):
6517
                            self.assertRaises(ValueError, bmpm, '', langs,
6518
                                              name_mode, match_mode, concat)
6519
                        else:
6520
                            self.assertEqual(bmpm('', langs, name_mode,
6521
                                                  match_mode, concat), '')
6522
6523
        # testSolrGENERIC
6524
        # concat is true, ruleType is EXACT
6525
        self.assertEqual(bmpm('Angelo', '', 'gen', 'exact', True),
6526
                         'angelo anxelo anhelo anjelo anZelo andZelo')
6527
        self.assertEqual(bmpm('D\'Angelo', '', 'gen', 'exact', True),
6528
                         'angelo anxelo anhelo anjelo anZelo andZelo dangelo' +
6529
                         ' danxelo danhelo danjelo danZelo dandZelo')
6530
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'gen',
6531
                              'exact', True),
6532
                         'angelo anxelo andZelo')
6533
        self.assertEqual(bmpm('1234', '', 'gen', 'exact', True), '')
6534
6535
        # concat is false, ruleType is EXACT
6536
        self.assertEqual(bmpm('Angelo', '', 'gen', 'exact', False),
6537
                         'angelo anxelo anhelo anjelo anZelo andZelo')
6538
        self.assertEqual(bmpm('D\'Angelo', '', 'gen', 'exact', False),
6539
                         'angelo anxelo anhelo anjelo anZelo andZelo dangelo' +
6540
                         ' danxelo danhelo danjelo danZelo dandZelo')
6541
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'gen',
6542
                              'exact', False),
6543
                         'angelo anxelo andZelo')
6544
        self.assertEqual(bmpm('1234', '', 'gen', 'exact', False), '')
6545
6546
        # concat is true, ruleType is APPROX
6547
        self.assertEqual(bmpm('Angelo', '', 'gen', 'approx', True),
6548
                         'angilo angYlo agilo ongilo ongYlo ogilo Yngilo' +
6549
                         ' YngYlo anxilo onxilo anilo onilo aniilo oniilo' +
6550
                         ' anzilo onzilo')
6551
        self.assertEqual(bmpm('D\'Angelo', '', 'gen', 'approx', True),
6552
                         'angilo angYlo agilo ongilo ongYlo ogilo Yngilo' +
6553
                         ' YngYlo anxilo onxilo anilo onilo aniilo oniilo' +
6554
                         ' anzilo onzilo dangilo dangYlo dagilo dongilo' +
6555
                         ' dongYlo dogilo dYngilo dYngYlo danxilo donxilo' +
6556
                         ' danilo donilo daniilo doniilo danzilo donzilo')
6557
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'gen',
6558
                              'approx', True),
6559
                         'angilo ongilo anxilo onxilo anzilo onzilo')
6560
        self.assertEqual(bmpm('1234', '', 'gen', 'approx', True), '')
6561
6562
        # concat is false, ruleType is APPROX
6563
        self.assertEqual(bmpm('Angelo', '', 'gen', 'approx', False),
6564
                         'angilo angYlo agilo ongilo ongYlo ogilo Yngilo' +
6565
                         ' YngYlo anxilo onxilo anilo onilo aniilo oniilo' +
6566
                         ' anzilo onzilo')
6567
        self.assertEqual(bmpm('D\'Angelo', '', 'gen', 'approx', False),
6568
                         'angilo angYlo agilo ongilo ongYlo ogilo Yngilo' +
6569
                         ' YngYlo anxilo onxilo anilo onilo aniilo oniilo' +
6570
                         ' anzilo onzilo dangilo dangYlo dagilo dongilo' +
6571
                         ' dongYlo dogilo dYngilo dYngYlo danxilo donxilo' +
6572
                         ' danilo donilo daniilo doniilo danzilo donzilo')
6573
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'gen',
6574
                              'approx', False),
6575
                         'angilo ongilo anxilo onxilo anzilo onzilo')
6576
        self.assertEqual(bmpm('1234', '', 'gen', 'approx', False), '')
6577
6578
        # testSolrASHKENAZI
6579
        # concat is true, ruleType is EXACT
6580
        self.assertEqual(bmpm('Angelo', '', 'ash', 'exact', True),
6581
                         'angelo andZelo anhelo anxelo')
6582
        self.assertEqual(bmpm('D\'Angelo', '', 'ash', 'exact', True),
6583
                         'dangelo dandZelo danhelo danxelo')
6584
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6585
                          'ash', 'exact', True)
6586
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'ash',
6587
                              'exact', True, True), 'anxelo angelo')
6588
        self.assertEqual(bmpm('1234', '', 'ash', 'exact', True), '')
6589
6590
        # concat is false, ruleType is EXACT
6591
        self.assertEqual(bmpm('Angelo', '', 'ash', 'exact', False),
6592
                         'angelo andZelo anhelo anxelo')
6593
        self.assertEqual(bmpm('D\'Angelo', '', 'ash', 'exact', False),
6594
                         'dangelo dandZelo danhelo danxelo')
6595
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6596
                          'ash', 'exact', False)
6597
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'ash',
6598
                              'exact', False, True), 'anxelo angelo')
6599
        self.assertEqual(bmpm('1234', '', 'ash', 'exact', False), '')
6600
6601
        # concat is true, ruleType is APPROX
6602
        self.assertEqual(bmpm('Angelo', '', 'ash', 'approx', True),
6603
                         'angilo angYlo ongilo ongYlo Yngilo YngYlo anzilo' +
6604
                         ' onzilo anilo onilo anxilo onxilo')
6605
        self.assertEqual(bmpm('D\'Angelo', '', 'ash', 'approx', True),
6606
                         'dangilo dangYlo dongilo dongYlo dYngilo dYngYlo' +
6607
                         ' danzilo donzilo danilo donilo danxilo donxilo')
6608
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6609
                          'ash', 'approx', True)
6610
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'ash',
6611
                              'approx', True, True),
6612
                         'anxYlo anxilo onxYlo onxilo angYlo angilo ongYlo' +
6613
                         ' ongilo')
6614
        self.assertEqual(bmpm('1234', '', 'ash', 'approx', True), '')
6615
6616
        # concat is false, ruleType is APPROX
6617
        self.assertEqual(bmpm('Angelo', '', 'ash', 'approx', False),
6618
                         'angilo angYlo ongilo ongYlo Yngilo YngYlo anzilo' +
6619
                         ' onzilo anilo onilo anxilo onxilo')
6620
        self.assertEqual(bmpm('D\'Angelo', '', 'ash', 'approx', False),
6621
                         'dangilo dangYlo dongilo dongYlo dYngilo dYngYlo' +
6622
                         ' danzilo donzilo danilo donilo danxilo donxilo')
6623
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6624
                          'ash', 'approx', False)
6625
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'ash',
6626
                              'approx', False, True),
6627
                         'anxYlo anxilo onxYlo onxilo angYlo angilo ongYlo' +
6628
                         ' ongilo')
6629
        self.assertEqual(bmpm('1234', '', 'ash', 'approx', False), '')
6630
6631
        # testSolrSEPHARDIC
6632
        # concat is true, ruleType is EXACT
6633
        self.assertEqual(bmpm('Angelo', '', 'sep', 'exact', True),
6634
                         'anZelo andZelo anxelo')
6635
        self.assertEqual(bmpm('D\'Angelo', '', 'sep', 'exact', True),
6636
                         'anZelo andZelo anxelo')
6637
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6638
                          'sep', 'exact', True)
6639
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'sep',
6640
                              'exact', True, True),
6641
                         'andZelo anxelo')
6642
        self.assertEqual(bmpm('1234', '', 'sep', 'exact', True), '')
6643
6644
        # concat is false, ruleType is EXACT
6645
        self.assertEqual(bmpm('Angelo', '', 'sep', 'exact', False),
6646
                         'anZelo andZelo anxelo')
6647
        self.assertEqual(bmpm('D\'Angelo', '', 'sep', 'exact', False),
6648
                         'anZelo andZelo anxelo')
6649
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6650
                          'sep', 'exact', False)
6651
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'sep',
6652
                              'exact', False, True), 'andZelo anxelo')
6653
        self.assertEqual(bmpm('1234', '', 'sep', 'exact', False), '')
6654
6655
        # concat is true, ruleType is APPROX
6656
        self.assertEqual(bmpm('Angelo', '', 'sep', 'approx', True),
6657
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6658
        self.assertEqual(bmpm('D\'Angelo', '', 'sep', 'approx', True),
6659
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6660
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6661
                          'sep', 'approx', True)
6662
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'sep',
6663
                              'approx', True, True),
6664
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6665
        self.assertEqual(bmpm('1234', '', 'sep', 'approx', True), '')
6666
6667
        # concat is false, ruleType is APPROX
6668
        self.assertEqual(bmpm('Angelo', '', 'sep', 'approx', False),
6669
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6670
        self.assertEqual(bmpm('D\'Angelo', '', 'sep', 'approx', False),
6671
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6672
        self.assertRaises(ValueError, bmpm, 'Angelo', 'italian,greek,spanish',
6673
                          'sep', 'approx', False)
6674
        self.assertEqual(bmpm('Angelo', 'italian,greek,spanish', 'sep',
6675
                              'approx', False, True),
6676
                         'anzila anzilu nzila nzilu anhila anhilu nhila nhilu')
6677
        self.assertEqual(bmpm('1234', '', 'sep', 'approx', False), '')
6678
6679
        # testCompatibilityWithOriginalVersion
6680
        self.assertEqual(bmpm('abram', '', 'gen', 'approx', False),
6681
                         'abram abrom avram avrom obram obrom ovram ovrom' +
6682
                         ' Ybram Ybrom abran abron obran obron')
6683
        self.assertEqual(bmpm('Bendzin', '', 'gen', 'approx', False),
6684
                         'binzn bindzn vindzn bintsn vintsn')
6685
        self.assertEqual(bmpm('abram', '', 'ash', 'approx', False),
6686
                         'abram abrom avram avrom obram obrom ovram ovrom' +
6687
                         ' Ybram Ybrom ombram ombrom imbram imbrom')
6688
        self.assertEqual(bmpm('Halpern', '', 'ash', 'approx', False),
6689
                         'alpirn alpYrn olpirn olpYrn Ylpirn YlpYrn xalpirn' +
6690
                         ' xolpirn')
6691
6692
        # PhoneticEngineTest
6693
        self.assertEqual(bmpm('Renault', '', 'gen', 'approx', True),
6694
                         'rinolt rino rinDlt rinalt rinult rinD rina rinu')
6695
        self.assertEqual(bmpm('Renault', '', 'ash', 'approx', True),
6696
                         'rinDlt rinalt rinult rYnDlt rYnalt rYnult rinolt')
6697
        self.assertEqual(bmpm('Renault', '', 'sep', 'approx', True),
6698
                         'rinDlt')
6699
        self.assertEqual(bmpm('SntJohn-Smith', '', 'gen', 'exact', True),
6700
                         'sntjonsmit')
6701
        self.assertEqual(bmpm('d\'ortley', '', 'gen', 'exact', True),
6702
                         'ortlaj ortlej dortlaj dortlej')
6703
        self.assertEqual(bmpm('van helsing', '', 'gen', 'exact', False),
6704
                         'helSink helsink helzink xelsink elSink elsink' +
6705
                         ' vanhelsink vanhelzink vanjelsink fanhelsink' +
6706
                         ' fanhelzink banhelsink')
6707
6708
    def test_bmpm_misc(self):
6709
        """Test abydos.phonetic.bmpm (miscellaneous tests).
6710
6711
        The purpose of this test set is to achieve higher code coverage
6712
        and to hit some of the test cases noted in the BMPM reference code.
6713
        """
6714
        # test of Ashkenazi with discardable prefix
6715
        self.assertEqual(bmpm('bar Hayim', name_mode='ash'), 'Dm xDm')
6716
6717
        # tests of concat behavior
6718
        self.assertEqual(bmpm('Rodham Clinton', concat=False),
6719
                         'rodam rodom rYdam rYdom rodan rodon rodxam rodxom' +
6720
                         ' rodxan rodxon rudam rudom klinton klnton klintun' +
6721
                         ' klntun tzlinton tzlnton tzlintun tzlntun zlinton' +
6722
                         ' zlnton')
6723
        self.assertEqual(bmpm('Rodham Clinton', concat=True),
6724
                         'rodamklinton rodomklinton rodamklnton rodomklnton' +
6725
                         ' rodamklintun rodomklintun rodamklntun rodomklntun' +
6726
                         ' rodamtzlinton rodomtzlinton rodamtzlnton' +
6727
                         ' rodomtzlnton rodamtzlintun rodomtzlintun' +
6728
                         ' rodamtzlntun rodomtzlntun rodamzlinton' +
6729
                         ' rodomzlinton rodamzlnton rodomzlnton rodanklinton' +
6730
                         ' rodonklinton rodanklnton rodonklnton' +
6731
                         ' rodxamklinton rodxomklinton rodxamklnton' +
6732
                         ' rodxomklnton rodxanklinton rodxonklinton' +
6733
                         ' rodxanklnton rodxonklnton rudamklinton' +
6734
                         ' rudomklinton rudamklnton rudomklnton rudamklintun' +
6735
                         ' rudomklintun rudamklntun rudomklntun' +
6736
                         ' rudamtzlinton rudomtzlinton rudamtzlnton' +
6737
                         ' rudomtzlnton rudamtzlintun rudomtzlintun' +
6738
                         ' rudamtzlntun rudomtzlntun')
6739
6740
        # tests of name_mode values
6741
        self.assertEqual(bmpm('bar Hayim', name_mode='ash'), 'Dm xDm')
6742
        self.assertEqual(bmpm('bar Hayim', name_mode='ashkenazi'), 'Dm xDm')
6743
        self.assertEqual(bmpm('bar Hayim', name_mode='Ashkenazi'), 'Dm xDm')
6744
        self.assertEqual(bmpm('bar Hayim', name_mode='gen', concat=True),
6745
                         'barDm borDm bYrDm varDm vorDm barDn borDn barxDm' +
6746
                         ' borxDm varxDm vorxDm barxDn borxDn')
6747
        self.assertEqual(bmpm('bar Hayim', name_mode='general', concat=True),
6748
                         'barDm borDm bYrDm varDm vorDm barDn borDn barxDm' +
6749
                         ' borxDm varxDm vorxDm barxDn borxDn')
6750
        self.assertEqual(bmpm('bar Hayim', name_mode='Mizrahi', concat=True),
6751
                         'barDm borDm bYrDm varDm vorDm barDn borDn barxDm' +
6752
                         ' borxDm varxDm vorxDm barxDn borxDn')
6753
        self.assertEqual(bmpm('bar Hayim', name_mode='mizrahi', concat=True),
6754
                         'barDm borDm bYrDm varDm vorDm barDn borDn barxDm' +
6755
                         ' borxDm varxDm vorxDm barxDn borxDn')
6756
        self.assertEqual(bmpm('bar Hayim', name_mode='miz', concat=True),
6757
                         'barDm borDm bYrDm varDm vorDm barDn borDn barxDm' +
6758
                         ' borxDm varxDm vorxDm barxDn borxDn')
6759
6760
        # test that out-of-range language_arg results in L_ANY
6761
        self.assertEqual(bmpm('Rodham Clinton', language_arg=2**32),
6762
                         'rodam rodom rYdam rYdom rodan rodon rodxam rodxom' +
6763
                         ' rodxan rodxon rudam rudom klinton klnton klintun' +
6764
                         ' klntun tzlinton tzlnton tzlintun tzlntun zlinton' +
6765
                         ' zlnton')
6766
        self.assertEqual(bmpm('Rodham Clinton', language_arg=-4),
6767
                         'rodam rodom rYdam rYdom rodan rodon rodxam rodxom' +
6768
                         ' rodxan rodxon rudam rudom klinton klnton klintun' +
6769
                         ' klntun tzlinton tzlnton tzlintun tzlntun zlinton' +
6770
                         ' zlnton')
6771
6772
        # etc. (for code coverage)
6773
        self.assertEqual(bmpm('van Damme', name_mode='sep'), 'dami mi dam m')
6774
6775 View Code Duplication
    def test_bmpm_nachnamen(self):
0 ignored issues
show
Duplication introduced by
This code seems to be duplicated in your project.
Loading history...
6776
        """Test abydos.phonetic.bmpm (Nachnamen set)."""
6777
        if not ALLOW_RANDOM:
6778
            return
6779
        with codecs.open(TESTDIR + '/corpora/nachnamen.bm.csv',
6780
                         encoding='utf-8') as nachnamen_testset:
6781
            next(nachnamen_testset)
6782
            for nn_line in nachnamen_testset:
6783
                nn_line = nn_line.strip().split(',')
6784
                # This test set is very large (~10000 entries)
6785
                # so let's just randomly select about 20 for testing
6786
                if nn_line[0] != '#' and one_in(500):
6787
                    self.assertEqual(bmpm(nn_line[0], language_arg='german'),
6788
                                     nn_line[1])
6789
                    self.assertEqual(bmpm(nn_line[0]), nn_line[2])
6790
6791 View Code Duplication
    def test_bmpm_nachnamen_cc(self):
0 ignored issues
show
Duplication introduced by
This code seems to be duplicated in your project.
Loading history...
6792
        """Test abydos.phonetic.bmpm (Nachnamen set, corner cases)."""
6793
        with codecs.open(TESTDIR + '/corpora/nachnamen.bm.cc.csv',
6794
                         encoding='utf-8') as nachnamen_testset:
6795
            next(nachnamen_testset)
6796
            for nn_line in nachnamen_testset:
6797
                nn_line = nn_line.strip().split(',')
6798
                # This test set is very large (~10000 entries)
6799
                # so let's just randomly select about 20 for testing
6800
                if nn_line[0] != '#':
6801
                    self.assertEqual(bmpm(nn_line[0], language_arg='german'),
6802
                                     nn_line[1])
6803
                    self.assertEqual(bmpm(nn_line[0]), nn_line[2])
6804
6805 View Code Duplication
    def test_bmpm_uscensus2000(self):
0 ignored issues
show
Duplication introduced by
This code seems to be duplicated in your project.
Loading history...
6806
        """Test abydos.phonetic.bmpm (US Census 2000 set)."""
6807
        if not ALLOW_RANDOM:
6808
            return
6809
        with open(TESTDIR + '/corpora/uscensus2000.bm.csv') as uscensus_ts:
6810
            next(uscensus_ts)
6811
            for cen_line in uscensus_ts:
6812
                cen_line = cen_line.strip().split(',')
6813
                # This test set is very large (~150000 entries)
6814
                # so let's just randomly select about 20 for testing
6815
                if cen_line[0] != '#' and one_in(7500):
6816
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6817
                                          name_mode='gen'), cen_line[1])
6818
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6819
                                          name_mode='ash'), cen_line[2])
6820
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6821
                                          name_mode='sep'), cen_line[3])
6822
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6823
                                          name_mode='gen'), cen_line[4])
6824
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6825
                                          name_mode='ash'), cen_line[5])
6826
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6827
                                          name_mode='sep'), cen_line[6])
6828
6829 View Code Duplication
    def test_bmpm_uscensus2000_cc(self):
0 ignored issues
show
Duplication introduced by
This code seems to be duplicated in your project.
Loading history...
6830
        """Test abydos.phonetic.bmpm (US Census 2000 set, corner cases)."""
6831
        with open(TESTDIR + '/corpora/uscensus2000.bm.cc.csv') as uscensus_ts:
6832
            next(uscensus_ts)
6833
            for cen_line in uscensus_ts:
6834
                cen_line = cen_line.strip().split(',')
6835
                # This test set is very large (~150000 entries)
6836
                # so let's just randomly select about 20 for testing
6837
                if cen_line[0] != '#' and one_in(10):
6838
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6839
                                          name_mode='gen'), cen_line[1])
6840
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6841
                                          name_mode='ash'), cen_line[2])
6842
                    self.assertEqual(bmpm(cen_line[0], match_mode='approx',
6843
                                          name_mode='sep'), cen_line[3])
6844
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6845
                                          name_mode='gen'), cen_line[4])
6846
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6847
                                          name_mode='ash'), cen_line[5])
6848
                    self.assertEqual(bmpm(cen_line[0], match_mode='exact',
6849
                                          name_mode='sep'), cen_line[6])
6850
6851
    def test_bm_phonetic_number(self):
6852
        """Test abydos.bm._bm_phonetic_number."""
6853
        self.assertEqual(_bm_phonetic_number(''), '')
6854
        self.assertEqual(_bm_phonetic_number('abcd'), 'abcd')
6855
        self.assertEqual(_bm_phonetic_number('abcd[123]'), 'abcd')
6856
        self.assertEqual(_bm_phonetic_number('abcd[123'), 'abcd')
6857
        self.assertEqual(_bm_phonetic_number('abcd['), 'abcd')
6858
        self.assertEqual(_bm_phonetic_number('abcd[[[123]]]'), 'abcd')
6859
6860
    def test_bm_apply_rule_if_compat(self):
6861
        """Test abydos.bm._bm_apply_rule_if_compat."""
6862
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def', 4), 'abcdef')
6863
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def[6]', 4),
6864
                         'abcdef[4]')
6865
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def[4]', 4),
6866
                         'abcdef[4]')
6867
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def[0]', 4), None)
6868
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def[8]', 4), None)
6869
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def', 1), 'abcdef')
6870
        self.assertEqual(_bm_apply_rule_if_compat('abc', 'def[4]', 1),
6871
                         'abcdef[4]')
6872
6873
    def test_bm_language(self):
6874
        """Test abydos.bm._bm_language.
6875
6876
        Most test cases from:
6877
        http://svn.apache.org/viewvc/commons/proper/codec/trunk/src/test/java/org/apache/commons/codec/language/bm/LanguageGuessingTest.java?view=markup
6878
        """
6879
        self.assertEqual(_bm_language('Renault', 'gen'), L_FRENCH)
6880
        self.assertEqual(_bm_language('Mickiewicz', 'gen'), L_POLISH)
6881
        self.assertEqual(_bm_language('Thompson', 'gen') & L_ENGLISH,
6882
                         L_ENGLISH)
6883
        self.assertEqual(_bm_language('Nuñez', 'gen'), L_SPANISH)
6884
        self.assertEqual(_bm_language('Carvalho', 'gen'), L_PORTUGUESE)
6885
        self.assertEqual(_bm_language('Čapek', 'gen'), L_CZECH | L_LATVIAN)
6886
        self.assertEqual(_bm_language('Sjneijder', 'gen'), L_DUTCH)
6887
        self.assertEqual(_bm_language('Klausewitz', 'gen'), L_GERMAN)
6888
        self.assertEqual(_bm_language('Küçük', 'gen'), L_TURKISH)
6889
        self.assertEqual(_bm_language('Giacometti', 'gen'), L_ITALIAN)
6890
        self.assertEqual(_bm_language('Nagy', 'gen'), L_HUNGARIAN)
6891
        self.assertEqual(_bm_language('Ceauşescu', 'gen'), L_ROMANIAN)
6892
        self.assertEqual(_bm_language('Angelopoulos', 'gen'), L_GREEKLATIN)
6893
        self.assertEqual(_bm_language('Αγγελόπουλος', 'gen'), L_GREEK)
6894
        self.assertEqual(_bm_language('Пушкин', 'gen'), L_CYRILLIC)
6895
        self.assertEqual(_bm_language('כהן', 'gen'), L_HEBREW)
6896
        self.assertEqual(_bm_language('ácz', 'gen'), L_ANY)
6897
        self.assertEqual(_bm_language('átz', 'gen'), L_ANY)
6898
6899
    def test_bm_expand_alternates(self):
6900
        """Test abydos.bm._bm_expand_alternates."""
6901
        self.assertEqual(_bm_expand_alternates(''), '')
6902
        self.assertEqual(_bm_expand_alternates('aa'), 'aa')
6903
        self.assertEqual(_bm_expand_alternates('aa|bb'), 'aa|bb')
6904
        self.assertEqual(_bm_expand_alternates('aa|aa'), 'aa|aa')
6905
6906
        self.assertEqual(_bm_expand_alternates('(aa)(bb)'), 'aabb')
6907
        self.assertEqual(_bm_expand_alternates('(aa)(bb[0])'), '')
6908
        self.assertEqual(_bm_expand_alternates('(aa)(bb[4])'), 'aabb[4]')
6909
        self.assertEqual(_bm_expand_alternates('(aa[0])(bb)'), '')
6910
        self.assertEqual(_bm_expand_alternates('(aa[4])(bb)'), 'aabb[4]')
6911
6912
        self.assertEqual(_bm_expand_alternates('(a|b|c)(a|b|c)'),
6913
                         'aa|ab|ac|ba|bb|bc|ca|cb|cc')
6914
        self.assertEqual(_bm_expand_alternates('(a[1]|b[2])(c|d)'),
6915
                         'ac[1]|ad[1]|bc[2]|bd[2]')
6916
        self.assertEqual(_bm_expand_alternates('(a[1]|b[2])(c[4]|d)'),
6917
                         'ad[1]|bd[2]')
6918
6919
    def test_bm_remove_dupes(self):
6920
        """Test abydos.bm._bm_remove_dupes."""
6921
        self.assertEqual(_bm_remove_dupes(''), '')
6922
        self.assertEqual(_bm_remove_dupes('aa'), 'aa')
6923
        self.assertEqual(_bm_remove_dupes('aa|bb'), 'aa|bb')
6924
        self.assertEqual(_bm_remove_dupes('aa|aa'), 'aa')
6925
        self.assertEqual(_bm_remove_dupes('aa|aa|aa|bb|aa'), 'aa|bb')
6926
        self.assertEqual(_bm_remove_dupes('bb|aa|bb|aa|bb'), 'bb|aa')
6927
6928
    def test_bm_normalize_lang_attrs(self):
6929
        """Test abydos.bm._bm_normalize_language_attributes."""
6930
        self.assertEqual(_bm_normalize_lang_attrs('', False), '')
6931
        self.assertEqual(_bm_normalize_lang_attrs('', True), '')
6932
6933
        self.assertRaises(ValueError, _bm_normalize_lang_attrs, 'a[1', False)
6934
        self.assertRaises(ValueError, _bm_normalize_lang_attrs, 'a[1', True)
6935
6936
        self.assertEqual(_bm_normalize_lang_attrs('abc', False), 'abc')
6937
        self.assertEqual(_bm_normalize_lang_attrs('abc[0]', False), '[0]')
6938
        self.assertEqual(_bm_normalize_lang_attrs('abc[2]', False), 'abc[2]')
6939
        self.assertEqual(_bm_normalize_lang_attrs('abc[2][4]', False), '[0]')
6940
        self.assertEqual(_bm_normalize_lang_attrs('abc[2][6]', False),
6941
                         'abc[2]')
6942
        self.assertEqual(_bm_normalize_lang_attrs('ab[2]c[4]', False), '[0]')
6943
        self.assertEqual(_bm_normalize_lang_attrs('ab[2]c[6]', False),
6944
                         'abc[2]')
6945
6946
        self.assertEqual(_bm_normalize_lang_attrs('abc', True), 'abc')
6947
        self.assertEqual(_bm_normalize_lang_attrs('abc[0]', True), 'abc')
6948
        self.assertEqual(_bm_normalize_lang_attrs('abc[2]', True), 'abc')
6949
        self.assertEqual(_bm_normalize_lang_attrs('abc[2][4]', True), 'abc')
6950
        self.assertEqual(_bm_normalize_lang_attrs('abc[2][6]', True), 'abc')
6951
        self.assertEqual(_bm_normalize_lang_attrs('ab[2]c[4]', True), 'abc')
6952
        self.assertEqual(_bm_normalize_lang_attrs('ab[2]c[6]', True), 'abc')
6953
6954
6955
if __name__ == '__main__':
6956
    unittest.main()
6957