|
@@ 6758-6772 (lines=15) @@
|
| 6755 |
|
# etc. (for code coverage) |
| 6756 |
|
self.assertEqual(bmpm('van Damme', name_mode='sep'), 'dami mi dam m') |
| 6757 |
|
|
| 6758 |
|
def test_bmpm_nachnamen(self): |
| 6759 |
|
"""Test abydos.phonetic.bmpm (Nachnamen set).""" |
| 6760 |
|
if not ALLOW_RANDOM: |
| 6761 |
|
return |
| 6762 |
|
with codecs.open(TESTDIR + '/corpora/nachnamen.bm.csv', |
| 6763 |
|
encoding='utf-8') as nachnamen_testset: |
| 6764 |
|
next(nachnamen_testset) |
| 6765 |
|
for nn_line in nachnamen_testset: |
| 6766 |
|
nn_line = nn_line.strip().split(',') |
| 6767 |
|
# This test set is very large (~10000 entries) |
| 6768 |
|
# so let's just randomly select about 20 for testing |
| 6769 |
|
if nn_line[0] != '#' and _one_in(500): |
| 6770 |
|
self.assertEqual(bmpm(nn_line[0], language_arg='german'), |
| 6771 |
|
nn_line[1]) |
| 6772 |
|
self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
| 6773 |
|
|
| 6774 |
|
def test_bmpm_nachnamen_cc(self): |
| 6775 |
|
"""Test abydos.phonetic.bmpm (Nachnamen set, corner cases).""" |
|
@@ 6774-6786 (lines=13) @@
|
| 6771 |
|
nn_line[1]) |
| 6772 |
|
self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
| 6773 |
|
|
| 6774 |
|
def test_bmpm_nachnamen_cc(self): |
| 6775 |
|
"""Test abydos.phonetic.bmpm (Nachnamen set, corner cases).""" |
| 6776 |
|
with codecs.open(TESTDIR + '/corpora/nachnamen.bm.cc.csv', |
| 6777 |
|
encoding='utf-8') as nachnamen_testset: |
| 6778 |
|
next(nachnamen_testset) |
| 6779 |
|
for nn_line in nachnamen_testset: |
| 6780 |
|
nn_line = nn_line.strip().split(',') |
| 6781 |
|
# This test set is very large (~10000 entries) |
| 6782 |
|
# so let's just randomly select about 20 for testing |
| 6783 |
|
if nn_line[0] != '#': |
| 6784 |
|
self.assertEqual(bmpm(nn_line[0], language_arg='german'), |
| 6785 |
|
nn_line[1]) |
| 6786 |
|
self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
| 6787 |
|
|
| 6788 |
|
def test_bmpm_uscensus2000(self): |
| 6789 |
|
"""Test abydos.phonetic.bmpm (US Census 2000 set).""" |