@@ 6044-6058 (lines=15) @@ | ||
6041 | # etc. (for code coverage) |
|
6042 | self.assertEqual(bmpm('van Damme', name_mode='sep'), 'dami mi dam m') |
|
6043 | ||
6044 | def test_bmpm_nachnamen(self): |
|
6045 | """Test abydos.phonetic.bmpm (Nachnamen set).""" |
|
6046 | if not ALLOW_RANDOM: |
|
6047 | return |
|
6048 | with codecs.open(TESTDIR + '/corpora/nachnamen.bm.csv', |
|
6049 | encoding='utf-8') as nachnamen_testset: |
|
6050 | next(nachnamen_testset) |
|
6051 | for nn_line in nachnamen_testset: |
|
6052 | nn_line = nn_line.strip().split(',') |
|
6053 | # This test set is very large (~10000 entries) |
|
6054 | # so let's just randomly select about 20 for testing |
|
6055 | if nn_line[0] != '#' and one_in(500): |
|
6056 | self.assertEqual(bmpm(nn_line[0], language_arg='german'), |
|
6057 | nn_line[1]) |
|
6058 | self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
|
6059 | ||
6060 | def test_bmpm_nachnamen_cc(self): |
|
6061 | """Test abydos.phonetic.bmpm (Nachnamen set, corner cases).""" |
|
@@ 6060-6072 (lines=13) @@ | ||
6057 | nn_line[1]) |
|
6058 | self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
|
6059 | ||
6060 | def test_bmpm_nachnamen_cc(self): |
|
6061 | """Test abydos.phonetic.bmpm (Nachnamen set, corner cases).""" |
|
6062 | with codecs.open(TESTDIR + '/corpora/nachnamen.bm.cc.csv', |
|
6063 | encoding='utf-8') as nachnamen_testset: |
|
6064 | next(nachnamen_testset) |
|
6065 | for nn_line in nachnamen_testset: |
|
6066 | nn_line = nn_line.strip().split(',') |
|
6067 | # This test set is very large (~10000 entries) |
|
6068 | # so let's just randomly select about 20 for testing |
|
6069 | if nn_line[0] != '#': |
|
6070 | self.assertEqual(bmpm(nn_line[0], language_arg='german'), |
|
6071 | nn_line[1]) |
|
6072 | self.assertEqual(bmpm(nn_line[0]), nn_line[2]) |
|
6073 | ||
6074 | def test_bmpm_uscensus2000(self): |
|
6075 | """Test abydos.phonetic.bmpm (US Census 2000 set).""" |