abydos.phonetic._phonem - Code Metrics - Inspection of "0.3.6" - chrislit/abydos - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Pull Request — master (#141)

by Chris

created 2018-11-17 01:00 UTC

abydos.phonetic._phonem A

↳ Parent: Project

Complexity

Total Complexity

Size/Duplication

Total Lines	154
Duplicated Lines	0 %

Test Coverage

Coverage

100%

Importance

Changes

Metric	Value
eloc	49
dl	0
loc	154
ccs	18
cts	18
cp	1
rs	10
c	0
b	0
f	0
wmc	3

1 Method

Rating	Name	Duplication	Size	Complexity
A	Phonem.encode()	0	35	2

1 Function

Rating	Name	Duplication	Size	Complexity
A	phonem()	0	28	1

# -*- coding: utf-8 -*-

# Copyright 2014-2018 by Christopher C. Little.
# This file is part of Abydos.
#
# Abydos is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Abydos is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with Abydos. If not, see <http://www.gnu.org/licenses/>.

"""abydos.phonetic._phonem.

Phonem
"""

from __future__ import (
    absolute_import,
    division,
    print_function,
    unicode_literals,
)

from unicodedata import normalize as unicode_normalize

from six import text_type

from ._phonetic import Phonetic

__all__ = ['Phonem', 'phonem']


class Phonem(Phonetic):

    """Phonem.

    Phonem is defined in :cite:`Wilde:1988`.

    This version is based on the Perl implementation documented at
    :cite:`Wilz:2005`.
    It includes some enhancements presented in the Java port at
    :cite:`dcm4che:2011`.

    Phonem is intended chiefly for German names/words.
    """

    _substitutions = (
        ('SC', 'C'),
        ('SZ', 'C'),
        ('CZ', 'C'),
        ('TZ', 'C'),
        ('TS', 'C'),
        ('KS', 'X'),
        ('PF', 'V'),
        ('QU', 'KW'),
        ('PH', 'V'),
        ('UE', 'Y'),
        ('AE', 'E'),
        ('OE', 'Ö'),
        ('EI', 'AY'),
        ('EY', 'AY'),
        ('EU', 'OY'),
        ('AU', 'A§'),
        ('OU', '§'),
    )

    _trans = dict(
        zip(
            (ord(_) for _ in 'ZKGQÇÑßFWPTÁÀÂÃÅÄÆÉÈÊËIJÌÍÎÏÜÝ§ÚÙÛÔÒÓÕØ'),

            'CCCCCNSVVBDAAAAAEEEEEEYYYYYYYYUUUUOOOOÖ',
        )
    )

    _uc_set = set('ABCDLMNORSUVWXYÖ')

    def encode(self, word):
        """Return the Phonem code for a word.

        Parameters
        ----------
        word : str
        The word to transform

        Returns
        -------
        str
            The Phonem value

        Examples
        --------
        >>> pe = Phonem()
        >>> pe.encode('Christopher')
        'CRYSDOVR'
        >>> pe.encode('Niall')
        'NYAL'
        >>> pe.encode('Smith')
        'SMYD'
        >>> pe.encode('Schmidt')
        'CMYD'

        """
        word = unicode_normalize('NFC', text_type(word.upper()))
        for i, j in self._substitutions:
            word = word.replace(i, j)
        word = word.translate(self._trans)

        return ''.join(
            c
            for c in self._delete_consecutive_repeats(word)
            if c in self._uc_set
        )


def phonem(word):
    """Return the Phonem code for a word.

    This is a wrapper for :py:meth:`Phonem.encode`.

    Parameters
    ----------
    word : str
        The word to transform

    Returns
    -------
    str
        The Phonem value

    Examples
    --------
    >>> phonem('Christopher')
    'CRYSDOVR'
    >>> phonem('Niall')
    'NYAL'
    >>> phonem('Smith')
    'SMYD'
    >>> phonem('Schmidt')
    'CMYD'

    """
    return Phonem().encode(word)


if __name__ == '__main__':
    import doctest

    doctest.testmod()


1		# -- coding: utf-8 --
2
3		# Copyright 2014-2018 by Christopher C. Little.
4		# This file is part of Abydos.
5		#
6		# Abydos is free software: you can redistribute it and/or modify
7		# it under the terms of the GNU General Public License as published by
8		# the Free Software Foundation, either version 3 of the License, or
9		# (at your option) any later version.
10		#
11		# Abydos is distributed in the hope that it will be useful,
12		# but WITHOUT ANY WARRANTY; without even the implied warranty of
13		# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14		# GNU General Public License for more details.
15		#
16		# You should have received a copy of the GNU General Public License
17		# along with Abydos. If not, see <http://www.gnu.org/licenses/>.
18
19	1	"""abydos.phonetic._phonem.
20
21		Phonem
22		"""
23
24	1	from __future__ import (
25		absolute_import,
26		division,
27		print_function,
28		unicode_literals,
29		)
30
31	1	from unicodedata import normalize as unicode_normalize
32
33	1	from six import text_type
34
35	1	from ._phonetic import Phonetic
36
37	1	__all__ = ['Phonem', 'phonem']
38
39
40	1	class Phonem(Phonetic):
		0 ignored issues – show Unused Code introduced 2018-11-10 01:42 UTC by Report Bug Copy Issue Report The variable `__class__` seems to be unused. Loading history...
41		"""Phonem.
42
43		Phonem is defined in :cite:`Wilde:1988`.
44
45		This version is based on the Perl implementation documented at
46		:cite:`Wilz:2005`.
47		It includes some enhancements presented in the Java port at
48		:cite:`dcm4che:2011`.
49
50		Phonem is intended chiefly for German names/words.
51		"""
52
53	1	_substitutions = (
54		('SC', 'C'),
55		('SZ', 'C'),
56		('CZ', 'C'),
57		('TZ', 'C'),
58		('TS', 'C'),
59		('KS', 'X'),
60		('PF', 'V'),
61		('QU', 'KW'),
62		('PH', 'V'),
63		('UE', 'Y'),
64		('AE', 'E'),
65		('OE', 'Ö'),
66		('EI', 'AY'),
67		('EY', 'AY'),
68		('EU', 'OY'),
69		('AU', 'A§'),
70		('OU', '§'),
71		)
72
73	1	_trans = dict(
74		zip(
75		(ord(_) for _ in 'ZKGQÇÑßFWPTÁÀÂÃÅÄÆÉÈÊËIJÌÍÎÏÜÝ§ÚÙÛÔÒÓÕØ'),
		0 ignored issues – show Comprehensibility Best Practice introduced 2018-10-24 06:00 UTC by Report Bug Copy Issue Report The variable `_` does not seem to be defined. Loading history...
76		'CCCCCNSVVBDAAAAAEEEEEEYYYYYYYYUUUUOOOOÖ',
77		)
78		)
79
80	1	_uc_set = set('ABCDLMNORSUVWXYÖ')
81
82	1	def encode(self, word):
83		"""Return the Phonem code for a word.
84
85		Parameters
86		----------
87		word : str
88		The word to transform
89
90		Returns
91		-------
92		str
93		The Phonem value
94
95		Examples
96		--------
97		>>> pe = Phonem()
98		>>> pe.encode('Christopher')
99		'CRYSDOVR'
100		>>> pe.encode('Niall')
101		'NYAL'
102		>>> pe.encode('Smith')
103		'SMYD'
104		>>> pe.encode('Schmidt')
105		'CMYD'
106
107		"""
108	1	word = unicode_normalize('NFC', text_type(word.upper()))
109	1	for i, j in self._substitutions:
110	1	word = word.replace(i, j)
111	1	word = word.translate(self._trans)
112
113	1	return ''.join(
114		c
115		for c in self._delete_consecutive_repeats(word)
116		if c in self._uc_set
117		)
118
119
120	1	def phonem(word):
121		"""Return the Phonem code for a word.
122
123		This is a wrapper for :py:meth:`Phonem.encode`.
124
125		Parameters
126		----------
127		word : str
128		The word to transform
129
130		Returns
131		-------
132		str
133		The Phonem value
134
135		Examples
136		--------
137		>>> phonem('Christopher')
138		'CRYSDOVR'
139		>>> phonem('Niall')
140		'NYAL'
141		>>> phonem('Smith')
142		'SMYD'
143		>>> phonem('Schmidt')
144		'CMYD'
145
146		"""
147	1	return Phonem().encode(word)
148
149
150		if __name__ == '__main__':
151		import doctest
152
153		doctest.testmod()
154

chrislit / abydos

Pull Request — master (#141)

abydos.phonetic._phonem A

Complexity

Size/Duplication

Test Coverage

Importance

1 Method

1 Function

Duplication Side-by-Side

Filter issues like