abydos.phonetic._parmar_kumbharana.parmar_kumbharana() - Code Metrics - Inspection of "78a222a9f7d8976f6744d263e3d6d01a2a991c27" - chrislit/abydos - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Branch — master (78a222)

by Chris

created 2018-10-26 11:30 UTC

parmar_kumbharana() B

↳ Parent: abydos.phonetic._parmar_kumbharana

Complexity

Conditions

Size

Total Lines	57
Code Lines	31

Duplication

Lines	0
Ratio	0 %

Code Coverage

Tests	16
CRAP Score	5

Importance

Changes

Metric	Value
eloc	31
dl	0
loc	57
ccs	16
cts	16
cp	1
rs	8.6693
c	0
b	0
f	0
cc	5
nop	1
crap	5

How to fix Long Method

# -*- coding: utf-8 -*-

# Copyright 2018 by Christopher C. Little.
# This file is part of Abydos.
#
# Abydos is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Abydos is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with Abydos. If not, see <http://www.gnu.org/licenses/>.

"""abydos.phonetic._parmar_kumbharana.

The phonetic._parmar_kumbharana module implements the Parmar-Kumbharana
phonetic algorithm.
"""

from __future__ import unicode_literals

from six.moves import range

from ._util import _delete_consecutive_repeats

__all__ = ['parmar_kumbharana']


def parmar_kumbharana(word):
    """Return the Parmar-Kumbharana encoding of a word.

    This is based on the phonetic algorithm proposed in :cite:`Parmar:2014`.

    :param str word: the word to transform
    :returns: the Parmar-Kumbharana encoding
    :rtype: str

    >>> parmar_kumbharana('Gough')
    'GF'
    >>> parmar_kumbharana('pneuma')
    'NM'
    >>> parmar_kumbharana('knight')
    'NT'
    >>> parmar_kumbharana('trice')
    'TRS'
    >>> parmar_kumbharana('judge')
    'JJ'
    """
    rule_table = {
        4: {'OUGH': 'F'},
        3: {'DGE': 'J', 'OUL': 'U', 'GHT': 'T'},
        2: {
            'CE': 'S',
            'CI': 'S',
            'CY': 'S',
            'GE': 'J',
            'GI': 'J',
            'GY': 'J',
            'WR': 'R',
            'GN': 'N',
            'KN': 'N',
            'PN': 'N',
            'CK': 'K',
            'SH': 'S',
        },
    }
    vowel_trans = {65: '', 69: '', 73: '', 79: '', 85: '', 89: ''}

    word = word.upper()  # Rule 3
    word = _delete_consecutive_repeats(word)  # Rule 4

    # Rule 5
    i = 0
    while i < len(word):
        for match_len in range(4, 1, -1):
            if word[i : i + match_len] in rule_table[match_len]:
                repl = rule_table[match_len][word[i : i + match_len]]
                word = word[:i] + repl + word[i + match_len :]
                i += len(repl)
                break
        else:
            i += 1

    word = word[:1] + word[1:].translate(vowel_trans)  # Rule 6
    return word


if __name__ == '__main__':
    import doctest

    doctest.testmod()


1		# -- coding: utf-8 --
2
3		# Copyright 2018 by Christopher C. Little.
4		# This file is part of Abydos.
5		#
6		# Abydos is free software: you can redistribute it and/or modify
7		# it under the terms of the GNU General Public License as published by
8		# the Free Software Foundation, either version 3 of the License, or
9		# (at your option) any later version.
10		#
11		# Abydos is distributed in the hope that it will be useful,
12		# but WITHOUT ANY WARRANTY; without even the implied warranty of
13		# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14		# GNU General Public License for more details.
15		#
16		# You should have received a copy of the GNU General Public License
17		# along with Abydos. If not, see <http://www.gnu.org/licenses/>.
18
19	1	"""abydos.phonetic._parmar_kumbharana.
20
21		The phonetic._parmar_kumbharana module implements the Parmar-Kumbharana
22		phonetic algorithm.
23		"""
24
25	1	from __future__ import unicode_literals
26
27	1	from six.moves import range
28
29	1	from ._util import _delete_consecutive_repeats
30
31	1	__all__ = ['parmar_kumbharana']
32
33
34	1	def parmar_kumbharana(word):
35		"""Return the Parmar-Kumbharana encoding of a word.
36
37		This is based on the phonetic algorithm proposed in :cite:`Parmar:2014`.
38
39		:param str word: the word to transform
40		:returns: the Parmar-Kumbharana encoding
41		:rtype: str
42
43		>>> parmar_kumbharana('Gough')
44		'GF'
45		>>> parmar_kumbharana('pneuma')
46		'NM'
47		>>> parmar_kumbharana('knight')
48		'NT'
49		>>> parmar_kumbharana('trice')
50		'TRS'
51		>>> parmar_kumbharana('judge')
52		'JJ'
53		"""
54	1	rule_table = {
55		4: {'OUGH': 'F'},
56		3: {'DGE': 'J', 'OUL': 'U', 'GHT': 'T'},
57		2: {
58		'CE': 'S',
59		'CI': 'S',
60		'CY': 'S',
61		'GE': 'J',
62		'GI': 'J',
63		'GY': 'J',
64		'WR': 'R',
65		'GN': 'N',
66		'KN': 'N',
67		'PN': 'N',
68		'CK': 'K',
69		'SH': 'S',
70		},
71		}
72	1	vowel_trans = {65: '', 69: '', 73: '', 79: '', 85: '', 89: ''}
73
74	1	word = word.upper() # Rule 3
75	1	word = _delete_consecutive_repeats(word) # Rule 4
76
77		# Rule 5
78	1	i = 0
79	1	while i < len(word):
80	1	for match_len in range(4, 1, -1):
81	1	if word[i : i + match_len] in rule_table[match_len]:
82	1	repl = rule_table[match_len][word[i : i + match_len]]
83	1	word = word[:i] + repl + word[i + match_len :]
84	1	i += len(repl)
85	1	break
86		else:
87	1	i += 1
88
89	1	word = word[:1] + word[1:].translate(vowel_trans) # Rule 6
90	1	return word
91
92
93		if __name__ == '__main__':
94		import doctest
95
96		doctest.testmod()
97

chrislit / abydos

Branch — master (78a222)

parmar_kumbharana() B

Complexity

Size

Duplication

Code Coverage

Importance

How to fix Long Method

Long Method

Duplication Side-by-Side

Filter issues like