mandos.analysis.distances._elle() - Code Metrics - Inspection of "build(deps-dev): bump sphinx-copybutton from 0.3.3..." - dmyersturnbull/mandos - Measure and Improve Code Quality continuously with Scrutinizer

Passed

Push — dependabot/pip/sphinx-copybutt... ( c72176 )

unknown

created 2021-07-05 03:05 UTC

mandos.analysis.distances._elle() A

↳ Parent: mandos.analysis.distances

Complexity

Conditions

Size

Total Lines	2
Code Lines	2

Duplication

Lines	0
Ratio	0 %

Importance

Changes

Metric	Value
cc	1
eloc	2
nop	1
dl	0
loc	2
rs	10
c	0
b	0
f	0

"""
Calculations of concordance between annotations.
"""
import abc
import math
from collections import defaultdict
from typing import Collection, Sequence

import numpy as np


from mandos.analysis import AnalysisUtils as Au
from mandos.analysis import SimilarityDf
from mandos.model.hits import AbstractHit

# note that most of these math functions are much faster than their numpy counterparts
# if we're not broadcasting, it's almost always better to use them
# some are more accurate, too
# e.g. we're using fsum rather than sum


class MatrixCalculator(metaclass=abc.ABCMeta):

    def calc(self, hits: Sequence[AbstractHit]) -> SimilarityDf:
class Foo:
    def some_method(self, x, y):
        return x + y;
        raise NotImplemented()



class JPrimeMatrixCalculator(MatrixCalculator):

    def calc(self, hits: Sequence[AbstractHit]) -> SimilarityDf:
        inchikey_to_hits = Au.hit_multidict(hits, "origin_inchikey")
        data = defaultdict(dict)
        for (c1, hits1), (c2, hits2) in zip(inchikey_to_hits.items(), inchikey_to_hits.items()):

            data[c1][c2] = self._j_prime(hits1, hits2)
        return SimilarityDf.from_dict(data)

    def _j_prime(self, hits1: Collection[AbstractHit], hits2: Collection[AbstractHit]) -> float:
        sources = {h.data_source for h in hits1}.intersection({h.data_source for h in hits2})
        if len(sources) == 0:
            return np.nan
        values = [
            self._jx(
                [h for h in hits1 if h.data_source == source],
                [h for h in hits1 if h.data_source == source],
            )
            for source in sources
        ]
        return float(math.fsum(values) / len(values))

    def _jx(self, hits1: Collection[AbstractHit], hits2: Collection[AbstractHit]) -> float:
        pair_to_weights = Au.weights_of_pairs(hits1, hits2)
        values = [self._wedge(ca, cb) / self._vee(ca, cb) for ca, cb in pair_to_weights.values()]
        return float(math.fsum(values) / len(values))

    def _wedge(self, ca: float, cb: float) -> float:
class Foo:
    def some_method(self, x, y):
        return x + y;
        return math.sqrt(Au.elle(ca) * Au.elle(cb))

    def _vee(self, ca: float, cb: float) -> float:
class Foo:
    def some_method(self, x, y):
        return x + y;
        return Au.elle(ca) + Au.elle(cb) - math.sqrt(Au.elle(ca) * Au.elle(cb))


__all__ = ["MatrixCalculator", "JPrimeMatrixCalculator"]


1			"""
2			Calculations of concordance between annotations.
3			"""
4			import abc
5			import math
6			from collections import defaultdict
7			from typing import Collection, Sequence
8
9			import numpy as np
			0 ignored issues – show introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Unable to import 'numpy' Loading history...
10
11			from mandos.analysis import AnalysisUtils as Au
12			from mandos.analysis import SimilarityDf
13			from mandos.model.hits import AbstractHit
14
15			# note that most of these math functions are much faster than their numpy counterparts
16			# if we're not broadcasting, it's almost always better to use them
17			# some are more accurate, too
18			# e.g. we're using fsum rather than sum
19
20
21			class MatrixCalculator(metaclass=abc.ABCMeta):
			0 ignored issues – show introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Missing class docstring Loading history...
22			def calc(self, hits: Sequence[AbstractHit]) -> SimilarityDf:
			0 ignored issues – show Coding Style introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report This method could be written as a function/class method. If a method does not access any attributes of the class, it could also be implemented as a function or static method. This can help improve readability. For example class Foo: def some_method(self, x, y): return x + y; could be written as class Foo: @classmethod def some_method(cls, x, y): return x + y; Loading history... introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Missing function or method docstring Loading history...
23			raise NotImplemented()
			0 ignored issues – show Bug introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report `NotImplemented` does not seem to be callable. Loading history... Best Practice introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report NotImplemented raised - should raise NotImplementedError Loading history...
24
25
26			class JPrimeMatrixCalculator(MatrixCalculator):
			0 ignored issues – show introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Missing class docstring Loading history...
27			def calc(self, hits: Sequence[AbstractHit]) -> SimilarityDf:
28			inchikey_to_hits = Au.hit_multidict(hits, "origin_inchikey")
29			data = defaultdict(dict)
30			for (c1, hits1), (c2, hits2) in zip(inchikey_to_hits.items(), inchikey_to_hits.items()):
			0 ignored issues – show Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Variable name "c1" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history... Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Variable name "c2" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history...
31			data[c1][c2] = self._j_prime(hits1, hits2)
32			return SimilarityDf.from_dict(data)
33
34			def _j_prime(self, hits1: Collection[AbstractHit], hits2: Collection[AbstractHit]) -> float:
35			sources = {h.data_source for h in hits1}.intersection({h.data_source for h in hits2})
36			if len(sources) == 0:
37			return np.nan
38			values = [
39			self._jx(
40			[h for h in hits1 if h.data_source == source],
41			[h for h in hits1 if h.data_source == source],
42			)
43			for source in sources
44			]
45			return float(math.fsum(values) / len(values))
46
47			def _jx(self, hits1: Collection[AbstractHit], hits2: Collection[AbstractHit]) -> float:
48			pair_to_weights = Au.weights_of_pairs(hits1, hits2)
49			values = [self._wedge(ca, cb) / self._vee(ca, cb) for ca, cb in pair_to_weights.values()]
50			return float(math.fsum(values) / len(values))
51
52			def _wedge(self, ca: float, cb: float) -> float:
			0 ignored issues – show Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Argument name "ca" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history... Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Argument name "cb" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history... Coding Style introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report This method could be written as a function/class method. If a method does not access any attributes of the class, it could also be implemented as a function or static method. This can help improve readability. For example class Foo: def some_method(self, x, y): return x + y; could be written as class Foo: @classmethod def some_method(cls, x, y): return x + y; Loading history...
53			return math.sqrt(Au.elle(ca) * Au.elle(cb))
54
55			def _vee(self, ca: float, cb: float) -> float:
			0 ignored issues – show Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Argument name "ca" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history... Coding Style Naming introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report Argument name "cb" doesn't conform to snake_case naming style ('([^\\W\\dA-Z][^\\WA-Z]2,\|_[^\\WA-Z]\|__[^\\WA-Z\\d_][^\\WA-Z]+__)$' pattern) This check looks for invalid names for a range of different identifiers. You can set regular expressions to which the identifiers must conform if the defaults do not match your requirements. If your project includes a Pylint configuration file, the settings contained in that file take precedence. To find out more about Pylint, please refer to their site. Loading history... Coding Style introduced 2021-06-30 04:51 UTC by Report Bug Copy Issue Report This method could be written as a function/class method. If a method does not access any attributes of the class, it could also be implemented as a function or static method. This can help improve readability. For example class Foo: def some_method(self, x, y): return x + y; could be written as class Foo: @classmethod def some_method(cls, x, y): return x + y; Loading history...
56			return Au.elle(ca) + Au.elle(cb) - math.sqrt(Au.elle(ca) * Au.elle(cb))
57
58
59			__all__ = ["MatrixCalculator", "JPrimeMatrixCalculator"]
60

dmyersturnbull / mandos

Push — dependabot/pip/sphinx-copybutt... ( c72176 )

mandos.analysis.distances._elle() A

Complexity

Size

Duplication

Importance

Duplication Side-by-Side

Filter issues like