e2edutch.stanza - Code Metrics - Inspection of "Processor" - Filter-Bubble/e2e-Dutch - Measure and Improve Code Quality continuously with Scrutinizer

Passed

Pull Request — master (#26)

by Dafne van

created 2021-01-25 13:53 UTC

e2edutch.stanza A

↳ Parent: Project

Complexity

Total Complexity

Size/Duplication

Total Lines	75
Duplicated Lines	0 %

Importance

Changes

Metric	Value
wmc	3
eloc	38
dl	0
loc	75
rs	10
c	0
b	0
f	0

3 Methods

Rating	Name	Size	Complexity
A	CorefProcessor._set_up_model()	3	1
A	CorefProcessor.__init__()	22	1
A	CorefProcessor.process()	20	1

import os

import stanza

import logging


from pathlib import Path


from e2edutch import util
from e2edutch import coref_model as cm

from e2edutch.download import download_data
from e2edutch.predict import Predictor

from stanza.pipeline.processor import Processor, register_processor

from stanza.models.common.doc import Document


import tensorflow.compat.v1 as tf


logger = logging.getLogger('e2edutch')
logger.setLevel(logging.INFO)
logger.addHandler(logging.StreamHandler())


@register_processor('coref')
class CorefProcessor(Processor):
    ''' Processor that appends coreference information '''
    _requires = set(['tokenize'])
    _provides = set(['coref'])
    

    def __init__(self, config, pipeline, use_gpu):
class SomeParent:
    def __init__(self):
        self.x = 1

class SomeChild(SomeParent):
    def __init__(self):
        # Initialize the super class
        SomeParent.__init__(self)
        # Make e2edutch follow Stanza's GPU settings:
        # set the environment value for GPU, so that initialize_from_env picks it up.
        #if use_gpu:
        #    os.environ['GPU'] = ' '.join(tf.config.experimental.list_physical_devices('GPU'))
        #else:
        #    if 'GPU' in os.environ['GPU'] :
        #        os.environ.pop('GPU')

        self.e2econfig = util.initialize_from_env(model_name='final')

        # Override datapath and log_root:
        # store e2edata with the Stanza resources, ie. a 'stanza_resources/nl/coref' directory
        self.e2econfig['datapath'] = Path(config['model_path']).parent
        self.e2econfig['log_root'] = Path(config['model_path']).parent

        # Download data files if not present
        download_data(self.e2econfig)

        # Start and stop a session to cache all models
        predictor = Predictor(config=self.e2econfig)
        predictor.end_session()

    def _set_up_model(self, *args):
class Foo:
    def some_method(self, x, y):
        return x + y;
        print ('_set_up_model')

        pass


    def process(self, doc):

        predictor = Predictor(config=self.e2econfig)

        # build the example argument for predict:
        #   example (dict): dict with the following fields:
        #                     sentences ([[str]])
        #                     doc_id (str)
        #                     clusters ([[(int, int)]]) (optional)
        example = {}
        example['sentences'] = [sentence.text for sentence in doc.sentences]
        example['doc_id'] = 'document_from_stanza'
        example['doc_key'] = 'undocumented'

        # predicted_clusters, _ = predictor.predict(example)
        print(predictor.predict(example))

        predictor.end_session()

        return doc


1			import os
			0 ignored issues – show introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Missing module docstring Loading history... Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report The import `os` seems to be unused. Loading history...
2			import stanza
			0 ignored issues – show Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report The import `stanza` seems to be unused. Loading history...
3			import logging
			0 ignored issues – show introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report standard import "import logging" should be placed before "import stanza" Loading history...
4
5			from pathlib import Path
			0 ignored issues – show introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report standard import "from pathlib import Path" should be placed before "import stanza" Loading history...
6
7			from e2edutch import util
8			from e2edutch import coref_model as cm
			0 ignored issues – show Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Unused coref_model imported from e2edutch as cm Loading history...
9			from e2edutch.download import download_data
10			from e2edutch.predict import Predictor
11
12			from stanza.pipeline.processor import Processor, register_processor
			0 ignored issues – show introduced 2021-01-25 13:55 UTC by Report Bug Copy Issue Report third party import "from stanza.pipeline.processor import Processor, register_processor" should be placed before "from e2edutch import util" Loading history...
13			from stanza.models.common.doc import Document
			0 ignored issues – show Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Unused Document imported from stanza.models.common.doc Loading history... introduced 2021-01-25 13:55 UTC by Report Bug Copy Issue Report third party import "from stanza.models.common.doc import Document" should be placed before "from e2edutch import util" Loading history...
14
15			import tensorflow.compat.v1 as tf
			0 ignored issues – show introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Unable to import 'tensorflow.compat.v1' Loading history... Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Unused tensorflow.compat.v1 imported as tf Loading history... introduced 2021-01-25 13:55 UTC by Report Bug Copy Issue Report third party import "import tensorflow.compat.v1 as tf" should be placed before "from e2edutch import util" Loading history...
16
17			logger = logging.getLogger('e2edutch')
18			logger.setLevel(logging.INFO)
19			logger.addHandler(logging.StreamHandler())
20
21
22			@register_processor('coref')
23			class CorefProcessor(Processor):
24			''' Processor that appends coreference information '''
25			_requires = set(['tokenize'])
26			_provides = set(['coref'])
27
			0 ignored issues – show Coding Style introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Trailing whitespace Loading history...
28			def __init__(self, config, pipeline, use_gpu):
			0 ignored issues – show Bug introduced 2021-01-25 13:55 UTC by Report Bug Copy Issue Report The `__init__` method of the super-class `Processor` is not called. It is generally advisable to initialize the super-class by calling its `__init__` method: class SomeParent: def __init__(self): self.x = 1 class SomeChild(SomeParent): def __init__(self): # Initialize the super class SomeParent.__init__(self) Loading history...
29			# Make e2edutch follow Stanza's GPU settings:
30			# set the environment value for GPU, so that initialize_from_env picks it up.
31			#if use_gpu:
32			# os.environ['GPU'] = ' '.join(tf.config.experimental.list_physical_devices('GPU'))
33			#else:
34			# if 'GPU' in os.environ['GPU'] :
35			# os.environ.pop('GPU')
36
37			self.e2econfig = util.initialize_from_env(model_name='final')
38
39			# Override datapath and log_root:
40			# store e2edata with the Stanza resources, ie. a 'stanza_resources/nl/coref' directory
41			self.e2econfig['datapath'] = Path(config['model_path']).parent
42			self.e2econfig['log_root'] = Path(config['model_path']).parent
43
44			# Download data files if not present
45			download_data(self.e2econfig)
46
47			# Start and stop a session to cache all models
48			predictor = Predictor(config=self.e2econfig)
49			predictor.end_session()
50
51			def _set_up_model(self, *args):
			0 ignored issues – show Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report The argument `args` seems to be unused. Loading history... Coding Style introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report This method could be written as a function/class method. If a method does not access any attributes of the class, it could also be implemented as a function or static method. This can help improve readability. For example class Foo: def some_method(self, x, y): return x + y; could be written as class Foo: @classmethod def some_method(cls, x, y): return x + y; Loading history...
52			print ('_set_up_model')
			0 ignored issues – show Coding Style introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report No space allowed before bracket Loading history...
53			pass
			0 ignored issues – show Unused Code introduced 2021-01-25 09:19 UTC by Report Bug Copy Issue Report Unnecessary pass statement Loading history...
54
55			def process(self, doc):
56
57			predictor = Predictor(config=self.e2econfig)
58
59			# build the example argument for predict:
60			# example (dict): dict with the following fields:
61			# sentences ([[str]])
62			# doc_id (str)
63			# clusters ([[(int, int)]]) (optional)
64			example = {}
65			example['sentences'] = [sentence.text for sentence in doc.sentences]
66			example['doc_id'] = 'document_from_stanza'
67			example['doc_key'] = 'undocumented'
68
69			# predicted_clusters, _ = predictor.predict(example)
70			print(predictor.predict(example))
71
72			predictor.end_session()
73
74			return doc
75

Filter-Bubble / e2e-Dutch

Pull Request — master (#26)

e2edutch.stanza A

Complexity

Size/Duplication

Importance

3 Methods

Duplication Side-by-Side

Filter issues like