report_models - Code Metrics - Inspection of "WIP" - boromir674/topic-modeling-toolkit - Measure and Improve Code Quality continuously with Scrutinizer

Passed

Push — packagify ( b5b75f...d6a758 )

by Konstantinos

created 2019-09-27 19:58 UTC

report_models A

↳ Parent: Project

Complexity

Total Complexity

Size/Duplication

Total Lines	54
Duplicated Lines	0 %

Importance

Changes

Metric	Value
eloc	41
dl	0
loc	54
rs	10
c	0
b	0
f	0
wmc	5

2 Functions

Rating	Name	Duplication	Size	Complexity
A	get_cli_arguments()	0	6	1
A	main()	0	34	4

#!/usr/bin/env python

import argparse
from topic_modeling_toolkit.reporting import ModelReporter
from topic_modeling_toolkit.reporting.reporter import InvalidMetricException


def get_cli_arguments():
    parser = argparse.ArgumentParser(prog='report_models.py', description='Reports on the trained models for the specified collection (dataset)', formatter_class=argparse.ArgumentDefaultsHelpFormatter)
    parser.add_argument('dataset', metavar='collection_name', help='the collection to report models trained on')
    # parser.add_argument('--details', '-d', default=False, action='store_true', help='Switch to show details about the models')
    parser.add_argument('--sort', '-s', default='perplexity', help='Whether to sort the found experiments by checking the desired metric against the corresponding models')
    return parser.parse_args()


def main():
    COLUMNS = [
        'nb-topics',
        'collection-passes',
        'document-passes',
        # 'total-phi-updates',
        'perplexity',
        'kernel-size',
        'kernel-coherence',
        'kernel-contrast',
        'kernel-purity',
        'top-tokens-coherence',
        'sparsity-phi',
        'sparsity-theta',
        'background-tokens-ratio',
        'regularizers'
    ]

    cli_args = get_cli_arguments()
    sort_metric = cli_args.sort

    collections_dir = os.getenv('COLLECTIONS_DIR')

    if not collections_dir:
        raise RuntimeError(
            "Please set the COLLECTIONS_DIR environment variable with the path to a directory containing collections/datasets")
    model_reporter = ModelReporter(collections_dir)
    while 1:
        try:
            s = model_reporter.get_formatted_string(cli_args.dataset, columns=COLUMNS, metric=sort_metric, verbose=True)
            print('\n{}'.format(s))
            break
        except InvalidMetricException as e:
            print(e)
            sort_metric = input("Please input another metric to sort (blank for 'perplexity'): ")


if __name__ == '__main__':
    main()


1			#!/usr/bin/env python
2
3			import argparse
4			from topic_modeling_toolkit.reporting import ModelReporter
5			from topic_modeling_toolkit.reporting.reporter import InvalidMetricException
6
7
8			def get_cli_arguments():
9			parser = argparse.ArgumentParser(prog='report_models.py', description='Reports on the trained models for the specified collection (dataset)', formatter_class=argparse.ArgumentDefaultsHelpFormatter)
10			parser.add_argument('dataset', metavar='collection_name', help='the collection to report models trained on')
11			# parser.add_argument('--details', '-d', default=False, action='store_true', help='Switch to show details about the models')
12			parser.add_argument('--sort', '-s', default='perplexity', help='Whether to sort the found experiments by checking the desired metric against the corresponding models')
13			return parser.parse_args()
14
15
16			def main():
17			COLUMNS = [
18			'nb-topics',
19			'collection-passes',
20			'document-passes',
21			# 'total-phi-updates',
22			'perplexity',
23			'kernel-size',
24			'kernel-coherence',
25			'kernel-contrast',
26			'kernel-purity',
27			'top-tokens-coherence',
28			'sparsity-phi',
29			'sparsity-theta',
30			'background-tokens-ratio',
31			'regularizers'
32			]
33
34			cli_args = get_cli_arguments()
35			sort_metric = cli_args.sort
36
37			collections_dir = os.getenv('COLLECTIONS_DIR')
			0 ignored issues – show Comprehensibility Best Practice introduced 2019-09-23 04:09 UTC by Report Bug Copy Issue Report The variable `os` does not seem to be defined. Loading history...
38			if not collections_dir:
39			raise RuntimeError(
40			"Please set the COLLECTIONS_DIR environment variable with the path to a directory containing collections/datasets")
41			model_reporter = ModelReporter(collections_dir)
42			while 1:
43			try:
44			s = model_reporter.get_formatted_string(cli_args.dataset, columns=COLUMNS, metric=sort_metric, verbose=True)
45			print('\n{}'.format(s))
46			break
47			except InvalidMetricException as e:
48			print(e)
49			sort_metric = input("Please input another metric to sort (blank for 'perplexity'): ")
50
51
52			if __name__ == '__main__':
53			main()
54

boromir674 / topic-modeling-toolkit

Push — packagify ( b5b75f...d6a758 )

report_models A

Complexity

Size/Duplication

Importance

2 Functions

Duplication Side-by-Side

Filter issues like