gradient_free_optimizers.optimizers.smb_opt.forest_optimizer - Code Metrics - Inspection of "refactor expected-improvement into separate module" - SimonBlanke/Gradient-Free-Optimizers - Measure and Improve Code Quality continuously with Scrutinizer

Passed

Push — master ( e7a955...cd6747 )

by Simon

created 2022-06-16 10:30 UTC

gradient_free_optimizers.optimizers.smb_opt.forest_optimizer A

↳ Parent: Project

Complexity

Total Complexity

Size/Duplication

Total Lines	80
Duplicated Lines	56.25 %

Importance

Changes

Metric	Value
wmc	6
eloc	55
dl	45
loc	80
rs	10
c	0
b	0
f	0

3 Methods

Rating	Name	Duplication	Size	Complexity
A	ForestOptimizer.__init__()	23	23	1
A	ForestOptimizer._training()	9	9	2
A	ForestOptimizer._expected_improvement()	6	6	1

1 Function

Rating	Name	Duplication	Size	Complexity
A	normalize()	0	8	2

How to fix Duplicated Code

# Author: Simon Blanke
# Email: [email protected]
# License: MIT License

import numpy as np
from scipy.stats import norm


from .smbo import SMBO
from .surrogate_models import (
    RandomForestRegressor,
    ExtraTreesRegressor,
    GradientBoostingRegressor,
)
from .acquisition_function import ExpectedImprovement


tree_regressor_dict = {
    "random_forest": RandomForestRegressor,
    "extra_tree": ExtraTreesRegressor,
    "gradient_boost": GradientBoostingRegressor,
}


def normalize(array):
    num = array - array.min()
    den = array.max() - array.min()

    if den == 0:
        return np.random.random_sample(array.shape)
    else:
        return ((num / den) + 0) / 1


class ForestOptimizer(SMBO):

    name = "Forest Optimization"
    _name_ = "forest_optimization"
    """Based on the forest-optimizer in the scikit-optimize package"""

    def __init__(
        self,
        *args,
        tree_regressor="extra_tree",
        tree_para={"n_estimators": 100},
        xi=0.03,
        warm_start_smbo=None,
        max_sample_size=10000000,
        sampling={"random": 1000000},
        warnings=100000000,
        **kwargs
    ):
        super().__init__(*args, **kwargs)
        self.tree_regressor = tree_regressor
        self.tree_para = tree_para
        self.regr = tree_regressor_dict[tree_regressor](**self.tree_para)
        self.xi = xi
        self.warm_start_smbo = warm_start_smbo
        self.max_sample_size = max_sample_size
        self.sampling = sampling
        self.warnings = warnings

        self.init_warm_start_smbo()

    def _expected_improvement(self):
        all_pos_comb = self._all_possible_pos()
        self.pos_comb = self._sampling(all_pos_comb)

        acqu_func = ExpectedImprovement(self.regr, self.pos_comb, self.xi)
        return acqu_func.calculate(self.X_sample, self.Y_sample)

    def _training(self):
        X_sample = np.array(self.X_sample)
        Y_sample = np.array(self.Y_sample)

        if len(Y_sample) == 0:
            return self.move_random()

        Y_sample = normalize(Y_sample).reshape(-1, 1)
        self.regr.fit(X_sample, Y_sample)


1		# Author: Simon Blanke
2		# Email: [email protected]
3		# License: MIT License
4
5		import numpy as np
6		from scipy.stats import norm
7
8
9		from .smbo import SMBO
10		from .surrogate_models import (
11		RandomForestRegressor,
12		ExtraTreesRegressor,
13		GradientBoostingRegressor,
14		)
15		from .acquisition_function import ExpectedImprovement
16
17
18		tree_regressor_dict = {
19		"random_forest": RandomForestRegressor,
20		"extra_tree": ExtraTreesRegressor,
21		"gradient_boost": GradientBoostingRegressor,
22		}
23
24
25		def normalize(array):
26		num = array - array.min()
27		den = array.max() - array.min()
28
29		if den == 0:
30		return np.random.random_sample(array.shape)
31		else:
32		return ((num / den) + 0) / 1
33
34
35	View Code Duplication	class ForestOptimizer(SMBO):
		0 ignored issues – show Duplication introduced 2022-06-16 10:35 UTC by Report Bug Copy Issue Report This code seems to be duplicated in your project. Loading history...
36		name = "Forest Optimization"
37		_name_ = "forest_optimization"
38		"""Based on the forest-optimizer in the scikit-optimize package"""
39
40		def __init__(
41		self,
42		*args,
43		tree_regressor="extra_tree",
44		tree_para={"n_estimators": 100},
45		xi=0.03,
46		warm_start_smbo=None,
47		max_sample_size=10000000,
48		sampling={"random": 1000000},
49		warnings=100000000,
50		**kwargs
51		):
52		super().__init__(args, *kwargs)
53		self.tree_regressor = tree_regressor
54		self.tree_para = tree_para
55		self.regr = tree_regressor_dict[tree_regressor](**self.tree_para)
56		self.xi = xi
57		self.warm_start_smbo = warm_start_smbo
58		self.max_sample_size = max_sample_size
59		self.sampling = sampling
60		self.warnings = warnings
61
62		self.init_warm_start_smbo()
63
64		def _expected_improvement(self):
65		all_pos_comb = self._all_possible_pos()
66		self.pos_comb = self._sampling(all_pos_comb)
67
68		acqu_func = ExpectedImprovement(self.regr, self.pos_comb, self.xi)
69		return acqu_func.calculate(self.X_sample, self.Y_sample)
70
71		def _training(self):
72		X_sample = np.array(self.X_sample)
73		Y_sample = np.array(self.Y_sample)
74
75		if len(Y_sample) == 0:
76		return self.move_random()
77
78		Y_sample = normalize(Y_sample).reshape(-1, 1)
79		self.regr.fit(X_sample, Y_sample)
80

SimonBlanke / Gradient-Free-Optimizers

Push — master ( e7a955...cd6747 )

gradient_free_optimizers.optimizers.smb_opt.forest_optimizer A

Complexity

Size/Duplication

Importance

3 Methods

1 Function

How to fix Duplicated Code

Duplicated Code

Duplication Side-by-Side

Filter issues like