| Total Complexity | 2 |
| Total Lines | 30 |
| Duplicated Lines | 0 % |
| Changes | 0 | ||
| 1 | # Author: Simon Blanke |
||
| 2 | # Email: [email protected] |
||
| 3 | # License: MIT License |
||
| 4 | |||
| 5 | import numpy as np |
||
| 6 | import pandas as pd |
||
| 7 | |||
| 8 | |||
| 9 | class DatasetFeatures: |
||
| 10 | def __init__(self, X, y): |
||
| 11 | self.X = X |
||
| 12 | self.y = y |
||
| 13 | |||
| 14 | def get_features(self): |
||
| 15 | features_X_list = [self.X.size, self.X.itemsize, self.X.ndim] |
||
| 16 | features_y_list = [self.y.size, self.y.itemsize, self.y.ndim] |
||
| 17 | |||
| 18 | features_np = np.array(features_X_list + features_y_list) |
||
| 19 | |||
| 20 | col_names = [ |
||
| 21 | "X_size", |
||
| 22 | "X_byte_size", |
||
| 23 | "X_ndim", |
||
| 24 | "y_size", |
||
| 25 | "y_byte_size", |
||
| 26 | "y_ndim", |
||
| 27 | ] |
||
| 28 | |||
| 29 | return pd.DataFrame(features_np, columns=col_names) |
||
| 30 |