|
@@ 41-57 (lines=17) @@
|
| 38 |
|
self.assertEqual(train_dev_test_split(self.data_split, target='Col2', |
| 39 |
|
dev_size=0.5, test_size=0)[i].shape, expected_results[i]) |
| 40 |
|
|
| 41 |
|
def test_train_dev_test_split_series(self): |
| 42 |
|
# Test the propper splitting in train, dev and test sets |
| 43 |
|
|
| 44 |
|
expected_results = [(6, 5), (2, 5), (2, 5), (6,), (2,), (2,)] |
| 45 |
|
for i, _ in enumerate(expected_results): |
| 46 |
|
self.assertEqual(train_dev_test_split(self.data_split, target=self.data_target, |
| 47 |
|
dev_size=0.2, test_size=0.2)[i].shape, expected_results[i]) |
| 48 |
|
|
| 49 |
|
expected_results = [(8, 5), (2, 5), (8,), (2,)] |
| 50 |
|
for i, _ in enumerate(expected_results): |
| 51 |
|
self.assertEqual(train_dev_test_split(self.data_split, target=self.data_target, |
| 52 |
|
dev_size=0, test_size=0.2)[i].shape, expected_results[i]) |
| 53 |
|
|
| 54 |
|
expected_results = [(5, 5), (5, 5), (5,), (5,)] |
| 55 |
|
for i, _ in enumerate(expected_results): |
| 56 |
|
self.assertEqual(train_dev_test_split(self.data_split, target=self.data_target, |
| 57 |
|
dev_size=0.5, test_size=0)[i].shape, expected_results[i]) |
| 58 |
|
|
|
@@ 23-38 (lines=16) @@
|
| 20 |
|
columns=['Col1', 'Col2', 'Col3', 'Col4', 'Col5']) |
| 21 |
|
cls.data_target = pd.Series([1, 0, 1, 0, 0, 1, 1, 0, 1, 1]) |
| 22 |
|
|
| 23 |
|
def test_train_dev_test_split_col(self): |
| 24 |
|
# Test the propper splitting in train, dev and test sets |
| 25 |
|
|
| 26 |
|
expected_results = [(8, 4), (1, 4), (1, 4), (8,), (1,), (1,)] |
| 27 |
|
for i, _ in enumerate(expected_results): |
| 28 |
|
self.assertEqual(train_dev_test_split(self.data_split, 'Col2', |
| 29 |
|
random_state=1234)[i].shape, expected_results[i]) |
| 30 |
|
|
| 31 |
|
expected_results = [(8, 4), (2, 4), (8,), (2,)] |
| 32 |
|
for i, _ in enumerate(expected_results): |
| 33 |
|
self.assertEqual(train_dev_test_split(self.data_split, target='Col2', |
| 34 |
|
dev_size=0, test_size=0.2)[i].shape, expected_results[i]) |
| 35 |
|
|
| 36 |
|
expected_results = [(5, 4), (5, 4), (5,), (5,)] |
| 37 |
|
for i, _ in enumerate(expected_results): |
| 38 |
|
self.assertEqual(train_dev_test_split(self.data_split, target='Col2', |
| 39 |
|
dev_size=0.5, test_size=0)[i].shape, expected_results[i]) |
| 40 |
|
|
| 41 |
|
def test_train_dev_test_split_series(self): |