|
1
|
|
|
from fuel.datasets import H5PYDataset |
|
2
|
|
|
from fuel.transformers.defaults import uint8_pixels_to_floatX |
|
3
|
|
|
from fuel.utils import find_in_data_path |
|
4
|
|
|
|
|
5
|
|
|
|
|
6
|
|
|
class CelebA(H5PYDataset): |
|
7
|
|
|
"""The CelebFaces Attributes Dataset (CelebA) dataset. |
|
8
|
|
|
|
|
9
|
|
|
CelebA is a large-scale face |
|
10
|
|
|
attributes dataset with more than 200K celebrity images, each |
|
11
|
|
|
with 40 attribute annotations. The images in this dataset cover |
|
12
|
|
|
large pose variations and background clutter. CelebA has large |
|
13
|
|
|
diversities, large quantities, and rich annotations, including: |
|
14
|
|
|
|
|
15
|
|
|
* 10,177 number of identities |
|
16
|
|
|
* 202,599 number of face images |
|
17
|
|
|
* 5 landmark locations per image |
|
18
|
|
|
* 40 binary attributes annotations per image. |
|
19
|
|
|
|
|
20
|
|
|
The dataset can be employed as the training and test sets for |
|
21
|
|
|
the following computer vision tasks: |
|
22
|
|
|
|
|
23
|
|
|
* face attribute recognition |
|
24
|
|
|
* face detection |
|
25
|
|
|
* landmark (or facial part) localization |
|
26
|
|
|
|
|
27
|
|
|
Parameters |
|
28
|
|
|
---------- |
|
29
|
|
|
which_format : {'aligned_cropped, '64'} |
|
30
|
|
|
Either the aligned and cropped version of CelebA, or |
|
31
|
|
|
a 64x64 version of it. |
|
32
|
|
|
which_sets : tuple of str |
|
33
|
|
|
Which split to load. Valid values are 'train', 'valid' and |
|
34
|
|
|
'test' corresponding to the training set (162,770 examples), the |
|
35
|
|
|
validation set (19,867 examples) and the test set (19,962 |
|
36
|
|
|
examples). |
|
37
|
|
|
|
|
38
|
|
|
""" |
|
39
|
|
|
_filename = 'celeba_{}.hdf5' |
|
40
|
|
|
default_transformers = uint8_pixels_to_floatX(('features',)) |
|
41
|
|
|
|
|
42
|
|
|
def __init__(self, which_format, which_sets, **kwargs): |
|
43
|
|
|
self.which_format = which_format |
|
44
|
|
|
super(CelebA, self).__init__( |
|
45
|
|
|
file_or_path=find_in_data_path(self.filename), |
|
46
|
|
|
which_sets=which_sets, **kwargs) |
|
47
|
|
|
|
|
48
|
|
|
@property |
|
49
|
|
|
def filename(self): |
|
50
|
|
|
return self._filename.format(self.which_format) |
|
51
|
|
|
|