Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
hackassin
GitHub Repository: hackassin/learnopencv
Path: blob/master/FaceMaskOverlay/lib/datasets/face300w.py
3443 views
1
# ------------------------------------------------------------------------------
2
# Copyright (c) Microsoft
3
# Licensed under the MIT License.
4
# Created by Tianheng Cheng([email protected]), Yang Zhao
5
# ------------------------------------------------------------------------------
6
7
import os
8
import random
9
10
import torch
11
import torch.utils.data as data
12
import pandas as pd
13
from PIL import Image
14
import numpy as np
15
16
from ..utils.transforms import fliplr_joints, crop, generate_target, transform_pixel
17
18
19
class Face300W(data.Dataset):
20
21
def __init__(self, cfg, is_train=True, transform=None):
22
# specify annotation file for dataset
23
if is_train:
24
self.csv_file = cfg.DATASET.TRAINSET
25
else:
26
self.csv_file = cfg.DATASET.TESTSET
27
28
self.is_train = is_train
29
self.transform = transform
30
self.data_root = cfg.DATASET.ROOT
31
self.input_size = cfg.MODEL.IMAGE_SIZE
32
self.output_size = cfg.MODEL.HEATMAP_SIZE
33
self.sigma = cfg.MODEL.SIGMA
34
self.scale_factor = cfg.DATASET.SCALE_FACTOR
35
self.rot_factor = cfg.DATASET.ROT_FACTOR
36
self.label_type = cfg.MODEL.TARGET_TYPE
37
self.flip = cfg.DATASET.FLIP
38
39
# load annotations
40
self.landmarks_frame = pd.read_csv(self.csv_file)
41
42
self.mean = np.array([0.485, 0.456, 0.406], dtype=np.float32)
43
self.std = np.array([0.229, 0.224, 0.225], dtype=np.float32)
44
45
def __len__(self):
46
return len(self.landmarks_frame)
47
48
def __getitem__(self, idx):
49
50
image_path = os.path.join(self.data_root,
51
self.landmarks_frame.iloc[idx, 0])
52
scale = self.landmarks_frame.iloc[idx, 1]
53
54
center_w = self.landmarks_frame.iloc[idx, 2]
55
center_h = self.landmarks_frame.iloc[idx, 3]
56
center = torch.Tensor([center_w, center_h])
57
58
pts = self.landmarks_frame.iloc[idx, 4:].values
59
pts = pts.astype('float').reshape(-1, 2)
60
61
scale *= 1.25
62
nparts = pts.shape[0]
63
img = np.array(Image.open(image_path).convert('RGB'), dtype=np.float32)
64
65
r = 0
66
if self.is_train:
67
scale = scale * (random.uniform(1 - self.scale_factor,
68
1 + self.scale_factor))
69
r = random.uniform(-self.rot_factor, self.rot_factor) \
70
if random.random() <= 0.6 else 0
71
if random.random() <= 0.5 and self.flip:
72
img = np.fliplr(img)
73
pts = fliplr_joints(pts, width=img.shape[1], dataset='300W')
74
center[0] = img.shape[1] - center[0]
75
76
img = crop(img, center, scale, self.input_size, rot=r)
77
78
target = np.zeros((nparts, self.output_size[0], self.output_size[1]))
79
tpts = pts.copy()
80
81
for i in range(nparts):
82
if tpts[i, 1] > 0:
83
tpts[i, 0:2] = transform_pixel(tpts[i, 0:2]+1, center,
84
scale, self.output_size, rot=r)
85
target[i] = generate_target(target[i], tpts[i]-1, self.sigma,
86
label_type=self.label_type)
87
img = img.astype(np.float32)
88
img = (img/255.0 - self.mean) / self.std
89
img = img.transpose([2, 0, 1])
90
target = torch.Tensor(target)
91
tpts = torch.Tensor(tpts)
92
center = torch.Tensor(center)
93
94
meta = {'index': idx, 'center': center, 'scale': scale,
95
'pts': torch.Tensor(pts), 'tpts': tpts}
96
97
return img, target, meta
98
99
100
if __name__ == '__main__':
101
102
pass
103
104