-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcustom_transforms.py
More file actions
64 lines (55 loc) · 2.32 KB
/
custom_transforms.py
File metadata and controls
64 lines (55 loc) · 2.32 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
import random
import numpy as np
from PIL import Image
import torch
class Compose(object):
def __init__(self, transforms):
self.transforms = transforms
def __call__(self, images, intrinsics):
for t in self.transforms:
images, intrinsics = t(images, intrinsics)
return images, intrinsics
class Normalize(object):
def __init__(self, mean, std):
self.mean = mean
self.std = std
def __call__(self, images, intrinsics):
for tensor in images:
for t, m, s in zip(tensor, self.mean, self.std):
t.sub_(m).div_(s)
return images, intrinsics
class ArrayToTensor(object):
def __call__(self, images, intrinsics):
tensors = []
for im in images:
im = np.transpose(im, (2, 0, 1)) # HWC to CHW format
tensors.append(torch.from_numpy(im).float()/255)
return tensors, intrinsics
class RandomHorizontalFlip(object):
def __call__(self, images, intrinsics):
assert intrinsics is not None
if random.random() < 0.5:
output_intrinsics = np.copy(intrinsics)
output_images = [np.copy(np.fliplr(im)) for im in images]
w = output_images[0].shape[1]
output_intrinsics[0, 2] = w - output_intrinsics[0, 2]
else:
output_images = images
output_intrinsics = intrinsics
return output_images, output_intrinsics
class RandomScaleCrop(object):
def __call__(self, images, intrinsics):
assert intrinsics is not None
output_intrinsics = np.copy(intrinsics)
in_h, in_w, _ = images[0].shape
x_scaling, y_scaling = np.random.uniform(1, 1.15, 2)
scaled_h, scaled_w = int(in_h * y_scaling), int(in_w * x_scaling)
output_intrinsics[0] *= x_scaling
output_intrinsics[1] *= y_scaling
scaled_images = [np.array(Image.fromarray(im.astype(np.uint8)).resize((scaled_w, scaled_h))).astype(np.float32) for im in images]
offset_y = np.random.randint(scaled_h - in_h + 1)
offset_x = np.random.randint(scaled_w - in_w + 1)
cropped_images = [im[offset_y:offset_y + in_h, offset_x:offset_x + in_w] for im in scaled_images]
output_intrinsics[0, 2] -= offset_x
output_intrinsics[1, 2] -= offset_y
return cropped_images, output_intrinsics