forked from dome272/VQGAN-pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutils.py
74 lines (58 loc) · 2.49 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
import os
import albumentations
import numpy as np
import torch.nn as nn
from PIL import Image
from torch.utils.data import Dataset, DataLoader
import matplotlib.pyplot as plt
# --------------------------------------------- #
# Data Utils
# --------------------------------------------- #
class ImagePaths(Dataset):
def __init__(self, path, size=None):
self.size = size
self.images = [os.path.join(path, file) for file in os.listdir(path)]
self._length = len(self.images)
self.rescaler = albumentations.SmallestMaxSize(max_size=self.size)
self.cropper = albumentations.CenterCrop(height=self.size, width=self.size)
self.preprocessor = albumentations.Compose([self.rescaler, self.cropper])
def __len__(self):
return self._length
def preprocess_image(self, image_path):
image = Image.open(image_path)
if not image.mode == "RGB":
image = image.convert("RGB")
image = np.array(image).astype(np.uint8)
image = self.preprocessor(image=image)["image"]
image = (image / 127.5 - 1.0).astype(np.float32)
image = image.transpose(2, 0, 1)
return image
def __getitem__(self, i):
example = self.preprocess_image(self.images[i])
return example
def load_data(args):
train_data = ImagePaths(args.dataset_path, size=256)
train_loader = DataLoader(train_data, batch_size=args.batch_size, shuffle=False)
return train_loader
# --------------------------------------------- #
# Module Utils
# for Encoder, Decoder etc.
# --------------------------------------------- #
def weights_init(m):
classname = m.__class__.__name__
if classname.find('Conv') != -1:
nn.init.normal_(m.weight.data, 0.0, 0.02)
elif classname.find('BatchNorm') != -1:
nn.init.normal_(m.weight.data, 1.0, 0.02)
nn.init.constant_(m.bias.data, 0)
def plot_images(images):
x = images["input"]
reconstruction = images["rec"]
half_sample = images["half_sample"]
full_sample = images["full_sample"]
fig, axarr = plt.subplots(1, 4)
axarr[0].imshow(x.cpu().detach().numpy()[0].transpose(1, 2, 0))
axarr[1].imshow(reconstruction.cpu().detach().numpy()[0].transpose(1, 2, 0))
axarr[2].imshow(half_sample.cpu().detach().numpy()[0].transpose(1, 2, 0))
axarr[3].imshow(full_sample.cpu().detach().numpy()[0].transpose(1, 2, 0))
plt.show()