forked from adamian98/pulse
-
Notifications
You must be signed in to change notification settings - Fork 0
/
run.py
executable file
·84 lines (72 loc) · 4.27 KB
/
run.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
#!/usr/bin/python3
from PULSE import PULSE
from torch.utils.data import Dataset, DataLoader
from torch.nn import DataParallel
from pathlib import Path
from PIL import Image
import torchvision
from math import log10, ceil
import argparse
class Images(Dataset):
def __init__(self, root_dir, duplicates):
self.root_path = Path(root_dir)
self.image_list = list(self.root_path.glob("*.png"))
self.duplicates = duplicates # Number of times to duplicate the image in the dataset to produce multiple HR images
def __len__(self):
return self.duplicates*len(self.image_list)
def __getitem__(self, idx):
img_path = self.image_list[idx//self.duplicates]
image = torchvision.transforms.ToTensor()(Image.open(img_path))
if(self.duplicates == 1):
return image,img_path.stem
else:
return image,img_path.stem+f"_{(idx % self.duplicates)+1}"
parser = argparse.ArgumentParser(description='PULSE')
#I/O arguments
parser.add_argument('-input_dir', type=str, default='input', help='input data directory')
parser.add_argument('-output_dir', type=str, default='runs', help='output data directory')
parser.add_argument('-cache_dir', type=str, default='cache', help='cache directory for model weights')
parser.add_argument('-duplicates', type=int, default=1, help='How many HR images to produce for every image in the input directory')
parser.add_argument('-batch_size', type=int, default=1, help='Batch size to use during optimization')
#PULSE arguments
parser.add_argument('-seed', type=int, help='manual seed to use')
parser.add_argument('-loss_str', type=str, default="100*L2+0.05*GEOCROSS+1*FACE", help='Loss function to use')
parser.add_argument('-eps', type=float, default=2e-3, help='Target for downscaling loss (L2)')
parser.add_argument('-distance', type=float, default=0.6, help='Face distance')
parser.add_argument('-noise_type', type=str, default='trainable', help='zero, fixed, or trainable')
parser.add_argument('-num_trainable_noise_layers', type=int, default=20, help='Number of noise layers to optimize')
parser.add_argument('-tile_latent', action='store_true', help='Whether to forcibly tile the same latent 18 times')
parser.add_argument('-bad_noise_layers', type=str, default="17", help='List of noise layers to zero out to improve image quality')
parser.add_argument('-opt_name', type=str, default='adam', help='Optimizer to use in projected gradient descent')
parser.add_argument('-learning_rate', type=float, default=0.4, help='Learning rate to use during optimization')
parser.add_argument('-steps', type=int, default=1000, help='Number of optimization steps')
parser.add_argument('-lr_schedule', type=str, default='linear1cycledrop', help='fixed, linear1cycledrop, linear1cycle')
parser.add_argument('-save_intermediate', action='store_true', help='Whether to store and save intermediate HR and LR images during optimization')
kwargs = vars(parser.parse_args())
dataset = Images(kwargs["input_dir"], duplicates=kwargs["duplicates"])
out_path = Path(kwargs["output_dir"])
out_path.mkdir(parents=True, exist_ok=True)
dataloader = DataLoader(dataset, batch_size=kwargs["batch_size"])
model = PULSE(cache_dir=kwargs["cache_dir"])
model = DataParallel(model)
toPIL = torchvision.transforms.ToPILImage()
for ref_im, ref_im_name in dataloader:
if(kwargs["save_intermediate"]):
padding = ceil(log10(100))
for i in range(kwargs["batch_size"]):
int_path_HR = Path(out_path / ref_im_name[i] / "HR")
int_path_LR = Path(out_path / ref_im_name[i] / "LR")
int_path_HR.mkdir(parents=True, exist_ok=True)
int_path_LR.mkdir(parents=True, exist_ok=True)
for j,(HR,LR) in enumerate(model(ref_im,**kwargs)):
for i in range(kwargs["batch_size"]):
toPIL(HR[i].cpu().detach().clamp(0, 1)).save(
int_path_HR / f"{ref_im_name[i]}_{j:0{padding}}.png")
toPIL(LR[i].cpu().detach().clamp(0, 1)).save(
int_path_LR / f"{ref_im_name[i]}_{j:0{padding}}.png")
else:
#out_im = model(ref_im,**kwargs)
for j,(HR,LR) in enumerate(model(ref_im,**kwargs)):
for i in range(kwargs["batch_size"]):
toPIL(HR[i].cpu().detach().clamp(0, 1)).save(
out_path / f"{ref_im_name[i]}.png")