-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathstylegan2_handler.py
executable file
·260 lines (199 loc) · 8.42 KB
/
stylegan2_handler.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
import pickle, pickletools
import numpy as np
import tensorflow as tf
from timeit import default_timer as timer
import PIL.Image
import numpy as np
import PIL.Image
import dnnlib
import dnnlib.tflib as tflib
import pickle
import os
import reconnector
def convert_images_to_uint8(images, drange=[-1,1], nchw_to_nhwc=False, shrink=1):
# Taken from dnnlib/tflib/tfutil.py
"""Convert a minibatch of images from float32 to uint8 with configurable dynamic range.
Can be used as an output transformation for Network.run().
"""
images = tf.cast(images, tf.float32)
if shrink > 1:
ksize = [1, 1, shrink, shrink]
images = tf.nn.avg_pool(images, ksize=ksize, strides=ksize, padding="VALID", data_format="NCHW")
if nchw_to_nhwc:
images = tf.transpose(images, [0, 2, 3, 1])
scale = 255 / (drange[1] - drange[0])
images = images * scale + (0.5 - drange[0] * scale)
return tf.saturate_cast(images, tf.uint8)
class StyleGAN2_Handler(object):
"""
Handles a trained StyleGAN2 model
"""
def __init__(self, settings, args, truncation_psi = 0.9):
# Initialization, should create the model, load it and also run one inference (to build the graph)
self.settings = settings
print("Init handler with path =", args.model_path)
_, name = os.path.split(args.model_path)
name = str(name).replace(".pkl", "")
name = str(name).replace(".pt", "")
self.model_name_id = name
self.truncation_psi = truncation_psi
# Load and create a model
self._create_model(args.model_path)
# Load other networks (if we set these)
self.multiple_nets_paths = args.multiple_nets
self.multiple_nets = None
if self.multiple_nets_paths is not "":
# TODO!
pass
self.latent_vector_size = self._Gs.input_shapes[0][1:][0]
# Infer once to build up the graph (takes like 2 sec extra time is the first one)
print("Testing with an example to build the graph")
self.set_noise()
self.noise_changing = False
self._example_input = self.example_input(verbose=False)
self._example_output = self.infer(self._example_input, verbose=False)
# Network altering:
self.original_weights = {}
def _create_model(self, model_path):
tf.InteractiveSession()
stream = open(model_path, 'rb')
tflib.init_tf()
with stream:
self._G, self._D, self._Gs = pickle.load(stream, encoding='latin1')
def report(self):
print("[StyleGAN2_Handler Status report]")
print("\t- latent_vector_size:",self.latent_vector_size)
print("\t- typical input shape is:",self._example_input.shape)
print("\t- typical output shape is:",self._example_output.shape)
def example_input(self, how_many=1, seed=None, verbose=True):
if seed:
if verbose:
print("Generating random input (from seed=",seed,")")
latents = np.random.RandomState(seed).randn(how_many, self.latent_vector_size)
else:
if verbose:
print("Generating random input")
latents = np.random.randn(how_many, self.latent_vector_size)
# PS: StyleGan2 code used:
# rnd = np.random.RandomState(seed)
# z = input_latents
# print("z my=", z.shape)
# z = rnd.randn(1, *self._Gs.input_shape[1:]) # [minibatch, component]
if verbose:
print("example input is ...", latents.shape)
example_input = latents
return example_input
def set_noise(self, seed=None):
noise_vars = [var for name, var in self._Gs.components.synthesis.vars.items() if name.startswith('noise')]
rnd = np.random.RandomState(seed)
tflib.set_vars({var: rnd.randn(*var.shape.as_list()) for var in noise_vars}) # [height, width]
def infer(self, input_latents, verbose=True):
z = input_latents
if self.noise_changing:
self.set_noise()
#images = self._Gs.run(z, None, **Gs_kwargs) # [minibatch, height, width, channel]
images = self._Gs.run(z, None, truncation_psi = self.truncation_psi, randomize_noise = False, output_transform = dict(func=convert_images_to_uint8, nchw_to_nhwc=True)) # [minibatch, height, width, channel]
if verbose:
print("Generated",images.shape)
return images
def save_image(self, image, name="foo.jpg"):
im = PIL.Image.fromarray(image)
im.save(name)
def toggleStylegan2Noise(self):
self.noise_changing = not self.noise_changing
def times_a(self, a, np_arr):
return a * np_arr
def change_net(self, target_tensor, operation, *kwargs):
# PS: Changing the weights is faster than generating an image... (which is good news)
np_arr = None
net = self._Gs
# restore old weights
for tensor_key in self.original_weights.keys():
orig_val = self.original_weights[tensor_key]
net.set_var(tensor_key, orig_val)
if target_tensor not in self.original_weights:
# we haven't change this tensor yet - load it from the NN
np_arr = net.get_var(target_tensor) # <slow
self.original_weights[target_tensor] = np_arr
np_arr = self.original_weights[target_tensor]
print("tensor as np_arr:", type(np_arr), np_arr.shape)
np_arr = operation(np_arr, kwargs)
net.set_var(target_tensor, np_arr)
self._Gs = net
def restore(self):
net = self._Gs
editednet = reconnector.restore_net(net)
self._Gs = editednet
def reconnect(self, target_tensor, percent_change = 30):
net = self._Gs
editednet = reconnector.reconnect(net, target_tensor, percent_change)
self._Gs = editednet
def reconnect_simulate_random_weights(self, target_tensor, percent_change = 30):
net = self._Gs
editednet = reconnector.reconnect_simulate_random_weights(net, target_tensor, percent_change)
self._Gs = editednet
def savenet(self):
# usually haxed net
net = self._Gs
def save_pkl(obj, filename):
with open(filename, 'wb') as file:
pickle.dump(obj, file, protocol=pickle.HIGHEST_PROTOCOL)
save_pkl(self._Gs, "renders/haxed_gs.pkl")
def DEBUG(self):
print("####DEBUG####")
print(self._Gs) # < is a Network from dnnlib/tflib/network.py
import blender
net = self._Gs
editednet = blender.test(net)
self._Gs = editednet
print("#############")
def alphablendmodels_slow(self, alpha):
import blender
net = self._Gs
editednet = blender.slow_blend_from_saved_weights(net,alpha)
self._Gs = editednet
"""
# Example of usage:
settings = {}
import mock
args = mock.Mock()
settings = mock.Mock()
args.model_path = "../stylegan2/stylegan2-ffhq-config-f.pkl"
args.truncation_psi = 0.5
style2_handler = StyleGAN2_Handler(settings, args)
style2_handler.report()
example_input = style2_handler.example_input()
example_output = style2_handler.infer(example_input)
print("example_output:", example_output.shape)
from timeit import default_timer as timer
# Basic measurements
repeats = 15
times = []
for repeat_i in range(repeats):
t_infer = timer()
example_input = style2_handler.example_input(verbose=False)
example_output = style2_handler.infer(example_input, verbose=False)
t_infer = timer() - t_infer
if repeat_i > 0:
times.append(t_infer)
#print("Prediction (of 1 sample) took", t_infer, "sec.")
times = np.asarray(times)
print("Statistics:")
print("prediction time - avg +- std =", np.mean(times), "+-", np.std(times), "sec.")
# Batch measurements
how_many = 4 # too big? gpu mem explodes
repeats = 15
times = []
for repeat_i in range(repeats):
t_infer = timer()
example_inputs = style2_handler.example_input(how_many = how_many, verbose=False)
example_outputs = style2_handler.infer(example_inputs, verbose=False)
t_infer = timer() - t_infer
if repeat_i > 0:
times.append(t_infer)
#print("Prediction (of",how_many,"samples) took", t_infer, "sec.")
times = np.asarray(times)
print("Statistics:")
print("prediction of whole",how_many," took time - avg +- std =", np.mean(times), "+-", np.std(times), "sec.")
print("prediction as divided for one - avg +- std =", np.mean(times/how_many), "+-", np.std(times/how_many), "sec.")
"""