Create generate_regularized_class_specific_samples.py

alexstoken · alexstoken · commit e0072a2da6f9 · 2020-03-10T08:22:57.000-05:00
Create new file with regularized class specific image generator in it
diff --git a/src/generate_regularized_class_specific_samples.py b/src/generate_regularized_class_specific_samples.py
@@ -0,0 +1,116 @@
+"""
+Created on Tues Mar 10 08:13:15 2020
+@author: Alex Stoken - https://github.com/alexstoken
+
+Last tested with torchvision 0.5.0 with image and model on cpu
+"""
+import os
+import numpy as np
+
+import torch
+from torch.optim import SGD
+from torchvision import models
+
+from misc_functions import preprocess_image, recreate_image, save_image
+
+
+class RegularizedClassSpecificImageGeneration():
+    """
+        Produces an image that maximizes a certain class with gradient ascent. Uses Gaussian blur, weight decay, and clipping. 
+    """
+
+    def __init__(self, model, target_class):
+        self.mean = [-0.485, -0.456, -0.406]
+        self.std = [1/0.229, 1/0.224, 1/0.225]
+        self.model = model
+        self.model.eval()
+        self.target_class = target_class
+        # Generate a random image
+        self.created_image = np.uint8(np.random.uniform(0, 255, (224, 224, 3)))
+        # Create the folder to export images if not exists
+        if not os.path.exists(f'../generated/class_{self.target_class}'):
+            os.makedirs(f'../generated/class_{self.target_class}')
+
+    def generate(self, iterations=150, blur_freq=4, blur_rad=1, wd=0.0001, clipping_value=0.1):
+        """Generates class specific image with enhancements to improve image quality. 
+        See https://arxiv.org/abs/1506.06579 for details on each argument's effect on output quality. 
+        
+
+        Play around with combinations of arguments. Besides the defaults, this combination has produced good images:
+        blur_freq=6, blur_rad=0.8, wd = 0.05
+
+        Keyword Arguments:
+            iterations {int} -- Total iterations for gradient ascent (default: {150})
+            blur_freq {int} -- Frequency of Gaussian blur effect, in iterations (default: {6})
+            blur_rad {float} -- Radius for gaussian blur, passed to PIL.ImageFilter.GaussianBlur() (default: {0.8})
+            wd {float} -- Weight decay value for Stochastic Gradient Ascent (default: {0.05})
+            clipping_value {None or float} -- Value for gradient clipping (default: {0.1})
+        
+        Returns:
+            np.ndarray -- Final maximally activated class image
+        """
+        initial_learning_rate = 6
+        for i in range(1, iterations):
+            # Process image and return variable
+
+            #implement gaussian blurring every ith iteration
+            #to improve output
+            if i % blur_freq == 0:
+                self.processed_image = preprocess_image(
+                    self.created_image, False, blur_rad)
+            else:
+                self.processed_image = preprocess_image(
+                    self.created_image, False)
+
+            # Define optimizer for the image - use weight decay to add regularization
+            # in SGD, wd = 2 * L2 regularization (https://bbabenko.github.io/weight-decay/)
+            optimizer = SGD([self.processed_image],
+                            lr=initial_learning_rate, weight_decay=wd)
+            # Forward
+            output = self.model(self.processed_image)
+            # Target specific class
+            class_loss = -output[0, self.target_class]
+
+            if i in np.linspace(0, iterations, 10, dtype=int):
+                print('Iteration:', str(i), 'Loss',
+                      "{0:.2f}".format(class_loss.data.numpy()))
+            # Zero grads
+            self.model.zero_grad()
+            # Backward
+            class_loss.backward()
+
+            if clipping_value:
+                torch.nn.utils.clip_grad_norm(
+                    self.model.parameters(), clipping_value)
+            # Update image
+            optimizer.step()
+            # Recreate image
+            self.created_image = recreate_image(self.processed_image)
+            if i in np.linspace(0, iterations, 10, dtype=int):
+                # Save image
+                im_path = f'../generated/class_{self.target_class}/c_{self.target_class}_iter_{i}_loss_{class_loss.data.numpy()}.jpg'
+                save_image(self.created_image, im_path)
+
+        #save final image
+        im_path = f'../generated/class_{self.target_class}/c_{self.target_class}_iter_{i}_loss_{class_loss.data.numpy()}.jpg'
+        save_image(self.created_image, im_path)
+
+        #write file with regularization details
+        with open(f'../generated/class_{self.target_class}/run_details.txt', 'w') as f:
+            f.write(f'Iterations: {iterations}\n')
+            f.write(f'Blur freq: {blur_freq}\n')
+            f.write(f'Blur radius: {blur_rad}\n')
+            f.write(f'Weight decay: {wd}\n')
+            f.write(f'Clip value: {clipping_value}\n')
+
+        #rename folder path with regularization details for easy access
+        os.rename(f'../generated/class_{self.target_class}',
+                  f'../generated/class_{self.target_class}_blurfreq_{blur_freq}_blurrad_{blur_rad}_wd{wd}')
+        return self.processed_image
+
+
+if __name__ == '__main__':
+    target_class = 130  # Flamingo
+    pretrained_model = models.alexnet(pretrained=True)
+    csig = ClassSpecificImageGeneration(pretrained_model, target_class)
+    csig.generate()