torchgan · avik-pal · May 1, 2019 · Dec 22, 2018 · Mar 16, 2019 · Mar 16, 2019
diff --git a/.travis.yml b/.travis.yml
@@ -41,6 +41,8 @@ jobs:
       script:
         # Test GMAN
         - travis_wait python gman/gman.py --cpu 1 -b 32 -s 16 -e 1
-
+        # Test BinaryGAN
+        - travis_wait python binarygan/binarygan.py --cpu 1 -b 32 -s 16 -e 1
+
       after_success: # nothing to do
 
diff --git a/README.md b/README.md
@@ -8,6 +8,10 @@ Collection of Generative Adversarial Networks developed using TorchGAN
    [Link to Paper](https://arxiv.org/pdf/1611.01673.pdf)\
    Requires the `torchgan` master.
 
+2. Training GANs with Binary Neurons by End-to-end Backpropagation\
+   [Link to Paper](https://arxiv.org/pdf/1810.04714.pdf)\
+   Requires the `torchgan` master.
+
 ## Contribution Guidelines
 
 We are open to accepting any model that you have built. The only things

diff --git a/binarygan/binarygan.py b/binarygan/binarygan.py
@@ -0,0 +1,231 @@
+import argparse
+
+import torch
+import torch.nn as nn
+import torch.utils.data as data
+import torchvision.datasets as dsets
+import torchvision.transforms as transforms
+from torch.optim import Adam
+from torchgan.losses import (WassersteinDiscriminatorLoss,
+                             WassersteinGeneratorLoss,
+                             WassersteinGradientPenalty)
+from torchgan.models import DCGANDiscriminator, DCGANGenerator
+from torchgan.trainer import ParallelTrainer, Trainer
+
+
+# Binary Neurons
+class Binarize(torch.autograd.Function):
+    @staticmethod
+    def forward(ctx, input, mode, threshold=None, dist=None):
+        x = torch.sigmoid(input)
+        x_clone = x.clone()
+        ctx.save_for_backward(x_clone)
+        if mode == 'd':
+            x[x >= threshold] = 1.0
+            x[x < threshold] = 0.0
+        elif mode == 's':
+            z = dist.sample(x.size()).to(device)
+            x[x >= z] = 1.0
+            x[x < z] = 0.0
+        return x
+
+    @staticmethod
+    def backward(self, grad_output):
+        # While backpropagating we only consider the output of the sigmoid
+        # function
+        x, = self.saved_tensors
+        return grad_output * x * (1.0 - x), None, None, None
+
+
+class BinaryNeurons(nn.Module):
+    r"""Implements the Binary Neurons as described in
+    https://arxiv.org/pdf/1810.04714.pdf
+
+    Args:
+        mode (str, optional): 2 choices - 'd' for Deterministic Binary Neurons
+            and 's' for Stochastic Binary Neurons. Any other choice will result
+            in the preactivation output.
+        threshold (float, optional): The probability threshold.
+    """
+
+    def __init__(self, mode='d', threshold=0.5):
+        super(BinaryNeurons, self).__init__()
+        self.function = Binarize.apply
+        self.mode = mode
+        if self.mode == 'd':
+            self.threshold = threshold
+            self.dist = None
+        elif self.mode == 's':
+            self.dist = torch.distributions.uniform.Uniform(0.0, 1.0)
+            self.threshold = None
+
+    def forward(self, x):
+        return self.function(x, self.mode, self.threshold, self.dist)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "-f",
+        "--data_dir",
+        help="directory where mnist will be downloaded/is available",
+        default="./")
+    parser.add_argument(
+        "-sc",
+        "--step_channels",
+        help="step channels for the generator and discriminators",
+        type=int,
+        default=16)
+    parser.add_argument(
+        "-t",
+        "--threshold",
+        help="The threshold for binarization",
+        type=float,
+        default=0.5)
+    parser.add_argument(
+        "--type",
+        help="Type of Binarization to be used",
+        choices=['s', 'd'],
+        default='s')
+    parser.add_argument(
+        "-lr",
+        "--learning_rate",
+        help="The learning rate for the optimizers",
+        type=float,
+        default=0.0002)
+    parser.add_argument(
+        "--cpu",
+        type=int,
+        help="Set it to 1 if cpu is to be used for training",
+        default=0)
+    parser.add_argument(
+        "-m",
+        "--multigpu",
+        choices=[0, 1],
+        type=int,
+        help="Choose 1 if multiple GPUs are available for training",
+        default=0)
+    parser.add_argument(
+        "-l",
+        "--list_gpus",
+        type=int,
+        nargs='+',
+        help="List of GPUs to be used for training. Used iff -m is set to 1",
+        default=[0, 1])
+    parser.add_argument(
+        "-b",
+        "--batch_size",
+        type=int,
+        help="Batch Size for training",
+        default=32)
+    parser.add_argument(
+        "-s",
+        "--sample_size",
+        type=int,
+        help="Number of Images Generated per Epoch",
+        default=64)
+    parser.add_argument(
+        "-c",
+        "--checkpoint",
+        help="Place to store the trained model",
+        default="./gman_")
+    parser.add_argument(
+        "-r",
+        "--reconstructions",
+        help="Directory to store the generated images",
+        default="./gman_images")
+    parser.add_argument(
+        "-e",
+        "--epochs",
+        help="Total epochs for which the model will be trained",
+        default=20,
+        type=int)
+    args = parser.parse_args()
+
+    network_config = {
+        "generator": {
+            "name": DCGANGenerator,
+            "args": {
+                "encoding_dims":
+                100,
+                "out_channels":
+                1,
+                "step_channels":
+                args.step_channels,
+                "last_nonlinearity":
+                BinaryNeurons(mode=args.type, threshold=args.threshold)
+            },
+            "optimizer": {
+                "name": Adam,
+                "args": {
+                    "lr": args.learning_rate,
+                    "betas": (0.5, 0.999)
+                }
+            }
+        },
+        "discriminator": {
+            "name": DCGANDiscriminator,
+            "args": {
+                "in_channels": 1,
+                "step_channels": args.step_channels
+            },
+            "optimizer": {
+                "name": Adam,
+                "args": {
+                    "lr": args.learning_rate,
+                    "betas": (0.5, 0.999)
+                }
+            }
+        }
+    }
+
+    losses_list = [
+        WassersteinGeneratorLoss(),
+        WassersteinDiscriminatorLoss(),
+        WassersteinGradientPenalty()
+    ]
+
+    if args.cpu == 0 and args.multigpu == 1:
+        trainer = ParallelTrainer(
+            network_config,
+            losses_list,
+            args.list_gpus,
+            epochs=args.epochs,
+            sample_size=args.sample_size,
+            checkpoints=args.checkpoint,
+            retain_checkpoints=1,
+            recon=args.reconstructions,
+        )
+    else:
+        if args.cpu == 1:
+            device = torch.device("cpu")
+        else:
+            device = torch.device("cuda:0")
+        trainer = Trainer(
+            network_config,
+            losses_list,
+            device=device,
+            epochs=args.epochs,
+            sample_size=args.sample_size,
+            checkpoints=args.checkpoint,
+            retain_checkpoints=1,
+            recon=args.reconstructions,
+        )
+
+    # Transforms to get Binarized MNIST
+    dataset = dsets.MNIST(
+        root=args.data_dir,
+        train=True,
+        transform=transforms.Compose([
+            transforms.Resize((32, 32)),
+            transforms.Lambda(lambda x: x.convert('1')),
+            transforms.ToTensor()
+        ]),
+        download=True)
+
+    dataloader = data.DataLoader(
+        dataset, batch_size=args.batch_size, shuffle=True)
+
+    trainer(dataloader)
+
+    trainer.complete()