Add 1D VariationalAutoencoder (#401)

vballoli · BradLarson · web-flow · commit 89abc7eb82ea · 2020-04-28T12:19:52.000-05:00
* Add 1D VariationalAutoencoder

* Add Autoencoder CMake

* Updating for Batcher.

* Reformat main.swift and update the target name in the README.

* Rework test dataset usage.

* Fix CMakeLists.

Co-authored-by: Brad Larson &lt;bradlarson@google.com&gt;
diff --git a/Autoencoder/Autoencoder1D/CMakeLists.txt b/Autoencoder/Autoencoder1D/CMakeLists.txt
@@ -0,0 +1,9 @@
+add_executable(Autoencoder1D
+  main.swift)
+target_link_libraries(Autoencoder1D PRIVATE
+  Datasets
+  ModelSupport)
+
+
+install(TARGETS Autoencoder1D
+  DESTINATION bin)
diff --git a/Autoencoder/Autoencoder2D/CMakeLists.txt b/Autoencoder/Autoencoder2D/CMakeLists.txt
@@ -0,0 +1,9 @@
+add_executable(Autoencoder2D
+  main.swift)
+target_link_libraries(Autoencoder2D PRIVATE
+  Datasets
+  ModelSupport)
+
+
+install(TARGETS Autoencoder2D
+  DESTINATION bin)
diff --git a/Autoencoder/CMakeLists.txt b/Autoencoder/CMakeLists.txt
@@ -0,0 +1,3 @@
+add_subdirectory(Autoencoder1D)
+add_subdirectory(Autoencoder2D)
+add_subdirectory(VAE1D)
diff --git a/Autoencoder/VAE1D/CMakeLists.txt b/Autoencoder/VAE1D/CMakeLists.txt
@@ -0,0 +1,9 @@
+add_executable(VariationalAutoencoder1D
+  main.swift)
+target_link_libraries(VariationalAutoencoder1D PRIVATE
+  Datasets
+  ModelSupport)
+
+
+install(TARGETS VariationalAutoencoder1D
+  DESTINATION bin)
diff --git a/Autoencoder/VAE1D/README.md b/Autoencoder/VAE1D/README.md
@@ -0,0 +1,34 @@
+# 1D Variational Autoencoder
+
+This is an example of a simple 1-dimensional Variational Autoencoder model, using MNIST as a training dataset. Variational Autoencoder is based on the paper: "Auto-Encoding Variational Bayes", [Kingma et. al](https://arxiv.org/abs/1312.6114). It should produce output similar to the following:
+
+### Epoch 1
+<p align="center">
+<img src="images/epoch-1-input.jpg" height="270" width="360">
+<img src="images/epoch-1-output.jpg" height="270" width="360">
+</p>
+
+### Epoch 10
+<p align="center">
+<img src="images/epoch-10-input.jpg" height="270" width="360">
+<img src="images/epoch-10-output.jpg" height="270" width="360">
+</p>
+
+
+## Setup
+
+To begin, you'll need the [latest version of Swift for
+TensorFlow](https://github.com/tensorflow/swift/blob/master/Installation.md)
+installed. Make sure you've added the correct version of `swift` to your path.
+
+To train the model, run:
+
+```
+swift run -c release VariationalAutoencoder1D
+```
+
+## Key implementations
+
+1. Reparamterization trick is internally implemented in the VAE model
+2. VAE model returns an `Array` of `Tensor<Float>` tensors - which is inherently a `Differentiable` extension. (Reference: [S4TF API Docs](https://www.tensorflow.org/swift/api_docs/Extensions/Array)) 
+3. Loss Function combines `sigmoidCrossEntropy` of the output and KL Divergence between the intermediate representations. 
diff --git a/Autoencoder/VAE1D/images/epoch-1-input.jpg b/Autoencoder/VAE1D/images/epoch-1-input.jpg
diff --git a/Autoencoder/VAE1D/images/epoch-1-output.jpg b/Autoencoder/VAE1D/images/epoch-1-output.jpg
diff --git a/Autoencoder/VAE1D/images/epoch-10-input.jpg b/Autoencoder/VAE1D/images/epoch-10-input.jpg
diff --git a/Autoencoder/VAE1D/images/epoch-10-output.jpg b/Autoencoder/VAE1D/images/epoch-10-output.jpg
diff --git a/Autoencoder/VAE1D/main.swift b/Autoencoder/VAE1D/main.swift
@@ -0,0 +1,134 @@
+// Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+// Based on the paper: "Auto-Encoding Variational Bayes"
+// by Diederik P Kingma and Max Welling
+// Reference implementation: https://github.com/pytorch/examples/blob/master/vae/main.py
+
+import Datasets
+import Foundation
+import ModelSupport
+import TensorFlow
+
+let epochCount = 10
+let imageHeight = 28
+let imageWidth = 28
+
+let outputFolder = "./output/"
+let dataset = MNIST(batchSize: 128, flattening: true)
+
+let inputDim = 784  // 28*28 for any MNIST
+let hiddenDim = 400
+let latentDim = 20
+
+// Variational Autoencoder
+public struct VAE: Layer {
+    // Encoder
+    public var encoderDense1: Dense<Float>
+    public var encoderDense2_1: Dense<Float>
+    public var encoderDense2_2: Dense<Float>
+    // Decoder
+    public var decoderDense1: Dense<Float>
+    public var decoderDense2: Dense<Float>
+
+    public init() {
+        self.encoderDense1 = Dense<Float>(
+            inputSize: inputDim, outputSize: hiddenDim, activation: relu)
+        self.encoderDense2_1 = Dense<Float>(inputSize: hiddenDim, outputSize: latentDim)
+        self.encoderDense2_2 = Dense<Float>(inputSize: hiddenDim, outputSize: latentDim)
+
+        self.decoderDense1 = Dense<Float>(
+            inputSize: latentDim, outputSize: hiddenDim, activation: relu)
+        self.decoderDense2 = Dense<Float>(inputSize: hiddenDim, outputSize: inputDim)
+    }
+
+    @differentiable
+    public func callAsFunction(_ input: Tensor<Float>) -> [Tensor<Float>] {
+        // Encode
+        let intermediateInput = encoderDense1(input)
+        let mu = encoderDense2_1(intermediateInput)
+        let logVar = encoderDense2_2(intermediateInput)
+
+        // Re-parameterization trick
+        let std = exp(0.5 * logVar)
+        let epsilon = Tensor<Float>(randomNormal: std.shape)
+        let z = mu + epsilon * std
+
+        // Decode
+        let output = z.sequenced(through: decoderDense1, decoderDense2)
+        return [output, mu, logVar]
+    }
+}
+
+var vae = VAE()
+let optimizer = Adam(for: vae, learningRate: 1e-3)
+
+// Loss function: sum of the KL divergence of the embeddings and the cross entropy loss between the input and it's reconstruction. 
+func vaeLossFunction(
+    input: Tensor<Float>, output: Tensor<Float>, mu: Tensor<Float>, logVar: Tensor<Float>
+) -> Tensor<Float> {
+    let crossEntropy = sigmoidCrossEntropy(logits: output, labels: input, reduction: _sum)
+    let klDivergence = -0.5 * (1 + logVar - pow(mu, 2) - exp(logVar)).sum()
+    return crossEntropy + klDivergence
+}
+
+// TODO: Find a cleaner way of extracting individual images that doesn't require a second dataset.
+let singleImageDataset = MNIST(batchSize: 1, flattening: true)
+let individualTestImages = singleImageDataset.test
+var testImageIterator = individualTestImages.sequenced()
+
+// Training loop
+for epoch in 1...epochCount {
+    // Test for each epoch
+    if let nextIndividualImage = testImageIterator.next() {
+        let sampleTensor = nextIndividualImage.first
+        let sampleImage = Tensor(
+            shape: [1, imageHeight * imageWidth], scalars: sampleTensor.scalars)
+
+        let testOutputs = vae(sampleImage)
+        let testImage = testOutputs[0]
+        let testMu = testOutputs[1]
+        let testLogVar = testOutputs[2]
+        if epoch == 1 || epoch % 10 == 0 {
+            do {
+                try saveImage(
+                    sampleImage, shape: (imageWidth, imageHeight), format: .grayscale,
+                    directory: outputFolder, name: "epoch-\(epoch)-input")
+                try saveImage(
+                    testImage, shape: (imageWidth, imageHeight), format: .grayscale,
+                    directory: outputFolder, name: "epoch-\(epoch)-output")
+            } catch {
+                print("Could not save image with error: \(error)")
+            }
+        }
+
+        let sampleLoss = vaeLossFunction(
+            input: sampleImage, output: testImage, mu: testMu, logVar: testLogVar)
+        print("[Epoch: \(epoch)] Loss: \(sampleLoss)")
+    }
+
+    for batch in dataset.training.sequenced() {
+        let x = batch.first
+
+        let 𝛁model = TensorFlow.gradient(at: vae) { vae -> Tensor<Float> in
+            let outputs = vae(x)
+            let output = outputs[0]
+            let mu = outputs[1]
+            let logVar = outputs[2]
+            return vaeLossFunction(input: x, output: output, mu: mu, logVar: logVar)
+        }
+
+        optimizer.update(&vae, along: 𝛁model)
+    }
+}
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -86,6 +86,7 @@ set_target_properties(SwiftProtobuf PROPERTIES
   INTERFACE_INCLUDE_DIRECTORIES ${CMAKE_Swift_MODULE_DIRECTORY})
 add_dependencies(SwiftProtobuf swift-protobuf-install)
 
+add_subdirectory(Autoencoder)
 add_subdirectory(Support)
 add_subdirectory(Batcher)
 add_subdirectory(Datasets)
diff --git a/Package.swift b/Package.swift
@@ -56,6 +56,9 @@ let package = Package(
         .target(
             name: "Autoencoder2D", dependencies: ["Datasets", "ModelSupport"],
             path: "Autoencoder/Autoencoder2D"),
+        .target(
+            name: "VariationalAutoencoder1D", dependencies: ["Datasets", "ModelSupport"],
+            path: "Autoencoder/VAE1D"),
         .target(name: "Catch", path: "Catch"),
         .target(name: "Gym-FrozenLake", path: "Gym/FrozenLake"),
         .target(name: "Gym-CartPole", path: "Gym/CartPole"),

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+add_subdirectory(Autoencoder1D)`
	`2`	`+add_subdirectory(Autoencoder2D)`
	`3`	`+add_subdirectory(VAE1D)`