update experiments

jaanli · jaanli · commit 567ec7475914 · 2016-08-15T11:50:08.000-07:00
diff --git a/README.md b/README.md
@@ -1,2 +1,4 @@
 # vae
 Variational Autoencoder or Deep Latent Gaussian Model demo
+
+Blog post: https://jaan.io/unreasonable-confusion/
diff --git a/vae.py b/vae.py
@@ -1,12 +1,17 @@
+import itertools
+import matplotlib as mpl
 import numpy as np
 import os
 import tensorflow as tf
 import tensorflow.contrib.slim as slim
 import time
+import seaborn as sns
 
+from matplotlib import pyplot as plt
 from scipy.misc import imsave
 from tensorflow.contrib.learn.python.learn.datasets.mnist import read_data_sets
 
+sns.set_style('whitegrid')
 
 sg = tf.contrib.bayesflow.stochastic_graph
 distributions = tf.contrib.distributions
@@ -15,10 +20,11 @@
 flags = tf.app.flags
 flags.DEFINE_string('data_dir', '/tmp/data/', 'Directory for storing data')
 flags.DEFINE_string('logdir', '/tmp/logs/', 'Directory for storing data')
-flags.DEFINE_integer('latent_dim', 100, 'Latent dimensionality of model')
+flags.DEFINE_integer('latent_dim', 2, 'Latent dimensionality of model')
 flags.DEFINE_integer('batch_size', 64, 'Minibatch size')
 flags.DEFINE_integer('n_samples', 10, 'Number of samples to save')
-flags.DEFINE_integer('print_every', 1000, 'Print every n iterations')
+flags.DEFINE_integer('print_every', 10, 'Print every n iterations')
+flags.DEFINE_integer('hidden_size', 200, 'Hidden size for neural networks')
 
 FLAGS = flags.FLAGS
 
@@ -41,7 +47,10 @@ def inference_network(x, latent_dim, hidden_size):
     net = slim.fully_connected(net, hidden_size)
     gaussian_params = slim.fully_connected(
         net, latent_dim * 2, activation_fn=None)
+  # The mean parameter is unconstrained
   mu = gaussian_params[:, :latent_dim]
+  # The standard deviation must be positive. Parametrize with a softplus and
+  # add a small epsilon for numerical stability
   sigma = 1e-6 + tf.nn.softplus(gaussian_params[:, latent_dim:])
   return mu, sigma
 
@@ -67,7 +76,7 @@ def generative_network(z, hidden_size):
 def train():
   # Train a Variational Autoencoder on MNIST
 
-  # Input placehoolders
+  # Input placeholders
   with tf.name_scope('data'):
     x = tf.placeholder(tf.float32, [None, 28, 28, 1])
     tf.image_summary('data', x, max_images=10)
@@ -76,39 +85,52 @@ def train():
   with tf.variable_scope('variational'):
     q_mu, q_sigma = inference_network(x=x,
                                       latent_dim=FLAGS.latent_dim,
-                                      hidden_size=200)
+                                      hidden_size=FLAGS.hidden_size)
     with sg.value_type(sg.SampleAndReshapeValue()):
+      # The variational distribution is a Normal with mean and standard
+      # deviation given by the inference network
       q_z = sg.DistributionTensor(distributions.Normal, mu=q_mu, sigma=q_sigma)
 
   with tf.variable_scope('model'):
-    p_x_given_z_logits = generative_network(z=q_z, hidden_size=200)
-    posterior_predictive = distributions.Bernoulli(logits=p_x_given_z_logits)
-    posterior_predictive_samples = posterior_predictive.sample()
+    # The likelihood is Bernoulli-distributed with logits given by the
+    # generative network
+    p_x_given_z_logits = generative_network(z=q_z,
+                                            hidden_size=FLAGS.hidden_size)
+    p_x_given_z = distributions.Bernoulli(logits=p_x_given_z_logits)
+    posterior_predictive_samples = p_x_given_z.sample()
     tf.image_summary('posterior_predictive',
                      tf.cast(posterior_predictive_samples, tf.float32),
                      max_images=10)
 
-
+  # Take samples from the prior
   with tf.variable_scope('model', reuse=True):
     p_z = distributions.Normal(mu=np.zeros(FLAGS.latent_dim, dtype=np.float32),
                                sigma=np.ones(FLAGS.latent_dim, dtype=np.float32))
     p_z_sample = p_z.sample_n(FLAGS.n_samples)
-    p_x_given_z_logits = generative_network(z=p_z_sample, hidden_size=200)
+    p_x_given_z_logits = generative_network(z=p_z_sample,
+                                            hidden_size=FLAGS.hidden_size)
     prior_predictive = distributions.Bernoulli(logits=p_x_given_z_logits)
     prior_predictive_samples = prior_predictive.sample()
     tf.image_summary('prior_predictive',
                      tf.cast(prior_predictive_samples, tf.float32),
                      max_images=10)
 
+  # Take samples from the prior with a placeholder
+  with tf.variable_scope('model', reuse=True):
+    z_input = tf.placeholder(tf.float32, [None, FLAGS.latent_dim])
+    p_x_given_z_logits = generative_network(z=z_input,
+                                            hidden_size=FLAGS.hidden_size)
+    prior_predictive_inp = distributions.Bernoulli(logits=p_x_given_z_logits)
+    prior_predictive_inp_sample = prior_predictive_inp.sample()
 
   # Build the evidence lower bound (ELBO) or the negative loss
   kl = tf.reduce_sum(distributions.kl(q_z.distribution, p_z), 1)
-  expected_log_likelihood = tf.reduce_sum(posterior_predictive.log_pmf(x),
+  expected_log_likelihood = tf.reduce_sum(p_x_given_z.log_pmf(x),
                                           [1, 2, 3])
 
   elbo = tf.reduce_sum(expected_log_likelihood - kl, 0)
 
-  optimizer = tf.train.AdamOptimizer(learning_rate=0.001)
+  optimizer = tf.train.RMSPropOptimizer(learning_rate=0.001)
 
   train_op = optimizer.minimize(-elbo)
 
@@ -126,11 +148,17 @@ def train():
   print('Saving TensorBoard summaries and images to: %s' % FLAGS.logdir)
   train_writer = tf.train.SummaryWriter(FLAGS.logdir, sess.graph)
 
-  for i in range(100000):
+  # Get fixed MNIST digits for plotting posterior means during training
+  np_x_fixed, np_y = mnist.test.next_batch(5000)
+  np_x_fixed = np_x_fixed.reshape(5000, 28, 28, 1)
+  np_x_fixed = (np_x_fixed > 0.5).astype(np.float32)
+
+  for i in range(1000):
+    # Re-binarize the data at every batch; this improves results
     np_x, _ = mnist.train.next_batch(FLAGS.batch_size)
     np_x = np_x.reshape(FLAGS.batch_size, 28, 28, 1)
     np_x = (np_x > 0.5).astype(np.float32)
-    sess.run(train_op, feed_dict={x: np_x})
+    sess.run(train_op, {x: np_x})
 
     # Print progress and save samples every so often
     t0 = time.time()
@@ -157,6 +185,47 @@ def train():
             FLAGS.logdir, 'iter_%d_prior_predictive_%d.jpg' % (i, k))
         imsave(f_name, np_prior_samples[k, :, :, 0])
 
+      # Plot the posterior predictive space
+      if FLAGS.latent_dim == 2:
+        np_q_mu = sess.run(q_mu, {x: np_x_fixed})
+        cmap = mpl.colors.ListedColormap(sns.color_palette("husl"))
+        f, ax = plt.subplots(1, figsize=(6 * 1.1618, 6))
+        im = ax.scatter(np_q_mu[:, 0], np_q_mu[:, 1], c=np.argmax(np_y, 1), cmap=cmap,
+                    alpha=0.7)
+        ax.set_xlabel('First dimension of sampled latent variable $z_1$')
+        ax.set_ylabel('Second dimension of sampled latent variable mean $z_2$')
+        ax.set_xlim([-10., 10.])
+        ax.set_ylim([-10., 10.])
+        f.colorbar(im, ax=ax, label='Digit class')
+        plt.tight_layout()
+        plt.savefig(os.path.join(FLAGS.logdir,
+                                 'posterior_predictive_map_frame_%d.png' % i))
+        plt.close()
+
+        nx = ny = 20
+        x_values = np.linspace(-3, 3, nx)
+        y_values = np.linspace(-3, 3, ny)
+        canvas = np.empty((28*ny, 28*nx))
+        for ii, yi in enumerate(x_values):
+          for j, xi in enumerate(y_values):
+            np_z = np.array([[xi, yi]])
+            x_mean = sess.run(prior_predictive_inp_sample, {z_input: np_z})
+            canvas[(nx-ii-1)*28:(nx-ii)*28, j*28:(j+1)*28] = x_mean[0].reshape(28, 28)
+        imsave(os.path.join(FLAGS.logdir,
+                            'prior_predictive_map_frame_%d.png' % i), canvas)
+        # plt.figure(figsize=(8, 10))
+        # Xi, Yi = np.meshgrid(x_values, y_values)
+        # plt.imshow(canvas, origin="upper")
+        # plt.tight_layout()
+        # plt.savefig()
+
+  # Make the gifs
+  os.system(
+      'convert -delay 15 -loop 0 {0}/posterior_predictive_map_frame*png {0}/posterior_predictive.gif'
+          .format(FLAGS.logdir))
+  os.system(
+      'convert -delay 15 -loop 0 {0}/prior_predictive_map_frame*png {0}/prior_predictive.gif'
+          .format(FLAGS.logdir))
 
 def main(_):
   if tf.gfile.Exists(FLAGS.logdir):

-Original file line number
+Diff line change
@@ @@ -1,2 +1,4 @@ @@
 # vae
 Variational Autoencoder or Deep Latent Gaussian Model demo
++
 +Blog post: https://jaan.io/unreasonable-confusion/