Examples tested and updated, NSF example added

VincentStimper · VincentStimper · commit 733ce34f4629 · 2021-11-25T15:51:16.000+01:00
diff --git a/example/neural-spline-flow.ipynb b/example/neural-spline-flow.ipynb
@@ -0,0 +1,199 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Neural Spline Flow"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Import required packages\n",
+    "import torch\n",
+    "import numpy as np\n",
+    "import normflow as nf\n",
+    "\n",
+    "from sklearn.datasets import make_moons\n",
+    "\n",
+    "from matplotlib import pyplot as plt\n",
+    "\n",
+    "from tqdm import tqdm"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Set up model\n",
+    "\n",
+    "# Define flows\n",
+    "K = 16\n",
+    "torch.manual_seed(0)\n",
+    "\n",
+    "latent_size = 2\n",
+    "hidden_units = 128\n",
+    "hidden_layers = 2\n",
+    "\n",
+    "flows = []\n",
+    "for i in range(K):\n",
+    "    flows += [nf.flows.AutoregressiveRationalQuadraticSpline(latent_size, hidden_layers, hidden_units)]\n",
+    "    flows += [nf.flows.InvertibleAffine(latent_size)]\n",
+    "\n",
+    "# Set prior and q0\n",
+    "q0 = nf.distributions.DiagGaussian(2, trainable=False)\n",
+    "    \n",
+    "# Construct flow model\n",
+    "nfm = nf.NormalizingFlow(q0=q0, flows=flows)\n",
+    "\n",
+    "# Move model on GPU if available\n",
+    "enable_cuda = True\n",
+    "device = torch.device('cuda' if torch.cuda.is_available() and enable_cuda else 'cpu')\n",
+    "nfm = nfm.to(device)\n",
+    "\n",
+    "# Initialize ActNorm\n",
+    "x_np, _ = make_moons(2 ** 9, noise=0.1)\n",
+    "x = torch.tensor(x_np).float().to(device)\n",
+    "_ = nfm.log_prob(x)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Plot prior distribution\n",
+    "x_np, _ = make_moons(2 ** 20, noise=0.1)\n",
+    "plt.figure(figsize=(15, 15))\n",
+    "plt.hist2d(x_np[:, 0], x_np[:, 1], bins=200)\n",
+    "plt.show()\n",
+    "\n",
+    "# Plot initial posterior distribution\n",
+    "grid_size = 100\n",
+    "xx, yy = torch.meshgrid(torch.linspace(-1.5, 2.5, grid_size), torch.linspace(-2, 2, grid_size))\n",
+    "zz = torch.cat([xx.unsqueeze(2), yy.unsqueeze(2)], 2).view(-1, 2)\n",
+    "zz = zz.to(device)\n",
+    "\n",
+    "nfm.eval()\n",
+    "log_prob = nfm.log_prob(zz).to('cpu').view(*xx.shape)\n",
+    "nfm.train()\n",
+    "prob = torch.exp(log_prob)\n",
+    "prob[torch.isnan(prob)] = 0\n",
+    "\n",
+    "plt.figure(figsize=(15, 15))\n",
+    "plt.pcolormesh(xx, yy, prob.data.numpy())\n",
+    "plt.gca().set_aspect('equal', 'box')\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Train model\n",
+    "max_iter = 10000\n",
+    "num_samples = 2 ** 9\n",
+    "show_iter = 500\n",
+    "\n",
+    "\n",
+    "loss_hist = np.array([])\n",
+    "\n",
+    "optimizer = torch.optim.Adam(nfm.parameters(), lr=1e-3, weight_decay=1e-5)\n",
+    "for it in tqdm(range(max_iter)):\n",
+    "    optimizer.zero_grad()\n",
+    "    \n",
+    "    # Get training samples\n",
+    "    x_np, _ = make_moons(num_samples, noise=0.1)\n",
+    "    x = torch.tensor(x_np).float().to(device)\n",
+    "    \n",
+    "    # Compute loss\n",
+    "    loss = nfm.forward_kld(x)\n",
+    "    \n",
+    "    # Do backprop and optimizer step\n",
+    "    if ~(torch.isnan(loss) | torch.isinf(loss)):\n",
+    "        loss.backward()\n",
+    "        optimizer.step()\n",
+    "    \n",
+    "    # Make layers Lipschitz continuous\n",
+    "    nf.utils.update_lipschitz(nfm, 5)\n",
+    "    \n",
+    "    # Log loss\n",
+    "    loss_hist = np.append(loss_hist, loss.to('cpu').data.numpy())\n",
+    "    \n",
+    "    # Plot learned posterior\n",
+    "    if (it + 1) % show_iter == 0:\n",
+    "        nfm.eval()\n",
+    "        log_prob = nfm.log_prob(zz)\n",
+    "        nfm.train()\n",
+    "        prob = torch.exp(log_prob.to('cpu').view(*xx.shape))\n",
+    "        prob[torch.isnan(prob)] = 0\n",
+    "\n",
+    "        plt.figure(figsize=(15, 15))\n",
+    "        plt.pcolormesh(xx, yy, prob.data.numpy())\n",
+    "        plt.gca().set_aspect('equal', 'box')\n",
+    "        plt.show()\n",
+    "\n",
+    "# Plot loss\n",
+    "plt.figure(figsize=(10, 10))\n",
+    "plt.plot(loss_hist, label='loss')\n",
+    "plt.legend()\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot learned posterior distribution\n",
+    "nfm.eval()\n",
+    "log_prob = nfm.log_prob(zz).to('cpu').view(*xx.shape)\n",
+    "nfm.train()\n",
+    "prob = torch.exp(log_prob)\n",
+    "prob[torch.isnan(prob)] = 0\n",
+    "\n",
+    "plt.figure(figsize=(15, 15))\n",
+    "plt.pcolormesh(xx, yy, prob.data.numpy())\n",
+    "plt.gca().set_aspect('equal', 'box')\n",
+    "plt.show()"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
diff --git a/example/planar.ipynb b/example/planar.ipynb
@@ -38,15 +38,10 @@
     "flows = []\n",
     "for i in range(K):\n",
     "    flows += [nf.flows.Planar((2,))]\n",
-    "#prior = nf.distributions.Sinusoidal(0.2, 4)\n",
-    "prior = nf.distributions.TwoModes(2, 0.1)\n",
-    "#prior = torch.distributions.MultivariateNormal(torch.tensor(np.zeros(2), device=device), \n",
-    "#                                               torch.tensor(np.eye(2), device=device))\n",
-    "#hidden_units_encoder = np.array([2, 4])\n",
-    "#encoder_nn = nf.nets.MLP(hidden_units_encoder)\n",
-    "#q0 = nf.distributions.NNDiagGaussian(encoder_nn)\n",
+    "target = nf.distributions.TwoModes(2, 0.1)\n",
+    "\n",
     "q0 = nf.distributions.DiagGaussian(2)\n",
-    "nfm = nf.NormalizingFlow(q0=q0, flows=flows, p=prior)\n",
+    "nfm = nf.NormalizingFlow(q0=q0, flows=flows, p=target)\n",
     "nfm.to(device)"
    ]
   },
@@ -58,11 +53,11 @@
    },
    "outputs": [],
    "source": [
-    "# Plot prior distribution\n",
+    "# Plot target distribution\n",
     "grid_size = 200\n",
     "xx, yy = torch.meshgrid(torch.linspace(-3, 3, grid_size), torch.linspace(-3, 3, grid_size))\n",
     "z = torch.cat([xx.unsqueeze(2), yy.unsqueeze(2)], 2).view(-1, 2)\n",
-    "log_prob = prior.log_prob(z.to(device)).to('cpu').view(*xx.shape)\n",
+    "log_prob = target.log_prob(z.to(device)).to('cpu').view(*xx.shape)\n",
     "prob = torch.exp(log_prob)\n",
     "\n",
     "plt.figure(figsize=(10, 10))\n",
@@ -142,7 +137,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
    "name": "python3"
   },
@@ -156,7 +151,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.6"
+   "version": "3.8.11"
   },
   "pycharm": {
    "stem_cell": {
diff --git a/example/residual.ipynb b/example/residual.ipynb
@@ -193,7 +193,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.12"
+   "version": "3.8.11"
   }
  },
  "nbformat": 4,

Original file line number	Diff line number	Diff line change
`@@ -193,7 +193,7 @@`
`193`	`193`	`"name": "python",`
`194`	`194`	`"nbconvert_exporter": "python",`
`195`	`195`	`"pygments_lexer": "ipython3",`
`196`		`- "version": "3.8.12"`
	`196`	`+ "version": "3.8.11"`
`197`	`197`	`}`
`198`	`198`	`},`
`199`	`199`	`"nbformat": 4,`