From e6d3815ce248970db17fd5adaabdd27e5ae719c5 Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Mon, 21 Jan 2013 17:56:10 +0100
Subject: [PATCH 1/7] COSMIT

---
 reconstruction/tv_denoising.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/reconstruction/tv_denoising.py b/reconstruction/tv_denoising.py
index 3493bae..235d675 100644
--- a/reconstruction/tv_denoising.py
+++ b/reconstruction/tv_denoising.py
@@ -11,8 +11,9 @@ def div(grad):
         this_res[-1] -= this_grad[-2]
     return res
 
+
 def gradient(img):
-    """ 
+    """
     Compute gradient of an image
 
     Parameters
@@ -26,7 +27,7 @@ def gradient(img):
         Gradient of the image: the i-th component along the first
         axis is the gradient along the i-th axis of the original
         array img
-"""
+    """
     shape = [img.ndim, ] + list(img.shape)
     gradient = np.zeros(shape, dtype=img.dtype)
     # 'Clever' code to have a view of the gradient with dimension i stop
@@ -69,6 +70,7 @@ def dual_gap(im, new, gap, weight):
     dual_gap = (gap**2).sum() + tv_new - im_norm + (new**2).sum()
     return 0.5 / im_norm * dual_gap
 
+
 def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
                                 check_gap_frequency=3):
 

From d4fa34faecc39cc96dfdaf7e6c6327fd99cb8ef7 Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Mon, 21 Jan 2013 19:33:00 +0100
Subject: [PATCH 2/7] ENH: Add bound constraints in TV

---
 demo_tv_bounds_reconstruction.py      | 75 +++++++++++++++++++++++++++
 reconstruction/forward_backward_tv.py | 15 +++++-
 reconstruction/tv_denoising.py        | 31 ++++++++---
 3 files changed, 113 insertions(+), 8 deletions(-)
 create mode 100644 demo_tv_bounds_reconstruction.py

diff --git a/demo_tv_bounds_reconstruction.py b/demo_tv_bounds_reconstruction.py
new file mode 100644
index 0000000..4eefefc
--- /dev/null
+++ b/demo_tv_bounds_reconstruction.py
@@ -0,0 +1,75 @@
+"""
+Total-variation penalization and bound constraints for tomography reconstruction
+================================================================================
+
+In this example, we reconstruct an image from its tomography projections
+with an uncomplete set of projections (l/8 angles, where l is the linear
+size of the image. For a correct reconstruction without a-priori information,
+one would usually require l or more angles). In addition, noise is added to
+the projections.
+
+In order to reconstruct the original image, we minimize a function that
+is the sum of (i) a L2 data fit term, and (ii) the total variation of the
+image, and bound constraints on the pixel values. Proximal iterations
+using the FISTA scheme are used.
+
+We compare with and without the bounds
+
+This example should take around 1mn to run and plot the results.
+"""
+
+print __doc__
+
+import numpy as np
+from reconstruction.forward_backward_tv import fista_tv
+from reconstruction.projections import build_projection_operator
+from reconstruction.util import generate_synthetic_data
+from time import time
+import matplotlib.pyplot as plt
+
+# Synthetic data
+l = 512
+np.random.seed(0)
+x = generate_synthetic_data(l)
+
+
+# Projection operator and projections data, with noise
+H = build_projection_operator(l, l / 32)
+y = H * x.ravel()[:, np.newaxis]
+y += 5 * np.random.randn(*y.shape)
+
+# Display original data
+plt.figure(figsize=(12, 5))
+plt.subplot(2, 3, 1)
+plt.imshow(x, cmap=plt.cm.gnuplot2, interpolation='nearest', vmin=-.1, vmax=1.2)
+plt.title('original data (256x256)')
+plt.axis('off')
+
+for idx, (val_min, val_max, name) in enumerate([
+                                        (None, None, 'TV'),
+                                        (0, 1, 'TV + interval'),
+                                    ]):
+    # Reconstruction
+    t1 = time()
+    res, energies = fista_tv(y, 50, 100, H, val_min=val_min,
+                             val_max=val_max)
+    t2 = time()
+
+    # Fraction of errors of segmented image wrt ground truth
+    err = np.abs(x - (res[-1] > 0.5)).mean()
+    print "%s: reconstruction done in %f s, %.3f%% segmentation error" % (
+                name, t2 - t1, 100 * err)
+
+    plt.subplot(2, 3, 2 + idx)
+    plt.imshow(res[-1], cmap=plt.cm.gnuplot2, interpolation='nearest', vmin=-.1,
+                vmax=1.2)
+    plt.title('reconstruction with %s' % name)
+    plt.axis('off')
+    ax = plt.subplot(2, 3, 5 + idx)
+    ax.yaxis.set_scale('log')
+    plt.hist(res[-1].ravel(), bins=20, normed=True)
+    plt.yticks(())
+    plt.title('Histogram of pixel intensity')
+    plt.axis('tight')
+
+plt.show()
diff --git a/reconstruction/forward_backward_tv.py b/reconstruction/forward_backward_tv.py
index 692aaa7..f2e50b7 100644
--- a/reconstruction/forward_backward_tv.py
+++ b/reconstruction/forward_backward_tv.py
@@ -11,6 +11,7 @@ def tv_norm(im):
     grad_x2 = np.diff(im, axis=1)
     return np.sqrt(grad_x1[:, :-1]**2 + grad_x2[:-1, :]**2).sum()
 
+
 def tv_norm_anisotropic(im):
     """Compute the anisotropic TV norm of an image"""
     grad_x1 = np.diff(im, axis=0)
@@ -19,7 +20,8 @@ def tv_norm_anisotropic(im):
 
 # ------------------ Proximal iterators ----------------------------
 
-def fista_tv(y, beta, niter, H, verbose=0, mask=None):
+def fista_tv(y, beta, niter, H, verbose=0, mask=None,
+             val_min=None, val_max=None):
     """
     TV regression using FISTA algorithm
     (Fast Iterative Shrinkage/Thresholding Algorithm)
@@ -42,6 +44,12 @@ def fista_tv(y, beta, niter, H, verbose=0, mask=None):
 
     mask : array of bools
 
+    val_min: None or float, optional
+        an optional lower bound constraint on the reconstructed image
+
+    val_max: None or float, optional
+        an optional upper bound constraint on the reconstructed image
+
     Returns
     -------
 
@@ -102,7 +110,8 @@ def fista_tv(y, beta, niter, H, verbose=0, mask=None):
         else:
             tmp2d = tmp.reshape((l, l))
         u_n = tv_denoise_fista(tmp2d,
-                weight=beta*gamma, eps=eps)
+                weight=beta*gamma, eps=eps, val_min=val_min,
+                val_max=val_max)
         t_new = (1 + np.sqrt(1 + 4 * t_old**2))/2.
         t_old = t_new
         x = u_n + (t_old - 1)/t_new * (u_n - u_old)
@@ -218,6 +227,7 @@ def ista_tv(y, beta, niter, H=None):
         energies.append(energy)
     return res, energies
 
+
 def gfb_tv(y, beta, niter, H=None, val_min=0, val_max=1, x0=None,
            stop_tol=1.e-4):
     """
@@ -332,6 +342,7 @@ def gfb_tv(y, beta, niter, H=None, val_min=0, val_max=1, x0=None,
             break
     return res, energies
 
+
 def gfb_tv_local(y, beta, niter, mask_pix, mask_reg, H=None,
                                 val_min=0, val_max=1, x0=None):
     """
diff --git a/reconstruction/tv_denoising.py b/reconstruction/tv_denoising.py
index 235d675..b227a71 100644
--- a/reconstruction/tv_denoising.py
+++ b/reconstruction/tv_denoising.py
@@ -72,8 +72,7 @@ def dual_gap(im, new, gap, weight):
 
 
 def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
-                                check_gap_frequency=3):
-
+                     check_gap_frequency=3, val_min=None, val_max=None):
     """
     Perform total-variation denoising on 2-d and 3-d images
 
@@ -101,6 +100,12 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     n_iter_max: int, optional
         maximal number of iterations used for the optimization.
 
+    val_min: None or float, optional
+        an optional lower bound constraint on the reconstructed image
+
+    val_max: None or float, optional
+        an optional upper bound constraint on the reconstructed image
+
     Returns
     -------
     out: ndarray
@@ -131,6 +136,7 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     t = 1.
     i = 0
     while i < n_iter_max:
+        # error is the dual variable
         error = weight * div(grad_aux) - im
         grad_tmp = gradient(error)
         grad_tmp *= 1./ (8 * weight)
@@ -141,13 +147,26 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
         grad_aux = (1 + t_factor) * grad_tmp - t_factor * grad_im
         grad_im = grad_tmp
         t = t_new
-        if (i % check_gap_frequency) == 0:
+        if (val_min is not None or val_max is not None or
+                                (i % check_gap_frequency) == 0):
             gap = weight * div(grad_im)
+            # Compute the primal variable
             new = im - gap
-            dgap = dual_gap(im, new, gap, weight)
-            if dgap < eps:
-                break
+            if (val_min is not None or val_max is not None):
+                new = new.clip(val_min, val_max, out=new)
+                # Now we need to recompute the dual variable
+                grad_im = gradient(new)
+            if (i % check_gap_frequency) == 0:
+                # In the case of bound constraints, the dual gap as we
+                # computed it may not go to zero.
+                dgap = dual_gap(im, new, gap, weight)
+                if dgap < eps:
+                    break
         i += 1
+    # Compute the primal variable
+    new = im - gap
+    if (val_min is not None or val_max is not None):
+        new = new.clip(val_min, val_max, out=new)
     return new
 
 

From 3f79b118d93032f7ee3e74e8a66d45f93c46cf02 Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Tue, 29 Jan 2013 16:02:13 +0100
Subject: [PATCH 3/7] BUG: Fix tv_denoising fista for 3D

The lipschitz constant was wrong
---
 reconstruction/tv_denoising.py | 47 +++++++++++++++++++++++++++++++---
 1 file changed, 44 insertions(+), 3 deletions(-)

diff --git a/reconstruction/tv_denoising.py b/reconstruction/tv_denoising.py
index b227a71..06d7870 100644
--- a/reconstruction/tv_denoising.py
+++ b/reconstruction/tv_denoising.py
@@ -72,7 +72,8 @@ def dual_gap(im, new, gap, weight):
 
 
 def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
-                     check_gap_frequency=3, val_min=None, val_max=None):
+                     check_gap_frequency=3, val_min=None, val_max=None,
+                     verbose=False):
     """
     Perform total-variation denoising on 2-d and 3-d images
 
@@ -106,6 +107,9 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     val_max: None or float, optional
         an optional upper bound constraint on the reconstructed image
 
+    verbose: bool, optional
+        if True, plot the dual gap of the optimization
+
     Returns
     -------
     out: ndarray
@@ -135,11 +139,19 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     grad_aux = np.zeros(shape)
     t = 1.
     i = 0
+    if im.ndim == 2:
+        # Upper bound on the Lipschitz constant
+        lipschitz_constant = 9
+    elif im.ndim == 3:
+        lipschitz_constant = 12
+    else:
+        raise ValueError('Cannot compute TV for images that are not '
+                         '2D or 3D')
     while i < n_iter_max:
         # error is the dual variable
         error = weight * div(grad_aux) - im
         grad_tmp = gradient(error)
-        grad_tmp *= 1./ (8 * weight)
+        grad_tmp *= 1./ (lipschitz_constant * weight)
         grad_aux += grad_tmp
         grad_tmp = _projector_on_dual(grad_aux)
         t_new = 1. / 2 * (1 + np.sqrt(1 + 4 * t**2))
@@ -160,6 +172,8 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
                 # In the case of bound constraints, the dual gap as we
                 # computed it may not go to zero.
                 dgap = dual_gap(im, new, gap, weight)
+                if verbose:
+                    print 'Iteration % 2i, dual gap: % 6.3e' % (i, dgap)
                 if dgap < eps:
                     break
         i += 1
@@ -170,16 +184,32 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     return new
 
 
+def test_grad_div_adjoint(size=12, random_state=42):
+    # We need to check that <D x, y> = <x, DT y> for x and y random vectors
+    random_state = np.random.RandomState(random_state)
+
+    x = np.random.normal(size=(size, size, size))
+    y = np.random.normal(size=(3, size, size, size))
+
+    np.testing.assert_almost_equal(np.sum(gradient(x) * y),
+                                   -np.sum(x * div(y)))
+
+
+
 if __name__ == '__main__':
+    # First our test
+    test_grad_div_adjoint()
     from scipy.misc import lena
     import matplotlib.pyplot as plt
     from time import time
+
+    # Smoke test on lena
     l = lena().astype(np.float)
     # normalize image between 0 and 1
     l /= l.max()
     l += 0.1 * l.std() * np.random.randn(*l.shape)
     t0 = time()
-    res = tv_denoise_fista(l, weight=0.05, eps=5.e-5)
+    res = tv_denoise_fista(l, weight=2.5, eps=5.e-5, verbose=True)
     t1 = time()
     print t1 - t0
     plt.figure()
@@ -187,4 +217,15 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     plt.imshow(l, cmap='gray')
     plt.subplot(122)
     plt.imshow(res, cmap='gray')
+
+    # Smoke test on a 3D random image with hidden structure
+    img = np.random.normal(size=(12, 24, 24))
+    img[4:8, 8:16, 8:16] += 1.5
+    res = tv_denoise_fista(img, weight=1.5, eps=5.e-5, verbose=True)
+    plt.figure()
+    plt.subplot(121)
+    plt.imshow(img[6], cmap='gray')
+    plt.subplot(122)
+    plt.imshow(res[6], cmap='gray')
+
     plt.show()

From becf21599d022ad98a1dacbb84bbd0b3dd20990b Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Wed, 30 Jan 2013 17:22:30 +0100
Subject: [PATCH 4/7] BUG: fix the constraint TV

---
 reconstruction/tv_denoising.py | 94 +++++++++++++++++++++++-----------
 1 file changed, 64 insertions(+), 30 deletions(-)

diff --git a/reconstruction/tv_denoising.py b/reconstruction/tv_denoising.py
index 06d7870..6a006b1 100644
--- a/reconstruction/tv_denoising.py
+++ b/reconstruction/tv_denoising.py
@@ -131,26 +131,42 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     total variation denoising in "Fast gradient-based algorithms for
     constrained total variation image denoising and deblurring problems"
     (2009).
+
+    For details on implementing the bound constraints, read the Beck and
+    Teboulle paper.
     """
-    if not im.dtype.kind == 'f':
-        im = im.astype(np.float)
-    shape = [im.ndim, ] + list(im.shape)
+    input_img = im
+    if not input_img.dtype.kind == 'f':
+        input_img = input_img.astype(np.float)
+    shape = [input_img.ndim, ] + list(input_img.shape)
     grad_im = np.zeros(shape)
     grad_aux = np.zeros(shape)
     t = 1.
     i = 0
-    if im.ndim == 2:
+    if input_img.ndim == 2:
         # Upper bound on the Lipschitz constant
         lipschitz_constant = 9
-    elif im.ndim == 3:
+    elif input_img.ndim == 3:
         lipschitz_constant = 12
     else:
         raise ValueError('Cannot compute TV for images that are not '
                          '2D or 3D')
+    # negated_output is the negated primal variable in the optimization
+    # loop
+    negated_output = -input_img
+    # Clipping values for the inner loop
+    negated_val_min = np.inf
+    negated_val_max = -np.inf
+    if val_min is not None:
+        negated_val_min = -val_min
+    if val_max is not None:
+        negated_val_max = -val_max
+    if (val_min is not None or val_max is not None):
+        # With bound constraints, the stopping criterion is on the
+        # evolution of the output
+        negated_output_old = negated_output.copy()
     while i < n_iter_max:
-        # error is the dual variable
-        error = weight * div(grad_aux) - im
-        grad_tmp = gradient(error)
+        grad_tmp = gradient(negated_output)
         grad_tmp *= 1./ (lipschitz_constant * weight)
         grad_aux += grad_tmp
         grad_tmp = _projector_on_dual(grad_aux)
@@ -159,29 +175,37 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
         grad_aux = (1 + t_factor) * grad_tmp - t_factor * grad_im
         grad_im = grad_tmp
         t = t_new
-        if (val_min is not None or val_max is not None or
-                                (i % check_gap_frequency) == 0):
-            gap = weight * div(grad_im)
-            # Compute the primal variable
-            new = im - gap
-            if (val_min is not None or val_max is not None):
-                new = new.clip(val_min, val_max, out=new)
-                # Now we need to recompute the dual variable
-                grad_im = gradient(new)
-            if (i % check_gap_frequency) == 0:
-                # In the case of bound constraints, the dual gap as we
-                # computed it may not go to zero.
-                dgap = dual_gap(im, new, gap, weight)
+        gap = weight * div(grad_im)
+        # Compute the primal variable
+        negated_output = gap - input_img
+        if (val_min is not None or val_max is not None):
+            negated_output = negated_output.clip(negated_val_max,
+                                negated_val_min,
+                                out=negated_output)
+        if (i % check_gap_frequency) == 0:
+            if val_min is None and val_max is None:
+                # In the case of bound constraints, we don't have
+                # the dual gap
+                dgap = dual_gap(input_img, -negated_output, gap, weight)
                 if verbose:
                     print 'Iteration % 2i, dual gap: % 6.3e' % (i, dgap)
                 if dgap < eps:
                     break
+            else:
+                diff = np.max(np.abs(negated_output_old - negated_output))
+                diff /= np.max(np.abs(negated_output))
+                if verbose:
+                    print 'Iteration % 2i, relative difference: % 6.3e' % (i,
+                                diff)
+                if diff < eps:
+                    break
+                negated_output_old = negated_output
         i += 1
     # Compute the primal variable
-    new = im - gap
+    output = input_img - gap
     if (val_min is not None or val_max is not None):
-        new = new.clip(val_min, val_max, out=new)
-    return new
+        output = output.clip(val_min, val_max, out=output)
+    return output
 
 
 def test_grad_div_adjoint(size=12, random_state=42):
@@ -219,13 +243,23 @@ def test_grad_div_adjoint(size=12, random_state=42):
     plt.imshow(res, cmap='gray')
 
     # Smoke test on a 3D random image with hidden structure
+    np.random.seed(42)
     img = np.random.normal(size=(12, 24, 24))
     img[4:8, 8:16, 8:16] += 1.5
-    res = tv_denoise_fista(img, weight=1.5, eps=5.e-5, verbose=True)
-    plt.figure()
-    plt.subplot(121)
-    plt.imshow(img[6], cmap='gray')
-    plt.subplot(122)
-    plt.imshow(res[6], cmap='gray')
+    res = tv_denoise_fista(img, weight=.6, eps=5.e-5, verbose=True)
+    plt.figure(figsize=(9, 3))
+    plt.subplot(131)
+    plt.imshow(img[6], cmap='gist_earth')
+    plt.title('Original data')
+    plt.subplot(132)
+    plt.imshow(res[6], cmap='gist_earth', vmin=-.1, vmax=.3)
+    plt.title('TV')
+
+    # add constraints
+    res_cons = tv_denoise_fista(img, weight=.6, eps=5.e-5, verbose=True,
+                           val_min=0, val_max=1.5)
+    plt.subplot(133)
+    plt.imshow(res_cons[6], cmap='gist_earth', vmin=-.1, vmax=.3)
+    plt.title('TV + interval')
 
     plt.show()

From b8d16176845bd00e3db5a52f02622675543a5208 Mon Sep 17 00:00:00 2001
From: Alexandre Abraham <abraham.alexandre@gmail.com>
Date: Mon, 4 Feb 2013 11:26:36 +0100
Subject: [PATCH 5/7] BUG: Fix clipping if val_min or val_max is None

---
 reconstruction/tv_denoising.py | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/reconstruction/tv_denoising.py b/reconstruction/tv_denoising.py
index 6a006b1..3dcc88c 100644
--- a/reconstruction/tv_denoising.py
+++ b/reconstruction/tv_denoising.py
@@ -1,5 +1,6 @@
 import numpy as np
 
+
 def div(grad):
     """ Compute divergence of image gradient """
     res = np.zeros(grad.shape[1:])
@@ -32,7 +33,7 @@ def gradient(img):
     gradient = np.zeros(shape, dtype=img.dtype)
     # 'Clever' code to have a view of the gradient with dimension i stop
     # at -1
-    slice_all = [0, slice(None, -1),]
+    slice_all = [0, slice(None, -1), ]
     for d in range(img.ndim):
         gradient[slice_all] = np.diff(img, axis=d)
         slice_all[0] = d + 1
@@ -45,7 +46,7 @@ def _projector_on_dual(grad):
     modifies in place the gradient to project it
     on the L2 unit ball
     """
-    norm = np.maximum(np.sqrt(np.sum(grad**2, 0)), 1.)
+    norm = np.maximum(np.sqrt(np.sum(grad ** 2, 0)), 1.)
     for grad_comp in grad:
         grad_comp /= norm
     return grad
@@ -57,17 +58,17 @@ def dual_gap(im, new, gap, weight):
     see "Total variation regularization for fMRI-based prediction of behavior",
     by Michel et al. (2011) for a derivation of the dual gap
     """
-    im_norm = (im**2).sum()
+    im_norm = (im ** 2).sum()
     gx, gy = np.zeros_like(new), np.zeros_like(new)
     gx[:-1] = np.diff(new, axis=0)
     gy[:, :-1] = np.diff(new, axis=1)
     if im.ndim == 3:
         gz = np.zeros_like(new)
         gz[..., :-1] = np.diff(new, axis=2)
-        tv_new = 2 * weight * np.sqrt(gx**2 + gy**2 + gz**2).sum()
+        tv_new = 2 * weight * np.sqrt(gx ** 2 + gy ** 2 + gz ** 2).sum()
     else:
-        tv_new = 2 * weight * np.sqrt(gx**2 + gy**2).sum()
-    dual_gap = (gap**2).sum() + tv_new - im_norm + (new**2).sum()
+        tv_new = 2 * weight * np.sqrt(gx ** 2 + gy ** 2).sum()
+    dual_gap = (gap ** 2).sum() + tv_new - im_norm + (new ** 2).sum()
     return 0.5 / im_norm * dual_gap
 
 
@@ -155,8 +156,8 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     # loop
     negated_output = -input_img
     # Clipping values for the inner loop
-    negated_val_min = np.inf
-    negated_val_max = -np.inf
+    negated_val_min = np.nan
+    negated_val_max = np.nan
     if val_min is not None:
         negated_val_min = -val_min
     if val_max is not None:
@@ -167,10 +168,10 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
         negated_output_old = negated_output.copy()
     while i < n_iter_max:
         grad_tmp = gradient(negated_output)
-        grad_tmp *= 1./ (lipschitz_constant * weight)
+        grad_tmp *= 1. / (lipschitz_constant * weight)
         grad_aux += grad_tmp
         grad_tmp = _projector_on_dual(grad_aux)
-        t_new = 1. / 2 * (1 + np.sqrt(1 + 4 * t**2))
+        t_new = 1. / 2 * (1 + np.sqrt(1 + 4 * t ** 2))
         t_factor = (t - 1) / t_new
         grad_aux = (1 + t_factor) * grad_tmp - t_factor * grad_im
         grad_im = grad_tmp
@@ -204,7 +205,7 @@ def tv_denoise_fista(im, weight=50, eps=5.e-5, n_iter_max=200,
     # Compute the primal variable
     output = input_img - gap
     if (val_min is not None or val_max is not None):
-        output = output.clip(val_min, val_max, out=output)
+        output = output.clip(-negated_val_min, -negated_val_max, out=output)
     return output
 
 
@@ -219,7 +220,6 @@ def test_grad_div_adjoint(size=12, random_state=42):
                                    -np.sum(x * div(y)))
 
 
-
 if __name__ == '__main__':
     # First our test
     test_grad_div_adjoint()

From 71e9d57506f7aa823b687579f0e7a5d745b984cb Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Mon, 4 Feb 2013 17:16:58 +0100
Subject: [PATCH 6/7] ENH: Prox TV+l1

---
 reconstruction/tv_l1.py | 278 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 278 insertions(+)
 create mode 100644 reconstruction/tv_l1.py

diff --git a/reconstruction/tv_l1.py b/reconstruction/tv_l1.py
new file mode 100644
index 0000000..3640c21
--- /dev/null
+++ b/reconstruction/tv_l1.py
@@ -0,0 +1,278 @@
+""" LV + l1 proximal operator
+
+The core idea here is to modify the analysis operator in the Beck &
+Teboulle approach (actually Chambolle) to keep the identity and thus to
+end up with an l1.
+"""
+
+import numpy as np
+
+
+def div_id(grad, l1_ratio=1.):
+    """ Compute divergence + id of image gradient + id"""
+    res = np.zeros(grad.shape[1:])
+    # The divergence part
+    for d in range(grad.shape[0] - 1):
+        this_grad = np.rollaxis(grad[d], d)
+        this_res = np.rollaxis(res, d)
+        this_res[:-1] += this_grad[:-1]
+        this_res[1:-1] -= this_grad[:-2]
+        this_res[-1] -= this_grad[-2]
+    # The identity part
+    res -= l1_ratio * grad[-1]
+    return res
+
+
+def gradient_id(img, l1_ratio=1.):
+    """
+    Compute gradient + id of an image
+
+    Parameters
+    ===========
+    img: ndarray
+        N-dimensional image
+
+    Returns
+    =======
+    gradient: ndarray
+        Gradient of the image: the i-th component along the first
+        axis is the gradient along the i-th axis of the original
+        array img
+    """
+    shape = [img.ndim + 1, ] + list(img.shape)
+    gradient = np.zeros(shape, dtype=img.dtype)
+    # The gradient part: 'Clever' code to have a view of the gradient
+    # with dimension i stop at -1
+    slice_all = [0, slice(None, -1),]
+    for d in range(img.ndim):
+        gradient[slice_all] = np.diff(img, axis=d)
+        slice_all[0] = d + 1
+        slice_all.insert(1, slice(None))
+    # The identity part
+    gradient[-1] = l1_ratio * img
+    return gradient
+
+
+def _projector_on_dual(grad):
+    """
+    modifies in place the gradient + id to project it
+    on the l21 unit ball in the gradient direction and the l1 ball in the
+    identity direction
+    """
+    # The l21 ball for the gradient direction
+    norm = np.maximum(np.sqrt(np.sum(grad[:-1]**2, 0)), 1.)
+    for grad_comp in grad[:-1]:
+        grad_comp /= norm
+    # The l1 ball for the identity direction
+    grad[-1] /= np.maximum(np.abs(grad[-1]), 1.)
+    return grad
+
+
+def total_variation(gradient):
+    """ Our total-variation like norm
+    """
+    return (np.sum(np.sqrt(np.sum(gradient[:-1]**2, axis=0)))
+            + np.sum(np.abs(gradient[-1])))
+
+
+def dual_gap(im, new, gap, weight, l1_ratio=1.):
+    """
+    dual gap of total variation denoising
+    see "Total variation regularization for fMRI-based prediction of behavior",
+    by Michel et al. (2011) for a derivation of the dual gap
+    """
+    im_norm = (im**2).sum()
+    tv_new = total_variation(gradient_id(new, l1_ratio=l1_ratio))
+    d_gap = (gap**2).sum() + 2*weight*tv_new - im_norm + (new**2).sum()
+    return 0.5 / im_norm * d_gap
+
+
+def _objective_function(input_img, output_img, gradient, weight):
+    return (.5 * ((input_img - output_img)**2).sum()
+            + weight * total_variation(gradient))
+
+
+def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
+                     check_gap_frequency=3, val_min=None, val_max=None,
+                     verbose=False, fista=True):
+    """
+    Perform total-variation denoising on 2-d and 3-d images
+
+    Find the argmin `res` of
+        1/2 * ||im - res||^2 + weight * TV(res),
+
+    where TV is the isotropic l1 norm of the gradient.
+
+    Parameters
+    ----------
+    im: ndarray of floats (2-d or 3-d)
+        input data to be denoised. `im` can be of any numeric type,
+        but it is cast into an ndarray of floats for the computation
+        of the denoised image.
+
+    weight: float, optional
+        denoising weight. The greater ``weight``, the more denoising (at
+        the expense of fidelity to ``input``)
+
+    eps: float, optional
+        precision required. The distance to the exact solution is computed
+        by the dual gap of the optimization problem and rescaled by the l2
+        norm of the image (for contrast invariance).
+
+    n_iter_max: int, optional
+        maximal number of iterations used for the optimization.
+
+    val_min: None or float, optional
+        an optional lower bound constraint on the reconstructed image
+
+    val_max: None or float, optional
+        an optional upper bound constraint on the reconstructed image
+
+    verbose: bool, optional
+        if True, plot the dual gap of the optimization
+
+    Returns
+    -------
+    out: ndarray
+        denoised array
+
+    Notes
+    -----
+    The principle of total variation denoising is explained in
+    http://en.wikipedia.org/wiki/Total_variation_denoising
+
+    The principle of total variation denoising is to minimize the
+    total variation of the image, which can be roughly described as
+    the integral of the norm of the image gradient. Total variation
+    denoising tends to produce "cartoon-like" images, that is,
+    piecewise-constant images.
+
+    This function implements the FISTA (Fast Iterative Shrinkage
+    Thresholding Algorithm) algorithm of Beck et Teboulle, adapted to
+    total variation denoising in "Fast gradient-based algorithms for
+    constrained total variation image denoising and deblurring problems"
+    (2009).
+
+    For details on implementing the bound constraints, read the Beck and
+    Teboulle paper.
+    """
+    weight = float(weight)
+    input_img = im
+    if not input_img.dtype.kind == 'f':
+        input_img = input_img.astype(np.float)
+    shape = [input_img.ndim + 1, ] + list(input_img.shape)
+    grad_im = np.zeros(shape)
+    grad_aux = np.zeros(shape)
+    t = 1.
+    i = 0
+    if input_img.ndim == 2:
+        # Upper bound on the Lipschitz constant
+        # Theory tells us that the Lipschitz constant of div * grad is 8
+        lipschitz_constant = 1.1 * (8 + l1_ratio**2)
+    elif input_img.ndim == 3:
+        # Theory tells us that the Lipschitz constant of div * grad is 12
+        lipschitz_constant = 1.1 * (12 + l1_ratio**2)
+    else:
+        raise ValueError('Cannot compute TV for images that are not '
+                         '2D or 3D')
+    # negated_output is the negated primal variable in the optimization
+    # loop
+    negated_output = -input_img
+    # Clipping values for the inner loop
+    negated_val_min = np.inf
+    negated_val_max = -np.inf
+    if val_min is not None:
+        negated_val_min = -val_min
+    if val_max is not None:
+        negated_val_max = -val_max
+    if True or (val_min is not None or val_max is not None):
+        # With bound constraints, the stopping criterion is on the
+        # evolution of the output
+        negated_output_old = negated_output.copy()
+    while i < n_iter_max:
+        grad_tmp = gradient_id(negated_output, l1_ratio=l1_ratio)
+        grad_tmp *= 1. / (lipschitz_constant * weight)
+        grad_aux += grad_tmp
+        grad_tmp = _projector_on_dual(grad_aux)
+        t_new = 1. / 2 * (1 + np.sqrt(1 + 4 * t**2))
+        t_factor = (t - 1) / t_new
+        if fista:
+            grad_aux = (1 + t_factor) * grad_tmp - t_factor * grad_im
+        else:
+            grad_aux = grad_tmp
+        grad_im = grad_tmp
+        t = t_new
+        gap = weight * div_id(grad_aux, l1_ratio=l1_ratio)
+        # Compute the primal variable
+        negated_output = gap - input_img
+        if (val_min is not None or val_max is not None):
+            negated_output = negated_output.clip(negated_val_max,
+                                negated_val_min,
+                                out=negated_output)
+        if (i % check_gap_frequency) == 0:
+            if val_min is None and val_max is None:
+                # In the case of bound constraints, we don't have
+                # the dual gap
+                dgap = dual_gap(input_img, -negated_output, gap, weight,
+                                l1_ratio=l1_ratio)
+                if verbose:
+                    print 'Iteration % 2i, dual gap: % 6.3e' % (i, dgap)
+                if dgap < eps:
+                    break
+            else:
+                diff = np.max(np.abs(negated_output_old - negated_output))
+                diff /= np.max(np.abs(negated_output))
+                if verbose:
+                    print ('Iteration % 2i, relative difference: % 6.3e,'
+                           'energy: % 6.3e, %s' % (i, diff,
+                           _objective_function(input_img,
+                           -negated_output,
+                           gradient_id(negated_output, l1_ratio=l1_ratio),
+                           weight)))
+                if diff < eps:
+                    break
+                negated_output_old = negated_output
+        i += 1
+    # Compute the primal variable, however, here we must use the ista
+    # value, not the fista one
+    output = input_img - weight * div_id(grad_im, l1_ratio=l1_ratio)
+    if (val_min is not None or val_max is not None):
+        output = output.clip(val_min, val_max, out=output)
+    return output
+
+
+def test_grad_div_adjoint(size=12, random_state=42):
+    # We need to check that <D x, y> = <x, DT y> for x and y random vectors
+    random_state = np.random.RandomState(random_state)
+
+    x = np.random.normal(size=(size, size, size))
+    y = np.random.normal(size=(4, size, size, size))
+
+    np.testing.assert_almost_equal(np.sum(gradient_id(x, l1_ratio=2.) * y),
+                                   -np.sum(x * div_id(y, l1_ratio=2.)))
+
+
+if __name__ == '__main__':
+    # First our test
+    test_grad_div_adjoint()
+    import matplotlib.pyplot as plt
+    from time import time
+
+    np.random.seed(0)
+    l = np.zeros((256, 256))
+    l[10:50, 10:50] = 1.2
+    l[-60:-30, 120:220] = 2.
+    l_noisy = l + 3 * l.std() * np.random.randn(*l.shape)
+    t0 = time()
+    res = tv_l1_fista(l, weight=2.5, l1_ratio=.02, eps=1.e-5, verbose=True,
+                      fista=True, n_iter_max=5000)
+    t1 = time()
+    print t1 - t0
+    plt.figure()
+    plt.subplot(121)
+    plt.imshow(l, cmap=plt.cm.gist_earth, vmin=-1., vmax=5.)
+    plt.subplot(122)
+    plt.imshow(res, cmap=plt.cm.gist_earth, vmin=-1., vmax=5.)
+    plt.show()
+
+

From 6431dae2424450273b8cc54868c73b87e60b259a Mon Sep 17 00:00:00 2001
From: GaelVaroquaux <gael.varoquaux@normalesup.org>
Date: Wed, 13 Feb 2013 15:55:27 +0100
Subject: [PATCH 7/7] Small optims in tv_l1 + dual gap

---
 reconstruction/tv_l1.py | 69 +++++++++++++++++++++++++----------------
 1 file changed, 43 insertions(+), 26 deletions(-)

diff --git a/reconstruction/tv_l1.py b/reconstruction/tv_l1.py
index 3640c21..19336aa 100644
--- a/reconstruction/tv_l1.py
+++ b/reconstruction/tv_l1.py
@@ -55,16 +55,19 @@ def gradient_id(img, l1_ratio=1.):
 
 def _projector_on_dual(grad):
     """
-    modifies in place the gradient + id to project it
+    modifies IN PLACE the gradient + id to project it
     on the l21 unit ball in the gradient direction and the l1 ball in the
     identity direction
     """
     # The l21 ball for the gradient direction
-    norm = np.maximum(np.sqrt(np.sum(grad[:-1]**2, 0)), 1.)
+    norm = np.sqrt(np.sum(grad[:-1]**2, 0))
+    norm.clip(1., out=norm)
     for grad_comp in grad[:-1]:
         grad_comp /= norm
     # The l1 ball for the identity direction
-    grad[-1] /= np.maximum(np.abs(grad[-1]), 1.)
+    norm = np.abs(grad[-1])
+    norm.clip(1., out=norm)
+    grad[-1] /= norm
     return grad
 
 
@@ -75,16 +78,15 @@ def total_variation(gradient):
             + np.sum(np.abs(gradient[-1])))
 
 
-def dual_gap(im, new, gap, weight, l1_ratio=1.):
+def dual_gap(input_img_norm, new, gap, weight, l1_ratio=1.):
     """
     dual gap of total variation denoising
     see "Total variation regularization for fMRI-based prediction of behavior",
     by Michel et al. (2011) for a derivation of the dual gap
     """
-    im_norm = (im**2).sum()
     tv_new = total_variation(gradient_id(new, l1_ratio=l1_ratio))
-    d_gap = (gap**2).sum() + 2*weight*tv_new - im_norm + (new**2).sum()
-    return 0.5 / im_norm * d_gap
+    d_gap = (gap**2).sum() + 2*weight*tv_new - input_img_norm + (new**2).sum()
+    return 0.5 / input_img_norm * d_gap
 
 
 def _objective_function(input_img, output_img, gradient, weight):
@@ -92,9 +94,11 @@ def _objective_function(input_img, output_img, gradient, weight):
             + weight * total_variation(gradient))
 
 
-def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
-                     check_gap_frequency=3, val_min=None, val_max=None,
-                     verbose=False, fista=True):
+@profile
+def tv_l1_fista(im, l1_ratio=.05, weight=50, dgap_tol=5.e-5, x_tol=None,
+                     n_iter_max=200,
+                     check_gap_frequency=4, val_min=None, val_max=None,
+                     verbose=True, fista=True):
     """
     Perform total-variation denoising on 2-d and 3-d images
 
@@ -114,10 +118,15 @@ def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
         denoising weight. The greater ``weight``, the more denoising (at
         the expense of fidelity to ``input``)
 
-    eps: float, optional
+    dgap_tol: float, optional
         precision required. The distance to the exact solution is computed
-        by the dual gap of the optimization problem and rescaled by the l2
-        norm of the image (for contrast invariance).
+        by the dual gap of the optimization problem and rescaled by the
+        squared l2 norm of the image (for contrast invariance).
+
+    x_tol: float or None, optional
+        The maximal relative difference between input and output. If
+        specified, this specifies a stopping criterion on x, rather than
+        the dual gap
 
     n_iter_max: int, optional
         maximal number of iterations used for the optimization.
@@ -158,6 +167,7 @@ def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
     """
     weight = float(weight)
     input_img = im
+    input_img_norm = (im ** 2).sum()
     if not input_img.dtype.kind == 'f':
         input_img = input_img.astype(np.float)
     shape = [input_img.ndim + 1, ] + list(input_img.shape)
@@ -189,11 +199,15 @@ def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
         # With bound constraints, the stopping criterion is on the
         # evolution of the output
         negated_output_old = negated_output.copy()
+    grad_tmp = None
     while i < n_iter_max:
         grad_tmp = gradient_id(negated_output, l1_ratio=l1_ratio)
         grad_tmp *= 1. / (lipschitz_constant * weight)
         grad_aux += grad_tmp
         grad_tmp = _projector_on_dual(grad_aux)
+        # Carefull, in the next few lines, grad_tmp and grad_aux are a
+        # view on the same array, as _projector_on_dual returns a view
+        # on the input array
         t_new = 1. / 2 * (1 + np.sqrt(1 + 4 * t**2))
         t_factor = (t - 1) / t_new
         if fista:
@@ -210,26 +224,29 @@ def tv_l1_fista(im, l1_ratio=.05, weight=50, eps=5.e-5, n_iter_max=200,
                                 negated_val_min,
                                 out=negated_output)
         if (i % check_gap_frequency) == 0:
-            if val_min is None and val_max is None:
-                # In the case of bound constraints, we don't have
-                # the dual gap
-                dgap = dual_gap(input_img, -negated_output, gap, weight,
-                                l1_ratio=l1_ratio)
+            if x_tol is None:
+                # Stopping criterion based on the dual_gap
+                if val_min is not None or val_max is not None:
+                    # We need to recompute the dual variable
+                    gap = negated_output + input_img
+                dgap = dual_gap(input_img_norm, -negated_output,
+                                gap, weight, l1_ratio=l1_ratio)
                 if verbose:
                     print 'Iteration % 2i, dual gap: % 6.3e' % (i, dgap)
-                if dgap < eps:
+                if dgap < dgap_tol:
                     break
             else:
+                # Stopping criterion based on x_tol
                 diff = np.max(np.abs(negated_output_old - negated_output))
                 diff /= np.max(np.abs(negated_output))
                 if verbose:
                     print ('Iteration % 2i, relative difference: % 6.3e,'
-                           'energy: % 6.3e, %s' % (i, diff,
+                           'energy: % 6.3e' % (i, diff,
                            _objective_function(input_img,
-                           -negated_output,
-                           gradient_id(negated_output, l1_ratio=l1_ratio),
-                           weight)))
-                if diff < eps:
+                                -negated_output,
+                                gradient_id(negated_output, l1_ratio=l1_ratio),
+                                weight)))
+                if diff < x_tol:
                     break
                 negated_output_old = negated_output
         i += 1
@@ -264,8 +281,8 @@ def test_grad_div_adjoint(size=12, random_state=42):
     l[-60:-30, 120:220] = 2.
     l_noisy = l + 3 * l.std() * np.random.randn(*l.shape)
     t0 = time()
-    res = tv_l1_fista(l, weight=2.5, l1_ratio=.02, eps=1.e-5, verbose=True,
-                      fista=True, n_iter_max=5000)
+    res = tv_l1_fista(l, weight=2.5, l1_ratio=.02, dgap_tol=1.e-5,
+                      verbose=True, fista=True, n_iter_max=5000)
     t1 = time()
     print t1 - t0
     plt.figure()