[gegl] move lohalo to nohalo and replace lohalo internals with Mitchell-Netravali + EWA Robidoux

From: Nicolas Robidoux <nrobidoux src gnome org>
To: commits-list gnome org
Cc:
Subject: [gegl] move lohalo to nohalo and replace lohalo internals with Mitchell-Netravali + EWA Robidoux
Date: Mon, 31 Dec 2012 19:23:35 +0000 (UTC)
commit 9a73547158c4b5b834d8a31b2a6e015f92656fa4
Author: Nicolas Robidoux <nrobidoux git gnome org>
Date:   Mon Dec 31 13:57:33 2012 -0500

    move lohalo to nohalo and replace lohalo internals with Mitchell-Netravali + EWA Robidoux

 gegl/buffer/Makefile.am               |    2 +
 gegl/buffer/gegl-buffer-access.c      |    1 +
 gegl/buffer/gegl-buffer.c             |    3 +-
 gegl/buffer/gegl-buffer.h             |    6 +-
 gegl/buffer/gegl-sampler-lohalo.c     | 2951 ++++++++++-----------------------
 gegl/buffer/gegl-sampler-nohalo.c     | 2677 ++++++++++++++++++++++++++++++
 gegl/buffer/gegl-sampler-nohalo.h     |   49 +
 gegl/buffer/gegl-sampler.c            |    6 +
 gegl/gegl-enums.h                     |    1 +
 operations/common/polar-coordinates.c |    2 +-
 operations/transform/transform-core.c |    2 +-
 operations/workshop/fractal-trace.c   |   16 +-
 operations/workshop/whirl-pinch.c     |    2 +-
 13 files changed, 3651 insertions(+), 2067 deletions(-)
---
diff --git a/gegl/buffer/Makefile.am b/gegl/buffer/Makefile.am
index 1a76bbb..806a717 100644
--- a/gegl/buffer/Makefile.am
+++ b/gegl/buffer/Makefile.am
@@ -30,6 +30,7 @@ libbuffer_la_SOURCES = \
     gegl-sampler-cubic.c	\
     gegl-sampler-linear.c	\
     gegl-sampler-nearest.c	\
+    gegl-sampler-nohalo.c       \
     gegl-sampler-lohalo.c       \
     gegl-region-generic.c	\
     gegl-tile.c			\
@@ -59,6 +60,7 @@ libbuffer_la_SOURCES = \
     gegl-sampler-cubic.h	\
     gegl-sampler-linear.h	\
     gegl-sampler-nearest.h	\
+    gegl-sampler-nohalo.h       \
     gegl-sampler-lohalo.h       \
     gegl-region.h		\
     gegl-region-generic.h	\
diff --git a/gegl/buffer/gegl-buffer-access.c b/gegl/buffer/gegl-buffer-access.c
index 359bd5e..6aa7e09 100644
--- a/gegl/buffer/gegl-buffer-access.c
+++ b/gegl/buffer/gegl-buffer-access.c
@@ -35,6 +35,7 @@
 #include "gegl-sampler-nearest.h"
 #include "gegl-sampler-linear.h"
 #include "gegl-sampler-cubic.h"
+#include "gegl-sampler-nohalo.h"
 #include "gegl-sampler-lohalo.h"
 #include "gegl-buffer-index.h"
 #include "gegl-tile-backend.h"
diff --git a/gegl/buffer/gegl-buffer.c b/gegl/buffer/gegl-buffer.c
index 874eede..ec4537c 100644
--- a/gegl/buffer/gegl-buffer.c
+++ b/gegl/buffer/gegl-buffer.c
@@ -56,6 +56,7 @@
 #include "gegl-sampler-nearest.h"
 #include "gegl-sampler-linear.h"
 #include "gegl-sampler-cubic.h"
+#include "gegl-sampler-nohalo.h"
 #include "gegl-sampler-lohalo.h"
 #include "gegl-types-internal.h"
 #include "gegl-utils.h"
@@ -745,7 +746,7 @@ gegl_buffer_constructor (GType                  type,
       /* Don't have the abyss track the extent if the intersection is
        * not the entire extent. Otherwise, setting the extent identical
        * to itself could suddenly make the abyss bigger. */
-      if (buffer->abyss_tracks_extent && 
+      if (buffer->abyss_tracks_extent &&
           (buffer->extent.x      != self.x ||
            buffer->extent.y      != self.y ||
            buffer->extent.width  != self.width ||
diff --git a/gegl/buffer/gegl-buffer.h b/gegl/buffer/gegl-buffer.h
index 0d2d507..cdb0e45 100644
--- a/gegl/buffer/gegl-buffer.h
+++ b/gegl/buffer/gegl-buffer.h
@@ -405,7 +405,8 @@ GeglBuffer *    gegl_buffer_dup               (GeglBuffer       *buffer);
  * @format: the format to store the sampled color in.
  * @sampler_type: the sampler type to use,
  * to be ported from working code. Valid values: GEGL_SAMPLER_NEAREST,
- * GEGL_SAMPLER_LINEAR, GEGL_SAMPLER_CUBIC and GEGL_SAMPLER_LOHALO
+ * GEGL_SAMPLER_LINEAR, GEGL_SAMPLER_CUBIC, GEGL_SAMPLER_NOHALO and
+ * GEGL_SAMPLER_LOHALO
  * @repeat_mode: how requests outside the buffer extent are handled.
  * Valid values: GEGL_ABYSS_NONE (abyss pixels are zeroed), GEGL_ABYSS_WHITE
  * (abyss pixels are white), GEGL_ABYSS_BLACK (abyss pixels are black),
@@ -455,7 +456,8 @@ GeglSamplerType gegl_sampler_type_from_string (const gchar *string);
  * @format: format we want data back in
  * @sampler_type: the sampler type to use,
  * to be ported from working code. Valid values: GEGL_SAMPLER_NEAREST,
- * GEGL_SAMPLER_LINEAR, GEGL_SAMPLER_CUBIC and GEGL_SAMPLER_LOHALO
+ * GEGL_SAMPLER_LINEAR, GEGL_SAMPLER_CUBIC, GEGL_SAMPLER_NOHALO and
+ * GEGL_SAMPLER_LOHALO
  *
  * Create a new sampler, when you are done with the sampler, g_object_unref
  * it.
diff --git a/gegl/buffer/gegl-sampler-lohalo.c b/gegl/buffer/gegl-sampler-lohalo.c
index acf17ae..fa03a59 100644
--- a/gegl/buffer/gegl-sampler-lohalo.c
+++ b/gegl/buffer/gegl-sampler-lohalo.c
@@ -15,8 +15,6 @@
  * <http://www.gnu.org/licenses/>.
  *
  * 2012 (c) Nicolas Robidoux
- * 2009-2011 (c) Nicolas Robidoux, Adam Turcotte, Chantal Racette,
- * Anthony Thyssen, John Cupitt and Ãyvind KolÃs.
  */
 
 /*
@@ -25,14 +23,19 @@
  * ==============
  *
  * The Lohalo ("Low Halo") sampler is a Jacobian-adaptive blend of
- * LBB-Nohalo (Nohalo subdivision with Locally Bounded Bicubic
- * interpolation) and Clamped EWA (Elliptical Weighted Averaging)
- * filtering with the "teepee" (radial tent, that is, conical) kernel.
+ * sigmoidized tensor filtering with the Mitchell-Netravali Keys cubic
+ * filter used as an upsampler (thus is unscaled), with
+ * non-sigmoidized (plain linear light) EWA (Elliptical Weighted
+ * Averaging) filtering with the Robidoux Keys cubic, which is used
+ * whenever some downsampling occurs and consequently is appropriately
+ * scaled.
  *
  * WARNING: This version of Lohalo only gives top quality results down
- * to about a downsampling of about ratio 1/(LOHALO_OFFSET_0+0.5).
+ * to about a downsampling of about ratio 2/(LOHALO_OFFSET_0+0.5).
  * Beyond that, the quality is somewhat lower (due to the use of
- * higher level mipmap data).
+ * higher level mipmap data instead of "level 0" unfiltered input
+ * data). (The "2" in the numerator is because the radius of the
+ * Robidoux EWA filter is 2.)
  *
  * The use of mipmap data is not a feature of the resampling methods
  * themselves: It is done to accommodate GEGL's preferred pixel data
@@ -40,69 +43,64 @@
  */
 
 /*
- * Reference:
+ * Credits and thanks:
  *
- * Nohalo subdivision (with bilinear instead of LBB "finish") is
- * documented in
+ * This code owes a lot to R&D performed for ImageMagick by
+ * N. Robidoux and Anthony Thyssen, and student research performed by
+ * A. Turcotte and C. Racette.
  *
- *   Robidoux, N., Gong, M., Cupitt, J., Turcotte, A., and Martinez,
- *   K.  CPU, SMP and GPU implementations of Nohalo level 1, a fast
- *   co-convex antialiasing image resampler.  In Proceedings of
- *   C3S2E. 2009, 185-195.
- */
-
-/*
- * Credits and thanks:
+ * Sigmoidization was invented by N. Robidoux as a method of
+ * minimizing the over and undershoots that arise out of filtering
+ * with kernel with one more negative lobe. It basically consists of
+ * resampling through a colorspace in which gamut extremes are "far"
+ * from midtones.
  *
  * Jacobian adaptive resampling was developed by N. Robidoux and
  * A. Turcotte of the Department of Mathematics and Computer Science
  * of Laurentian University in the course of A. Turcotte's Masters in
- * Computational Sciences. Later development was done while
- * N. Robidoux was an independent consultant.
+ * Computational Sciences (even though the eventual thesis did not
+ * include this topic). Ãyvind KolÃs and Michael Natterer contributed
+ * much to the GEGL implementation.
  *
- * Nohalo with LBB finishing scheme was developed by N. Robidoux and
- * C. Racette of the Department of Mathematics and Computer Science of
- * Laurentian University in the course of C. Racette's Masters in
- * Computational Sciences. Preliminary work on Nohalo and monotone
- * interpolation was performed by C. Racette and N. Robidoux in the
- * course of her honours thesis, by N. Robidoux, A. Turcotte and Eric
- * Daoust during Google Summer of Code 2009, and is based on 2009 work
- * by N. Robidoux, A. Turcotte, J. Cupitt, Minglun Gong and Kirk
- * Martinez. The Better Image Resampling project was started by
- * Minglun Gong, A. Turcotte and N. Robidoux in 2007.
+ * The Robidoux Keys cubic filter was developed by N. Robidoux and is
+ * based on earlier research by A. Thyssen on the use of cubic
+ * filters, like Mitchell-Netravali, for Elliptical Weighted
+ * Averaging.
  *
- * Clamped EWA with the teepee (radial version of the (Mexican) "hat"
- * or "triangle") filter kernel was developed by N. Robidoux and
- * A. Thyssen the assistance of C. Racette and Frederick Weinhaus. It
- * is based on methods of Paul Heckbert and Andreas Gustaffson (and
- * possibly others).
+ * Clamped EWA was developed by N. Robidoux and A. Thyssen with the
+ * assistance of Chantal Racette and Frederick Weinhaus. It is based
+ * on methods of Paul Heckbert, Andreas Gustaffson and almost
+ * certainly other researchers.
  *
- * N. Robidoux's early research on Nohalo funded in part by an NSERC
- * (National Science and Engineering Research Council of Canada)
- * Discovery Grant awarded to him (298424--2004). This, together with
- * M. Gong's own Discovery grant and A. Turcotte's NSERC USRA
- * (Undergraduate Summer Research Assistantship) funded the very
- * earliest stages of this project.
+ * Fast computation methods for Keys cubic weights were developed by
+ * N. Robidoux. Variants are used by the VIPS and ImageMagick
+ * libraries.
  *
- * A. Turcotte's image resampling research on reduced halo methods and
- * jacobian adaptive methods funded in part by an OGS (Ontario
- * Graduate Scholarship) and an NSERC Alexander Graham Bell Canada
- * Graduate Scholarhip awarded to him, by GSoC (Google Summer of Code)
- * 2010 funding awarded to GIMP (Gnu Image Manipulation Program), and
- * by Laurentian University research funding provided by N. Robidoux
- * and Ralf Meyer.
+ * A. Turcotte's image resampling research on Jacobian adaptive
+ * methods funded in part by an OGS (Ontario Graduate Scholarship) and
+ * an NSERC Alexander Graham Bell Canada Graduate Scholarhip awarded
+ * to him, by GSoC (Google Summer of Code) 2010 funding awarded to
+ * GIMP (Gnu Image Manipulation Program), and by Laurentian University
+ * research funding provided by N. Robidoux and Ralf Meyer.
  *
  * C. Racette's image resampling research and programming funded in
  * part by a NSERC Discovery Grant awarded to Julien Dompierre
  * (20-61098) and by a NSERC Alexander Graham Bell Canada Graduate
  * Scholarship awarded to her.
  *
- * E. Daoust's image resampling programming was funded by GSoC 2010
- * funding awarded to GIMP.
+ * N. Robidoux's development of fast formulas for the computation of
+ * Mitchell-Netravali Keys cubic weights was funded in part by Pixel
+ * Analytics Ltd.
  *
- * N. Robidoux thanks his co-authors, and Ralf Meyer, Geert Jordaens,
- * Craig DeForest, Massimo Valentini, Sven Neumann and Mitch Natterer
- * for useful comments.
+ * The programming of this and other GEGL samplers by N. Robidoux was
+ * funded by a large number of freedomsponsors.org patrons, including
+ * A. Prokoudine.
+ *
+ * In addition to the above, N. Robidoux thanks Craig DeForest,
+ * Mathias Rauen, John Cupitt, Henry HO and Massimo Valentini for
+ * useful comments, with special thanks to Cristy, the lead developer
+ * of ImageMagick, for making it available as a platform for research
+ * in image processing.
  */
 
 /*
@@ -117,9 +115,6 @@
  * pixel indices match the position of the top left corner of the
  * corresponding pixel, so that the center of pixel (i,j) is located
  * at (i+1/2,j+1/2), pixel center positions do NOT match their index.
- * Earlier versions of this code did not follow this convention: They
- * assumed that the location of the center of a pixel matched its
- * index.
  */
 
 #include "config.h"
@@ -132,49 +127,6 @@
 
 #include "gegl-sampler-lohalo.h"
 
-/*
- * LOHALO_MINMOD is an implementation of the minmod function which
- * only needs two "conditional moves."
- * LOHALO_MINMOD(a,b,a_times_a,a_times_b) "returns"
- * minmod(a,b). The macro parameter ("input") a_times_a is assumed to
- * contain the square of a; a_times_b, the product of a and b.
- *
- * For uncompressed natural images in high bit depth (images for which
- * the slopes a and b are unlikely to be equal to zero or be equal to
- * each other), or chips with good branch prediction, the following
- * version of the minmod function may work well:
- *
- * ( (a_times_b)>=0. ? ( (a_times_b)<(a_times_a) ? (b) : (a) ) : 0. )
- *
- * In this version, the forward branch of the second conditional move
- * is taken when |b|>|a| and when a*b<0. However, the "else" branch is
- * taken when a=0 (or when a=b), which is why the above version is not
- * as effective for images with regions with constant pixel values (or
- * regions with pixel values which vary linearly or bilinearly) since
- * we apply minmod to pairs of differences.
- *
- * The following version is more suitable for images with flat
- * (constant) colour areas, since a, which is a pixel difference, will
- * often be 0, in which case both forward branches are likely. This
- * may be preferable if "branch flag look ahead" does not work so
- * well.
- *
- * ( (a_times_b)>=0. ? ( (a_times_a)<=(a_times_b) ? (a) : (b) ) : 0. )
- *
- * This last version appears to be slightly better than the former in
- * speed tests performed on a recent multicore Intel chip, especially
- * when enlarging a sharp image by a large factor, hence the choice.
- */
-
-/* #define LOHALO_MINMOD(a,b,a_times_a,a_times_b) \ */
-/*   (                                            \ */
-/*     (a_times_b) >= (gfloat) 0.                 \ */
-/*     ?                                          \ */
-/*     ( (a_times_b) < (a_times_a) ? (b) : (a) )  \ */
-/*     :                                          \ */
-/*     (gfloat) 0.                                \ */
-/*   )                                              */
-
 #define LOHALO_MINMOD(_a_,_b_,_a_times_a_,_a_times_b_) \
   (                                                    \
     (_a_times_b_) >= (gfloat) 0.                       \
@@ -190,11 +142,11 @@
  */
 #define LOHALO_MIN(_x_,_y_) ( (_x_) <= (_y_) ? (_x_) : (_y_) )
 #define LOHALO_MAX(_x_,_y_) ( (_x_) >= (_y_) ? (_x_) : (_y_) )
-#define LOHALO_ABS(_x_)   ( (_x_) >= (gfloat) 0. ? (_x_) : -(_x_) )
-#define LOHALO_SIGN(_x_)  ( (_x_) >= (gfloat) 0. ? (gfloat) 1. : (gfloat) -1. )
+#define LOHALO_ABS(_x_)  ( (_x_) >= (gfloat) 0. ? (_x_) : -(_x_) )
+#define LOHALO_SIGN(_x_) ( (_x_) >= (gfloat) 0. ? (gfloat) 1. : (gfloat) -1. )
 
 /*
- * Special case of of Knuth's floored division, that is:
+ * Special case of Knuth's floored division, that is:
  *
  * FLOORED_DIVISION(a,b) (((a) - ((a)<0 ? (b)-1 : 0)) / (b))
  *
@@ -210,7 +162,7 @@
 
 /*
  * Convenience macros. _level_ and _previous_level_ must be a plain
- * integers (like "1", "2" etc) because it it literally replaced (note
+ * integers (like "1", "2" etc) because it is literally replaced (note
  * the "##_level").
  */
 
@@ -371,9 +323,14 @@ gegl_sampler_lohalo_class_init (GeglSamplerLohaloClass *klass)
  * Because things are kept centered, the stencil width/height is 1 +
  * twice the (size of) the offset.
  *
- * 5x5 is the smallest "level 0" context_rect that works with the
- * LBB-Nohalo component of the sampler. Because 5 = 1+2*2,
- * LOHALO_OFFSET_0 must be >= 2.
+ * The Mitchell-Netravali cubic filter uses 4 pixels in each
+ * direction. Because we anchor ourselves at the closest pixel, we
+ * need 2 pixels on both sides, because we don't know ahead of time
+ * which way things will be reflected. So, we need the size to be at
+ * least 5x5. 4x4 would be enough if we did not perform reflections in
+ * order to keep things as centered as possible between mipmap
+ * levels. In any case, as the code runs, LOHALO_OFFSET_0 must be >=
+ * 2.
  *
  * Speed/quality trade-off:
  *
@@ -390,7 +347,7 @@ gegl_sampler_lohalo_class_init (GeglSamplerLohaloClass *klass)
 /*
  * IMPORTANT: LOHALO_OFFSET_0 SHOULD BE AN INTEGER >= 2.
  */
-#define LOHALO_OFFSET_0 (11)
+#define LOHALO_OFFSET_0 (12)
 #define LOHALO_SIZE_0 (1+2*LOHALO_OFFSET_0)
 
 /*
@@ -403,7 +360,7 @@ gegl_sampler_lohalo_class_init (GeglSamplerLohaloClass *klass)
  * mipmap level's offset should almost never be smaller than half the
  * previous level's offset.
  */
-#define LOHALO_OFFSET_MIPMAP (11)
+#define LOHALO_OFFSET_MIPMAP (12)
 #define LOHALO_SIZE_MIPMAP (1+2*LOHALO_OFFSET_MIPMAP)
 
 #define LOHALO_OFFSET_1 LOHALO_OFFSET_MIPMAP
@@ -477,890 +434,71 @@ gegl_sampler_lohalo_init (GeglSamplerLohalo *self)
   GEGL_SAMPLER (self)->interpolate_format = babl_format ("RaGaBaA float");
 }
 
-static void inline
-nohalo_subdivision (const gfloat           uno_two,
-                    const gfloat           uno_thr,
-                    const gfloat           uno_fou,
-                    const gfloat           dos_one,
-                    const gfloat           dos_two,
-                    const gfloat           dos_thr,
-                    const gfloat           dos_fou,
-                    const gfloat           dos_fiv,
-                    const gfloat           tre_one,
-                    const gfloat           tre_two,
-                    const gfloat           tre_thr,
-                    const gfloat           tre_fou,
-                    const gfloat           tre_fiv,
-                    const gfloat           qua_one,
-                    const gfloat           qua_two,
-                    const gfloat           qua_thr,
-                    const gfloat           qua_fou,
-                    const gfloat           qua_fiv,
-                    const gfloat           cin_two,
-                    const gfloat           cin_thr,
-                    const gfloat           cin_fou,
-                          gfloat* restrict uno_one_1,
-                          gfloat* restrict uno_two_1,
-                          gfloat* restrict uno_thr_1,
-                          gfloat* restrict uno_fou_1,
-                          gfloat* restrict dos_one_1,
-                          gfloat* restrict dos_two_1,
-                          gfloat* restrict dos_thr_1,
-                          gfloat* restrict dos_fou_1,
-                          gfloat* restrict tre_one_1,
-                          gfloat* restrict tre_two_1,
-                          gfloat* restrict tre_thr_1,
-                          gfloat* restrict tre_fou_1,
-                          gfloat* restrict qua_one_1,
-                          gfloat* restrict qua_two_1,
-                          gfloat* restrict qua_thr_1,
-                          gfloat* restrict qua_fou_1)
-{
-  /*
-   * nohalo_subdivision calculates the missing twelve float density
-   * pixel values, and also returns the "already known" four, so that
-   * the sixteen values which make up the stencil of LBB are
-   * available.
-   */
-  /*
-   * THE STENCIL OF INPUT VALUES:
-   *
-   * Pointer arithmetic is used to implicitly reflect the input
-   * stencil about tre_thr---assumed closer to the sampling location
-   * than other pixels (ties are OK)---in such a way that after
-   * reflection the sampling point is to the bottom right of tre_thr.
-   *
-   * The following code and picture assumes that the stencil reflexion
-   * has already been performed.
-   *
-   *               (ix-1,iy-2)  (ix,iy-2)    (ix+1,iy-2)
-   *               =uno_two     = uno_thr    = uno_fou
-   *
-   *
-   *
-   *  (ix-2,iy-1)  (ix-1,iy-1)  (ix,iy-1)    (ix+1,iy-1)  (ix+2,iy-1)
-   *  = dos_one    = dos_two    = dos_thr    = dos_fou    = dos_fiv
-   *
-   *
-   *
-   *  (ix-2,iy)    (ix-1,iy)    (ix,iy)      (ix+1,iy)    (ix+2,iy)
-   *  = tre_one    = tre_two    = tre_thr    = tre_fou    = tre_fiv
-   *                                    X
-   *
-   *
-   *  (ix-2,iy+1)  (ix-1,iy+1)  (ix,iy+1)    (ix+1,iy+1)  (ix+2,iy+1)
-   *  = qua_one    = qua_two    = qua_thr    = qua_fou    = qua_fiv
-   *
-   *
-   *
-   *               (ix-1,iy+2)  (ix,iy+2)    (ix+1,iy+2)
-   *               = cin_two    = cin_thr    = cin_fou
-   *
-   *
-   * The above input pixel values are the ones needed in order to make
-   * available the following values, needed by LBB:
-   *
-   *  uno_one_1 =      uno_two_1 =  uno_thr_1 =      uno_fou_1 =
-   *  (ix-1/2,iy-1/2)  (ix,iy-1/2)  (ix+1/2,iy-1/2)  (ix+1,iy-1/2)
-   *
-   *
-   *
-   *
-   *  dos_one_1 =      dos_two_1 =  dos_thr_1 =      dos_fou_1 =
-   *  (ix-1/2,iy)      (ix,iy)      (ix+1/2,iy)      (ix+1,iy)
-   *
-   *                             X
-   *
-   *
-   *  tre_one_1 =      tre_two_1 =  tre_thr_1 =      tre_fou_1 =
-   *  (ix-1/2,iy+1/2)  (ix,iy+1/2)  (ix+1/2,iy+1/2)  (ix+1,iy+1/2)
-   *
-   *
-   *
-   *
-   *  qua_one_1 =      qua_two_1 =  qua_thr_1 =      qua_fou_1 =
-   *  (ix-1/2,iy+1)    (ix,iy+1)    (ix+1/2,iy+1)    (ix+1,iy+1)
-   *
-   */
-
-  /*
-   * Computation of the nonlinear slopes: If two consecutive pixel
-   * value differences have the same sign, the smallest one (in
-   * absolute value) is taken to be the corresponding slope; if the
-   * two consecutive pixel value differences don't have the same sign,
-   * the corresponding slope is set to 0.
-   *
-   * In other words: Apply minmod to consecutive differences.
-   */
-  /*
-   * Two vertical simple differences:
-   */
-  const gfloat d_unodos_two = dos_two - uno_two;
-  const gfloat d_dostre_two = tre_two - dos_two;
-  const gfloat d_trequa_two = qua_two - tre_two;
-  const gfloat d_quacin_two = cin_two - qua_two;
-  /*
-   * Thr(ee) vertical differences:
-   */
-  const gfloat d_unodos_thr = dos_thr - uno_thr;
-  const gfloat d_dostre_thr = tre_thr - dos_thr;
-  const gfloat d_trequa_thr = qua_thr - tre_thr;
-  const gfloat d_quacin_thr = cin_thr - qua_thr;
-  /*
-   * Fou(r) vertical differences:
-   */
-  const gfloat d_unodos_fou = dos_fou - uno_fou;
-  const gfloat d_dostre_fou = tre_fou - dos_fou;
-  const gfloat d_trequa_fou = qua_fou - tre_fou;
-  const gfloat d_quacin_fou = cin_fou - qua_fou;
-  /*
-   * Dos horizontal differences:
-   */
-  const gfloat d_dos_onetwo = dos_two - dos_one;
-  const gfloat d_dos_twothr = dos_thr - dos_two;
-  const gfloat d_dos_thrfou = dos_fou - dos_thr;
-  const gfloat d_dos_foufiv = dos_fiv - dos_fou;
-  /*
-   * Tre(s) horizontal differences:
-   */
-  const gfloat d_tre_onetwo = tre_two - tre_one;
-  const gfloat d_tre_twothr = tre_thr - tre_two;
-  const gfloat d_tre_thrfou = tre_fou - tre_thr;
-  const gfloat d_tre_foufiv = tre_fiv - tre_fou;
-  /*
-   * Qua(ttro) horizontal differences:
-   */
-  const gfloat d_qua_onetwo = qua_two - qua_one;
-  const gfloat d_qua_twothr = qua_thr - qua_two;
-  const gfloat d_qua_thrfou = qua_fou - qua_thr;
-  const gfloat d_qua_foufiv = qua_fiv - qua_fou;
-
-  /*
-   * Recyclable vertical products and squares:
-   */
-  const gfloat d_unodos_times_dostre_two = d_unodos_two * d_dostre_two;
-  const gfloat d_dostre_two_sq           = d_dostre_two * d_dostre_two;
-  const gfloat d_dostre_times_trequa_two = d_dostre_two * d_trequa_two;
-  const gfloat d_trequa_times_quacin_two = d_quacin_two * d_trequa_two;
-  const gfloat d_quacin_two_sq           = d_quacin_two * d_quacin_two;
-
-  const gfloat d_unodos_times_dostre_thr = d_unodos_thr * d_dostre_thr;
-  const gfloat d_dostre_thr_sq           = d_dostre_thr * d_dostre_thr;
-  const gfloat d_dostre_times_trequa_thr = d_trequa_thr * d_dostre_thr;
-  const gfloat d_trequa_times_quacin_thr = d_trequa_thr * d_quacin_thr;
-  const gfloat d_quacin_thr_sq           = d_quacin_thr * d_quacin_thr;
-
-  const gfloat d_unodos_times_dostre_fou = d_unodos_fou * d_dostre_fou;
-  const gfloat d_dostre_fou_sq           = d_dostre_fou * d_dostre_fou;
-  const gfloat d_dostre_times_trequa_fou = d_trequa_fou * d_dostre_fou;
-  const gfloat d_trequa_times_quacin_fou = d_trequa_fou * d_quacin_fou;
-  const gfloat d_quacin_fou_sq           = d_quacin_fou * d_quacin_fou;
-  /*
-   * Recyclable horizontal products and squares:
-   */
-  const gfloat d_dos_onetwo_times_twothr = d_dos_onetwo * d_dos_twothr;
-  const gfloat d_dos_twothr_sq           = d_dos_twothr * d_dos_twothr;
-  const gfloat d_dos_twothr_times_thrfou = d_dos_twothr * d_dos_thrfou;
-  const gfloat d_dos_thrfou_times_foufiv = d_dos_thrfou * d_dos_foufiv;
-  const gfloat d_dos_foufiv_sq           = d_dos_foufiv * d_dos_foufiv;
-
-  const gfloat d_tre_onetwo_times_twothr = d_tre_onetwo * d_tre_twothr;
-  const gfloat d_tre_twothr_sq           = d_tre_twothr * d_tre_twothr;
-  const gfloat d_tre_twothr_times_thrfou = d_tre_thrfou * d_tre_twothr;
-  const gfloat d_tre_thrfou_times_foufiv = d_tre_thrfou * d_tre_foufiv;
-  const gfloat d_tre_foufiv_sq           = d_tre_foufiv * d_tre_foufiv;
-
-  const gfloat d_qua_onetwo_times_twothr = d_qua_onetwo * d_qua_twothr;
-  const gfloat d_qua_twothr_sq           = d_qua_twothr * d_qua_twothr;
-  const gfloat d_qua_twothr_times_thrfou = d_qua_thrfou * d_qua_twothr;
-  const gfloat d_qua_thrfou_times_foufiv = d_qua_thrfou * d_qua_foufiv;
-  const gfloat d_qua_foufiv_sq           = d_qua_foufiv * d_qua_foufiv;
-
-  /*
-   * Minmod slopes and first level pixel values:
-   */
-  const gfloat dos_thr_y = LOHALO_MINMOD( d_dostre_thr, d_unodos_thr,
-                                          d_dostre_thr_sq,
-                                          d_unodos_times_dostre_thr );
-  const gfloat tre_thr_y = LOHALO_MINMOD( d_dostre_thr, d_trequa_thr,
-                                          d_dostre_thr_sq,
-                                          d_dostre_times_trequa_thr );
-
-  const gfloat newval_uno_two =
-    (gfloat) 0.5
-    *
-    ( dos_thr + tre_thr + (gfloat) 0.5 * ( dos_thr_y - tre_thr_y ) );
-
-  const gfloat qua_thr_y = LOHALO_MINMOD( d_quacin_thr, d_trequa_thr,
-                                          d_quacin_thr_sq,
-                                          d_trequa_times_quacin_thr );
-
-  const gfloat newval_tre_two =
-    (gfloat) 0.5
-    *
-    ( tre_thr + qua_thr + (gfloat) 0.5 * ( tre_thr_y - qua_thr_y ) );
-
-  const gfloat tre_fou_y = LOHALO_MINMOD( d_dostre_fou, d_trequa_fou,
-                                          d_dostre_fou_sq,
-                                          d_dostre_times_trequa_fou );
-  const gfloat qua_fou_y = LOHALO_MINMOD( d_quacin_fou, d_trequa_fou,
-                                          d_quacin_fou_sq,
-                                          d_trequa_times_quacin_fou );
-
-  const gfloat newval_tre_fou =
-    (gfloat) 0.5
-    *
-    ( tre_fou + qua_fou + (gfloat) 0.5 * ( tre_fou_y - qua_fou_y ) );
-
-  const gfloat dos_fou_y = LOHALO_MINMOD( d_dostre_fou, d_unodos_fou,
-                                          d_dostre_fou_sq,
-                                          d_unodos_times_dostre_fou );
-
-  const gfloat newval_uno_fou =
-    (gfloat) 0.5
-    *
-    ( dos_fou + tre_fou + (gfloat) 0.5 * (dos_fou_y - tre_fou_y ) );
-
-  const gfloat tre_two_x = LOHALO_MINMOD( d_tre_twothr, d_tre_onetwo,
-                                          d_tre_twothr_sq,
-                                          d_tre_onetwo_times_twothr );
-  const gfloat tre_thr_x = LOHALO_MINMOD( d_tre_twothr, d_tre_thrfou,
-                                          d_tre_twothr_sq,
-                                          d_tre_twothr_times_thrfou );
-
-  const gfloat newval_dos_one =
-    (gfloat) 0.5
-    *
-    ( tre_two + tre_thr + (gfloat) 0.5 * ( tre_two_x - tre_thr_x ) );
-
-  const gfloat tre_fou_x = LOHALO_MINMOD( d_tre_foufiv, d_tre_thrfou,
-                                          d_tre_foufiv_sq,
-                                          d_tre_thrfou_times_foufiv );
-
-  const gfloat tre_thr_x_minus_tre_fou_x =
-    tre_thr_x - tre_fou_x;
-
-  const gfloat newval_dos_thr =
-    (gfloat) 0.5
-    *
-    ( tre_thr + tre_fou + (gfloat) 0.5 * tre_thr_x_minus_tre_fou_x );
-
-  const gfloat qua_thr_x = LOHALO_MINMOD( d_qua_twothr, d_qua_thrfou,
-                                          d_qua_twothr_sq,
-                                          d_qua_twothr_times_thrfou );
-  const gfloat qua_fou_x = LOHALO_MINMOD( d_qua_foufiv, d_qua_thrfou,
-                                          d_qua_foufiv_sq,
-                                          d_qua_thrfou_times_foufiv );
-
-  const gfloat qua_thr_x_minus_qua_fou_x =
-    qua_thr_x - qua_fou_x;
-
-  const gfloat newval_qua_thr =
-    (gfloat) 0.5
-    *
-    ( qua_thr + qua_fou + (gfloat) 0.5 * qua_thr_x_minus_qua_fou_x );
-
-  const gfloat qua_two_x = LOHALO_MINMOD( d_qua_twothr, d_qua_onetwo,
-                                          d_qua_twothr_sq,
-                                          d_qua_onetwo_times_twothr );
-
-  const gfloat newval_qua_one =
-    (gfloat) 0.5
-    *
-    ( qua_two + qua_thr + (gfloat) 0.5 * ( qua_two_x - qua_thr_x ) );
-
-  const gfloat newval_tre_thr =
-    (gfloat) 0.5
-    *
-    (
-      newval_tre_two + newval_tre_fou
-      +
-      (gfloat) 0.25 * ( tre_thr_x_minus_tre_fou_x + qua_thr_x_minus_qua_fou_x )
-    );
-
-  const gfloat dos_thr_x = LOHALO_MINMOD( d_dos_twothr, d_dos_thrfou,
-                                          d_dos_twothr_sq,
-                                          d_dos_twothr_times_thrfou );
-  const gfloat dos_fou_x = LOHALO_MINMOD( d_dos_foufiv, d_dos_thrfou,
-                                          d_dos_foufiv_sq,
-                                          d_dos_thrfou_times_foufiv );
-
-  const gfloat newval_uno_thr =
-    (gfloat) 0.5
-    *
-    (
-      newval_uno_two + newval_dos_thr
-      +
-      (gfloat) 0.5
-      *
-      (
-        dos_fou - tre_thr
-        +
-        (gfloat) 0.5 * ( dos_fou_y - tre_fou_y + dos_thr_x - dos_fou_x )
-      )
-    );
-
-  const gfloat tre_two_y = LOHALO_MINMOD( d_dostre_two, d_trequa_two,
-                                          d_dostre_two_sq,
-                                          d_dostre_times_trequa_two );
-  const gfloat qua_two_y = LOHALO_MINMOD( d_quacin_two, d_trequa_two,
-                                          d_quacin_two_sq,
-                                          d_trequa_times_quacin_two );
-
-  const gfloat newval_tre_one =
-    (gfloat) 0.5
-    *
-    (
-      newval_dos_one + newval_tre_two
-      +
-      (gfloat) 0.5
-      *
-      (
-        qua_two - tre_thr
-        +
-        (gfloat) 0.5 * ( qua_two_x - qua_thr_x + tre_two_y - qua_two_y )
-      )
-    );
-
-
-  const gfloat dos_two_x = LOHALO_MINMOD( d_dos_twothr, d_dos_onetwo,
-                                          d_dos_twothr_sq,
-                                          d_dos_onetwo_times_twothr );
-  const gfloat dos_two_y = LOHALO_MINMOD( d_dostre_two, d_unodos_two,
-                                          d_dostre_two_sq,
-                                          d_unodos_times_dostre_two );
-
-  const gfloat newval_uno_one =
-    (gfloat) 0.25
-    *
-    (
-      dos_two + dos_thr + tre_two + tre_thr
-      +
-      (gfloat) 0.5
-      *
-      (
-        dos_two_x - dos_thr_x + tre_two_x - tre_thr_x
-        +
-        dos_two_y + dos_thr_y - tre_two_y - tre_thr_y
-      )
-    );
-
-  /*
-   * Return the sixteen LBB stencil values:
-   */
-  *uno_one_1 = newval_uno_one;
-  *uno_two_1 = newval_uno_two;
-  *uno_thr_1 = newval_uno_thr;
-  *uno_fou_1 = newval_uno_fou;
-  *dos_one_1 = newval_dos_one;
-  *dos_two_1 =        tre_thr;
-  *dos_thr_1 = newval_dos_thr;
-  *dos_fou_1 =        tre_fou;
-  *tre_one_1 = newval_tre_one;
-  *tre_two_1 = newval_tre_two;
-  *tre_thr_1 = newval_tre_thr;
-  *tre_fou_1 = newval_tre_fou;
-  *qua_one_1 = newval_qua_one;
-  *qua_two_1 =        qua_thr;
-  *qua_thr_1 = newval_qua_thr;
-  *qua_fou_1 =        qua_fou;
-}
-
 static inline gfloat
-lbb (const gfloat c00,
-     const gfloat c10,
-     const gfloat c01,
-     const gfloat c11,
-     const gfloat c00dx,
-     const gfloat c10dx,
-     const gfloat c01dx,
-     const gfloat c11dx,
-     const gfloat c00dy,
-     const gfloat c10dy,
-     const gfloat c01dy,
-     const gfloat c11dy,
-     const gfloat c00dxdy,
-     const gfloat c10dxdy,
-     const gfloat c01dxdy,
-     const gfloat c11dxdy,
-     const gfloat uno_one,
-     const gfloat uno_two,
-     const gfloat uno_thr,
-     const gfloat uno_fou,
-     const gfloat dos_one,
-     const gfloat dos_two,
-     const gfloat dos_thr,
-     const gfloat dos_fou,
-     const gfloat tre_one,
-     const gfloat tre_two,
-     const gfloat tre_thr,
-     const gfloat tre_fou,
-     const gfloat qua_one,
-     const gfloat qua_two,
-     const gfloat qua_thr,
-     const gfloat qua_fou )
+robidoux (const gfloat c_major_x,
+          const gfloat c_major_y,
+          const gfloat c_minor_x,
+          const gfloat c_minor_y,
+          const gfloat s,
+          const gfloat t)
 {
   /*
-   * LBB (Locally Bounded Bicubic) is a high quality nonlinear variant
-   * of Catmull-Rom. Images resampled with LBB have much smaller halos
-   * than images resampled with windowed sincs or other interpolatory
-   * cubic spline filters. Specifically, LBB halos are narrower and
-   * the over/undershoot amplitude is smaller. This is accomplished
-   * without a significant reduction in the smoothness of the result
-   * (compared to Catmull-Rom).
-   *
-   * Another important property is that the resampled values are
-   * contained within the range of nearby input values. Consequently,
-   * no final clamping is needed to stay "in range" (e.g., 0-255 for
-   * standard 8-bit images).
-   *
-   * LBB was developed by Nicolas Robidoux and Chantal Racette of the
-   * Department of Mathematics and Computer Science of Laurentian
-   * University in the course of Chantal's Masters in Computational
-   * Sciences.
-   */
-  /*
-   * LBB is a novel method with the following properties:
-   *
-   * --LBB is a Hermite bicubic method: The bicubic surface is
-   *   defined, one convex hull of four nearby input points at a time,
-   *   using four point values, four x-derivatives, four
-   *   y-derivatives, and four cross-derivatives.
-   *
-   * --The stencil for values in a square patch is the usual 4x4.
-   *
-   * --LBB is interpolatory.
-   *
-   * --It is C^1 with continuous cross-derivatives.
-   *
-   * --When the limiters are inactive, LBB gives the same results as
-   *   Catmull-Rom.
-   *
-   * --When used on binary images, LBB gives results similar to
-   *   bicubic Hermite with all first derivatives---but not
-   *   necessarily the cross-derivatives--at the input pixel locations
-   *   set to zero.
-   *
-   * --The LBB reconstruction is locally bounded: Over each square
-   *   patch, the surface is contained between the minimum and the
-   *   maximum values among the 16 nearest input pixel values (those
-   *   in the stencil).
-   *
-   * --Consequently, the LBB reconstruction is globally bounded
-   *   between the very smallest input pixel value and the very
-   *   largest input pixel value. (It is not necessary to clamp
-   *   results.)
-   *
-   * The LBB method is based on the method of Ken Brodlie, Petros
-   * Mashwama and Sohail Butt for constraining Hermite interpolants
-   * between globally defined planes:
-   *
-   *   Visualization of surface data to preserve positivity and other
-   *   simple constraints. Computer & Graphics, Vol. 19, Number 4,
-   *   pages 585-594, 1995. DOI: 10.1016/0097-8493(95)00036-C.
-   *
-   * Instead of forcing the reconstructed surface to lie between two
-   * GLOBALLY defined planes, LBB constrains one patch at a time to
-   * lie between LOCALLY defined planes. This is accomplished by
-   * constraining the derivatives (x, y and cross) at each input pixel
-   * location so that if the constraint was applied everywhere the
-   * surface would fit between the min and max of the values at the 9
-   * closest pixel locations. Because this is done with each of the
-   * four pixel locations which define the bicubic patch, this forces
-   * the reconstructed surface to lie between the min and max of the
-   * values at the 16 closest values pixel locations. (Each corner
-   * defines its own 3x3 subgroup of the 4x4 stencil. Consequently,
-   * the surface is necessarily above the minimum of the four minima,
-   * which happens to be the minimum over the 4x4. Similarly with the
-   * maxima.)
-   *
-   * The above paragraph described the "soft" version of LBB, which is
-   * the only one used by lohalo.
-   */
-  /*
-   * STENCIL (FOOTPRINT) OF INPUT VALUES:
-   *
-   * The stencil of LBB is the same as for any standard Hermite
-   * bicubic (e.g., Catmull-Rom):
-   *
-   *  (ix-1,iy-1)  (ix,iy-1)    (ix+1,iy-1)  (ix+2,iy-1)
-   *  = uno_one    = uno_two    = uno_thr    = uno_fou
-   *
-   *  (ix-1,iy)    (ix,iy)      (ix+1,iy)    (ix+2,iy)
-   *  = dos_one    = dos_two    = dos_thr    = dos_fou
-   *                        X
-   *  (ix-1,iy+1)  (ix,iy+1)    (ix+1,iy+1)  (ix+2,iy+1)
-   *  = tre_one    = tre_two    = tre_thr    = tre_fou
-   *
-   *  (ix-1,iy+2)  (ix,iy+2)    (ix+1,iy+2)  (ix+2,iy+2)
-   *  = qua_one    = qua_two    = qua_thr    = qua_fou
-   *
-   * where ix is the floor of the requested left-to-right location
-   * ("X"), and iy is the floor of the requested up-to-down location.
-   */
-
-  /*
-   * Computation of the four min and four max over 3x3 input data
-   * sub-blocks of the 4x4 input stencil.
-   *
-   * Surprisingly, we have not succeeded in reducing the number of "?
-   * :" even though the data comes from the (co-monotone) method
-   * Nohalo so that it is known ahead of time that
-   *
-   *  dos_thr is between dos_two and dos_fou
+   * This function computes -398/(7+72sqrt(2)) times the Robidoux
+   * cubic. The factor is to remove one flop; it is harmless because
+   * the final results is normalized by the sum of the weights, which
+   * means nonzero multiplicative factors have no impact.
    *
-   *  tre_two is between dos_two and qua_two
+   * The Robidoux cubic is the Keys cubic defined, as a BC-spline, by
    *
-   *  tre_fou is between dos_fou and qua_fou
+   * B = 1656 / ( 1592 + 597 * sqrt(2) )
    *
-   *  qua_thr is between qua_two and qua_fou
+   * and
    *
-   *  tre_thr is in the convex hull of dos_two, dos_fou, qua_two and qua_fou
+   * C = 15407 / ( 35422 + 42984 * sqrt(2) ).
    *
-   *  to minimize the number of flags and conditional moves.
+   * Keys cubics are the BC-splines with B+2C=1.
    *
-   * (The "between" are not strict: "a between b and c" means
-   *
-   * "min(b,c) <= a <= max(b,c)".)
-   *
-   * We have, however, succeeded in eliminating one flag computation
-   * (one comparison) and one use of an intermediate result. See the
-   * two commented out lines below.
-   *
-   * Overall, only 27 comparisons are needed (to compute 4 mins and 4
-   * maxes!). Without the simplification, 28 comparisons would be
-   * used. Either way, the number of "? :" used is 34. If you can
-   * figure how to do this more efficiently, let us know.
-   */
-  const gfloat m1    = (dos_two <= dos_thr) ? dos_two : dos_thr  ;
-  const gfloat M1    = (dos_two <= dos_thr) ? dos_thr : dos_two  ;
-  const gfloat m2    = (tre_two <= tre_thr) ? tre_two : tre_thr  ;
-  const gfloat M2    = (tre_two <= tre_thr) ? tre_thr : tre_two  ;
-  const gfloat m4    = (qua_two <= qua_thr) ? qua_two : qua_thr  ;
-  const gfloat M4    = (qua_two <= qua_thr) ? qua_thr : qua_two  ;
-  const gfloat m3    = (uno_two <= uno_thr) ? uno_two : uno_thr  ;
-  const gfloat M3    = (uno_two <= uno_thr) ? uno_thr : uno_two  ;
-  const gfloat m5    = LOHALO_MIN(            m1,       m2      );
-  const gfloat M5    = LOHALO_MAX(            M1,       M2      );
-  const gfloat m6    = (dos_one <= tre_one) ? dos_one : tre_one  ;
-  const gfloat M6    = (dos_one <= tre_one) ? tre_one : dos_one  ;
-  const gfloat m7    = (dos_fou <= tre_fou) ? dos_fou : tre_fou  ;
-  const gfloat M7    = (dos_fou <= tre_fou) ? tre_fou : dos_fou  ;
-  const gfloat m13   = (dos_fou <= qua_fou) ? dos_fou : qua_fou  ;
-  const gfloat M13   = (dos_fou <= qua_fou) ? qua_fou : dos_fou  ;
-  /*
-   * Because the data comes from Nohalo subdivision, the following two
-   * lines can be replaced by the above, "simpler," two lines without
-   * changing the results.
+   * The Robidoux cubic is the unique Keys cubic with the property
+   * that it preserves images which pixel values constant along
+   * columns (or rows) under no-op EWA resampling. Informally, it is
+   * the unique Keys cubic for which a vertical or horizontal line or
+   * boundary does not "bleed" into neighbouring original pixel
+   * locations when used, as an EWA filter kernel, to resample without
+   * downsampling.
    *
-   * const gfloat m13   = LOHALO_MIN(            m7,       qua_fou );
-   * const gfloat M13   = LOHALO_MAX(            M7,       qua_fou );
-   *
-   * This allows for the comparisons to be reordered to put breathing
-   * room between the computation of a result and its use.
-   */
-  const gfloat m9    = LOHALO_MIN(            m5,       m4      );
-  const gfloat M9    = LOHALO_MAX(            M5,       M4      );
-  const gfloat m11   = LOHALO_MIN(            m6,       qua_one );
-  const gfloat M11   = LOHALO_MAX(            M6,       qua_one );
-  const gfloat m10   = LOHALO_MIN(            m6,       uno_one );
-  const gfloat M10   = LOHALO_MAX(            M6,       uno_one );
-  const gfloat m8    = LOHALO_MIN(            m5,       m3      );
-  const gfloat M8    = LOHALO_MAX(            M5,       M3      );
-  const gfloat m12   = LOHALO_MIN(            m7,       uno_fou );
-  const gfloat M12   = LOHALO_MAX(            M7,       uno_fou );
-  const gfloat min11 = LOHALO_MIN(            m9,       m13     );
-  const gfloat max11 = LOHALO_MAX(            M9,       M13     );
-  const gfloat min01 = LOHALO_MIN(            m9,       m11     );
-  const gfloat max01 = LOHALO_MAX(            M9,       M11     );
-  const gfloat min00 = LOHALO_MIN(            m8,       m10     );
-  const gfloat max00 = LOHALO_MAX(            M8,       M10     );
-  const gfloat min10 = LOHALO_MIN(            m8,       m12     );
-  const gfloat max10 = LOHALO_MAX(            M8,       M12     );
-
-  /*
-   * The remainder of the "per channel" computation involves the
-   * computation of:
-   *
-   * --8 conditional moves,
-   *
-   * --8 signs (in which the sign of zero is unimportant),
-   *
-   * --12 minima of two values,
-   *
-   * --8 maxima of two values,
-   *
-   * --8 absolute values,
-   *
-   * for a grand total of 29 minima, 25 maxima, 8 conditional moves, 8
-   * signs, and 8 absolute values. If everything is done with
-   * conditional moves, "only" 28+8+8+12+8+8=72 flags are involved
-   * (because initial min and max can be computed with one flag).
-   *
-   * The "per channel" part of the computation also involves 107
-   * arithmetic operations (54 *, 21 +, 42 -).
-   */
-
-  /*
-   * Distances to the local min and max:
-   */
-  const gfloat u11 = tre_thr - min11;
-  const gfloat v11 = max11 - tre_thr;
-  const gfloat u01 = tre_two - min01;
-  const gfloat v01 = max01 - tre_two;
-  const gfloat u00 = dos_two - min00;
-  const gfloat v00 = max00 - dos_two;
-  const gfloat u10 = dos_thr - min10;
-  const gfloat v10 = max10 - dos_thr;
-
-  /*
-   * Initial values of the derivatives computed with centered
-   * differences. Factors of 1/2 are left out because they are folded
-   * in later:
-   */
-  const gfloat dble_dzdx00i = dos_thr - dos_one;
-  const gfloat dble_dzdy11i = qua_thr - dos_thr;
-  const gfloat dble_dzdx10i = dos_fou - dos_two;
-  const gfloat dble_dzdy01i = qua_two - dos_two;
-  const gfloat dble_dzdx01i = tre_thr - tre_one;
-  const gfloat dble_dzdy10i = tre_thr - uno_thr;
-  const gfloat dble_dzdx11i = tre_fou - tre_two;
-  const gfloat dble_dzdy00i = tre_two - uno_two;
-
-  /*
-   * Signs of the derivatives. The upcoming clamping does not change
-   * them (except if the clamping sends a negative derivative to 0, in
-   * which case the sign does not matter anyway).
-   */
-  const gfloat sign_dzdx00 = LOHALO_SIGN( dble_dzdx00i );
-  const gfloat sign_dzdx10 = LOHALO_SIGN( dble_dzdx10i );
-  const gfloat sign_dzdx01 = LOHALO_SIGN( dble_dzdx01i );
-  const gfloat sign_dzdx11 = LOHALO_SIGN( dble_dzdx11i );
-
-  const gfloat sign_dzdy00 = LOHALO_SIGN( dble_dzdy00i );
-  const gfloat sign_dzdy10 = LOHALO_SIGN( dble_dzdy10i );
-  const gfloat sign_dzdy01 = LOHALO_SIGN( dble_dzdy01i );
-  const gfloat sign_dzdy11 = LOHALO_SIGN( dble_dzdy11i );
-
-  /*
-   * Initial values of the cross-derivatives. Factors of 1/4 are left
-   * out because folded in later:
-   */
-  const gfloat quad_d2zdxdy00i = uno_one - uno_thr + dble_dzdx01i;
-  const gfloat quad_d2zdxdy10i = uno_two - uno_fou + dble_dzdx11i;
-  const gfloat quad_d2zdxdy01i = qua_thr - qua_one - dble_dzdx00i;
-  const gfloat quad_d2zdxdy11i = qua_fou - qua_two - dble_dzdx10i;
-
-  /*
-   * Slope limiters. The key multiplier is 3 but we fold a factor of
-   * 2, hence 6:
-   */
-  const gfloat dble_slopelimit_00 = (gfloat) 6.0 * LOHALO_MIN( u00, v00 );
-  const gfloat dble_slopelimit_10 = (gfloat) 6.0 * LOHALO_MIN( u10, v10 );
-  const gfloat dble_slopelimit_01 = (gfloat) 6.0 * LOHALO_MIN( u01, v01 );
-  const gfloat dble_slopelimit_11 = (gfloat) 6.0 * LOHALO_MIN( u11, v11 );
-
-  /*
-   * Clamped first derivatives:
-   */
-  const gfloat dble_dzdx00 =
-    ( sign_dzdx00 * dble_dzdx00i <= dble_slopelimit_00 )
-    ? dble_dzdx00i :  sign_dzdx00 * dble_slopelimit_00;
-  const gfloat dble_dzdy00 =
-    ( sign_dzdy00 * dble_dzdy00i <= dble_slopelimit_00 )
-    ? dble_dzdy00i :  sign_dzdy00 * dble_slopelimit_00;
-  const gfloat dble_dzdx10 =
-    ( sign_dzdx10 * dble_dzdx10i <= dble_slopelimit_10 )
-    ? dble_dzdx10i :  sign_dzdx10 * dble_slopelimit_10;
-  const gfloat dble_dzdy10 =
-    ( sign_dzdy10 * dble_dzdy10i <= dble_slopelimit_10 )
-    ? dble_dzdy10i :  sign_dzdy10 * dble_slopelimit_10;
-  const gfloat dble_dzdx01 =
-    ( sign_dzdx01 * dble_dzdx01i <= dble_slopelimit_01 )
-    ? dble_dzdx01i :  sign_dzdx01 * dble_slopelimit_01;
-  const gfloat dble_dzdy01 =
-    ( sign_dzdy01 * dble_dzdy01i <= dble_slopelimit_01 )
-    ? dble_dzdy01i :  sign_dzdy01 * dble_slopelimit_01;
-  const gfloat dble_dzdx11 =
-    ( sign_dzdx11 * dble_dzdx11i <= dble_slopelimit_11 )
-    ? dble_dzdx11i :  sign_dzdx11 * dble_slopelimit_11;
-  const gfloat dble_dzdy11 =
-    ( sign_dzdy11 * dble_dzdy11i <= dble_slopelimit_11 )
-    ? dble_dzdy11i :  sign_dzdy11 * dble_slopelimit_11;
-
-  /*
-   * Sums and differences of first derivatives:
-   */
-  const gfloat twelve_sum00 = (gfloat) 6.0 * ( dble_dzdx00 + dble_dzdy00 );
-  const gfloat twelve_dif00 = (gfloat) 6.0 * ( dble_dzdx00 - dble_dzdy00 );
-  const gfloat twelve_sum10 = (gfloat) 6.0 * ( dble_dzdx10 + dble_dzdy10 );
-  const gfloat twelve_dif10 = (gfloat) 6.0 * ( dble_dzdx10 - dble_dzdy10 );
-  const gfloat twelve_sum01 = (gfloat) 6.0 * ( dble_dzdx01 + dble_dzdy01 );
-  const gfloat twelve_dif01 = (gfloat) 6.0 * ( dble_dzdx01 - dble_dzdy01 );
-  const gfloat twelve_sum11 = (gfloat) 6.0 * ( dble_dzdx11 + dble_dzdy11 );
-  const gfloat twelve_dif11 = (gfloat) 6.0 * ( dble_dzdx11 - dble_dzdy11 );
-
-  /*
-   * Absolute values of the sums:
-   */
-  const gfloat twelve_abs_sum00 = LOHALO_ABS( twelve_sum00 );
-  const gfloat twelve_abs_sum10 = LOHALO_ABS( twelve_sum10 );
-  const gfloat twelve_abs_sum01 = LOHALO_ABS( twelve_sum01 );
-  const gfloat twelve_abs_sum11 = LOHALO_ABS( twelve_sum11 );
-
-  /*
-   * Scaled distances to the min:
+   * An internal panel of web designers at a private company preferred
+   * EWA Robidoux over Mitchell-Netravali and a number of alternatives
+   * for reducing images and producing thumbnails in 8-bit sRGB
+   * (without going through linear light).
    */
-  const gfloat u00_times_36 = (gfloat) 36.0 * u00;
-  const gfloat u10_times_36 = (gfloat) 36.0 * u10;
-  const gfloat u01_times_36 = (gfloat) 36.0 * u01;
-  const gfloat u11_times_36 = (gfloat) 36.0 * u11;
-
-  /*
-   * First cross-derivative limiter:
-   */
-  const gfloat first_limit00 = twelve_abs_sum00 - u00_times_36;
-  const gfloat first_limit10 = twelve_abs_sum10 - u10_times_36;
-  const gfloat first_limit01 = twelve_abs_sum01 - u01_times_36;
-  const gfloat first_limit11 = twelve_abs_sum11 - u11_times_36;
-
-  const gfloat quad_d2zdxdy00ii = LOHALO_MAX( quad_d2zdxdy00i, first_limit00 );
-  const gfloat quad_d2zdxdy10ii = LOHALO_MAX( quad_d2zdxdy10i, first_limit10 );
-  const gfloat quad_d2zdxdy01ii = LOHALO_MAX( quad_d2zdxdy01i, first_limit01 );
-  const gfloat quad_d2zdxdy11ii = LOHALO_MAX( quad_d2zdxdy11i, first_limit11 );
-
-  /*
-   * Scaled distances to the max:
-   */
-  const gfloat v00_times_36 = (gfloat) 36.0 * v00;
-  const gfloat v10_times_36 = (gfloat) 36.0 * v10;
-  const gfloat v01_times_36 = (gfloat) 36.0 * v01;
-  const gfloat v11_times_36 = (gfloat) 36.0 * v11;
-
-  /*
-   * Second cross-derivative limiter:
-   */
-  const gfloat second_limit00 = v00_times_36 - twelve_abs_sum00;
-  const gfloat second_limit10 = v10_times_36 - twelve_abs_sum10;
-  const gfloat second_limit01 = v01_times_36 - twelve_abs_sum01;
-  const gfloat second_limit11 = v11_times_36 - twelve_abs_sum11;
-
-  const gfloat quad_d2zdxdy00iii =
-    LOHALO_MIN( quad_d2zdxdy00ii, second_limit00 );
-  const gfloat quad_d2zdxdy10iii =
-    LOHALO_MIN( quad_d2zdxdy10ii, second_limit10 );
-  const gfloat quad_d2zdxdy01iii =
-    LOHALO_MIN( quad_d2zdxdy01ii, second_limit01 );
-  const gfloat quad_d2zdxdy11iii =
-    LOHALO_MIN( quad_d2zdxdy11ii, second_limit11 );
-
-  /*
-   * Absolute values of the differences:
-   */
-  const gfloat twelve_abs_dif00 = LOHALO_ABS( twelve_dif00 );
-  const gfloat twelve_abs_dif10 = LOHALO_ABS( twelve_dif10 );
-  const gfloat twelve_abs_dif01 = LOHALO_ABS( twelve_dif01 );
-  const gfloat twelve_abs_dif11 = LOHALO_ABS( twelve_dif11 );
-
-  /*
-   * Third cross-derivative limiter:
-   */
-  const gfloat third_limit00 = twelve_abs_dif00 - v00_times_36;
-  const gfloat third_limit10 = twelve_abs_dif10 - v10_times_36;
-  const gfloat third_limit01 = twelve_abs_dif01 - v01_times_36;
-  const gfloat third_limit11 = twelve_abs_dif11 - v11_times_36;
-
-  const gfloat quad_d2zdxdy00iiii =
-    LOHALO_MAX( quad_d2zdxdy00iii, third_limit00);
-  const gfloat quad_d2zdxdy10iiii =
-    LOHALO_MAX( quad_d2zdxdy10iii, third_limit10);
-  const gfloat quad_d2zdxdy01iiii =
-    LOHALO_MAX( quad_d2zdxdy01iii, third_limit01);
-  const gfloat quad_d2zdxdy11iiii =
-    LOHALO_MAX( quad_d2zdxdy11iii, third_limit11);
-
-  /*
-   * Fourth cross-derivative limiter:
-   */
-  const gfloat fourth_limit00 = u00_times_36 - twelve_abs_dif00;
-  const gfloat fourth_limit10 = u10_times_36 - twelve_abs_dif10;
-  const gfloat fourth_limit01 = u01_times_36 - twelve_abs_dif01;
-  const gfloat fourth_limit11 = u11_times_36 - twelve_abs_dif11;
-
-  const gfloat quad_d2zdxdy00 = LOHALO_MIN( quad_d2zdxdy00iiii, fourth_limit00);
-  const gfloat quad_d2zdxdy10 = LOHALO_MIN( quad_d2zdxdy10iiii, fourth_limit10);
-  const gfloat quad_d2zdxdy01 = LOHALO_MIN( quad_d2zdxdy01iiii, fourth_limit01);
-  const gfloat quad_d2zdxdy11 = LOHALO_MIN( quad_d2zdxdy11iiii, fourth_limit11);
+  const gfloat q1 = s * c_major_x + t * c_major_y;
+  const gfloat q2 = s * c_minor_x + t * c_minor_y;
 
-  /*
-   * Part of the result that does not need derivatives:
-   */
-  const gfloat newval1 = c00 * dos_two
-                         +
-                         c10 * dos_thr
-                         +
-                         c01 * tre_two
-                         +
-                         c11 * tre_thr;
+  const gfloat r2 = q1 * q1 + q2 * q2;
 
-  /*
-   * Twice the part of the result that only needs first derivatives.
-   */
-  const gfloat newval2 = c00dx * dble_dzdx00
-                         +
-                         c10dx * dble_dzdx10
-                         +
-                         c01dx * dble_dzdx01
-                         +
-                         c11dx * dble_dzdx11
-                         +
-                         c00dy * dble_dzdy00
-                         +
-                         c10dy * dble_dzdy10
-                         +
-                         c01dy * dble_dzdy01
-                         +
-                         c11dy * dble_dzdy11;
+  if (r2 >= (gfloat) 4.)
+    return (gfloat) 0.;
 
-  /*
-   * Four times the part of the result that only uses
-   * cross-derivatives:
-   */
-  const gfloat newval3 = c00dxdy * quad_d2zdxdy00
-                         +
-                         c10dxdy * quad_d2zdxdy10
-                         +
-                         c01dxdy * quad_d2zdxdy01
-                         +
-                         c11dxdy * quad_d2zdxdy11;
-
-  const gfloat newval =
-    newval1 + (gfloat) 0.5 * ( newval2 + (gfloat) 0.5 * newval3 );
-
-  return newval;
-}
+  {
+    const gfloat r = sqrtf ((float) r2);
 
-static inline gfloat
-teepee (const gfloat c_major_x,
-        const gfloat c_major_y,
-        const gfloat c_minor_x,
-        const gfloat c_minor_y,
-        const gfloat s,
-        const gfloat t)
-{
-  const gfloat q1 = s * c_major_x + t * c_major_y;
-  const gfloat q2 = s * c_minor_x + t * c_minor_y;
+    const gfloat minus_inner_root =
+      ( -103. - 36. * sqrt(2.) ) / ( 7. + 72. * sqrt(2.) );
+    const gfloat minus_outer_root = -2.;
 
-  const float r2 = q1 * q1 + q2 * q2;
+    const gfloat a3 = -3.;
+    const gfloat a2 = ( 45739. +   7164. * sqrt(2.) ) / 10319.;
+    const gfloat a0 = ( -8926. + -14328. * sqrt(2.) ) / 10319.;
 
-  const gfloat weight =
-    r2 < (float) 1.
-    ?
-    (gfloat) ( (float) 1. - sqrtf( r2 ) )
-    :
-    (gfloat) 0.;
+    const gfloat weight =
+      (r2 >= (float) 1.)
+      ?
+      (r + minus_inner_root) * (r + minus_outer_root) * (r + minus_outer_root)
+      :
+      r2 * (a3 * r + a2) + a0;
 
-  return weight;
+    return weight;
+  }
 }
 
 static inline void
@@ -1380,12 +518,12 @@ ewa_update (const gint              j,
 {
   const gint skip = j * channels + i * row_skip;
 
-  const gfloat weight = teepee (c_major_x,
-                                c_major_y,
-                                c_minor_x,
-                                c_minor_y,
-                                x_0 - (gfloat) j,
-                                y_0 - (gfloat) i);
+  const gfloat weight = robidoux (c_major_x,
+                                  c_major_y,
+                                  c_minor_x,
+                                  c_minor_y,
+                                  x_0 - (gfloat) j,
+                                  y_0 - (gfloat) i);
 
   *total_weight += weight;
   ewa_newval[0] += weight * input_bptr[ skip     ];
@@ -1410,21 +548,21 @@ mipmap_ewa_update (const gint              level,
                          gdouble* restrict total_weight,
                          gfloat*  restrict ewa_newval)
 {
-  const gint skip = j * channels + i * row_skip;
-
   /*
-   * The factor of "2^(2*level)" = "4 << level" is because level
-   * mipmap values are averages of that many level 0 pixel values, and
-   * the "1 << level" factor in the index is because the absolute
-   * positions are correspondingly "stretched".
+   * The factor of "4^level" = "4 << level" is because level mipmap
+   * values are averages of that many level 0 pixel values, and the "1
+   * << level" factor in the index is because the absolute positions
+   * are correspondingly "stretched".
    */
   const gfloat weight = (gfloat) ( 4 << level ) *
-                        teepee (c_major_x,
-                                c_major_y,
-                                c_minor_x,
-                                c_minor_y,
-                                x - (gfloat) ( (gint) ( 1 << level ) * j),
-                                y - (gfloat) ( (gint) ( 1 << level ) * i));
+                        robidoux (c_major_x,
+                                  c_major_y,
+                                  c_minor_x,
+                                  c_minor_y,
+                                  x - (gfloat) ( (gint) ( 1 << level ) * j),
+                                  y - (gfloat) ( (gint) ( 1 << level ) * i));
+
+  const gint skip = j * channels + i * row_skip;
 
   *total_weight += weight;
   ewa_newval[0] += weight * input_bptr[ skip     ];
@@ -1467,6 +605,19 @@ gegl_sampler_lohalo_get (      GeglSampler*    restrict  self,
   const gint iy_0 = floor ((double) absolute_y);
 
   /*
+   * Using the neareast anchor pixel position is not the most
+   * efficient choice for a tensor bicubic for which anchoring an
+   * asymetrical 4 point stencil at the second pixel location in both
+   * directions is best. For one thing, it requires having at least a
+   * 5x5 stencil when dealing with possible reflexions. The reason for
+   * this less efficient choice for the upsampling component of lohalo
+   * is that we use multiple mipmap levels when downsampling, and
+   * keeping things as centered as possible minimizes the impact of
+   * the slight geometrical shifts introduced by the use of pyramid
+   * levels.
+   */
+
+  /*
    * This is the pointer we use to pull pixel from "base" mipmap level
    * (level "0"), the one with scale=1.0.
    */
@@ -1500,1127 +651,820 @@ gegl_sampler_lohalo_get (      GeglSampler*    restrict  self,
   const gint shift_back_1_pix = -shift_forw_1_pix;
   const gint shift_back_1_row = -shift_forw_1_row;
 
-  const gint shift_back_2_pix = 2 * shift_back_1_pix;
-  const gint shift_back_2_row = 2 * shift_back_1_row;
   const gint shift_forw_2_pix = 2 * shift_forw_1_pix;
   const gint shift_forw_2_row = 2 * shift_forw_1_row;
 
-  const gint uno_two_shift = shift_back_1_pix + shift_back_2_row;
-  const gint uno_thr_shift =                    shift_back_2_row;
-  const gint uno_fou_shift = shift_forw_1_pix + shift_back_2_row;
-
-  const gint dos_one_shift = shift_back_2_pix + shift_back_1_row;
-  const gint dos_two_shift = shift_back_1_pix + shift_back_1_row;
-  const gint dos_thr_shift =                    shift_back_1_row;
-  const gint dos_fou_shift = shift_forw_1_pix + shift_back_1_row;
-  const gint dos_fiv_shift = shift_forw_2_pix + shift_back_1_row;
+  const gint uno_one_shift = shift_back_1_pix + shift_back_1_row;
+  const gint uno_two_shift =                    shift_back_1_row;
+  const gint uno_thr_shift = shift_forw_1_pix + shift_back_1_row;
+  const gint uno_fou_shift = shift_forw_2_pix + shift_back_1_row;
 
-  const gint tre_one_shift = shift_back_2_pix;
-  const gint tre_two_shift = shift_back_1_pix;
-  const gint tre_thr_shift = 0;
-  const gint tre_fou_shift = shift_forw_1_pix;
-  const gint tre_fiv_shift = shift_forw_2_pix;
+  const gint dos_one_shift = shift_back_1_pix;
+  const gint dos_two_shift = 0;
+  const gint dos_thr_shift = shift_forw_1_pix;
+  const gint dos_fou_shift = shift_forw_2_pix;
 
-  const gint qua_one_shift = shift_back_2_pix + shift_forw_1_row;
-  const gint qua_two_shift = shift_back_1_pix + shift_forw_1_row;
-  const gint qua_thr_shift =                    shift_forw_1_row;
-  const gint qua_fou_shift = shift_forw_1_pix + shift_forw_1_row;
-  const gint qua_fiv_shift = shift_forw_2_pix + shift_forw_1_row;
+  const gint tre_one_shift = shift_back_1_pix + shift_forw_1_row;
+  const gint tre_two_shift =                    shift_forw_1_row;
+  const gint tre_thr_shift = shift_forw_1_pix + shift_forw_1_row;
+  const gint tre_fou_shift = shift_forw_2_pix + shift_forw_1_row;
 
-  const gint cin_two_shift = shift_back_1_pix + shift_forw_2_row;
-  const gint cin_thr_shift =                    shift_forw_2_row;
-  const gint cin_fou_shift = shift_forw_1_pix + shift_forw_2_row;
+  const gint qua_one_shift = shift_back_1_pix + shift_forw_2_row;
+  const gint qua_two_shift =                    shift_forw_2_row;
+  const gint qua_thr_shift = shift_forw_1_pix + shift_forw_2_row;
+  const gint qua_fou_shift = shift_forw_2_pix + shift_forw_2_row;
 
   /*
-   * Channel by channel computation of the new pixel values:
+   * Flip coordinates so we can assume we are in the interval [0,1].
+   */
+  const gfloat ax = x_0 >= (gfloat) 0. ? x_0 : -x_0;
+  const gfloat ay = y_0 >= (gfloat) 0. ? y_0 : -y_0;
+  /*
+   * Computation of the Mitchell-Netravali weights using an original
+   * method of N. Robidoux that only requires 13 flops to compute each
+   * group of four weights.
    */
-  gfloat uno_one_0, uno_two_0, uno_thr_0, uno_fou_0;
-  gfloat dos_one_0, dos_two_0, dos_thr_0, dos_fou_0;
-  gfloat tre_one_0, tre_two_0, tre_thr_0, tre_fou_0;
-  gfloat qua_one_0, qua_two_0, qua_thr_0, qua_fou_0;
-
-  gfloat uno_one_1, uno_two_1, uno_thr_1, uno_fou_1;
-  gfloat dos_one_1, dos_two_1, dos_thr_1, dos_fou_1;
-  gfloat tre_one_1, tre_two_1, tre_thr_1, tre_fou_1;
-  gfloat qua_one_1, qua_two_1, qua_thr_1, qua_fou_1;
-
-  gfloat uno_one_2, uno_two_2, uno_thr_2, uno_fou_2;
-  gfloat dos_one_2, dos_two_2, dos_thr_2, dos_fou_2;
-  gfloat tre_one_2, tre_two_2, tre_thr_2, tre_fou_2;
-  gfloat qua_one_2, qua_two_2, qua_thr_2, qua_fou_2;
-
-  gfloat uno_one_3, uno_two_3, uno_thr_3, uno_fou_3;
-  gfloat dos_one_3, dos_two_3, dos_thr_3, dos_fou_3;
-  gfloat tre_one_3, tre_two_3, tre_thr_3, tre_fou_3;
-  gfloat qua_one_3, qua_two_3, qua_thr_3, qua_fou_3;
+  const gfloat xt1 = (gfloat) (7./18.) * ax;
+  const gfloat yt1 = (gfloat) (7./18.) * ay;
+  const gfloat xt2 = (gfloat) 1. - ax;
+  const gfloat yt2 = (gfloat) 1. - ay;
+  const gfloat fou = ( xt1 + (gfloat) (-1./3.) ) * ax * ax;
+  const gfloat qua = ( yt1 + (gfloat) (-1./3.) ) * ay * ay;
+  const gfloat one = ( (gfloat) (1./18.) - xt1 ) * xt2 * xt2;
+  const gfloat uno = ( (gfloat) (1./18.) - yt1 ) * yt2 * yt2;
+  const gfloat xt3 = fou - one;
+  const gfloat yt3 = qua - uno;
+  const gfloat thr = ax - fou - xt3;
+  const gfloat tre = ay - qua - yt3;
+  const gfloat two = xt2 - one + xt3;
+  const gfloat dos = yt2 - uno + yt3;
 
   /*
    * The newval array will contain one computed resampled value per
    * channel:
    */
   gfloat newval[channels];
-
-  /*
-   * First channel:
-   */
-  nohalo_subdivision (input_bptr[ uno_two_shift ],
-                      input_bptr[ uno_thr_shift ],
-                      input_bptr[ uno_fou_shift ],
-                      input_bptr[ dos_one_shift ],
-                      input_bptr[ dos_two_shift ],
-                      input_bptr[ dos_thr_shift ],
-                      input_bptr[ dos_fou_shift ],
-                      input_bptr[ dos_fiv_shift ],
-                      input_bptr[ tre_one_shift ],
-                      input_bptr[ tre_two_shift ],
-                      input_bptr[ tre_thr_shift ],
-                      input_bptr[ tre_fou_shift ],
-                      input_bptr[ tre_fiv_shift ],
-                      input_bptr[ qua_one_shift ],
-                      input_bptr[ qua_two_shift ],
-                      input_bptr[ qua_thr_shift ],
-                      input_bptr[ qua_fou_shift ],
-                      input_bptr[ qua_fiv_shift ],
-                      input_bptr[ cin_two_shift ],
-                      input_bptr[ cin_thr_shift ],
-                      input_bptr[ cin_fou_shift ],
-                      &uno_one_0,
-                      &uno_two_0,
-                      &uno_thr_0,
-                      &uno_fou_0,
-                      &dos_one_0,
-                      &dos_two_0,
-                      &dos_thr_0,
-                      &dos_fou_0,
-                      &tre_one_0,
-                      &tre_two_0,
-                      &tre_thr_0,
-                      &tre_fou_0,
-                      &qua_one_0,
-                      &qua_two_0,
-                      &qua_thr_0,
-                      &qua_fou_0);
+  newval[0] = uno * ( one * input_bptr[ uno_one_shift ] +
+                      two * input_bptr[ uno_two_shift ] +
+                      thr * input_bptr[ uno_thr_shift ] +
+                      fou * input_bptr[ uno_fou_shift ] ) +
+              dos * ( one * input_bptr[ dos_one_shift ] +
+                      two * input_bptr[ dos_two_shift ] +
+                      thr * input_bptr[ dos_thr_shift ] +
+                      fou * input_bptr[ dos_fou_shift ] ) +
+              tre * ( one * input_bptr[ tre_one_shift ] +
+                      two * input_bptr[ tre_two_shift ] +
+                      thr * input_bptr[ tre_thr_shift ] +
+                      fou * input_bptr[ tre_fou_shift ] ) +
+              qua * ( one * input_bptr[ qua_one_shift ] +
+                      two * input_bptr[ qua_two_shift ] +
+                      thr * input_bptr[ qua_thr_shift ] +
+                      fou * input_bptr[ qua_fou_shift ] );
+  newval[1] = uno * ( one * input_bptr[ uno_one_shift + 1 ] +
+                      two * input_bptr[ uno_two_shift + 1 ] +
+                      thr * input_bptr[ uno_thr_shift + 1 ] +
+                      fou * input_bptr[ uno_fou_shift + 1 ] ) +
+              dos * ( one * input_bptr[ dos_one_shift + 1 ] +
+                      two * input_bptr[ dos_two_shift + 1 ] +
+                      thr * input_bptr[ dos_thr_shift + 1 ] +
+                      fou * input_bptr[ dos_fou_shift + 1 ] ) +
+              tre * ( one * input_bptr[ tre_one_shift + 1 ] +
+                      two * input_bptr[ tre_two_shift + 1 ] +
+                      thr * input_bptr[ tre_thr_shift + 1 ] +
+                      fou * input_bptr[ tre_fou_shift + 1 ] ) +
+              qua * ( one * input_bptr[ qua_one_shift + 1 ] +
+                      two * input_bptr[ qua_two_shift + 1 ] +
+                      thr * input_bptr[ qua_thr_shift + 1 ] +
+                      fou * input_bptr[ qua_fou_shift + 1 ] );
+  newval[2] = uno * ( one * input_bptr[ uno_one_shift + 2 ] +
+                      two * input_bptr[ uno_two_shift + 2 ] +
+                      thr * input_bptr[ uno_thr_shift + 2 ] +
+                      fou * input_bptr[ uno_fou_shift + 2 ] ) +
+              dos * ( one * input_bptr[ dos_one_shift + 2 ] +
+                      two * input_bptr[ dos_two_shift + 2 ] +
+                      thr * input_bptr[ dos_thr_shift + 2 ] +
+                      fou * input_bptr[ dos_fou_shift + 2 ] ) +
+              tre * ( one * input_bptr[ tre_one_shift + 2 ] +
+                      two * input_bptr[ tre_two_shift + 2 ] +
+                      thr * input_bptr[ tre_thr_shift + 2 ] +
+                      fou * input_bptr[ tre_fou_shift + 2 ] ) +
+              qua * ( one * input_bptr[ qua_one_shift + 2 ] +
+                      two * input_bptr[ qua_two_shift + 2 ] +
+                      thr * input_bptr[ qua_thr_shift + 2 ] +
+                      fou * input_bptr[ qua_fou_shift + 2 ] );
+  newval[3] = uno * ( one * input_bptr[ uno_one_shift + 3 ] +
+                      two * input_bptr[ uno_two_shift + 3 ] +
+                      thr * input_bptr[ uno_thr_shift + 3 ] +
+                      fou * input_bptr[ uno_fou_shift + 3 ] ) +
+              dos * ( one * input_bptr[ dos_one_shift + 3 ] +
+                      two * input_bptr[ dos_two_shift + 3 ] +
+                      thr * input_bptr[ dos_thr_shift + 3 ] +
+                      fou * input_bptr[ dos_fou_shift + 3 ] ) +
+              tre * ( one * input_bptr[ tre_one_shift + 3 ] +
+                      two * input_bptr[ tre_two_shift + 3 ] +
+                      thr * input_bptr[ tre_thr_shift + 3 ] +
+                      fou * input_bptr[ tre_fou_shift + 3 ] ) +
+              qua * ( one * input_bptr[ qua_one_shift + 3 ] +
+                      two * input_bptr[ qua_two_shift + 3 ] +
+                      thr * input_bptr[ qua_thr_shift + 3 ] +
+                      fou * input_bptr[ qua_fou_shift + 3 ] );
 
   {
     /*
-     * Computation of the needed weights (coefficients).
+     * Determine whether Mitchell-Netravali needs to be blended with
+     * the downsampling method (Clamped EWA with the Robidoux
+     * filter).
+     *
+     * This is done by taking the 2x2 matrix Jinv (the exact or
+     * approximate inverse Jacobian of the transformation at the
+     * location under consideration:
+     *
+     * Jinv = [ a b ] = [ dx/dX dx/dY ]
+     *        [ c d ] = [ dy/dX dy/dY ]
+     *
+     * and computes from it the major and minor axis vectors
+     * [major_x, major_y] and [minor_x,minor_y] of the smallest
+     * ellipse containing both the unit disk and the ellipse which
+     * is the image of the unit disk by the linear transformation
+     *
+     * [ a b ] [S] = [s]
+     * [ c d ] [T] = [t]
+     *
+     * The vector [S,T] is the difference between a position in
+     * output space and [X,Y], the output location under
+     * consideration; the vector [s,t] is the difference between a
+     * position in input space and [x,y], the corresponding input
+     * location.
+     *
      */
-    const gfloat xp1over2   = ( 2 * sign_of_x_0 ) * x_0;
-    const gfloat xm1over2   = xp1over2 + (gfloat) (-1.0);
-    const gfloat onepx      = (gfloat) 0.5 + xp1over2;
-    const gfloat onemx      = (gfloat) 1.5 - xp1over2;
-    const gfloat xp1over2sq = xp1over2 * xp1over2;
-
-    const gfloat yp1over2   = ( 2 * sign_of_y_0 ) * y_0;
-    const gfloat ym1over2   = yp1over2 + (gfloat) (-1.0);
-    const gfloat onepy      = (gfloat) 0.5 + yp1over2;
-    const gfloat onemy      = (gfloat) 1.5 - yp1over2;
-    const gfloat yp1over2sq = yp1over2 * yp1over2;
-
-    const gfloat xm1over2sq = xm1over2 * xm1over2;
-    const gfloat ym1over2sq = ym1over2 * ym1over2;
-
-    const gfloat twice1px = onepx + onepx;
-    const gfloat twice1py = onepy + onepy;
-    const gfloat twice1mx = onemx + onemx;
-    const gfloat twice1my = onemy + onemy;
-
-    const gfloat xm1over2sq_times_ym1over2sq = xm1over2sq * ym1over2sq;
-    const gfloat xp1over2sq_times_ym1over2sq = xp1over2sq * ym1over2sq;
-    const gfloat xp1over2sq_times_yp1over2sq = xp1over2sq * yp1over2sq;
-    const gfloat xm1over2sq_times_yp1over2sq = xm1over2sq * yp1over2sq;
-
-    const gfloat four_times_1px_times_1py = twice1px * twice1py;
-    const gfloat four_times_1mx_times_1py = twice1mx * twice1py;
-    const gfloat twice_xp1over2_times_1py = xp1over2 * twice1py;
-    const gfloat twice_xm1over2_times_1py = xm1over2 * twice1py;
-
-    const gfloat twice_xm1over2_times_1my = xm1over2 * twice1my;
-    const gfloat twice_xp1over2_times_1my = xp1over2 * twice1my;
-    const gfloat four_times_1mx_times_1my = twice1mx * twice1my;
-    const gfloat four_times_1px_times_1my = twice1px * twice1my;
-
-    const gfloat twice_1px_times_ym1over2 = twice1px * ym1over2;
-    const gfloat twice_1mx_times_ym1over2 = twice1mx * ym1over2;
-    const gfloat xp1over2_times_ym1over2  = xp1over2 * ym1over2;
-    const gfloat xm1over2_times_ym1over2  = xm1over2 * ym1over2;
-
-    const gfloat xm1over2_times_yp1over2  = xm1over2 * yp1over2;
-    const gfloat xp1over2_times_yp1over2  = xp1over2 * yp1over2;
-    const gfloat twice_1mx_times_yp1over2 = twice1mx * yp1over2;
-    const gfloat twice_1px_times_yp1over2 = twice1px * yp1over2;
-
-    const gfloat c00     =
-      four_times_1px_times_1py * xm1over2sq_times_ym1over2sq;
-    const gfloat c00dx   =
-      twice_xp1over2_times_1py * xm1over2sq_times_ym1over2sq;
-    const gfloat c00dy   =
-      twice_1px_times_yp1over2 * xm1over2sq_times_ym1over2sq;
-    const gfloat c00dxdy =
-       xp1over2_times_yp1over2 * xm1over2sq_times_ym1over2sq;
-
-    const gfloat c10     =
-      four_times_1mx_times_1py * xp1over2sq_times_ym1over2sq;
-    const gfloat c10dx   =
-      twice_xm1over2_times_1py * xp1over2sq_times_ym1over2sq;
-    const gfloat c10dy   =
-      twice_1mx_times_yp1over2 * xp1over2sq_times_ym1over2sq;
-    const gfloat c10dxdy =
-       xm1over2_times_yp1over2 * xp1over2sq_times_ym1over2sq;
-
-    const gfloat c01     =
-      four_times_1px_times_1my * xm1over2sq_times_yp1over2sq;
-    const gfloat c01dx   =
-      twice_xp1over2_times_1my * xm1over2sq_times_yp1over2sq;
-    const gfloat c01dy   =
-      twice_1px_times_ym1over2 * xm1over2sq_times_yp1over2sq;
-    const gfloat c01dxdy =
-      xp1over2_times_ym1over2 * xm1over2sq_times_yp1over2sq;
-
-    const gfloat c11     =
-      four_times_1mx_times_1my * xp1over2sq_times_yp1over2sq;
-    const gfloat c11dx   =
-      twice_xm1over2_times_1my * xp1over2sq_times_yp1over2sq;
-    const gfloat c11dy   =
-      twice_1mx_times_ym1over2 * xp1over2sq_times_yp1over2sq;
-    const gfloat c11dxdy =
-      xm1over2_times_ym1over2 * xp1over2sq_times_yp1over2sq;
-
-    newval[0] = lbb (c00,
-                     c10,
-                     c01,
-                     c11,
-                     c00dx,
-                     c10dx,
-                     c01dx,
-                     c11dx,
-                     c00dy,
-                     c10dy,
-                     c01dy,
-                     c11dy,
-                     c00dxdy,
-                     c10dxdy,
-                     c01dxdy,
-                     c11dxdy,
-                     uno_one_0,
-                     uno_two_0,
-                     uno_thr_0,
-                     uno_fou_0,
-                     dos_one_0,
-                     dos_two_0,
-                     dos_thr_0,
-                     dos_fou_0,
-                     tre_one_0,
-                     tre_two_0,
-                     tre_thr_0,
-                     tre_fou_0,
-                     qua_one_0,
-                     qua_two_0,
-                     qua_thr_0,
-                     qua_fou_0);
     /*
-     * Second channel:
+     * GOAL:
+     * Fix things so that the pullback, in input space, of a disk of
+     * radius r in output space is an ellipse which contains, at
+     * least, a disc of radius r. (Make this hold for any r>0.)
+     *
+     * ESSENCE OF THE METHOD:
+     * Compute the product of the first two factors of an SVD of the
+     * linear transformation defining the ellipse and make sure that
+     * both its columns have norm at least 1.  Because rotations and
+     * reflexions map disks to themselves, it is not necessary to
+     * compute the third (rightmost) factor of the SVD.
+     *
+     * DETAILS:
+     * Find the singular values and (unit) left singular vectors of
+     * Jinv, clamping up the singular values to 1, and multiply the
+     * unit left singular vectors by the new singular values in
+     * order to get the minor and major ellipse axis vectors.
+     *
+     * Image resampling context:
+     *
+     * The Jacobian matrix of the transformation at the output point
+     * under consideration is defined as follows:
+     *
+     * Consider the transformation (x,y) -> (X,Y) from input
+     * locations to output locations.
+     *
+     * The Jacobian matrix of the transformation at (x,y) is equal
+     * to
+     *
+     *   J = [ A, B ] = [ dX/dx, dX/dy ]
+     *       [ C, D ]   [ dY/dx, dY/dy ]
+     *
+     * that is, the vector [A,C] is the tangent vector corresponding
+     * to input changes in the horizontal direction, and the vector
+     * [B,D] is the tangent vector corresponding to input changes in
+     * the vertical direction.
+     *
+     * In the context of resampling, it is natural to use the
+     * inverse Jacobian matrix Jinv because resampling is generally
+     * performed by pulling pixel locations in the output image back
+     * to locations in the input image. Jinv is
+     *
+     *   Jinv = [ a, b ] = [ dx/dX, dx/dY ]
+     *          [ c, d ]   [ dy/dX, dy/dY ]
+     *
+     * Note: Jinv can be computed from J with the following matrix
+     * formula:
+     *
+     *   Jinv = 1/(A*D-B*C) [  D, -B ]
+     *                      [ -C,  A ]
+     *
+     * What we do is modify Jinv so that it generates an ellipse
+     * which is as close as possible to the original but which
+     * contains the unit disk. This can be accomplished as follows:
+     *
+     * Let
+     *
+     *   Jinv = U Sigma V^T
+     *
+     * be an SVD decomposition of Jinv. (The SVD is not unique, but
+     * the final ellipse does not depend on the particular SVD.)
+     *
+     * We could clamp up the entries of the diagonal matrix Sigma so
+     * that they are at least 1, and then set
+     *
+     *   Jinv = U newSigma V^T.
+     *
+     * However, we do not need to compute V for the following
+     * reason: V^T is an orthogonal matrix (that is, it represents a
+     * combination of rotations and reflexions) so that it maps the
+     * unit circle to itself. For this reason, the exact value of V
+     * does not affect the final ellipse, and we can choose V to be
+     * the identity matrix. This gives
+     *
+     *   Jinv = U newSigma.
+     *
+     * In the end, we return the two diagonal entries of newSigma
+     * together with the two columns of U.
+     *
      */
-    nohalo_subdivision (input_bptr[ uno_two_shift + 1 ],
-                        input_bptr[ uno_thr_shift + 1 ],
-                        input_bptr[ uno_fou_shift + 1 ],
-                        input_bptr[ dos_one_shift + 1 ],
-                        input_bptr[ dos_two_shift + 1 ],
-                        input_bptr[ dos_thr_shift + 1 ],
-                        input_bptr[ dos_fou_shift + 1 ],
-                        input_bptr[ dos_fiv_shift + 1 ],
-                        input_bptr[ tre_one_shift + 1 ],
-                        input_bptr[ tre_two_shift + 1 ],
-                        input_bptr[ tre_thr_shift + 1 ],
-                        input_bptr[ tre_fou_shift + 1 ],
-                        input_bptr[ tre_fiv_shift + 1 ],
-                        input_bptr[ qua_one_shift + 1 ],
-                        input_bptr[ qua_two_shift + 1 ],
-                        input_bptr[ qua_thr_shift + 1 ],
-                        input_bptr[ qua_fou_shift + 1 ],
-                        input_bptr[ qua_fiv_shift + 1 ],
-                        input_bptr[ cin_two_shift + 1 ],
-                        input_bptr[ cin_thr_shift + 1 ],
-                        input_bptr[ cin_fou_shift + 1 ],
-                        &uno_one_1,
-                        &uno_two_1,
-                        &uno_thr_1,
-                        &uno_fou_1,
-                        &dos_one_1,
-                        &dos_two_1,
-                        &dos_thr_1,
-                        &dos_fou_1,
-                        &tre_one_1,
-                        &tre_two_1,
-                        &tre_thr_1,
-                        &tre_fou_1,
-                        &qua_one_1,
-                        &qua_two_1,
-                        &qua_thr_1,
-                        &qua_fou_1);
-    newval[1] = lbb (c00,
-                     c10,
-                     c01,
-                     c11,
-                     c00dx,
-                     c10dx,
-                     c01dx,
-                     c11dx,
-                     c00dy,
-                     c10dy,
-                     c01dy,
-                     c11dy,
-                     c00dxdy,
-                     c10dxdy,
-                     c01dxdy,
-                     c11dxdy,
-                     uno_one_1,
-                     uno_two_1,
-                     uno_thr_1,
-                     uno_fou_1,
-                     dos_one_1,
-                     dos_two_1,
-                     dos_thr_1,
-                     dos_fou_1,
-                     tre_one_1,
-                     tre_two_1,
-                     tre_thr_1,
-                     tre_fou_1,
-                     qua_one_1,
-                     qua_two_1,
-                     qua_thr_1,
-                     qua_fou_1);
     /*
-     * Third channel:
+     * We compute:
+     *
+     * major_mag: half-length of the major axis of the "new"
+     *            (post-clamping) ellipse.
+     *
+     * minor_mag: half-length of the minor axis of the "new"
+     *            ellipse.
+     *
+     * major_unit_x: x-coordinate of the major axis direction vector
+     *               of both the "old" and "new" ellipses.
+     *
+     * major_unit_y: y-coordinate of the major axis direction
+     *               vector.
+     *
+     * minor_unit_x: x-coordinate of the minor axis direction
+     *               vector.
+     *
+     * minor_unit_y: y-coordinate of the minor axis direction
+     *               vector.
+     *
+     * Unit vectors are useful for computing projections, in
+     * particular, to compute the distance between a point in output
+     * space and the center of a unit disk in output space, using
+     * the position of the corresponding point [s,t] in input space.
+     * Following the clamping, the square of this distance is
+     *
+     * ( ( s * major_unit_x + t * major_unit_y ) / major_mag )^2
+     * +
+     * ( ( s * minor_unit_x + t * minor_unit_y ) / minor_mag )^2
+     *
+     * If such distances will be computed for many [s,t]'s, it makes
+     * sense to actually compute the reciprocal of major_mag and
+     * minor_mag and multiply them by the above unit lengths.
      */
-    nohalo_subdivision (input_bptr[ uno_two_shift + 2 ],
-                        input_bptr[ uno_thr_shift + 2 ],
-                        input_bptr[ uno_fou_shift + 2 ],
-                        input_bptr[ dos_one_shift + 2 ],
-                        input_bptr[ dos_two_shift + 2 ],
-                        input_bptr[ dos_thr_shift + 2 ],
-                        input_bptr[ dos_fou_shift + 2 ],
-                        input_bptr[ dos_fiv_shift + 2 ],
-                        input_bptr[ tre_one_shift + 2 ],
-                        input_bptr[ tre_two_shift + 2 ],
-                        input_bptr[ tre_thr_shift + 2 ],
-                        input_bptr[ tre_fou_shift + 2 ],
-                        input_bptr[ tre_fiv_shift + 2 ],
-                        input_bptr[ qua_one_shift + 2 ],
-                        input_bptr[ qua_two_shift + 2 ],
-                        input_bptr[ qua_thr_shift + 2 ],
-                        input_bptr[ qua_fou_shift + 2 ],
-                        input_bptr[ qua_fiv_shift + 2 ],
-                        input_bptr[ cin_two_shift + 2 ],
-                        input_bptr[ cin_thr_shift + 2 ],
-                        input_bptr[ cin_fou_shift + 2 ],
-                        &uno_one_2,
-                        &uno_two_2,
-                        &uno_thr_2,
-                        &uno_fou_2,
-                        &dos_one_2,
-                        &dos_two_2,
-                        &dos_thr_2,
-                        &dos_fou_2,
-                        &tre_one_2,
-                        &tre_two_2,
-                        &tre_thr_2,
-                        &tre_fou_2,
-                        &qua_one_2,
-                        &qua_two_2,
-                        &qua_thr_2,
-                        &qua_fou_2);
-    newval[2] = lbb (c00,
-                     c10,
-                     c01,
-                     c11,
-                     c00dx,
-                     c10dx,
-                     c01dx,
-                     c11dx,
-                     c00dy,
-                     c10dy,
-                     c01dy,
-                     c11dy,
-                     c00dxdy,
-                     c10dxdy,
-                     c01dxdy,
-                     c11dxdy,
-                     uno_one_2,
-                     uno_two_2,
-                     uno_thr_2,
-                     uno_fou_2,
-                     dos_one_2,
-                     dos_two_2,
-                     dos_thr_2,
-                     dos_fou_2,
-                     tre_one_2,
-                     tre_two_2,
-                     tre_thr_2,
-                     tre_fou_2,
-                     qua_one_2,
-                     qua_two_2,
-                     qua_thr_2,
-                     qua_fou_2);
     /*
-     * Fourth channel:
+     * History:
+     *
+     * ClampUpAxes, the ImageMagick function (found in resample.c)
+     * on which this is based, was written by Nicolas Robidoux and
+     * Chantal Racette of Laurentian University with insightful
+     * suggestions from Anthony Thyssen and funding from the
+     * National Science and Engineering Research Council of
+     * Canada. It is distinguished from its predecessors by its
+     * efficient handling of degenerate cases.
+     *
+     * The idea of clamping up the EWA ellipse's major and minor
+     * axes so that the result contains the reconstruction kernel
+     * filter support is taken from Andreas Gustaffson's Masters
+     * thesis "Interactive Image Warping", Helsinki University of
+     * Technology, Faculty of Information Technology, 59 pages, 1993
+     * (see Section 3.6).
+     *
+     * The use of the SVD to clamp up the singular values of the
+     * Jacobian matrix of the pullback transformation for EWA
+     * resampling is taken from the astrophysicist Craig DeForest.
+     * It is implemented in his PDL::Transform code (PDL = Perl Data
+     * Language).
+     *
+     * SVD reference:
+     * "We Recommend Singular Value Decomposition" by David Austin
+     * http://www.ams.org/samplings/feature-column/fcarc-svd
+     *
+     * Ellipse reference:
+     * http://en.wikipedia.org/wiki/Ellipse#Canonical_form
      */
-    nohalo_subdivision (input_bptr[ uno_two_shift + 3 ],
-                        input_bptr[ uno_thr_shift + 3 ],
-                        input_bptr[ uno_fou_shift + 3 ],
-                        input_bptr[ dos_one_shift + 3 ],
-                        input_bptr[ dos_two_shift + 3 ],
-                        input_bptr[ dos_thr_shift + 3 ],
-                        input_bptr[ dos_fou_shift + 3 ],
-                        input_bptr[ dos_fiv_shift + 3 ],
-                        input_bptr[ tre_one_shift + 3 ],
-                        input_bptr[ tre_two_shift + 3 ],
-                        input_bptr[ tre_thr_shift + 3 ],
-                        input_bptr[ tre_fou_shift + 3 ],
-                        input_bptr[ tre_fiv_shift + 3 ],
-                        input_bptr[ qua_one_shift + 3 ],
-                        input_bptr[ qua_two_shift + 3 ],
-                        input_bptr[ qua_thr_shift + 3 ],
-                        input_bptr[ qua_fou_shift + 3 ],
-                        input_bptr[ qua_fiv_shift + 3 ],
-                        input_bptr[ cin_two_shift + 3 ],
-                        input_bptr[ cin_thr_shift + 3 ],
-                        input_bptr[ cin_fou_shift + 3 ],
-                        &uno_one_3,
-                        &uno_two_3,
-                        &uno_thr_3,
-                        &uno_fou_3,
-                        &dos_one_3,
-                        &dos_two_3,
-                        &dos_thr_3,
-                        &dos_fou_3,
-                        &tre_one_3,
-                        &tre_two_3,
-                        &tre_thr_3,
-                        &tre_fou_3,
-                        &qua_one_3,
-                        &qua_two_3,
-                        &qua_thr_3,
-                        &qua_fou_3);
-    newval[3] = lbb (c00,
-                     c10,
-                     c01,
-                     c11,
-                     c00dx,
-                     c10dx,
-                     c01dx,
-                     c11dx,
-                     c00dy,
-                     c10dy,
-                     c01dy,
-                     c11dy,
-                     c00dxdy,
-                     c10dxdy,
-                     c01dxdy,
-                     c11dxdy,
-                     uno_one_3,
-                     uno_two_3,
-                     uno_thr_3,
-                     uno_fou_3,
-                     dos_one_3,
-                     dos_two_3,
-                     dos_thr_3,
-                     dos_fou_3,
-                     tre_one_3,
-                     tre_two_3,
-                     tre_thr_3,
-                     tre_fou_3,
-                     qua_one_3,
-                     qua_two_3,
-                     qua_thr_3,
-                     qua_fou_3);
-
-    {
-      /*
-       * Determine whether LBB-Nohalo needs to be blended with the
-       * downsampling method (Clamped EWA with the tent filter).
-       *
-       * This is done by taking the 2x2 matrix Jinv (the exact or
-       * approximate inverse Jacobian of the transformation at the
-       * location under consideration:
-       *
-       * Jinv = [ a b ] = [ dx/dX dx/dY ]
-       *        [ c d ] = [ dy/dX dy/dY ]
-       *
-       * and computes from it the major and minor axis vectors
-       * [major_x, major_y] and [minor_x,minor_y] of the smallest
-       * ellipse containing both the unit disk and the ellipse which
-       * is the image of the unit disk by the linear transformation
-       *
-       * [ a b ] [S] = [s]
-       * [ c d ] [T] = [t]
-       *
-       * The vector [S,T] is the difference between a position in
-       * output space and [X,Y], the output location under
-       * consideration; the vector [s,t] is the difference between a
-       * position in input space and [x,y], the corresponding input
-       * location.
-       *
-       */
-      /*
-       * GOAL:
-       * Fix things so that the pullback, in input space, of a disk of
-       * radius r in output space is an ellipse which contains, at
-       * least, a disc of radius r. (Make this hold for any r>0.)
-       *
-       * ESSENCE OF THE METHOD:
-       * Compute the product of the first two factors of an SVD of the
-       * linear transformation defining the ellipse and make sure that
-       * both its columns have norm at least 1.  Because rotations and
-       * reflexions map disks to themselves, it is not necessary to
-       * compute the third (rightmost) factor of the SVD.
-       *
-       * DETAILS:
-       * Find the singular values and (unit) left singular vectors of
-       * Jinv, clamping up the singular values to 1, and multiply the
-       * unit left singular vectors by the new singular values in
-       * order to get the minor and major ellipse axis vectors.
-       *
-       * Image resampling context:
-       *
-       * The Jacobian matrix of the transformation at the output point
-       * under consideration is defined as follows:
-       *
-       * Consider the transformation (x,y) -> (X,Y) from input
-       * locations to output locations.
-       *
-       * The Jacobian matrix of the transformation at (x,y) is equal
-       * to
-       *
-       *   J = [ A, B ] = [ dX/dx, dX/dy ]
-       *       [ C, D ]   [ dY/dx, dY/dy ]
-       *
-       * that is, the vector [A,C] is the tangent vector corresponding
-       * to input changes in the horizontal direction, and the vector
-       * [B,D] is the tangent vector corresponding to input changes in
-       * the vertical direction.
-       *
-       * In the context of resampling, it is natural to use the
-       * inverse Jacobian matrix Jinv because resampling is generally
-       * performed by pulling pixel locations in the output image back
-       * to locations in the input image. Jinv is
-       *
-       *   Jinv = [ a, b ] = [ dx/dX, dx/dY ]
-       *          [ c, d ]   [ dy/dX, dy/dY ]
-       *
-       * Note: Jinv can be computed from J with the following matrix
-       * formula:
-       *
-       *   Jinv = 1/(A*D-B*C) [  D, -B ]
-       *                      [ -C,  A ]
-       *
-       * What we do is modify Jinv so that it generates an ellipse
-       * which is as close as possible to the original but which
-       * contains the unit disk. This can be accomplished as follows:
-       *
-       * Let
-       *
-       *   Jinv = U Sigma V^T
-       *
-       * be an SVD decomposition of Jinv. (The SVD is not unique, but
-       * the final ellipse does not depend on the particular SVD.)
-       *
-       * We could clamp up the entries of the diagonal matrix Sigma so
-       * that they are at least 1, and then set
-       *
-       *   Jinv = U newSigma V^T.
-       *
-       * However, we do not need to compute V for the following
-       * reason: V^T is an orthogonal matrix (that is, it represents a
-       * combination of rotations and reflexions) so that it maps the
-       * unit circle to itself. For this reason, the exact value of V
-       * does not affect the final ellipse, and we can choose V to be
-       * the identity matrix. This gives
-       *
-       *   Jinv = U newSigma.
-       *
-       * In the end, we return the two diagonal entries of newSigma
-       * together with the two columns of U.
-       *
-       */
-      /*
-       * We compute:
-       *
-       * major_mag: half-length of the major axis of the "new"
-       *            (post-clamping) ellipse.
-       *
-       * minor_mag: half-length of the minor axis of the "new"
-       *            ellipse.
-       *
-       * major_unit_x: x-coordinate of the major axis direction vector
-       *               of both the "old" and "new" ellipses.
-       *
-       * major_unit_y: y-coordinate of the major axis direction
-       *               vector.
-       *
-       * minor_unit_x: x-coordinate of the minor axis direction
-       *               vector.
-       *
-       * minor_unit_y: y-coordinate of the minor axis direction
-       *               vector.
-       *
-       * Unit vectors are useful for computing projections, in
-       * particular, to compute the distance between a point in output
-       * space and the center of a unit disk in output space, using
-       * the position of the corresponding point [s,t] in input space.
-       * Following the clamping, the square of this distance is
-       *
-       * ( ( s * major_unit_x + t * major_unit_y ) / major_mag )^2
-       * +
-       * ( ( s * minor_unit_x + t * minor_unit_y ) / minor_mag )^2
-       *
-       * If such distances will be computed for many [s,t]'s, it makes
-       * sense to actually compute the reciprocal of major_mag and
-       * minor_mag and multiply them by the above unit lengths.
-       */
-      /*
-       * History:
-       *
-       * ClampUpAxes, the ImageMagick function (found in resample.c)
-       * on which this is based, was written by Nicolas Robidoux and
-       * Chantal Racette of Laurentian University with insightful
-       * suggestions from Anthony Thyssen and funding from the
-       * National Science and Engineering Research Council of
-       * Canada. It is distinguished from its predecessors by its
-       * efficient handling of degenerate cases.
-       *
-       * The idea of clamping up the EWA ellipse's major and minor
-       * axes so that the result contains the reconstruction kernel
-       * filter support is taken from Andreas Gustaffson's Masters
-       * thesis "Interactive Image Warping", Helsinki University of
-       * Technology, Faculty of Information Technology, 59 pages, 1993
-       * (see Section 3.6).
-       *
-       * The use of the SVD to clamp up the singular values of the
-       * Jacobian matrix of the pullback transformation for EWA
-       * resampling is taken from the astrophysicist Craig DeForest.
-       * It is implemented in his PDL::Transform code (PDL = Perl Data
-       * Language).
-       *
-       * SVD reference:
-       * "We Recommend Singular Value Decomposition" by David Austin
-       * http://www.ams.org/samplings/feature-column/fcarc-svd
-       *
-       * Ellipse reference:
-       * http://en.wikipedia.org/wiki/Ellipse#Canonical_form
-       */
-      const gdouble a = scale?scale->coeff[0][0]:1;
-      const gdouble b = scale?scale->coeff[0][1]:0;
-      const gdouble c = scale?scale->coeff[1][0]:0;
-      const gdouble d = scale?scale->coeff[1][1]:1;
-
-      /*
-       * Computations are done in double precision because "direct"
-       * SVD computations are prone to round off error. (Computing in
-       * single precision most likely would be fine.)
-       */
-      /*
-       * n is the matrix Jinv * transpose(Jinv). Eigenvalues of n are
-       * the squares of the singular values of Jinv.
-       */
-      const gdouble aa = a * a;
-      const gdouble bb = b * b;
-      const gdouble cc = c * c;
-      const gdouble dd = d * d;
-      /*
-       * Eigenvectors of n are left singular vectors of Jinv.
-       */
-      const gdouble n11 = aa + bb;
-      const gdouble n12 = a * c + b * d;
-      const gdouble n21 = n12;
-      const gdouble n22 = cc + dd;
-      const double det = a * d - b * c;
-      const double twice_det = det + det;
-      const double frobenius_squared = n11 + n22;
-      const double discriminant =
-        ( frobenius_squared + twice_det ) * ( frobenius_squared - twice_det );
-      /*
-       * In exact arithmetic, the discriminant cannot be negative. In
-       * floating point, it can, leading a non-deterministic bug in
-       * ImageMagick (now fixed, thanks to Cristy).
-       */
-      const double sqrt_discriminant =
-        sqrt (discriminant > 0. ? discriminant : 0.);
-
-      /*
-       * Initially, we only compute the squares of the singular
-       * values.
-       */
-      /*
-       * s1 is the largest singular value of the inverse Jacobian
-       * matrix. In other words, its reciprocal is the smallest
-       * singular value of the Jacobian matrix itself.  If s1 = 0,
-       * both singular values are 0, and any orthogonal pair of left
-       * and right factors produces a singular decomposition of Jinv.
-       */
-      const gdouble twice_s1s1 = frobenius_squared + sqrt_discriminant;
-      /*
-       * If s1 <= 1, the forward transformation is not downsampling in
-       * any direction, and consequently we do not need the
-       * downsampling scheme at all.
-       */
-
-      if (twice_s1s1 > (gdouble) 2.)
-        {
-          /*
-           * The result (most likely) has a nonzero teepee component.
-           */
-          const gdouble s1s1 = (gdouble) 0.5 * twice_s1s1;
-          /*
-           * s2 the smallest singular value of the inverse Jacobian
-           * matrix. Its reciprocal is the largest singular value of
-           * the Jacobian matrix itself.
-           */
-          const gdouble s2s2 = 0.5 * ( frobenius_squared - sqrt_discriminant );
-
-          const gdouble s1s1minusn11 = s1s1 - n11;
-          const gdouble s1s1minusn22 = s1s1 - n22;
-          /*
-           * u1, the first column of the U factor of a singular
-           * decomposition of Jinv, is a (non-normalized) left
-           * singular vector corresponding to s1. It has entries u11
-           * and u21. We compute u1 from the fact that it is an
-           * eigenvector of n corresponding to the eigenvalue s1^2.
-           */
-          const gdouble s1s1minusn11_squared = s1s1minusn11 * s1s1minusn11;
-          const gdouble s1s1minusn22_squared = s1s1minusn22 * s1s1minusn22;
-          /*
-           * The following selects the largest row of n-s1^2 I ("I"
-           * being the 2x2 identity matrix) as the one which is used
-           * to find the eigenvector. If both s1^2-n11 and s1^2-n22
-           * are zero, n-s1^2 I is the zero matrix.  In that case, any
-           * vector is an eigenvector; in addition, norm below is
-           * equal to zero, and, in exact arithmetic, this is the only
-           * case in which norm = 0. So, setting u1 to the simple but
-           * arbitrary vector [1,0] if norm = 0 safely takes care of
-           * all cases.
-           */
-          const gdouble temp_u11 =
-            s1s1minusn11_squared >= s1s1minusn22_squared
-            ?
-            n12
-            :
-            s1s1minusn22;
-          const gdouble temp_u21 =
-            s1s1minusn11_squared >= s1s1minusn22_squared
-            ?
-            s1s1minusn11
-            :
-            n21;
-          const gdouble norm =
-            sqrt( temp_u11 * temp_u11 + temp_u21 * temp_u21 );
-          /*
-           * Finalize the entries of first left singular vector
-           * (associated with the largest singular value).
-           */
-          const gdouble u11 =
-            norm > (gdouble) 0.0 ? temp_u11 / norm : (gdouble) 1.0;
-          const gdouble u21 =
-            norm > (gdouble) 0.0 ? temp_u21 / norm : (gdouble) 0.0;
-          /*
-           * Clamp the singular values up to 1:
-           */
-          const gdouble major_mag =
-            s1s1 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s1s1 );
-          const gdouble minor_mag =
-            s2s2 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s2s2 );
-          /*
-           * Unit major and minor axis direction vectors:
-           */
-          const gdouble major_unit_x =  u11;
-          const gdouble major_unit_y =  u21;
-          const gdouble minor_unit_x = -u21;
-          const gdouble minor_unit_y =  u11;
+    /*
+     * Use the scale object if defined. Otherwise, assume that the
+     * inverse Jacobian matrix is the identity.
+     */
+    const gdouble a = scale ? scale->coeff[0][0] : 1;
+    const gdouble b = scale ? scale->coeff[0][1] : 0;
+    const gdouble c = scale ? scale->coeff[1][0] : 0;
+    const gdouble d = scale ? scale->coeff[1][1] : 1;
 
-          /*
-           * The square of the distance to the key location in output
-           * place of a point [s,t] in input space is the square root of
-           *
-           * ( s * c_major_x + t * c_major_y )^2
-           * +
-           * ( s * c_minor_x + t * c_minor_y )^2.
-           */
-          const gfloat c_major_x = major_unit_x / major_mag;
-          const gfloat c_major_y = major_unit_y / major_mag;
-          const gfloat c_minor_x = minor_unit_x / minor_mag;
-          const gfloat c_minor_y = minor_unit_y / minor_mag;
+    /*
+     * Computations are done in double precision because "direct"
+     * SVD computations are prone to round off error. (Computing in
+     * single precision most likely would be fine.)
+     */
+    /*
+     * n is the matrix Jinv * transpose(Jinv). Eigenvalues of n are
+     * the squares of the singular values of Jinv.
+     */
+    const gdouble aa = a * a;
+    const gdouble bb = b * b;
+    const gdouble cc = c * c;
+    const gdouble dd = d * d;
+    /*
+     * Eigenvectors of n are left singular vectors of Jinv.
+     */
+    const gdouble n11 = aa + bb;
+    const gdouble n12 = a * c + b * d;
+    const gdouble n21 = n12;
+    const gdouble n22 = cc + dd;
+    const double det = a * d - b * c;
+    const double twice_det = det + det;
+    const double frobenius_squared = n11 + n22;
+    const double discriminant =
+      ( frobenius_squared + twice_det ) * ( frobenius_squared - twice_det );
+    /*
+     * In exact arithmetic, the discriminant cannot be negative. In
+     * floating point, it can, leading a non-deterministic bug in
+     * ImageMagick (now fixed, thanks to Cristy, the lead dev).
+     */
+    const double sqrt_discriminant =
+      sqrt (discriminant > 0. ? discriminant : 0.);
 
-          /*
-           * Remainder of the ellipse geometry computation:
-           */
-          /*
-           * Major and minor axis direction vectors:
-           */
-          const gdouble major_x = major_mag * major_unit_x;
-          const gdouble major_y = major_mag * major_unit_y;
-          const gdouble minor_x = minor_mag * minor_unit_x;
-          const gdouble minor_y = minor_mag * minor_unit_y;
+    /*
+     * Initially, we only compute the squares of the singular
+     * values.
+     */
+    /*
+     * s1 is the largest singular value of the inverse Jacobian
+     * matrix. In other words, its reciprocal is the smallest
+     * singular value of the Jacobian matrix itself.  If s1 = 0,
+     * both singular values are 0, and any orthogonal pair of left
+     * and right factors produces a singular decomposition of Jinv.
+     */
+    const gdouble twice_s1s1 = frobenius_squared + sqrt_discriminant;
+    /*
+     * If s1 <= 1, the forward transformation is not downsampling in
+     * any direction, and consequently we do not need the
+     * downsampling scheme at all.
+     */
 
-          /*
-           * Ellipse coefficients:
-           */
-          const gdouble ellipse_a =
-            major_y * major_y + minor_y * minor_y;
-          const gdouble folded_ellipse_b =
-            major_x * major_y + minor_x * minor_y;
-          const gdouble ellipse_c =
-            major_x * major_x + minor_x * minor_x;
-          const gdouble ellipse_f = major_mag * minor_mag;
+    if (twice_s1s1 > (gdouble) 2.)
+      {
+        /*
+         * The result (most likely) has a nonzero EWA component.
+         */
+        const gdouble s1s1 = (gdouble) 0.5 * twice_s1s1;
+        /*
+         * s2 the smallest singular value of the inverse Jacobian
+         * matrix. Its reciprocal is the largest singular value of
+         * the Jacobian matrix itself.
+         */
+        const gdouble s2s2 = 0.5 * ( frobenius_squared - sqrt_discriminant );
+
+        const gdouble s1s1minusn11 = s1s1 - n11;
+        const gdouble s1s1minusn22 = s1s1 - n22;
+        /*
+         * u1, the first column of the U factor of a singular
+         * decomposition of Jinv, is a (non-normalized) left
+         * singular vector corresponding to s1. It has entries u11
+         * and u21. We compute u1 from the fact that it is an
+         * eigenvector of n corresponding to the eigenvalue s1^2.
+         */
+        const gdouble s1s1minusn11_squared = s1s1minusn11 * s1s1minusn11;
+        const gdouble s1s1minusn22_squared = s1s1minusn22 * s1s1minusn22;
+        /*
+         * The following selects the largest row of n-s1^2 I ("I"
+         * being the 2x2 identity matrix) as the one which is used
+         * to find the eigenvector. If both s1^2-n11 and s1^2-n22
+         * are zero, n-s1^2 I is the zero matrix.  In that case, any
+         * vector is an eigenvector; in addition, norm below is
+         * equal to zero, and, in exact arithmetic, this is the only
+         * case in which norm = 0. So, setting u1 to the simple but
+         * arbitrary vector [1,0] if norm = 0 safely takes care of
+         * all cases.
+         */
+        const gdouble temp_u11 =
+          s1s1minusn11_squared >= s1s1minusn22_squared
+          ?
+          n12
+          :
+          s1s1minusn22;
+        const gdouble temp_u21 =
+          s1s1minusn11_squared >= s1s1minusn22_squared
+          ?
+          s1s1minusn11
+          :
+          n21;
+        const gdouble norm =
+          sqrt( temp_u11 * temp_u11 + temp_u21 * temp_u21 );
+        /*
+         * Finalize the entries of first left singular vector
+         * (associated with the largest singular value).
+         */
+        const gdouble u11 =
+          norm > (gdouble) 0.0 ? temp_u11 / norm : (gdouble) 1.0;
+        const gdouble u21 =
+          norm > (gdouble) 0.0 ? temp_u21 / norm : (gdouble) 0.0;
+        /*
+         * Clamp the singular values up to 1:
+         */
+        const gdouble major_mag =
+          s1s1 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s1s1 );
+        const gdouble minor_mag =
+          s2s2 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s2s2 );
+        /*
+         * Unit major and minor axis direction vectors:
+         */
+        const gdouble major_unit_x =  u11;
+        const gdouble major_unit_y =  u21;
+        const gdouble minor_unit_x = -u21;
+        const gdouble minor_unit_y =  u11;
+
+        /*
+         * The square of the distance to the key location in output
+         * place of a point [s,t] in input space is the square root of
+         *
+         * ( s * c_major_x + t * c_major_y )^2
+         * +
+         * ( s * c_minor_x + t * c_minor_y )^2.
+         */
+        const gfloat c_major_x = major_unit_x / major_mag;
+        const gfloat c_major_y = major_unit_y / major_mag;
+        const gfloat c_minor_x = minor_unit_x / minor_mag;
+        const gfloat c_minor_y = minor_unit_y / minor_mag;
+
+        /*
+         * Remainder of the ellipse geometry computation:
+         */
+        /*
+         * Major and minor axis direction vectors:
+         */
+        const gdouble major_x = major_mag * major_unit_x;
+        const gdouble major_y = major_mag * major_unit_y;
+        const gdouble minor_x = minor_mag * minor_unit_x;
+        const gdouble minor_y = minor_mag * minor_unit_y;
+
+        /*
+         * Ellipse coefficients:
+         */
+        const gdouble ellipse_a =
+          major_y * major_y + minor_y * minor_y;
+        const gdouble folded_ellipse_b =
+          major_x * major_y + minor_x * minor_y;
+        const gdouble ellipse_c =
+          major_x * major_x + minor_x * minor_x;
+        const gdouble ellipse_f = major_mag * minor_mag;
 
           /*
-           * Bounding box of the ellipse:
+           * ewa_radius is the unscaled radius, which here is 2
+           * because we use EWA Robidoux, which is based on a Keys
+           * cubic.
            */
-          const gdouble bounding_box_factor =
-            ellipse_f * ellipse_f /
-            ( ellipse_c * ellipse_a - folded_ellipse_b * folded_ellipse_b );
-          const gfloat bounding_box_half_width =
-            sqrtf( (gfloat) (ellipse_c * bounding_box_factor) );
-          const gfloat bounding_box_half_height =
-            sqrtf( (gfloat) (ellipse_a * bounding_box_factor) );
+          const gfloat ewa_radius = 2.;
+        /*
+         * Bounding box of the ellipse:
+         */
+        const gdouble bounding_box_factor =
+          ellipse_f * ellipse_f /
+          ( ellipse_c * ellipse_a - folded_ellipse_b * folded_ellipse_b );
+        const gfloat bounding_box_half_width =
+          ewa_radius * sqrtf( (gfloat) (ellipse_c * bounding_box_factor) );
+        const gfloat bounding_box_half_height =
+          ewa_radius * sqrtf( (gfloat) (ellipse_a * bounding_box_factor) );
+
+        /*
+         * Relative weight of the contribution of
+         * Mitchell-Netravali:
+         */
+        const gfloat theta = (gfloat) ( (gdouble) 1. / ellipse_f );
+
+        /*
+         * Grab the pixel values located within the level 0
+         * context_rect.  Farther ones will be accessed through
+         * higher mipmap levels.
+         */
+        const gint out_left_0 =
+          LOHALO_MAX
+          (
+            (gint) ceilf  ( (double) ( x_0 - bounding_box_half_width  ) )
+            ,
+            -LOHALO_OFFSET_0
+          );
+        const gint out_rite_0 =
+          LOHALO_MIN
+          (
+            (gint) floorf ( (double) ( x_0 + bounding_box_half_width  ) )
+            ,
+            LOHALO_OFFSET_0
+          );
+        const gint out_top_0 =
+          LOHALO_MAX
+          (
+            (gint) ceilf  ( (double) ( y_0 - bounding_box_half_height ) )
+            ,
+            -LOHALO_OFFSET_0
+          );
+        const gint out_bot_0 =
+          LOHALO_MIN
+          (
+            (gint) floorf ( (double) ( y_0 + bounding_box_half_height ) )
+            ,
+            LOHALO_OFFSET_0
+          );
+
+        /*
+         * Accumulator for the EWA weights:
+         */
+        gdouble total_weight = (gdouble) 0.0;
+        /*
+         * Storage for the EWA contribution:
+         */
+        gfloat ewa_newval[channels];
+        ewa_newval[0] = (gfloat) 0;
+        ewa_newval[1] = (gfloat) 0;
+        ewa_newval[2] = (gfloat) 0;
+        ewa_newval[3] = (gfloat) 0;
 
-          /*
-           * Relative weight of the contribution of LBB-Nohalo:
-           */
-          const gfloat theta = (gfloat) ( (gdouble) 1. / ellipse_f );
+        {
+          gint i = out_top_0;
+          do {
+            gint j = out_left_0;
+            do {
+              ewa_update (j,
+                          i,
+                          c_major_x,
+                          c_major_y,
+                          c_minor_x,
+                          c_minor_y,
+                          x_0,
+                          y_0,
+                          channels,
+                          row_skip,
+                          input_bptr,
+                          &total_weight,
+                          ewa_newval);
+            } while ( ++j <= out_rite_0 );
+          } while ( ++i <= out_bot_0 );
+        }
 
+        {
           /*
-           * Grab the pixel values located within the level 0
-           * context_rect.  Farther ones will be accessed through
-           * higher mipmap levels.
+           * In order to know whether we use higher mipmap level
+           * values, we need to check whether there is a level 1
+           * mipmap location within the ellipse. So, we need to
+           * determine the alignment of the level 1 mipmap level
+           * w.r.t. the current level 0.
+           *
+           * At level 0, we can access pixels which are at most
+           * LOHALO_OFFSET_0 away from the anchor pixel location in
+           * box distance.
            */
-          const gint out_left_0 =
-            LOHALO_MAX
-            (
-              (gint) ceilf  ( (double) ( x_0 - bounding_box_half_width  ) )
-              ,
-              -LOHALO_OFFSET_0
-            );
-          const gint out_rite_0 =
-            LOHALO_MIN
-            (
-              (gint) floorf ( (double) ( x_0 + bounding_box_half_width  ) )
-              ,
-              LOHALO_OFFSET_0
-            );
-          const gint out_top_0 =
-            LOHALO_MAX
-            (
-              (gint) ceilf  ( (double) ( y_0 - bounding_box_half_height ) )
-              ,
-              -LOHALO_OFFSET_0
-            );
-          const gint out_bot_0 =
-            LOHALO_MIN
-            (
-              (gint) floorf ( (double) ( y_0 + bounding_box_half_height ) )
-              ,
-              LOHALO_OFFSET_0
-            );
-
           /*
-           * Accumulator for the EWA weights:
+           * Determine whether the anchor level_0 pixel locations
+           * are odd (VS even):
            */
-          gdouble total_weight = (gdouble) 0.0;
+          const gint odd_ix_0 = ix_0 % 2;
+          const gint odd_iy_0 = iy_0 % 2;
           /*
-           * Storage for the EWA contribution:
+           * Find the closest locations, on all four sides, of level 1
+           * pixels which involve data not found in the level 0
+           * LOHALO_SIZE_0xLOHALO_SIZE_0.
            */
-          gfloat ewa_newval[channels];
-          ewa_newval[0] = (gfloat) 0;
-          ewa_newval[1] = (gfloat) 0;
-          ewa_newval[2] = (gfloat) 0;
-          ewa_newval[3] = (gfloat) 0;
-
-          {
-            gint i = out_top_0;
-            do {
-              gint j = out_left_0;
-              do {
-                ewa_update (j,
-                            i,
-                            c_major_x,
-                            c_major_y,
-                            c_minor_x,
-                            c_minor_y,
-                            x_0,
-                            y_0,
-                            channels,
-                            row_skip,
-                            input_bptr,
-                            &total_weight,
-                            ewa_newval);
-              } while ( ++j <= out_rite_0 );
-            } while ( ++i <= out_bot_0 );
-          }
+          LOHALO_FIND_CLOSEST_LOCATIONS(0,1)
 
-          {
-            /*
-             * In order to know whether we use higher mipmap level
-             * values, we need to check whether there is a level 1
-             * mipmap location within the ellipse. So, we need to
-             * determine the alignment of the level 1 mipmap level
-             * w.r.t. the current level 0.
-             *
-             * At level 0, we can access pixels which are at most
-             * LOHALO_OFFSET_0 away from the anchor pixel location in
-             * box distance.
-             */
-            /*
-             * Determine whether the anchor level_0 pixel locations
-             * are odd (VS even):
-             */
-            const gint odd_ix_0 = ix_0 % 2;
-            const gint odd_iy_0 = iy_0 % 2;
-            /*
-             * Find the closest locations, on all four sides, of level 1
-             * pixels which involve data not found in the level 0
-             * LOHALO_SIZE_0xLOHALO_SIZE_0.
-             */
-            LOHALO_FIND_CLOSEST_LOCATIONS(0,1)
+          if (( x_0 - bounding_box_half_width  < closest_left_1 ) ||
+              ( x_0 + bounding_box_half_width  > closest_rite_1 ) ||
+              ( y_0 - bounding_box_half_height < closest_top_1  ) ||
+              ( y_0 + bounding_box_half_height > closest_bot_1  ))
+            {
+              /*
+               * We most likely need higher mipmap level(s) because
+               * the bounding box of the ellipse covers mipmap pixel
+               * locations which involve data not "covered" by the
+               * level 0 context_rect. (The ellipse may still fail
+               * to involve mipmap level 1 values--in which case all
+               * mipmap pixel values will get 0 coefficients--but we
+               * used a quick and dirty bounding box test which lets
+               * through false positives.)
+               */
+              /*
+               * Nearest mipmap anchor pixel location:
+               */
+              const gint ix_1 = LOHALO_FLOORED_DIVISION_BY_2(ix_0);
+              const gint iy_1 = LOHALO_FLOORED_DIVISION_BY_2(iy_0);
+              /*
+               * Get pointer to mipmap level 1 data:
+               */
+              const gfloat* restrict input_bptr_1 =
+                (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                        ix_1,
+                                                        iy_1,
+                                                        (gint) 1,
+                                                        repeat_mode);
+              /*
+               * Position of the sampling location in the coordinate
+               * system defined by the mipmap "pixel locations"
+               * relative to the level 1 anchor pixel location. The
+               * "-1/2"s are because the center of a level 0 pixel
+               * is at a box distance of 1/2 from the center of the
+               * closest level 1 pixel.
+               */
+              const gfloat x_1 =
+                x_0 + (gfloat) ( ix_0 - 2 * ix_1 ) - (gfloat) 0.5;
+              const gfloat y_1 =
+                y_0 + (gfloat) ( iy_0 - 2 * iy_1 ) - (gfloat) 0.5;
+              /*
+               * Key index ranges:
+               */
+              /*
+               * The "in" indices are the closest relative mipmap 1
+               * indices of needed mipmap values:
+               */
+              LOHALO_FIND_CLOSEST_INDICES(0,1)
+              /*
+               * The "out" indices are the farthest relative mipmap 1
+               * indices we use at this level:
+               */
+              LOHALO_FIND_FARTHEST_INDICES(1)
+              /*
+               * Update using mipmap level 1 values.
+               */
+              LOHALO_MIPMAP_EWA_UPDATE(1)
 
-            if (( x_0 - bounding_box_half_width  < closest_left_1 ) ||
-                ( x_0 + bounding_box_half_width  > closest_rite_1 ) ||
-                ( y_0 - bounding_box_half_height < closest_top_1  ) ||
-                ( y_0 + bounding_box_half_height > closest_bot_1  ))
               {
-                /*
-                 * We most likely need higher mipmap level(s) because
-                 * the bounding box of the ellipse covers mipmap pixel
-                 * locations which involve data not "covered" by the
-                 * level 0 context_rect. (The ellipse may still fail
-                 * to involve mipmap level 1 values--in which case all
-                 * mipmap pixel values will get 0 coefficients--but we
-                 * used a quick and dirty bounding box test which lets
-                 * through false positives.)
-                 */
-                /*
-                 * Nearest mipmap anchor pixel location:
-                 */
-                const gint ix_1 = LOHALO_FLOORED_DIVISION_BY_2(ix_0);
-                const gint iy_1 = LOHALO_FLOORED_DIVISION_BY_2(iy_0);
-                /*
-                 * Get pointer to mipmap level 1 data:
-                 */
-                const gfloat* restrict input_bptr_1 =
+              /*
+               * Second mipmap level.
+               */
+              const gint odd_ix_1 = ix_1 % 2;
+              const gint odd_iy_1 = iy_1 % 2;
+              LOHALO_FIND_CLOSEST_LOCATIONS(1,2)
+              if (( x_1 - bounding_box_half_width  < closest_left_2 ) ||
+                  ( x_1 + bounding_box_half_width  > closest_rite_2 ) ||
+                  ( y_1 - bounding_box_half_height < closest_top_2  ) ||
+                  ( y_1 + bounding_box_half_height > closest_bot_2  ))
+                {
+                const gint ix_2 = LOHALO_FLOORED_DIVISION_BY_2(ix_1);
+                const gint iy_2 = LOHALO_FLOORED_DIVISION_BY_2(iy_1);
+                const gfloat* restrict input_bptr_2 =
                   (gfloat*) gegl_sampler_get_from_mipmap (self,
-                                                          ix_1,
-                                                          iy_1,
-                                                          (gint) 1,
+                                                          ix_2,
+                                                          iy_2,
+                                                          (gint) 2,
                                                           repeat_mode);
-                /*
-                 * Position of the sampling location in the coordinate
-                 * system defined by the mipmap "pixel locations"
-                 * relative to the level 1 anchor pixel location. The
-                 * "-1/2"s are because the center of a level 0 pixel
-                 * is at a box distance of 1/2 from the center of the
-                 * closest level 1 pixel.
-                 */
-                const gfloat x_1 =
-                  x_0 + (gfloat) ( ix_0 - 2 * ix_1 ) - (gfloat) 0.5;
-                const gfloat y_1 =
-                  y_0 + (gfloat) ( iy_0 - 2 * iy_1 ) - (gfloat) 0.5;
-                /*
-                 * Key index ranges:
-                 */
-                /*
-                 * The "in" indices are the closest relative mipmap 1
-                 * indices of needed mipmap values:
-                 */
-                LOHALO_FIND_CLOSEST_INDICES(0,1)
-                /*
-                 * The "out" indices are the farthest relative mipmap 1
-                 * indices we use at this level:
-                 */
-                LOHALO_FIND_FARTHEST_INDICES(1)
-                /*
-                 * Update using mipmap level 1 values.
-                 */
-                LOHALO_MIPMAP_EWA_UPDATE(1)
+                const gfloat x_2 =
+                  x_1 + (gfloat) ( 2 * ( ix_1 - 2 * ix_2 ) - 1 );
+                const gfloat y_2 =
+                  y_1 + (gfloat) ( 2 * ( iy_1 - 2 * iy_2 ) - 1 );
+                LOHALO_FIND_CLOSEST_INDICES(1,2)
+                LOHALO_FIND_FARTHEST_INDICES(2)
+                LOHALO_MIPMAP_EWA_UPDATE(2)
 
                 {
                 /*
-                 * Second mipmap level.
+                 * Third mipmap level.
                  */
-                const gint odd_ix_1 = ix_1 % 2;
-                const gint odd_iy_1 = iy_1 % 2;
-                LOHALO_FIND_CLOSEST_LOCATIONS(1,2)
-                if (( x_1 - bounding_box_half_width  < closest_left_2 ) ||
-                    ( x_1 + bounding_box_half_width  > closest_rite_2 ) ||
-                    ( y_1 - bounding_box_half_height < closest_top_2  ) ||
-                    ( y_1 + bounding_box_half_height > closest_bot_2  ))
+                const gint odd_ix_2 = ix_2 % 2;
+                const gint odd_iy_2 = iy_2 % 2;
+                LOHALO_FIND_CLOSEST_LOCATIONS(2,3)
+                if (( x_2 - bounding_box_half_width  < closest_left_3 ) ||
+                    ( x_2 + bounding_box_half_width  > closest_rite_3 ) ||
+                    ( y_2 - bounding_box_half_height < closest_top_3  ) ||
+                    ( y_2 + bounding_box_half_height > closest_bot_3  ))
                   {
-                  const gint ix_2 = LOHALO_FLOORED_DIVISION_BY_2(ix_1);
-                  const gint iy_2 = LOHALO_FLOORED_DIVISION_BY_2(iy_1);
-                  const gfloat* restrict input_bptr_2 =
+                  const gint ix_3 = LOHALO_FLOORED_DIVISION_BY_2(ix_2);
+                  const gint iy_3 = LOHALO_FLOORED_DIVISION_BY_2(iy_2);
+                  const gfloat* restrict input_bptr_3 =
                     (gfloat*) gegl_sampler_get_from_mipmap (self,
-                                                            ix_2,
-                                                            iy_2,
-                                                            (gint) 2,
+                                                            ix_3,
+                                                            iy_3,
+                                                            (gint) 3,
                                                             repeat_mode);
-                  const gfloat x_2 =
-                    x_1 + (gfloat) ( 2 * ( ix_1 - 2 * ix_2 ) - 1 );
-                  const gfloat y_2 =
-                    y_1 + (gfloat) ( 2 * ( iy_1 - 2 * iy_2 ) - 1 );
-                  LOHALO_FIND_CLOSEST_INDICES(1,2)
-                  LOHALO_FIND_FARTHEST_INDICES(2)
-                  LOHALO_MIPMAP_EWA_UPDATE(2)
+                  const gfloat x_3 =
+                    x_2 + (gfloat) ( 2 * ( ix_2 - 2 * ix_3 ) - 1 );
+                  const gfloat y_3 =
+                    y_2 + (gfloat) ( 2 * ( iy_2 - 2 * iy_3 ) - 1 );
+                  LOHALO_FIND_CLOSEST_INDICES(2,3)
+                  LOHALO_FIND_FARTHEST_INDICES(3)
+                  LOHALO_MIPMAP_EWA_UPDATE(3)
 
                   {
                   /*
-                   * Third mipmap level.
+                   * Fourth mipmap level.
                    */
-                  const gint odd_ix_2 = ix_2 % 2;
-                  const gint odd_iy_2 = iy_2 % 2;
-                  LOHALO_FIND_CLOSEST_LOCATIONS(2,3)
-                  if (( x_2 - bounding_box_half_width  < closest_left_3 ) ||
-                      ( x_2 + bounding_box_half_width  > closest_rite_3 ) ||
-                      ( y_2 - bounding_box_half_height < closest_top_3  ) ||
-                      ( y_2 + bounding_box_half_height > closest_bot_3  ))
+                  const gint odd_ix_3 = ix_3 % 2;
+                  const gint odd_iy_3 = iy_3 % 2;
+                  LOHALO_FIND_CLOSEST_LOCATIONS(3,4)
+                  if (( x_3 - bounding_box_half_width  < closest_left_4 ) ||
+                      ( x_3 + bounding_box_half_width  > closest_rite_4 ) ||
+                      ( y_3 - bounding_box_half_height < closest_top_4  ) ||
+                      ( y_3 + bounding_box_half_height > closest_bot_4  ))
                     {
-                    const gint ix_3 = LOHALO_FLOORED_DIVISION_BY_2(ix_2);
-                    const gint iy_3 = LOHALO_FLOORED_DIVISION_BY_2(iy_2);
-                    const gfloat* restrict input_bptr_3 =
+                    const gint ix_4 = LOHALO_FLOORED_DIVISION_BY_2(ix_3);
+                    const gint iy_4 = LOHALO_FLOORED_DIVISION_BY_2(iy_3);
+                    const gfloat* restrict input_bptr_4 =
                       (gfloat*) gegl_sampler_get_from_mipmap (self,
-                                                              ix_3,
-                                                              iy_3,
-                                                              (gint) 3,
+                                                              ix_4,
+                                                              iy_4,
+                                                              (gint) 4,
                                                               repeat_mode);
-                    const gfloat x_3 =
-                      x_2 + (gfloat) ( 2 * ( ix_2 - 2 * ix_3 ) - 1 );
-                    const gfloat y_3 =
-                      y_2 + (gfloat) ( 2 * ( iy_2 - 2 * iy_3 ) - 1 );
-                    LOHALO_FIND_CLOSEST_INDICES(2,3)
-                    LOHALO_FIND_FARTHEST_INDICES(3)
-                    LOHALO_MIPMAP_EWA_UPDATE(3)
+                    const gfloat x_4 =
+                      x_3 + (gfloat) ( 2 * ( ix_3 - 2 * ix_4 ) - 1 );
+                    const gfloat y_4 =
+                      y_3 + (gfloat) ( 2 * ( iy_3 - 2 * iy_4 ) - 1 );
+                    LOHALO_FIND_CLOSEST_INDICES(3,4)
+                    LOHALO_FIND_FARTHEST_INDICES(4)
+                    LOHALO_MIPMAP_EWA_UPDATE(4)
 
                     {
                     /*
-                     * Fourth mipmap level.
+                     * Fifth mipmap level.
                      */
-                    const gint odd_ix_3 = ix_3 % 2;
-                    const gint odd_iy_3 = iy_3 % 2;
-                    LOHALO_FIND_CLOSEST_LOCATIONS(3,4)
-                    if (( x_3 - bounding_box_half_width  < closest_left_4 ) ||
-                        ( x_3 + bounding_box_half_width  > closest_rite_4 ) ||
-                        ( y_3 - bounding_box_half_height < closest_top_4  ) ||
-                        ( y_3 + bounding_box_half_height > closest_bot_4  ))
+                    const gint odd_ix_4 = ix_4 % 2;
+                    const gint odd_iy_4 = iy_4 % 2;
+                    LOHALO_FIND_CLOSEST_LOCATIONS(4,5)
+                    if (( x_4 - bounding_box_half_width  < closest_left_5 ) ||
+                        ( x_4 + bounding_box_half_width  > closest_rite_5 ) ||
+                        ( y_4 - bounding_box_half_height < closest_top_5  ) ||
+                        ( y_4 + bounding_box_half_height > closest_bot_5  ))
                       {
-                      const gint ix_4 = LOHALO_FLOORED_DIVISION_BY_2(ix_3);
-                      const gint iy_4 = LOHALO_FLOORED_DIVISION_BY_2(iy_3);
-                      const gfloat* restrict input_bptr_4 =
+                      const gint ix_5 = LOHALO_FLOORED_DIVISION_BY_2(ix_4);
+                      const gint iy_5 = LOHALO_FLOORED_DIVISION_BY_2(iy_4);
+                      const gfloat* restrict input_bptr_5 =
                         (gfloat*) gegl_sampler_get_from_mipmap (self,
-                                                                ix_4,
-                                                                iy_4,
-                                                                (gint) 4,
+                                                                ix_5,
+                                                                iy_5,
+                                                                (gint) 5,
                                                                 repeat_mode);
-                      const gfloat x_4 =
-                        x_3 + (gfloat) ( 2 * ( ix_3 - 2 * ix_4 ) - 1 );
-                      const gfloat y_4 =
-                        y_3 + (gfloat) ( 2 * ( iy_3 - 2 * iy_4 ) - 1 );
-                      LOHALO_FIND_CLOSEST_INDICES(3,4)
-                      LOHALO_FIND_FARTHEST_INDICES(4)
-                      LOHALO_MIPMAP_EWA_UPDATE(4)
+                      const gfloat x_5 =
+                        x_4 + (gfloat) ( 2 * ( ix_4 - 2 * ix_5 ) - 1 );
+                      const gfloat y_5 =
+                        y_4 + (gfloat) ( 2 * ( iy_4 - 2 * iy_5 ) - 1 );
+                      LOHALO_FIND_CLOSEST_INDICES(4,5)
+                      LOHALO_FIND_FARTHEST_INDICES(5)
+                      LOHALO_MIPMAP_EWA_UPDATE(5)
 
                       {
                       /*
-                       * Fifth mipmap level.
+                       * Sixth mipmap level.
                        */
-                      const gint odd_ix_4 = ix_4 % 2;
-                      const gint odd_iy_4 = iy_4 % 2;
-                      LOHALO_FIND_CLOSEST_LOCATIONS(4,5)
-                      if (( x_4 - bounding_box_half_width  < closest_left_5 ) ||
-                          ( x_4 + bounding_box_half_width  > closest_rite_5 ) ||
-                          ( y_4 - bounding_box_half_height < closest_top_5  ) ||
-                          ( y_4 + bounding_box_half_height > closest_bot_5  ))
+                      const gint odd_ix_5 = ix_5 % 2;
+                      const gint odd_iy_5 = iy_5 % 2;
+                      LOHALO_FIND_CLOSEST_LOCATIONS(5,6)
+                      if (( x_5 - bounding_box_half_width
+                            < closest_left_6 ) ||
+                          ( x_5 + bounding_box_half_width
+                            > closest_rite_6 ) ||
+                          ( y_5 - bounding_box_half_height
+                            < closest_top_6  ) ||
+                          ( y_5 + bounding_box_half_height
+                            > closest_bot_6  ))
                         {
-                        const gint ix_5 = LOHALO_FLOORED_DIVISION_BY_2(ix_4);
-                        const gint iy_5 = LOHALO_FLOORED_DIVISION_BY_2(iy_4);
-                        const gfloat* restrict input_bptr_5 =
-                          (gfloat*) gegl_sampler_get_from_mipmap (self,
-                                                                  ix_5,
-                                                                  iy_5,
-                                                                  (gint) 5,
-                                                                  repeat_mode);
-                        const gfloat x_5 =
-                          x_4 + (gfloat) ( 2 * ( ix_4 - 2 * ix_5 ) - 1 );
-                        const gfloat y_5 =
-                          y_4 + (gfloat) ( 2 * ( iy_4 - 2 * iy_5 ) - 1 );
-                        LOHALO_FIND_CLOSEST_INDICES(4,5)
-                        LOHALO_FIND_FARTHEST_INDICES(5)
-                        LOHALO_MIPMAP_EWA_UPDATE(5)
+                        const gint ix_6 = LOHALO_FLOORED_DIVISION_BY_2(ix_5);
+                        const gint iy_6 = LOHALO_FLOORED_DIVISION_BY_2(iy_5);
+                        const gfloat* restrict input_bptr_6 = (gfloat*)
+                          gegl_sampler_get_from_mipmap (self,
+                                                        ix_6,
+                                                        iy_6,
+                                                        (gint) 6,
+                                                        repeat_mode);
+                        const gfloat x_6 =
+                          x_5 + (gfloat) ( 2 * ( ix_5 - 2 * ix_6 ) - 1 );
+                        const gfloat y_6 =
+                          y_5 + (gfloat) ( 2 * ( iy_5 - 2 * iy_6 ) - 1 );
+                        LOHALO_FIND_CLOSEST_INDICES(5,6)
+                        LOHALO_FIND_FARTHEST_INDICES(6)
+                        LOHALO_MIPMAP_EWA_UPDATE(6)
 
                         {
                         /*
-                         * Sixth mipmap level.
+                         * Seventh mipmap level (eight if counted
+                         * from zero = "straight up").
                          */
-                        const gint odd_ix_5 = ix_5 % 2;
-                        const gint odd_iy_5 = iy_5 % 2;
-                        LOHALO_FIND_CLOSEST_LOCATIONS(5,6)
-                        if (( x_5 - bounding_box_half_width
-                              < closest_left_6 ) ||
-                            ( x_5 + bounding_box_half_width
-                              > closest_rite_6 ) ||
-                            ( y_5 - bounding_box_half_height
-                              < closest_top_6  ) ||
-                            ( y_5 + bounding_box_half_height
-                              > closest_bot_6  ))
+                        const gint odd_ix_6 = ix_6 % 2;
+                        const gint odd_iy_6 = iy_6 % 2;
+                        LOHALO_FIND_CLOSEST_LOCATIONS(6,7)
+                        if (( x_6 - bounding_box_half_width
+                              < closest_left_7 ) ||
+                            ( x_6 + bounding_box_half_width
+                              > closest_rite_7 ) ||
+                            ( y_6 - bounding_box_half_height
+                              < closest_top_7  ) ||
+                            ( y_6 + bounding_box_half_height
+                              > closest_bot_7  ))
                           {
-                          const gint ix_6 = LOHALO_FLOORED_DIVISION_BY_2(ix_5);
-                          const gint iy_6 = LOHALO_FLOORED_DIVISION_BY_2(iy_5);
-                          const gfloat* restrict input_bptr_6 = (gfloat*)
+                          const gint ix_7 =
+                            LOHALO_FLOORED_DIVISION_BY_2(ix_6);
+                          const gint iy_7 =
+                            LOHALO_FLOORED_DIVISION_BY_2(iy_6);
+                          const gfloat* restrict input_bptr_7 = (gfloat*)
                             gegl_sampler_get_from_mipmap (self,
-                                                          ix_6,
-                                                          iy_6,
-                                                          (gint) 6,
+                                                          ix_7,
+                                                          iy_7,
+                                                          (gint) 7,
                                                           repeat_mode);
-                          const gfloat x_6 =
-                            x_5 + (gfloat) ( 2 * ( ix_5 - 2 * ix_6 ) - 1 );
-                          const gfloat y_6 =
-                            y_5 + (gfloat) ( 2 * ( iy_5 - 2 * iy_6 ) - 1 );
-                          LOHALO_FIND_CLOSEST_INDICES(5,6)
-                          LOHALO_FIND_FARTHEST_INDICES(6)
-                          LOHALO_MIPMAP_EWA_UPDATE(6)
-
-                          {
-                          /*
-                           * Seventh mipmap level (eight if counted
-                           * from zero = "straight up").
-                           */
-                          const gint odd_ix_6 = ix_6 % 2;
-                          const gint odd_iy_6 = iy_6 % 2;
-                          LOHALO_FIND_CLOSEST_LOCATIONS(6,7)
-                          if (( x_6 - bounding_box_half_width
-                                < closest_left_7 ) ||
-                              ( x_6 + bounding_box_half_width
-                                > closest_rite_7 ) ||
-                              ( y_6 - bounding_box_half_height
-                                < closest_top_7  ) ||
-                              ( y_6 + bounding_box_half_height
-                                > closest_bot_7  ))
-                            {
-                            const gint ix_7 =
-                              LOHALO_FLOORED_DIVISION_BY_2(ix_6);
-                            const gint iy_7 =
-                              LOHALO_FLOORED_DIVISION_BY_2(iy_6);
-                            const gfloat* restrict input_bptr_7 = (gfloat*)
-                              gegl_sampler_get_from_mipmap (self,
-                                                            ix_7,
-                                                            iy_7,
-                                                            (gint) 7,
-                                                            repeat_mode);
-                            const gfloat x_7 =
-                              x_6 + (gfloat) ( 2 * ( ix_6 - 2 * ix_7 ) - 1 );
-                            const gfloat y_7 =
-                              y_6 + (gfloat) ( 2 * ( iy_6 - 2 * iy_7 ) - 1 );
-                            LOHALO_FIND_CLOSEST_INDICES(6,7)
-                            LOHALO_FIND_FARTHEST_INDICES(7)
-                            LOHALO_MIPMAP_EWA_UPDATE(7)
-                            }
-                          }
+                          const gfloat x_7 =
+                            x_6 + (gfloat) ( 2 * ( ix_6 - 2 * ix_7 ) - 1 );
+                          const gfloat y_7 =
+                            y_6 + (gfloat) ( 2 * ( iy_6 - 2 * iy_7 ) - 1 );
+                          LOHALO_FIND_CLOSEST_INDICES(6,7)
+                          LOHALO_FIND_FARTHEST_INDICES(7)
+                          LOHALO_MIPMAP_EWA_UPDATE(7)
                           }
                         }
                         }
@@ -2631,27 +1475,28 @@ gegl_sampler_lohalo_get (      GeglSampler*    restrict  self,
                   }
                   }
                 }
+                }
               }
-
-            {
-              /*
-               * Blend the LBB-Nohalo and EWA results:
-               */
-              const gfloat beta =
-                (gfloat) ( ( (gdouble) 1.0 - theta ) / total_weight );
-              newval[0] = theta * newval[0] + beta * ewa_newval[0];
-              newval[1] = theta * newval[1] + beta * ewa_newval[1];
-              newval[2] = theta * newval[2] + beta * ewa_newval[2];
-              newval[3] = theta * newval[3] + beta * ewa_newval[3];
             }
+
+          {
+            /*
+             * Blend the Mitchell-Netravali and EWA Robidoux results:
+             */
+            const gfloat beta =
+              (gfloat) ( ( (gdouble) 1.0 - theta ) / total_weight );
+            newval[0] = theta * newval[0] + beta * ewa_newval[0];
+            newval[1] = theta * newval[1] + beta * ewa_newval[1];
+            newval[2] = theta * newval[2] + beta * ewa_newval[2];
+            newval[3] = theta * newval[3] + beta * ewa_newval[3];
           }
         }
+      }
 
-      /*
-       * Ship out the result:
-       */
-      babl_process (self->fish, newval, output, 1);
-      return;
-    }
+    /*
+     * Ship out the result:
+     */
+    babl_process (self->fish, newval, output, 1);
+    return;
   }
 }
diff --git a/gegl/buffer/gegl-sampler-nohalo.c b/gegl/buffer/gegl-sampler-nohalo.c
new file mode 100644
index 0000000..9a0944d
--- /dev/null
+++ b/gegl/buffer/gegl-sampler-nohalo.c
@@ -0,0 +1,2677 @@
+/* This file is part of GEGL
+ *
+ * GEGL is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU Lesser General Public License as
+ * published by the Free Software Foundation; either version 3 of the
+ * License, or (at your option) any later version.
+ *
+ * GEGL is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General
+ * Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with GEGL; if not, see
+ * <http://www.gnu.org/licenses/>.
+ *
+ * 2012 (c) Nicolas Robidoux
+ * 2009-2011 (c) Nicolas Robidoux, Adam Turcotte, Chantal Racette,
+ * Anthony Thyssen, John Cupitt and Ãyvind KolÃs.
+ */
+
+/*
+ * ==============
+ * NOHALO SAMPLER
+ * ==============
+ *
+ * The Nohalo ("No Halo") sampler is a Jacobian-adaptive blend of
+ * LBB-Nohalo (Nohalo subdivision with Locally Bounded Bicubic
+ * interpolation) used as an upsampler (hence "unscaled") and Clamped
+ * EWA (Elliptical Weighted Averaging) filtering with the "teepee"
+ * (radial tent, that is, conical) kernel, which is used whenever some
+ * downsampling occurs and consequently is appropriately scaled.
+ *
+ * WARNING: This version of Nohalo only gives top quality results down
+ * to about a downsampling of about ratio 1/(NOHALO_OFFSET_0+0.5).
+ * Beyond that, the quality is somewhat lower (due to the use of
+ * higher level mipmap data instead of "level 0" unfiltered input
+ * data).
+ *
+ * The use of mipmap data is not a feature of the resampling methods
+ * themselves: It is done to accommodate GEGL's preferred pixel data
+ * management system.
+ *
+ * TODO: The teepee filter probably should be replaced by filtering
+ * with the triangle (bilinear, Mexican hat function) filter, using
+ * clamped parallelograms instead of clamped ellipses (which I believe
+ * has never been done, even though it's a fairly obvious thing to
+ * do). It has better antialiasing, and is not much blurrier, although
+ * the slight added blur is probably a good thing when downsampling
+ * just a little bit.
+ */
+
+/*
+ * Reference:
+ *
+ * Nohalo subdivision (with bilinear instead of LBB "finish") is
+ * documented in
+ *
+ *   Robidoux, N., Gong, M., Cupitt, J., Turcotte, A., and Martinez,
+ *   K.  CPU, SMP and GPU implementations of Nohalo level 1, a fast
+ *   co-convex antialiasing image resampler.  In Proceedings of
+ *   C3S2E. 2009, 185-195.
+ */
+
+/*
+ * Credits and thanks:
+ *
+ * This code owes a lot to R&D performed for ImageMagick and VIPS
+ * (Virtual Image Processing System) by N. Robidoux, A. Thyssen and
+ * J. Cupitt, and student research performed by A. Turcotte and
+ * C. Racette.
+ *
+ * Jacobian adaptive resampling was developed by N. Robidoux and
+ * A. Turcotte of the Department of Mathematics and Computer Science
+ * of Laurentian University in the course of A. Turcotte's Masters in
+ * Computational Sciences (even though the eventual thesis did not
+ * include this topic). Ã. KolÃs and Michael Natterer contributed much
+ * to the GEGL implementation.
+ *
+ * Nohalo with LBB finishing scheme was developed by N. Robidoux and
+ * C. Racette of the Department of Mathematics and Computer Science of
+ * Laurentian University in the course of C. Racette's Masters in
+ * Computational Sciences. Preliminary work on Nohalo and monotone
+ * interpolation was performed by C. Racette and N. Robidoux in the
+ * course of her honours thesis, by N. Robidoux, A. Turcotte and Eric
+ * Daoust during Google Summer of Code 2009, and is based on 2009 work
+ * by N. Robidoux, A. Turcotte, J. Cupitt, Minglun Gong and Kirk
+ * Martinez. The Better Image Resampling project was started by
+ * Minglun Gong, A. Turcotte and N. Robidoux in 2007.
+ *
+ * Clamped EWA with the teepee (radial version of the (Mexican) "hat"
+ * or "triangle") filter kernel was developed by N. Robidoux and
+ * A. Thyssen the assistance of C. Racette and Frederick Weinhaus. It
+ * is based on methods of Paul Heckbert and Andreas Gustaffson (and
+ * possibly others).
+ *
+ * The programming of this and other GEGL samplers by N. Robidoux was
+ * funded by a large number of freedomsponsors.org patrons, including
+ * A. Prokoudine.
+ *
+ * N. Robidoux's early research on Nohalo funded in part by an NSERC
+ * (National Science and Engineering Research Council of Canada)
+ * Discovery Grant awarded to him (298424--2004). This, together with
+ * M. Gong's own Discovery grant and A. Turcotte's NSERC USRA
+ * (Undergraduate Summer Research Assistantship) funded the very
+ * earliest stages of this project.
+ *
+ * A. Turcotte's image resampling research on reduced halo methods and
+ * Jacobian adaptive methods funded in part by an OGS (Ontario
+ * Graduate Scholarship) and an NSERC Alexander Graham Bell Canada
+ * Graduate Scholarhip awarded to him, by GSoC (Google Summer of Code)
+ * 2010 funding awarded to GIMP (Gnu Image Manipulation Program) and
+ * by Laurentian University research funding provided by N. Robidoux
+ * and Ralf Meyer.
+ *
+ * C. Racette's image resampling research and programming funded in
+ * part by a NSERC Discovery Grant awarded to Julien Dompierre
+ * (20-61098) and by a NSERC Alexander Graham Bell Canada Graduate
+ * Scholarship awarded to her.
+ *
+ * E. Daoust's image resampling programming was funded by GSoC 2010
+ * funding awarded to GIMP.
+ *
+ * N. Robidoux thanks the above and Massimo Valentini, Geert Jordaens,
+ * Craig DeForest, Sven Neumann and R. Meyer for useful comments.
+ */
+
+/*
+ * General convention:
+ *
+ * Looking at the image as a (linear algebra) matrix, the index j has
+ * to do with the x-coordinate, that is, horizontal position, and the
+ * index i has to do with the y-coordinate (which runs from top to
+ * bottom), that is, the vertical position.
+ *
+ * However, in order to match the GIMP convention that states that
+ * pixel indices match the position of the top left corner of the
+ * corresponding pixel, so that the center of pixel (i,j) is located
+ * at (i+1/2,j+1/2), pixel center positions do NOT match their index.
+ * Earlier versions of this code did not follow this convention: They
+ * assumed that the location of the center of a pixel matched its
+ * index.
+ */
+
+#include "config.h"
+#include <glib-object.h>
+#include <math.h>
+
+#include "gegl.h"
+#include "gegl-types-internal.h"
+#include "gegl-buffer-private.h"
+
+#include "gegl-sampler-nohalo.h"
+
+/*
+ * NOHALO_MINMOD is an implementation of the minmod function which
+ * only needs two "conditional moves."
+ * NOHALO_MINMOD(a,b,a_times_a,a_times_b) "returns"
+ * minmod(a,b). The macro parameter ("input") a_times_a is assumed to
+ * contain the square of a; a_times_b, the product of a and b.
+ *
+ * For uncompressed natural images in high bit depth (images for which
+ * the slopes a and b are unlikely to be equal to zero or be equal to
+ * each other), or chips with good branch prediction, the following
+ * version of the minmod function may work well:
+ *
+ * ( (a_times_b)>=0. ? ( (a_times_b)<(a_times_a) ? (b) : (a) ) : 0. )
+ *
+ * In this version, the forward branch of the second conditional move
+ * is taken when |b|>|a| and when a*b<0. However, the "else" branch is
+ * taken when a=0 (or when a=b), which is why the above version is not
+ * as effective for images with regions with constant pixel values (or
+ * regions with pixel values which vary linearly or bilinearly) since
+ * we apply minmod to pairs of differences.
+ *
+ * The following version is more suitable for images with flat
+ * (constant) colour areas, since a, which is a pixel difference, will
+ * often be 0, in which case both forward branches are likely. This
+ * may be preferable if "branch flag look ahead" does not work so
+ * well.
+ *
+ * ( (a_times_b)>=0. ? ( (a_times_a)<=(a_times_b) ? (a) : (b) ) : 0. )
+ *
+ * This last version appears to be slightly better than the former in
+ * speed tests performed on a recent multicore Intel chip, especially
+ * when enlarging a sharp image by a large factor, hence the choice.
+ */
+
+/* #define NOHALO_MINMOD(a,b,a_times_a,a_times_b) \ */
+/*   (                                            \ */
+/*     (a_times_b) >= (gfloat) 0.                 \ */
+/*     ?                                          \ */
+/*     ( (a_times_b) < (a_times_a) ? (b) : (a) )  \ */
+/*     :                                          \ */
+/*     (gfloat) 0.                                \ */
+/*   )                                              */
+
+#define NOHALO_MINMOD(_a_,_b_,_a_times_a_,_a_times_b_) \
+  (                                                    \
+    (_a_times_b_) >= (gfloat) 0.                       \
+    ?                                                  \
+    ( (_a_times_a_) <= (_a_times_b_) ? (_a_) : (_b_) ) \
+    :                                                  \
+    (gfloat) 0.                                        \
+  )
+
+/*
+ * Macros set up so the likely winner in in the first argument
+ * (forward branch likely etc):
+ */
+#define NOHALO_MIN(_x_,_y_) ( (_x_) <= (_y_) ? (_x_) : (_y_) )
+#define NOHALO_MAX(_x_,_y_) ( (_x_) >= (_y_) ? (_x_) : (_y_) )
+#define NOHALO_ABS(_x_)  ( (_x_) >= (gfloat) 0. ? (_x_) : -(_x_) )
+#define NOHALO_SIGN(_x_) ( (_x_) >= (gfloat) 0. ? (gfloat) 1. : (gfloat) -1. )
+
+/*
+ * Special case of Knuth's floored division, that is:
+ *
+ * FLOORED_DIVISION(a,b) (((a) - ((a)<0 ? (b)-1 : 0)) / (b))
+ *
+ * When b is 2, this gives, for example,
+ *
+ * FLOORED_DIVISION_BY_2(a) (((a) - ((a)>=0 ? 0 : 1)) / 2)
+ *
+ * On a two's complement machine, this is even simpler:
+ *
+ * FLOORED_DIVISION_BY_2(a) ( (a)>>1 )
+ */
+#define NOHALO_FLOORED_DIVISION_BY_2(_a_) ( (_a_)>>1 )
+
+/*
+ * Convenience macros. _level_ and _previous_level_ must be a plain
+ * integers (like "1", "2" etc) because it is literally replaced (note
+ * the "##_level").
+ */
+
+#define NOHALO_FIND_CLOSEST_LOCATIONS(_previous_level_,_level_) \
+  const gfloat closest_left_##_level_ =                         \
+    odd_ix_##_previous_level_                                   \
+    ?                                                           \
+    (gfloat) ( -( NOHALO_OFFSET_##_previous_level_ + 1.5 ) )    \
+    :                                                           \
+    (gfloat) ( -( NOHALO_OFFSET_##_previous_level_ + 0.5 ) );   \
+  const gfloat closest_rite_##_level_ =                         \
+    odd_ix_##_previous_level_                                   \
+    ?                                                           \
+    (gfloat) (  ( NOHALO_OFFSET_##_previous_level_ + 0.5 ) )    \
+    :                                                           \
+    (gfloat) (  ( NOHALO_OFFSET_##_previous_level_ + 1.5 ) );   \
+  const gfloat closest_top_##_level_  =                         \
+    odd_iy_##_previous_level_                                   \
+    ?                                                           \
+    (gfloat) ( -( NOHALO_OFFSET_##_previous_level_ + 1.5 ) )    \
+    :                                                           \
+    (gfloat) ( -( NOHALO_OFFSET_##_previous_level_ + 0.5 ) );   \
+  const gfloat closest_bot_##_level_  =                         \
+    odd_iy_##_previous_level_                                   \
+    ?                                                           \
+    (gfloat) (  ( NOHALO_OFFSET_##_previous_level_ + 0.5 ) )    \
+    :                                                           \
+    (gfloat) (  ( NOHALO_OFFSET_##_previous_level_ + 1.5 ) );
+
+#define NOHALO_FIND_CLOSEST_INDICES(_previous_level_,_level_)             \
+  const gint in_left_##_level_ =                                          \
+    -NOHALO_OFFSET_##_previous_level_        + odd_ix_##_previous_level_; \
+  const gint in_rite_##_level_ =                                          \
+    ( NOHALO_OFFSET_##_previous_level_ - 1 ) + odd_ix_##_previous_level_; \
+  const gint in_top_##_level_  =                                          \
+    -NOHALO_OFFSET_##_previous_level_        + odd_iy_##_previous_level_; \
+  const gint in_bot_##_level_  =                                          \
+    ( NOHALO_OFFSET_##_previous_level_ - 1 ) + odd_iy_##_previous_level_;
+
+#define NOHALO_FIND_FARTHEST_INDICES(_level_)                            \
+  const gint out_left_##_level_ =                                        \
+    NOHALO_MAX                                                           \
+    (                                                                    \
+      (gint) ceilf  (                                                    \
+        (float)                                                          \
+          ( ( x_##_level_ - bounding_box_half_width  ) * (gfloat) 0.5 )) \
+      ,                                                                  \
+      -NOHALO_OFFSET_MIPMAP                                              \
+    );                                                                   \
+  const gint out_rite_##_level_ =                                        \
+    NOHALO_MIN                                                           \
+    (                                                                    \
+      (gint) floorf (                                                    \
+        (float)                                                          \
+          ( ( x_##_level_ + bounding_box_half_width  ) * (gfloat) 0.5 )) \
+      ,                                                                  \
+      NOHALO_OFFSET_MIPMAP                                               \
+    );                                                                   \
+  const gint out_top_##_level_ =                                         \
+    NOHALO_MAX                                                           \
+    (                                                                    \
+      (gint) ceilf  (                                                    \
+        (float)                                                          \
+          ( ( y_##_level_ - bounding_box_half_height ) * (gfloat) 0.5 )) \
+      ,                                                                  \
+      -NOHALO_OFFSET_MIPMAP                                              \
+    );                                                                   \
+  const gint out_bot_##_level_ =                                         \
+    NOHALO_MIN                                                           \
+    (                                                                    \
+      (gint) floorf (                                                    \
+        (float)                                                          \
+          ( ( y_##_level_ + bounding_box_half_height ) * (gfloat) 0.5 )) \
+      ,                                                                  \
+      NOHALO_OFFSET_MIPMAP                                               \
+    );
+
+#define NOHALO_MIPMAP_EWA_UPDATE(_level_)                           \
+  {                                                                 \
+    gint i;                                                         \
+    for ( i = out_top_##_level_; i <= in_top_##_level_; i++ )       \
+      {                                                             \
+        gint j = out_left_##_level_;                                \
+        do {                                                        \
+          NOHALO_MIPMAP_PIXEL_UPDATE(_level_);                      \
+        } while ( ++j <= out_rite_##_level_ );                      \
+      }                                                             \
+  }                                                                 \
+  {                                                                 \
+    gint i = in_top_##_level_ + (gint) 1;                           \
+    do {                                                            \
+      {                                                             \
+        gint j;                                                     \
+        for ( j = out_left_##_level_; j <= in_left_##_level_; j++ ) \
+          {                                                         \
+            NOHALO_MIPMAP_PIXEL_UPDATE(_level_);                    \
+          }                                                         \
+      }                                                             \
+      {                                                             \
+        gint j;                                                     \
+        for ( j = in_rite_##_level_; j <= out_rite_##_level_; j++ ) \
+          {                                                         \
+            NOHALO_MIPMAP_PIXEL_UPDATE(_level_);                    \
+          }                                                         \
+      }                                                             \
+    } while ( ++i < in_bot_##_level_ );                             \
+  }                                                                 \
+  {                                                                 \
+    gint i;                                                         \
+    for ( i = in_bot_##_level_; i <= out_bot_##_level_; i++ )       \
+      {                                                             \
+        gint j = out_left_##_level_;                                \
+        do {                                                        \
+          NOHALO_MIPMAP_PIXEL_UPDATE(_level_);                      \
+        } while ( ++j <= out_rite_##_level_ );                      \
+      }                                                             \
+  }
+
+#define NOHALO_MIPMAP_PIXEL_UPDATE(_level_)  \
+  mipmap_ewa_update (_level_,                \
+                     j,                      \
+                     i,                      \
+                     c_major_x,              \
+                     c_major_y,              \
+                     c_minor_x,              \
+                     c_minor_y,              \
+                     x_##_level_,            \
+                     y_##_level_,            \
+                     channels,               \
+                     row_skip,               \
+                     input_bptr_##_level_,   \
+                     &total_weight,          \
+                     ewa_newval)
+
+enum
+{
+  PROP_0,
+  PROP_LAST
+};
+
+static void gegl_sampler_nohalo_get (      GeglSampler* restrict  self,
+                                     const gdouble                absolute_x,
+                                     const gdouble                absolute_y,
+                                           GeglMatrix2           *scale,
+                                           void*        restrict  output,
+                                           GeglAbyssPolicy        repeat_mode);
+
+G_DEFINE_TYPE (GeglSamplerNohalo, gegl_sampler_nohalo, GEGL_TYPE_SAMPLER)
+
+static void
+gegl_sampler_nohalo_class_init (GeglSamplerNohaloClass *klass)
+{
+  GeglSamplerClass *sampler_class = GEGL_SAMPLER_CLASS (klass);
+  sampler_class->get = gegl_sampler_nohalo_get;
+}
+
+/*
+ * Because things are kept centered, the stencil width/height is 1 +
+ * twice the (size of) the offset.
+ *
+ * 5x5 is the smallest "level 0" context_rect that works with the
+ * LBB-Nohalo component of the sampler. Because 5 = 1+2*2,
+ * NOHALO_OFFSET_0 must be >= 2.
+ *
+ * Speed/quality trade-off:
+ *
+ * Downsampling quality will decrease around ratio 1/(NOHALO_OFFSET_0
+ * + .5). In addition, the smaller NOHALO_OFFSET_0, the more
+ * noticeable the artifacts. To maintain maximum quality for the
+ * widest downsampling range possible, a somewhat large
+ * NOHALO_OFFSET_0 should be used. However, the larger the "level 0"
+ * offset, the slower Nohalo will run when no significant downsampling
+ * is done, because the width and height of context_rect is
+ * (2*NOHALO_OFFSET_0+1), and consequently there is less data "tile"
+ * reuse with large NOHALO_OFFSET_0.
+ */
+/*
+ * IMPORTANT: NOHALO_OFFSET_0 SHOULD BE AN INTEGER >= 2.
+ */
+#define NOHALO_OFFSET_0 (12)
+#define NOHALO_SIZE_0 (1+2*NOHALO_OFFSET_0)
+
+/*
+ * The higher mipmap context_rects must be set so that there is at
+ * least one higher mipmap pixel location within the higher
+ * context_rect but outside the lower context_rect, irregardless of
+ * the alignment at the sampling location. I (Nicolas) have not taken
+ * the time to find the exact inequality that must be respected so
+ * that the do whiles word properly. Almost certainly, the higher
+ * mipmap level's offset should almost never be smaller than half the
+ * previous level's offset.
+ */
+#define NOHALO_OFFSET_MIPMAP (12)
+#define NOHALO_SIZE_MIPMAP (1+2*NOHALO_OFFSET_MIPMAP)
+
+#define NOHALO_OFFSET_1 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_1   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_2 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_2   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_3 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_3   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_4 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_4   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_5 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_5   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_6 NOHALO_OFFSET_MIPMAP
+#define NOHALO_SIZE_6   NOHALO_SIZE_MIPMAP
+
+#define NOHALO_OFFSET_7 (GEGL_SAMPLER_MAXIMUM_HEIGHT/2-1)
+#define NOHALO_SIZE_7   (GEGL_SAMPLER_MAXIMUM_HEIGHT)
+
+/*
+ * Nohalo always uses some mipmap level 0 values, but not always
+ * higher mipmap values.
+ */
+static void
+gegl_sampler_nohalo_init (GeglSamplerNohalo *self)
+{
+  GEGL_SAMPLER (self)->context_rect[0].x   = -NOHALO_OFFSET_0;
+  GEGL_SAMPLER (self)->context_rect[0].y   = -NOHALO_OFFSET_0;
+  GEGL_SAMPLER (self)->context_rect[0].width  = NOHALO_SIZE_0;
+  GEGL_SAMPLER (self)->context_rect[0].height = NOHALO_SIZE_0;
+
+  GEGL_SAMPLER (self)->context_rect[1].x   = -NOHALO_OFFSET_1;
+  GEGL_SAMPLER (self)->context_rect[1].y   = -NOHALO_OFFSET_1;
+  GEGL_SAMPLER (self)->context_rect[1].width  = NOHALO_SIZE_1;
+  GEGL_SAMPLER (self)->context_rect[1].height = NOHALO_SIZE_1;
+
+  GEGL_SAMPLER (self)->context_rect[2].x   = -NOHALO_OFFSET_2;
+  GEGL_SAMPLER (self)->context_rect[2].y   = -NOHALO_OFFSET_2;
+  GEGL_SAMPLER (self)->context_rect[2].width  = NOHALO_SIZE_2;
+  GEGL_SAMPLER (self)->context_rect[2].height = NOHALO_SIZE_2;
+
+  GEGL_SAMPLER (self)->context_rect[3].x   = -NOHALO_OFFSET_3;
+  GEGL_SAMPLER (self)->context_rect[3].y   = -NOHALO_OFFSET_3;
+  GEGL_SAMPLER (self)->context_rect[3].width  = NOHALO_SIZE_3;
+  GEGL_SAMPLER (self)->context_rect[3].height = NOHALO_SIZE_3;
+
+  GEGL_SAMPLER (self)->context_rect[4].x   = -NOHALO_OFFSET_4;
+  GEGL_SAMPLER (self)->context_rect[4].y   = -NOHALO_OFFSET_4;
+  GEGL_SAMPLER (self)->context_rect[4].width  = NOHALO_SIZE_4;
+  GEGL_SAMPLER (self)->context_rect[4].height = NOHALO_SIZE_4;
+
+  GEGL_SAMPLER (self)->context_rect[5].x   = -NOHALO_OFFSET_5;
+  GEGL_SAMPLER (self)->context_rect[5].y   = -NOHALO_OFFSET_5;
+  GEGL_SAMPLER (self)->context_rect[5].width  = NOHALO_SIZE_5;
+  GEGL_SAMPLER (self)->context_rect[5].height = NOHALO_SIZE_5;
+
+  GEGL_SAMPLER (self)->context_rect[6].x   = -NOHALO_OFFSET_6;
+  GEGL_SAMPLER (self)->context_rect[6].y   = -NOHALO_OFFSET_6;
+  GEGL_SAMPLER (self)->context_rect[6].width  = NOHALO_SIZE_6;
+  GEGL_SAMPLER (self)->context_rect[6].height = NOHALO_SIZE_6;
+
+  GEGL_SAMPLER (self)->context_rect[7].x   = -NOHALO_OFFSET_7;
+  GEGL_SAMPLER (self)->context_rect[7].y   = -NOHALO_OFFSET_7;
+  GEGL_SAMPLER (self)->context_rect[7].width  = NOHALO_SIZE_7;
+  GEGL_SAMPLER (self)->context_rect[7].height = NOHALO_SIZE_7;
+
+  GEGL_SAMPLER (self)->interpolate_format = babl_format ("RaGaBaA float");
+}
+
+static void inline
+nohalo_subdivision (const gfloat           uno_two,
+                    const gfloat           uno_thr,
+                    const gfloat           uno_fou,
+                    const gfloat           dos_one,
+                    const gfloat           dos_two,
+                    const gfloat           dos_thr,
+                    const gfloat           dos_fou,
+                    const gfloat           dos_fiv,
+                    const gfloat           tre_one,
+                    const gfloat           tre_two,
+                    const gfloat           tre_thr,
+                    const gfloat           tre_fou,
+                    const gfloat           tre_fiv,
+                    const gfloat           qua_one,
+                    const gfloat           qua_two,
+                    const gfloat           qua_thr,
+                    const gfloat           qua_fou,
+                    const gfloat           qua_fiv,
+                    const gfloat           cin_two,
+                    const gfloat           cin_thr,
+                    const gfloat           cin_fou,
+                          gfloat* restrict uno_one_1,
+                          gfloat* restrict uno_two_1,
+                          gfloat* restrict uno_thr_1,
+                          gfloat* restrict uno_fou_1,
+                          gfloat* restrict dos_one_1,
+                          gfloat* restrict dos_two_1,
+                          gfloat* restrict dos_thr_1,
+                          gfloat* restrict dos_fou_1,
+                          gfloat* restrict tre_one_1,
+                          gfloat* restrict tre_two_1,
+                          gfloat* restrict tre_thr_1,
+                          gfloat* restrict tre_fou_1,
+                          gfloat* restrict qua_one_1,
+                          gfloat* restrict qua_two_1,
+                          gfloat* restrict qua_thr_1,
+                          gfloat* restrict qua_fou_1)
+{
+  /*
+   * nohalo_subdivision calculates the missing twelve float density
+   * pixel values, and also returns the "already known" four, so that
+   * the sixteen values which make up the stencil of LBB are
+   * available.
+   */
+  /*
+   * THE STENCIL OF INPUT VALUES:
+   *
+   * Pointer arithmetic is used to implicitly reflect the input
+   * stencil about tre_thr---assumed closer to the sampling location
+   * than other pixels (ties are OK)---in such a way that after
+   * reflection the sampling point is to the bottom right of tre_thr.
+   *
+   * The following code and picture assumes that the stencil reflexion
+   * has already been performed.
+   *
+   *               (ix-1,iy-2)  (ix,iy-2)    (ix+1,iy-2)
+   *               =uno_two     = uno_thr    = uno_fou
+   *
+   *
+   *
+   *  (ix-2,iy-1)  (ix-1,iy-1)  (ix,iy-1)    (ix+1,iy-1)  (ix+2,iy-1)
+   *  = dos_one    = dos_two    = dos_thr    = dos_fou    = dos_fiv
+   *
+   *
+   *
+   *  (ix-2,iy)    (ix-1,iy)    (ix,iy)      (ix+1,iy)    (ix+2,iy)
+   *  = tre_one    = tre_two    = tre_thr    = tre_fou    = tre_fiv
+   *                                    X
+   *
+   *
+   *  (ix-2,iy+1)  (ix-1,iy+1)  (ix,iy+1)    (ix+1,iy+1)  (ix+2,iy+1)
+   *  = qua_one    = qua_two    = qua_thr    = qua_fou    = qua_fiv
+   *
+   *
+   *
+   *               (ix-1,iy+2)  (ix,iy+2)    (ix+1,iy+2)
+   *               = cin_two    = cin_thr    = cin_fou
+   *
+   *
+   * The above input pixel values are the ones needed in order to make
+   * available the following values, needed by LBB:
+   *
+   *  uno_one_1 =      uno_two_1 =  uno_thr_1 =      uno_fou_1 =
+   *  (ix-1/2,iy-1/2)  (ix,iy-1/2)  (ix+1/2,iy-1/2)  (ix+1,iy-1/2)
+   *
+   *
+   *
+   *
+   *  dos_one_1 =      dos_two_1 =  dos_thr_1 =      dos_fou_1 =
+   *  (ix-1/2,iy)      (ix,iy)      (ix+1/2,iy)      (ix+1,iy)
+   *
+   *                             X
+   *
+   *
+   *  tre_one_1 =      tre_two_1 =  tre_thr_1 =      tre_fou_1 =
+   *  (ix-1/2,iy+1/2)  (ix,iy+1/2)  (ix+1/2,iy+1/2)  (ix+1,iy+1/2)
+   *
+   *
+   *
+   *
+   *  qua_one_1 =      qua_two_1 =  qua_thr_1 =      qua_fou_1 =
+   *  (ix-1/2,iy+1)    (ix,iy+1)    (ix+1/2,iy+1)    (ix+1,iy+1)
+   *
+   */
+
+  /*
+   * Computation of the nonlinear slopes: If two consecutive pixel
+   * value differences have the same sign, the smallest one (in
+   * absolute value) is taken to be the corresponding slope; if the
+   * two consecutive pixel value differences don't have the same sign,
+   * the corresponding slope is set to 0.
+   *
+   * In other words: Apply minmod to consecutive differences.
+   */
+  /*
+   * Two vertical simple differences:
+   */
+  const gfloat d_unodos_two = dos_two - uno_two;
+  const gfloat d_dostre_two = tre_two - dos_two;
+  const gfloat d_trequa_two = qua_two - tre_two;
+  const gfloat d_quacin_two = cin_two - qua_two;
+  /*
+   * Thr(ee) vertical differences:
+   */
+  const gfloat d_unodos_thr = dos_thr - uno_thr;
+  const gfloat d_dostre_thr = tre_thr - dos_thr;
+  const gfloat d_trequa_thr = qua_thr - tre_thr;
+  const gfloat d_quacin_thr = cin_thr - qua_thr;
+  /*
+   * Fou(r) vertical differences:
+   */
+  const gfloat d_unodos_fou = dos_fou - uno_fou;
+  const gfloat d_dostre_fou = tre_fou - dos_fou;
+  const gfloat d_trequa_fou = qua_fou - tre_fou;
+  const gfloat d_quacin_fou = cin_fou - qua_fou;
+  /*
+   * Dos horizontal differences:
+   */
+  const gfloat d_dos_onetwo = dos_two - dos_one;
+  const gfloat d_dos_twothr = dos_thr - dos_two;
+  const gfloat d_dos_thrfou = dos_fou - dos_thr;
+  const gfloat d_dos_foufiv = dos_fiv - dos_fou;
+  /*
+   * Tre(s) horizontal differences:
+   */
+  const gfloat d_tre_onetwo = tre_two - tre_one;
+  const gfloat d_tre_twothr = tre_thr - tre_two;
+  const gfloat d_tre_thrfou = tre_fou - tre_thr;
+  const gfloat d_tre_foufiv = tre_fiv - tre_fou;
+  /*
+   * Qua(ttro) horizontal differences:
+   */
+  const gfloat d_qua_onetwo = qua_two - qua_one;
+  const gfloat d_qua_twothr = qua_thr - qua_two;
+  const gfloat d_qua_thrfou = qua_fou - qua_thr;
+  const gfloat d_qua_foufiv = qua_fiv - qua_fou;
+
+  /*
+   * Recyclable vertical products and squares:
+   */
+  const gfloat d_unodos_times_dostre_two = d_unodos_two * d_dostre_two;
+  const gfloat d_dostre_two_sq           = d_dostre_two * d_dostre_two;
+  const gfloat d_dostre_times_trequa_two = d_dostre_two * d_trequa_two;
+  const gfloat d_trequa_times_quacin_two = d_quacin_two * d_trequa_two;
+  const gfloat d_quacin_two_sq           = d_quacin_two * d_quacin_two;
+
+  const gfloat d_unodos_times_dostre_thr = d_unodos_thr * d_dostre_thr;
+  const gfloat d_dostre_thr_sq           = d_dostre_thr * d_dostre_thr;
+  const gfloat d_dostre_times_trequa_thr = d_trequa_thr * d_dostre_thr;
+  const gfloat d_trequa_times_quacin_thr = d_trequa_thr * d_quacin_thr;
+  const gfloat d_quacin_thr_sq           = d_quacin_thr * d_quacin_thr;
+
+  const gfloat d_unodos_times_dostre_fou = d_unodos_fou * d_dostre_fou;
+  const gfloat d_dostre_fou_sq           = d_dostre_fou * d_dostre_fou;
+  const gfloat d_dostre_times_trequa_fou = d_trequa_fou * d_dostre_fou;
+  const gfloat d_trequa_times_quacin_fou = d_trequa_fou * d_quacin_fou;
+  const gfloat d_quacin_fou_sq           = d_quacin_fou * d_quacin_fou;
+  /*
+   * Recyclable horizontal products and squares:
+   */
+  const gfloat d_dos_onetwo_times_twothr = d_dos_onetwo * d_dos_twothr;
+  const gfloat d_dos_twothr_sq           = d_dos_twothr * d_dos_twothr;
+  const gfloat d_dos_twothr_times_thrfou = d_dos_twothr * d_dos_thrfou;
+  const gfloat d_dos_thrfou_times_foufiv = d_dos_thrfou * d_dos_foufiv;
+  const gfloat d_dos_foufiv_sq           = d_dos_foufiv * d_dos_foufiv;
+
+  const gfloat d_tre_onetwo_times_twothr = d_tre_onetwo * d_tre_twothr;
+  const gfloat d_tre_twothr_sq           = d_tre_twothr * d_tre_twothr;
+  const gfloat d_tre_twothr_times_thrfou = d_tre_thrfou * d_tre_twothr;
+  const gfloat d_tre_thrfou_times_foufiv = d_tre_thrfou * d_tre_foufiv;
+  const gfloat d_tre_foufiv_sq           = d_tre_foufiv * d_tre_foufiv;
+
+  const gfloat d_qua_onetwo_times_twothr = d_qua_onetwo * d_qua_twothr;
+  const gfloat d_qua_twothr_sq           = d_qua_twothr * d_qua_twothr;
+  const gfloat d_qua_twothr_times_thrfou = d_qua_thrfou * d_qua_twothr;
+  const gfloat d_qua_thrfou_times_foufiv = d_qua_thrfou * d_qua_foufiv;
+  const gfloat d_qua_foufiv_sq           = d_qua_foufiv * d_qua_foufiv;
+
+  /*
+   * Minmod slopes and first level pixel values:
+   */
+  const gfloat dos_thr_y = NOHALO_MINMOD( d_dostre_thr, d_unodos_thr,
+                                          d_dostre_thr_sq,
+                                          d_unodos_times_dostre_thr );
+  const gfloat tre_thr_y = NOHALO_MINMOD( d_dostre_thr, d_trequa_thr,
+                                          d_dostre_thr_sq,
+                                          d_dostre_times_trequa_thr );
+
+  const gfloat newval_uno_two =
+    (gfloat) 0.5
+    *
+    ( dos_thr + tre_thr + (gfloat) 0.5 * ( dos_thr_y - tre_thr_y ) );
+
+  const gfloat qua_thr_y = NOHALO_MINMOD( d_quacin_thr, d_trequa_thr,
+                                          d_quacin_thr_sq,
+                                          d_trequa_times_quacin_thr );
+
+  const gfloat newval_tre_two =
+    (gfloat) 0.5
+    *
+    ( tre_thr + qua_thr + (gfloat) 0.5 * ( tre_thr_y - qua_thr_y ) );
+
+  const gfloat tre_fou_y = NOHALO_MINMOD( d_dostre_fou, d_trequa_fou,
+                                          d_dostre_fou_sq,
+                                          d_dostre_times_trequa_fou );
+  const gfloat qua_fou_y = NOHALO_MINMOD( d_quacin_fou, d_trequa_fou,
+                                          d_quacin_fou_sq,
+                                          d_trequa_times_quacin_fou );
+
+  const gfloat newval_tre_fou =
+    (gfloat) 0.5
+    *
+    ( tre_fou + qua_fou + (gfloat) 0.5 * ( tre_fou_y - qua_fou_y ) );
+
+  const gfloat dos_fou_y = NOHALO_MINMOD( d_dostre_fou, d_unodos_fou,
+                                          d_dostre_fou_sq,
+                                          d_unodos_times_dostre_fou );
+
+  const gfloat newval_uno_fou =
+    (gfloat) 0.5
+    *
+    ( dos_fou + tre_fou + (gfloat) 0.5 * (dos_fou_y - tre_fou_y ) );
+
+  const gfloat tre_two_x = NOHALO_MINMOD( d_tre_twothr, d_tre_onetwo,
+                                          d_tre_twothr_sq,
+                                          d_tre_onetwo_times_twothr );
+  const gfloat tre_thr_x = NOHALO_MINMOD( d_tre_twothr, d_tre_thrfou,
+                                          d_tre_twothr_sq,
+                                          d_tre_twothr_times_thrfou );
+
+  const gfloat newval_dos_one =
+    (gfloat) 0.5
+    *
+    ( tre_two + tre_thr + (gfloat) 0.5 * ( tre_two_x - tre_thr_x ) );
+
+  const gfloat tre_fou_x = NOHALO_MINMOD( d_tre_foufiv, d_tre_thrfou,
+                                          d_tre_foufiv_sq,
+                                          d_tre_thrfou_times_foufiv );
+
+  const gfloat tre_thr_x_minus_tre_fou_x =
+    tre_thr_x - tre_fou_x;
+
+  const gfloat newval_dos_thr =
+    (gfloat) 0.5
+    *
+    ( tre_thr + tre_fou + (gfloat) 0.5 * tre_thr_x_minus_tre_fou_x );
+
+  const gfloat qua_thr_x = NOHALO_MINMOD( d_qua_twothr, d_qua_thrfou,
+                                          d_qua_twothr_sq,
+                                          d_qua_twothr_times_thrfou );
+  const gfloat qua_fou_x = NOHALO_MINMOD( d_qua_foufiv, d_qua_thrfou,
+                                          d_qua_foufiv_sq,
+                                          d_qua_thrfou_times_foufiv );
+
+  const gfloat qua_thr_x_minus_qua_fou_x =
+    qua_thr_x - qua_fou_x;
+
+  const gfloat newval_qua_thr =
+    (gfloat) 0.5
+    *
+    ( qua_thr + qua_fou + (gfloat) 0.5 * qua_thr_x_minus_qua_fou_x );
+
+  const gfloat qua_two_x = NOHALO_MINMOD( d_qua_twothr, d_qua_onetwo,
+                                          d_qua_twothr_sq,
+                                          d_qua_onetwo_times_twothr );
+
+  const gfloat newval_qua_one =
+    (gfloat) 0.5
+    *
+    ( qua_two + qua_thr + (gfloat) 0.5 * ( qua_two_x - qua_thr_x ) );
+
+  const gfloat newval_tre_thr =
+    (gfloat) 0.5
+    *
+    (
+      newval_tre_two + newval_tre_fou
+      +
+      (gfloat) 0.25 * ( tre_thr_x_minus_tre_fou_x + qua_thr_x_minus_qua_fou_x )
+    );
+
+  const gfloat dos_thr_x = NOHALO_MINMOD( d_dos_twothr, d_dos_thrfou,
+                                          d_dos_twothr_sq,
+                                          d_dos_twothr_times_thrfou );
+  const gfloat dos_fou_x = NOHALO_MINMOD( d_dos_foufiv, d_dos_thrfou,
+                                          d_dos_foufiv_sq,
+                                          d_dos_thrfou_times_foufiv );
+
+  const gfloat newval_uno_thr =
+    (gfloat) 0.5
+    *
+    (
+      newval_uno_two + newval_dos_thr
+      +
+      (gfloat) 0.5
+      *
+      (
+        dos_fou - tre_thr
+        +
+        (gfloat) 0.5 * ( dos_fou_y - tre_fou_y + dos_thr_x - dos_fou_x )
+      )
+    );
+
+  const gfloat tre_two_y = NOHALO_MINMOD( d_dostre_two, d_trequa_two,
+                                          d_dostre_two_sq,
+                                          d_dostre_times_trequa_two );
+  const gfloat qua_two_y = NOHALO_MINMOD( d_quacin_two, d_trequa_two,
+                                          d_quacin_two_sq,
+                                          d_trequa_times_quacin_two );
+
+  const gfloat newval_tre_one =
+    (gfloat) 0.5
+    *
+    (
+      newval_dos_one + newval_tre_two
+      +
+      (gfloat) 0.5
+      *
+      (
+        qua_two - tre_thr
+        +
+        (gfloat) 0.5 * ( qua_two_x - qua_thr_x + tre_two_y - qua_two_y )
+      )
+    );
+
+
+  const gfloat dos_two_x = NOHALO_MINMOD( d_dos_twothr, d_dos_onetwo,
+                                          d_dos_twothr_sq,
+                                          d_dos_onetwo_times_twothr );
+  const gfloat dos_two_y = NOHALO_MINMOD( d_dostre_two, d_unodos_two,
+                                          d_dostre_two_sq,
+                                          d_unodos_times_dostre_two );
+
+  const gfloat newval_uno_one =
+    (gfloat) 0.25
+    *
+    (
+      dos_two + dos_thr + tre_two + tre_thr
+      +
+      (gfloat) 0.5
+      *
+      (
+        dos_two_x - dos_thr_x + tre_two_x - tre_thr_x
+        +
+        dos_two_y + dos_thr_y - tre_two_y - tre_thr_y
+      )
+    );
+
+  /*
+   * Return the sixteen LBB stencil values:
+   */
+  *uno_one_1 = newval_uno_one;
+  *uno_two_1 = newval_uno_two;
+  *uno_thr_1 = newval_uno_thr;
+  *uno_fou_1 = newval_uno_fou;
+  *dos_one_1 = newval_dos_one;
+  *dos_two_1 =        tre_thr;
+  *dos_thr_1 = newval_dos_thr;
+  *dos_fou_1 =        tre_fou;
+  *tre_one_1 = newval_tre_one;
+  *tre_two_1 = newval_tre_two;
+  *tre_thr_1 = newval_tre_thr;
+  *tre_fou_1 = newval_tre_fou;
+  *qua_one_1 = newval_qua_one;
+  *qua_two_1 =        qua_thr;
+  *qua_thr_1 = newval_qua_thr;
+  *qua_fou_1 =        qua_fou;
+}
+
+static inline gfloat
+lbb (const gfloat c00,
+     const gfloat c10,
+     const gfloat c01,
+     const gfloat c11,
+     const gfloat c00dx,
+     const gfloat c10dx,
+     const gfloat c01dx,
+     const gfloat c11dx,
+     const gfloat c00dy,
+     const gfloat c10dy,
+     const gfloat c01dy,
+     const gfloat c11dy,
+     const gfloat c00dxdy,
+     const gfloat c10dxdy,
+     const gfloat c01dxdy,
+     const gfloat c11dxdy,
+     const gfloat uno_one,
+     const gfloat uno_two,
+     const gfloat uno_thr,
+     const gfloat uno_fou,
+     const gfloat dos_one,
+     const gfloat dos_two,
+     const gfloat dos_thr,
+     const gfloat dos_fou,
+     const gfloat tre_one,
+     const gfloat tre_two,
+     const gfloat tre_thr,
+     const gfloat tre_fou,
+     const gfloat qua_one,
+     const gfloat qua_two,
+     const gfloat qua_thr,
+     const gfloat qua_fou )
+{
+  /*
+   * LBB (Locally Bounded Bicubic) is a high quality nonlinear variant
+   * of Catmull-Rom. Images resampled with LBB have much smaller halos
+   * than images resampled with windowed sincs or other interpolatory
+   * cubic spline filters. Specifically, LBB halos are narrower and
+   * the over/undershoot amplitude is smaller. This is accomplished
+   * without a significant reduction in the smoothness of the result
+   * (compared to Catmull-Rom).
+   *
+   * Another important property is that the resampled values are
+   * contained within the range of nearby input values. Consequently,
+   * no final clamping is needed to stay "in range" (e.g., 0-255 for
+   * standard 8-bit images).
+   *
+   * LBB was developed by Nicolas Robidoux and Chantal Racette of the
+   * Department of Mathematics and Computer Science of Laurentian
+   * University in the course of Chantal's Masters in Computational
+   * Sciences.
+   */
+  /*
+   * LBB is a novel method with the following properties:
+   *
+   * --LBB is a Hermite bicubic method: The bicubic surface is
+   *   defined, one convex hull of four nearby input points at a time,
+   *   using four point values, four x-derivatives, four
+   *   y-derivatives, and four cross-derivatives.
+   *
+   * --The stencil for values in a square patch is the usual 4x4.
+   *
+   * --LBB is interpolatory.
+   *
+   * --It is C^1 with continuous cross-derivatives.
+   *
+   * --When the limiters are inactive, LBB gives the same results as
+   *   Catmull-Rom.
+   *
+   * --When used on binary images, LBB gives results similar to
+   *   bicubic Hermite with all first derivatives---but not
+   *   necessarily the cross-derivatives--at the input pixel locations
+   *   set to zero.
+   *
+   * --The LBB reconstruction is locally bounded: Over each square
+   *   patch, the surface is contained between the minimum and the
+   *   maximum values among the 16 nearest input pixel values (those
+   *   in the stencil).
+   *
+   * --Consequently, the LBB reconstruction is globally bounded
+   *   between the very smallest input pixel value and the very
+   *   largest input pixel value. (It is not necessary to clamp
+   *   results.)
+   *
+   * The LBB method is based on the method of Ken Brodlie, Petros
+   * Mashwama and Sohail Butt for constraining Hermite interpolants
+   * between globally defined planes:
+   *
+   *   Visualization of surface data to preserve positivity and other
+   *   simple constraints. Computer & Graphics, Vol. 19, Number 4,
+   *   pages 585-594, 1995. DOI: 10.1016/0097-8493(95)00036-C.
+   *
+   * Instead of forcing the reconstructed surface to lie between two
+   * GLOBALLY defined planes, LBB constrains one patch at a time to
+   * lie between LOCALLY defined planes. This is accomplished by
+   * constraining the derivatives (x, y and cross) at each input pixel
+   * location so that if the constraint was applied everywhere the
+   * surface would fit between the min and max of the values at the 9
+   * closest pixel locations. Because this is done with each of the
+   * four pixel locations which define the bicubic patch, this forces
+   * the reconstructed surface to lie between the min and max of the
+   * values at the 16 closest values pixel locations. (Each corner
+   * defines its own 3x3 subgroup of the 4x4 stencil. Consequently,
+   * the surface is necessarily above the minimum of the four minima,
+   * which happens to be the minimum over the 4x4. Similarly with the
+   * maxima.)
+   *
+   * The above paragraph described the "soft" version of LBB, which is
+   * the only one used by nohalo.
+   */
+  /*
+   * STENCIL (FOOTPRINT) OF INPUT VALUES:
+   *
+   * The stencil of LBB is the same as for any standard Hermite
+   * bicubic (e.g., Catmull-Rom):
+   *
+   *  (ix-1,iy-1)  (ix,iy-1)    (ix+1,iy-1)  (ix+2,iy-1)
+   *  = uno_one    = uno_two    = uno_thr    = uno_fou
+   *
+   *  (ix-1,iy)    (ix,iy)      (ix+1,iy)    (ix+2,iy)
+   *  = dos_one    = dos_two    = dos_thr    = dos_fou
+   *                        X
+   *  (ix-1,iy+1)  (ix,iy+1)    (ix+1,iy+1)  (ix+2,iy+1)
+   *  = tre_one    = tre_two    = tre_thr    = tre_fou
+   *
+   *  (ix-1,iy+2)  (ix,iy+2)    (ix+1,iy+2)  (ix+2,iy+2)
+   *  = qua_one    = qua_two    = qua_thr    = qua_fou
+   *
+   * where ix is the floor of the requested left-to-right location
+   * ("X"), and iy is the floor of the requested up-to-down location.
+   */
+
+  /*
+   * Computation of the four min and four max over 3x3 input data
+   * sub-blocks of the 4x4 input stencil.
+   *
+   * Surprisingly, we have not succeeded in reducing the number of "?
+   * :" even though the data comes from the (co-monotone) method
+   * Nohalo so that it is known ahead of time that
+   *
+   *  dos_thr is between dos_two and dos_fou
+   *
+   *  tre_two is between dos_two and qua_two
+   *
+   *  tre_fou is between dos_fou and qua_fou
+   *
+   *  qua_thr is between qua_two and qua_fou
+   *
+   *  tre_thr is in the convex hull of dos_two, dos_fou, qua_two and qua_fou
+   *
+   *  to minimize the number of flags and conditional moves.
+   *
+   * (The "between" are not strict: "a between b and c" means
+   *
+   * "min(b,c) <= a <= max(b,c)".)
+   *
+   * We have, however, succeeded in eliminating one flag computation
+   * (one comparison) and one use of an intermediate result. See the
+   * two commented out lines below.
+   *
+   * Overall, only 27 comparisons are needed (to compute 4 mins and 4
+   * maxes!). Without the simplification, 28 comparisons would be
+   * used. Either way, the number of "? :" used is 34. If you can
+   * figure how to do this more efficiently, let us know.
+   */
+  const gfloat m1    = (dos_two <= dos_thr) ? dos_two : dos_thr  ;
+  const gfloat M1    = (dos_two <= dos_thr) ? dos_thr : dos_two  ;
+  const gfloat m2    = (tre_two <= tre_thr) ? tre_two : tre_thr  ;
+  const gfloat M2    = (tre_two <= tre_thr) ? tre_thr : tre_two  ;
+  const gfloat m4    = (qua_two <= qua_thr) ? qua_two : qua_thr  ;
+  const gfloat M4    = (qua_two <= qua_thr) ? qua_thr : qua_two  ;
+  const gfloat m3    = (uno_two <= uno_thr) ? uno_two : uno_thr  ;
+  const gfloat M3    = (uno_two <= uno_thr) ? uno_thr : uno_two  ;
+  const gfloat m5    = NOHALO_MIN(            m1,       m2      );
+  const gfloat M5    = NOHALO_MAX(            M1,       M2      );
+  const gfloat m6    = (dos_one <= tre_one) ? dos_one : tre_one  ;
+  const gfloat M6    = (dos_one <= tre_one) ? tre_one : dos_one  ;
+  const gfloat m7    = (dos_fou <= tre_fou) ? dos_fou : tre_fou  ;
+  const gfloat M7    = (dos_fou <= tre_fou) ? tre_fou : dos_fou  ;
+  const gfloat m13   = (dos_fou <= qua_fou) ? dos_fou : qua_fou  ;
+  const gfloat M13   = (dos_fou <= qua_fou) ? qua_fou : dos_fou  ;
+  /*
+   * Because the data comes from Nohalo subdivision, the following two
+   * lines can be replaced by the above, "simpler," two lines without
+   * changing the results.
+   *
+   * const gfloat m13   = NOHALO_MIN(            m7,       qua_fou );
+   * const gfloat M13   = NOHALO_MAX(            M7,       qua_fou );
+   *
+   * This allows for the comparisons to be reordered to put breathing
+   * room between the computation of a result and its use.
+   */
+  const gfloat m9    = NOHALO_MIN(            m5,       m4      );
+  const gfloat M9    = NOHALO_MAX(            M5,       M4      );
+  const gfloat m11   = NOHALO_MIN(            m6,       qua_one );
+  const gfloat M11   = NOHALO_MAX(            M6,       qua_one );
+  const gfloat m10   = NOHALO_MIN(            m6,       uno_one );
+  const gfloat M10   = NOHALO_MAX(            M6,       uno_one );
+  const gfloat m8    = NOHALO_MIN(            m5,       m3      );
+  const gfloat M8    = NOHALO_MAX(            M5,       M3      );
+  const gfloat m12   = NOHALO_MIN(            m7,       uno_fou );
+  const gfloat M12   = NOHALO_MAX(            M7,       uno_fou );
+  const gfloat min11 = NOHALO_MIN(            m9,       m13     );
+  const gfloat max11 = NOHALO_MAX(            M9,       M13     );
+  const gfloat min01 = NOHALO_MIN(            m9,       m11     );
+  const gfloat max01 = NOHALO_MAX(            M9,       M11     );
+  const gfloat min00 = NOHALO_MIN(            m8,       m10     );
+  const gfloat max00 = NOHALO_MAX(            M8,       M10     );
+  const gfloat min10 = NOHALO_MIN(            m8,       m12     );
+  const gfloat max10 = NOHALO_MAX(            M8,       M12     );
+
+  /*
+   * The remainder of the "per channel" computation involves the
+   * computation of:
+   *
+   * --8 conditional moves,
+   *
+   * --8 signs (in which the sign of zero is unimportant),
+   *
+   * --12 minima of two values,
+   *
+   * --8 maxima of two values,
+   *
+   * --8 absolute values,
+   *
+   * for a grand total of 29 minima, 25 maxima, 8 conditional moves, 8
+   * signs, and 8 absolute values. If everything is done with
+   * conditional moves, "only" 28+8+8+12+8+8=72 flags are involved
+   * (because initial min and max can be computed with one flag).
+   *
+   * The "per channel" part of the computation also involves 107
+   * arithmetic operations (54 *, 21 +, 42 -).
+   */
+
+  /*
+   * Distances to the local min and max:
+   */
+  const gfloat u11 = tre_thr - min11;
+  const gfloat v11 = max11 - tre_thr;
+  const gfloat u01 = tre_two - min01;
+  const gfloat v01 = max01 - tre_two;
+  const gfloat u00 = dos_two - min00;
+  const gfloat v00 = max00 - dos_two;
+  const gfloat u10 = dos_thr - min10;
+  const gfloat v10 = max10 - dos_thr;
+
+  /*
+   * Initial values of the derivatives computed with centered
+   * differences. Factors of 1/2 are left out because they are folded
+   * in later:
+   */
+  const gfloat dble_dzdx00i = dos_thr - dos_one;
+  const gfloat dble_dzdy11i = qua_thr - dos_thr;
+  const gfloat dble_dzdx10i = dos_fou - dos_two;
+  const gfloat dble_dzdy01i = qua_two - dos_two;
+  const gfloat dble_dzdx01i = tre_thr - tre_one;
+  const gfloat dble_dzdy10i = tre_thr - uno_thr;
+  const gfloat dble_dzdx11i = tre_fou - tre_two;
+  const gfloat dble_dzdy00i = tre_two - uno_two;
+
+  /*
+   * Signs of the derivatives. The upcoming clamping does not change
+   * them (except if the clamping sends a negative derivative to 0, in
+   * which case the sign does not matter anyway).
+   */
+  const gfloat sign_dzdx00 = NOHALO_SIGN( dble_dzdx00i );
+  const gfloat sign_dzdx10 = NOHALO_SIGN( dble_dzdx10i );
+  const gfloat sign_dzdx01 = NOHALO_SIGN( dble_dzdx01i );
+  const gfloat sign_dzdx11 = NOHALO_SIGN( dble_dzdx11i );
+
+  const gfloat sign_dzdy00 = NOHALO_SIGN( dble_dzdy00i );
+  const gfloat sign_dzdy10 = NOHALO_SIGN( dble_dzdy10i );
+  const gfloat sign_dzdy01 = NOHALO_SIGN( dble_dzdy01i );
+  const gfloat sign_dzdy11 = NOHALO_SIGN( dble_dzdy11i );
+
+  /*
+   * Initial values of the cross-derivatives. Factors of 1/4 are left
+   * out because folded in later:
+   */
+  const gfloat quad_d2zdxdy00i = uno_one - uno_thr + dble_dzdx01i;
+  const gfloat quad_d2zdxdy10i = uno_two - uno_fou + dble_dzdx11i;
+  const gfloat quad_d2zdxdy01i = qua_thr - qua_one - dble_dzdx00i;
+  const gfloat quad_d2zdxdy11i = qua_fou - qua_two - dble_dzdx10i;
+
+  /*
+   * Slope limiters. The key multiplier is 3 but we fold a factor of
+   * 2, hence 6:
+   */
+  const gfloat dble_slopelimit_00 = (gfloat) 6.0 * NOHALO_MIN( u00, v00 );
+  const gfloat dble_slopelimit_10 = (gfloat) 6.0 * NOHALO_MIN( u10, v10 );
+  const gfloat dble_slopelimit_01 = (gfloat) 6.0 * NOHALO_MIN( u01, v01 );
+  const gfloat dble_slopelimit_11 = (gfloat) 6.0 * NOHALO_MIN( u11, v11 );
+
+  /*
+   * Clamped first derivatives:
+   */
+  const gfloat dble_dzdx00 =
+    ( sign_dzdx00 * dble_dzdx00i <= dble_slopelimit_00 )
+    ? dble_dzdx00i :  sign_dzdx00 * dble_slopelimit_00;
+  const gfloat dble_dzdy00 =
+    ( sign_dzdy00 * dble_dzdy00i <= dble_slopelimit_00 )
+    ? dble_dzdy00i :  sign_dzdy00 * dble_slopelimit_00;
+  const gfloat dble_dzdx10 =
+    ( sign_dzdx10 * dble_dzdx10i <= dble_slopelimit_10 )
+    ? dble_dzdx10i :  sign_dzdx10 * dble_slopelimit_10;
+  const gfloat dble_dzdy10 =
+    ( sign_dzdy10 * dble_dzdy10i <= dble_slopelimit_10 )
+    ? dble_dzdy10i :  sign_dzdy10 * dble_slopelimit_10;
+  const gfloat dble_dzdx01 =
+    ( sign_dzdx01 * dble_dzdx01i <= dble_slopelimit_01 )
+    ? dble_dzdx01i :  sign_dzdx01 * dble_slopelimit_01;
+  const gfloat dble_dzdy01 =
+    ( sign_dzdy01 * dble_dzdy01i <= dble_slopelimit_01 )
+    ? dble_dzdy01i :  sign_dzdy01 * dble_slopelimit_01;
+  const gfloat dble_dzdx11 =
+    ( sign_dzdx11 * dble_dzdx11i <= dble_slopelimit_11 )
+    ? dble_dzdx11i :  sign_dzdx11 * dble_slopelimit_11;
+  const gfloat dble_dzdy11 =
+    ( sign_dzdy11 * dble_dzdy11i <= dble_slopelimit_11 )
+    ? dble_dzdy11i :  sign_dzdy11 * dble_slopelimit_11;
+
+  /*
+   * Sums and differences of first derivatives:
+   */
+  const gfloat twelve_sum00 = (gfloat) 6.0 * ( dble_dzdx00 + dble_dzdy00 );
+  const gfloat twelve_dif00 = (gfloat) 6.0 * ( dble_dzdx00 - dble_dzdy00 );
+  const gfloat twelve_sum10 = (gfloat) 6.0 * ( dble_dzdx10 + dble_dzdy10 );
+  const gfloat twelve_dif10 = (gfloat) 6.0 * ( dble_dzdx10 - dble_dzdy10 );
+  const gfloat twelve_sum01 = (gfloat) 6.0 * ( dble_dzdx01 + dble_dzdy01 );
+  const gfloat twelve_dif01 = (gfloat) 6.0 * ( dble_dzdx01 - dble_dzdy01 );
+  const gfloat twelve_sum11 = (gfloat) 6.0 * ( dble_dzdx11 + dble_dzdy11 );
+  const gfloat twelve_dif11 = (gfloat) 6.0 * ( dble_dzdx11 - dble_dzdy11 );
+
+  /*
+   * Absolute values of the sums:
+   */
+  const gfloat twelve_abs_sum00 = NOHALO_ABS( twelve_sum00 );
+  const gfloat twelve_abs_sum10 = NOHALO_ABS( twelve_sum10 );
+  const gfloat twelve_abs_sum01 = NOHALO_ABS( twelve_sum01 );
+  const gfloat twelve_abs_sum11 = NOHALO_ABS( twelve_sum11 );
+
+  /*
+   * Scaled distances to the min:
+   */
+  const gfloat u00_times_36 = (gfloat) 36.0 * u00;
+  const gfloat u10_times_36 = (gfloat) 36.0 * u10;
+  const gfloat u01_times_36 = (gfloat) 36.0 * u01;
+  const gfloat u11_times_36 = (gfloat) 36.0 * u11;
+
+  /*
+   * First cross-derivative limiter:
+   */
+  const gfloat first_limit00 = twelve_abs_sum00 - u00_times_36;
+  const gfloat first_limit10 = twelve_abs_sum10 - u10_times_36;
+  const gfloat first_limit01 = twelve_abs_sum01 - u01_times_36;
+  const gfloat first_limit11 = twelve_abs_sum11 - u11_times_36;
+
+  const gfloat quad_d2zdxdy00ii = NOHALO_MAX( quad_d2zdxdy00i, first_limit00 );
+  const gfloat quad_d2zdxdy10ii = NOHALO_MAX( quad_d2zdxdy10i, first_limit10 );
+  const gfloat quad_d2zdxdy01ii = NOHALO_MAX( quad_d2zdxdy01i, first_limit01 );
+  const gfloat quad_d2zdxdy11ii = NOHALO_MAX( quad_d2zdxdy11i, first_limit11 );
+
+  /*
+   * Scaled distances to the max:
+   */
+  const gfloat v00_times_36 = (gfloat) 36.0 * v00;
+  const gfloat v10_times_36 = (gfloat) 36.0 * v10;
+  const gfloat v01_times_36 = (gfloat) 36.0 * v01;
+  const gfloat v11_times_36 = (gfloat) 36.0 * v11;
+
+  /*
+   * Second cross-derivative limiter:
+   */
+  const gfloat second_limit00 = v00_times_36 - twelve_abs_sum00;
+  const gfloat second_limit10 = v10_times_36 - twelve_abs_sum10;
+  const gfloat second_limit01 = v01_times_36 - twelve_abs_sum01;
+  const gfloat second_limit11 = v11_times_36 - twelve_abs_sum11;
+
+  const gfloat quad_d2zdxdy00iii =
+    NOHALO_MIN( quad_d2zdxdy00ii, second_limit00 );
+  const gfloat quad_d2zdxdy10iii =
+    NOHALO_MIN( quad_d2zdxdy10ii, second_limit10 );
+  const gfloat quad_d2zdxdy01iii =
+    NOHALO_MIN( quad_d2zdxdy01ii, second_limit01 );
+  const gfloat quad_d2zdxdy11iii =
+    NOHALO_MIN( quad_d2zdxdy11ii, second_limit11 );
+
+  /*
+   * Absolute values of the differences:
+   */
+  const gfloat twelve_abs_dif00 = NOHALO_ABS( twelve_dif00 );
+  const gfloat twelve_abs_dif10 = NOHALO_ABS( twelve_dif10 );
+  const gfloat twelve_abs_dif01 = NOHALO_ABS( twelve_dif01 );
+  const gfloat twelve_abs_dif11 = NOHALO_ABS( twelve_dif11 );
+
+  /*
+   * Third cross-derivative limiter:
+   */
+  const gfloat third_limit00 = twelve_abs_dif00 - v00_times_36;
+  const gfloat third_limit10 = twelve_abs_dif10 - v10_times_36;
+  const gfloat third_limit01 = twelve_abs_dif01 - v01_times_36;
+  const gfloat third_limit11 = twelve_abs_dif11 - v11_times_36;
+
+  const gfloat quad_d2zdxdy00iiii =
+    NOHALO_MAX( quad_d2zdxdy00iii, third_limit00);
+  const gfloat quad_d2zdxdy10iiii =
+    NOHALO_MAX( quad_d2zdxdy10iii, third_limit10);
+  const gfloat quad_d2zdxdy01iiii =
+    NOHALO_MAX( quad_d2zdxdy01iii, third_limit01);
+  const gfloat quad_d2zdxdy11iiii =
+    NOHALO_MAX( quad_d2zdxdy11iii, third_limit11);
+
+  /*
+   * Fourth cross-derivative limiter:
+   */
+  const gfloat fourth_limit00 = u00_times_36 - twelve_abs_dif00;
+  const gfloat fourth_limit10 = u10_times_36 - twelve_abs_dif10;
+  const gfloat fourth_limit01 = u01_times_36 - twelve_abs_dif01;
+  const gfloat fourth_limit11 = u11_times_36 - twelve_abs_dif11;
+
+  const gfloat quad_d2zdxdy00 = NOHALO_MIN( quad_d2zdxdy00iiii, fourth_limit00);
+  const gfloat quad_d2zdxdy10 = NOHALO_MIN( quad_d2zdxdy10iiii, fourth_limit10);
+  const gfloat quad_d2zdxdy01 = NOHALO_MIN( quad_d2zdxdy01iiii, fourth_limit01);
+  const gfloat quad_d2zdxdy11 = NOHALO_MIN( quad_d2zdxdy11iiii, fourth_limit11);
+
+  /*
+   * Part of the result that does not need derivatives:
+   */
+  const gfloat newval1 = c00 * dos_two
+                         +
+                         c10 * dos_thr
+                         +
+                         c01 * tre_two
+                         +
+                         c11 * tre_thr;
+
+  /*
+   * Twice the part of the result that only needs first derivatives.
+   */
+  const gfloat newval2 = c00dx * dble_dzdx00
+                         +
+                         c10dx * dble_dzdx10
+                         +
+                         c01dx * dble_dzdx01
+                         +
+                         c11dx * dble_dzdx11
+                         +
+                         c00dy * dble_dzdy00
+                         +
+                         c10dy * dble_dzdy10
+                         +
+                         c01dy * dble_dzdy01
+                         +
+                         c11dy * dble_dzdy11;
+
+  /*
+   * Four times the part of the result that only uses
+   * cross-derivatives:
+   */
+  const gfloat newval3 = c00dxdy * quad_d2zdxdy00
+                         +
+                         c10dxdy * quad_d2zdxdy10
+                         +
+                         c01dxdy * quad_d2zdxdy01
+                         +
+                         c11dxdy * quad_d2zdxdy11;
+
+  const gfloat newval =
+    newval1 + (gfloat) 0.5 * ( newval2 + (gfloat) 0.5 * newval3 );
+
+  return newval;
+}
+
+static inline gfloat
+teepee (const gfloat c_major_x,
+        const gfloat c_major_y,
+        const gfloat c_minor_x,
+        const gfloat c_minor_y,
+        const gfloat s,
+        const gfloat t)
+{
+  const gfloat q1 = s * c_major_x + t * c_major_y;
+  const gfloat q2 = s * c_minor_x + t * c_minor_y;
+
+  const float r2 = q1 * q1 + q2 * q2;
+
+  const gfloat weight =
+    r2 < (float) 1.
+    ?
+    (gfloat) ( (float) 1. - sqrtf( r2 ) )
+    :
+    (gfloat) 0.;
+
+  return weight;
+}
+
+static inline void
+ewa_update (const gint              j,
+            const gint              i,
+            const gfloat            c_major_x,
+            const gfloat            c_major_y,
+            const gfloat            c_minor_x,
+            const gfloat            c_minor_y,
+            const gfloat            x_0,
+            const gfloat            y_0,
+            const gint              channels,
+            const gint              row_skip,
+            const gfloat*  restrict input_bptr,
+                  gdouble* restrict total_weight,
+                  gfloat*  restrict ewa_newval)
+{
+  const gint skip = j * channels + i * row_skip;
+
+  const gfloat weight = teepee (c_major_x,
+                                c_major_y,
+                                c_minor_x,
+                                c_minor_y,
+                                x_0 - (gfloat) j,
+                                y_0 - (gfloat) i);
+
+  *total_weight += weight;
+  ewa_newval[0] += weight * input_bptr[ skip     ];
+  ewa_newval[1] += weight * input_bptr[ skip + 1 ];
+  ewa_newval[2] += weight * input_bptr[ skip + 2 ];
+  ewa_newval[3] += weight * input_bptr[ skip + 3 ];
+}
+
+static inline void
+mipmap_ewa_update (const gint              level,
+                   const gint              j,
+                   const gint              i,
+                   const gfloat            c_major_x,
+                   const gfloat            c_major_y,
+                   const gfloat            c_minor_x,
+                   const gfloat            c_minor_y,
+                   const gfloat            x,
+                   const gfloat            y,
+                   const gint              channels,
+                   const gint              row_skip,
+                   const gfloat*  restrict input_bptr,
+                         gdouble* restrict total_weight,
+                         gfloat*  restrict ewa_newval)
+{
+  const gint skip = j * channels + i * row_skip;
+
+  /*
+   * The factor of "2^(level+1)" = "2 << level" is because level
+   * mipmap values are averages of that many level 0 pixel values, and
+   * the "1 << level" factor in the index is because the absolute
+   * positions are correspondingly "stretched".
+   */
+  const gfloat weight = (gfloat) ( 2 << level ) *
+                        teepee (c_major_x,
+                                c_major_y,
+                                c_minor_x,
+                                c_minor_y,
+                                x - (gfloat) ( (gint) ( 1 << level ) * j),
+                                y - (gfloat) ( (gint) ( 1 << level ) * i));
+
+  *total_weight += weight;
+  ewa_newval[0] += weight * input_bptr[ skip     ];
+  ewa_newval[1] += weight * input_bptr[ skip + 1 ];
+  ewa_newval[2] += weight * input_bptr[ skip + 2 ];
+  ewa_newval[3] += weight * input_bptr[ skip + 3 ];
+}
+
+static void
+gegl_sampler_nohalo_get (      GeglSampler*    restrict  self,
+                         const gdouble                   absolute_x,
+                         const gdouble                   absolute_y,
+                               GeglMatrix2              *scale,
+                               void*           restrict  output,
+                               GeglAbyssPolicy           repeat_mode)
+{
+  /*
+   * Needed constants related to the input pixel value pointer
+   * provided by gegl_sampler_get_ptr (self, ix, iy). pixels_per_row
+   * corresponds to fetch_rectangle.width in gegl_sampler_get_ptr.
+   */
+  const gint channels       = 4;
+  const gint pixels_per_row = GEGL_SAMPLER_MAXIMUM_WIDTH;
+  const gint row_skip       = channels * pixels_per_row;
+
+  /*
+   * The consequence of the following choice of anchor pixel location
+   * is that the sampling location is at most at a box distance of .5
+   * from the anchor pixel location. That is: This computes the index
+   * of the closest pixel center (one of the closest when there are
+   * ties) within the GIMP convention.
+   *
+   * The reason why floor gives the index of the closest pixel center
+   * (with ties resolved toward -infinity) is that absolute positions
+   * are corner-based, meaning that the absolute position of the
+   * center of the pixel indexed (0,0) is (.5,.5) instead of (0,0), as
+   * it would be if absolute positions were center-based.
+   */
+  const gint ix_0 = floor ((double) absolute_x);
+  const gint iy_0 = floor ((double) absolute_y);
+
+  /*
+   * This is the pointer we use to pull pixel from "base" mipmap level
+   * (level "0"), the one with scale=1.0.
+   */
+  const gfloat* restrict input_bptr =
+    (gfloat*) gegl_sampler_get_ptr (self, ix_0, iy_0, repeat_mode);
+
+  /*
+   * First, we convert from the absolute position in the coordinate
+   * system with origin at the top left corner of the pixel with index
+   * (0,0) (the "GIMP convention" a.k.a. "corner-based"), to the
+   * position in the coordinate system with origin at the center of
+   * the pixel with index (0,0) (the "index" convention
+   * a.k.a. "center-based").
+   */
+  const gdouble iabsolute_x = absolute_x - (gdouble) 0.5;
+  const gdouble iabsolute_y = absolute_y - (gdouble) 0.5;
+
+  /*
+   * (x_0,y_0) is the relative position of the sampling location
+   * w.r.t. the anchor pixel.
+   */
+  const gfloat x_0 = iabsolute_x - ix_0;
+  const gfloat y_0 = iabsolute_y - iy_0;
+
+  const gint sign_of_x_0 = 2 * ( x_0 >= (gfloat) 0. ) - 1;
+  const gint sign_of_y_0 = 2 * ( y_0 >= (gfloat) 0. ) - 1;
+
+  const gint shift_forw_1_pix = sign_of_x_0 * channels;
+  const gint shift_forw_1_row = sign_of_y_0 * row_skip;
+
+  const gint shift_back_1_pix = -shift_forw_1_pix;
+  const gint shift_back_1_row = -shift_forw_1_row;
+
+  const gint shift_back_2_pix = 2 * shift_back_1_pix;
+  const gint shift_back_2_row = 2 * shift_back_1_row;
+  const gint shift_forw_2_pix = 2 * shift_forw_1_pix;
+  const gint shift_forw_2_row = 2 * shift_forw_1_row;
+
+  const gint uno_two_shift = shift_back_1_pix + shift_back_2_row;
+  const gint uno_thr_shift =                    shift_back_2_row;
+  const gint uno_fou_shift = shift_forw_1_pix + shift_back_2_row;
+
+  const gint dos_one_shift = shift_back_2_pix + shift_back_1_row;
+  const gint dos_two_shift = shift_back_1_pix + shift_back_1_row;
+  const gint dos_thr_shift =                    shift_back_1_row;
+  const gint dos_fou_shift = shift_forw_1_pix + shift_back_1_row;
+  const gint dos_fiv_shift = shift_forw_2_pix + shift_back_1_row;
+
+  const gint tre_one_shift = shift_back_2_pix;
+  const gint tre_two_shift = shift_back_1_pix;
+  const gint tre_thr_shift = 0;
+  const gint tre_fou_shift = shift_forw_1_pix;
+  const gint tre_fiv_shift = shift_forw_2_pix;
+
+  const gint qua_one_shift = shift_back_2_pix + shift_forw_1_row;
+  const gint qua_two_shift = shift_back_1_pix + shift_forw_1_row;
+  const gint qua_thr_shift =                    shift_forw_1_row;
+  const gint qua_fou_shift = shift_forw_1_pix + shift_forw_1_row;
+  const gint qua_fiv_shift = shift_forw_2_pix + shift_forw_1_row;
+
+  const gint cin_two_shift = shift_back_1_pix + shift_forw_2_row;
+  const gint cin_thr_shift =                    shift_forw_2_row;
+  const gint cin_fou_shift = shift_forw_1_pix + shift_forw_2_row;
+
+  /*
+   * Channel by channel computation of the new pixel values:
+   */
+  gfloat uno_one_0, uno_two_0, uno_thr_0, uno_fou_0;
+  gfloat dos_one_0, dos_two_0, dos_thr_0, dos_fou_0;
+  gfloat tre_one_0, tre_two_0, tre_thr_0, tre_fou_0;
+  gfloat qua_one_0, qua_two_0, qua_thr_0, qua_fou_0;
+
+  gfloat uno_one_1, uno_two_1, uno_thr_1, uno_fou_1;
+  gfloat dos_one_1, dos_two_1, dos_thr_1, dos_fou_1;
+  gfloat tre_one_1, tre_two_1, tre_thr_1, tre_fou_1;
+  gfloat qua_one_1, qua_two_1, qua_thr_1, qua_fou_1;
+
+  gfloat uno_one_2, uno_two_2, uno_thr_2, uno_fou_2;
+  gfloat dos_one_2, dos_two_2, dos_thr_2, dos_fou_2;
+  gfloat tre_one_2, tre_two_2, tre_thr_2, tre_fou_2;
+  gfloat qua_one_2, qua_two_2, qua_thr_2, qua_fou_2;
+
+  gfloat uno_one_3, uno_two_3, uno_thr_3, uno_fou_3;
+  gfloat dos_one_3, dos_two_3, dos_thr_3, dos_fou_3;
+  gfloat tre_one_3, tre_two_3, tre_thr_3, tre_fou_3;
+  gfloat qua_one_3, qua_two_3, qua_thr_3, qua_fou_3;
+
+  /*
+   * The newval array will contain one computed resampled value per
+   * channel:
+   */
+  gfloat newval[channels];
+
+  /*
+   * First channel:
+   */
+  nohalo_subdivision (input_bptr[ uno_two_shift ],
+                      input_bptr[ uno_thr_shift ],
+                      input_bptr[ uno_fou_shift ],
+                      input_bptr[ dos_one_shift ],
+                      input_bptr[ dos_two_shift ],
+                      input_bptr[ dos_thr_shift ],
+                      input_bptr[ dos_fou_shift ],
+                      input_bptr[ dos_fiv_shift ],
+                      input_bptr[ tre_one_shift ],
+                      input_bptr[ tre_two_shift ],
+                      input_bptr[ tre_thr_shift ],
+                      input_bptr[ tre_fou_shift ],
+                      input_bptr[ tre_fiv_shift ],
+                      input_bptr[ qua_one_shift ],
+                      input_bptr[ qua_two_shift ],
+                      input_bptr[ qua_thr_shift ],
+                      input_bptr[ qua_fou_shift ],
+                      input_bptr[ qua_fiv_shift ],
+                      input_bptr[ cin_two_shift ],
+                      input_bptr[ cin_thr_shift ],
+                      input_bptr[ cin_fou_shift ],
+                      &uno_one_0,
+                      &uno_two_0,
+                      &uno_thr_0,
+                      &uno_fou_0,
+                      &dos_one_0,
+                      &dos_two_0,
+                      &dos_thr_0,
+                      &dos_fou_0,
+                      &tre_one_0,
+                      &tre_two_0,
+                      &tre_thr_0,
+                      &tre_fou_0,
+                      &qua_one_0,
+                      &qua_two_0,
+                      &qua_thr_0,
+                      &qua_fou_0);
+
+  {
+    /*
+     * Computation of the needed weights (coefficients).
+     */
+    const gfloat xp1over2   = ( 2 * sign_of_x_0 ) * x_0;
+    const gfloat xm1over2   = xp1over2 + (gfloat) (-1.0);
+    const gfloat onepx      = (gfloat) 0.5 + xp1over2;
+    const gfloat onemx      = (gfloat) 1.5 - xp1over2;
+    const gfloat xp1over2sq = xp1over2 * xp1over2;
+
+    const gfloat yp1over2   = ( 2 * sign_of_y_0 ) * y_0;
+    const gfloat ym1over2   = yp1over2 + (gfloat) (-1.0);
+    const gfloat onepy      = (gfloat) 0.5 + yp1over2;
+    const gfloat onemy      = (gfloat) 1.5 - yp1over2;
+    const gfloat yp1over2sq = yp1over2 * yp1over2;
+
+    const gfloat xm1over2sq = xm1over2 * xm1over2;
+    const gfloat ym1over2sq = ym1over2 * ym1over2;
+
+    const gfloat twice1px = onepx + onepx;
+    const gfloat twice1py = onepy + onepy;
+    const gfloat twice1mx = onemx + onemx;
+    const gfloat twice1my = onemy + onemy;
+
+    const gfloat xm1over2sq_times_ym1over2sq = xm1over2sq * ym1over2sq;
+    const gfloat xp1over2sq_times_ym1over2sq = xp1over2sq * ym1over2sq;
+    const gfloat xp1over2sq_times_yp1over2sq = xp1over2sq * yp1over2sq;
+    const gfloat xm1over2sq_times_yp1over2sq = xm1over2sq * yp1over2sq;
+
+    const gfloat four_times_1px_times_1py = twice1px * twice1py;
+    const gfloat four_times_1mx_times_1py = twice1mx * twice1py;
+    const gfloat twice_xp1over2_times_1py = xp1over2 * twice1py;
+    const gfloat twice_xm1over2_times_1py = xm1over2 * twice1py;
+
+    const gfloat twice_xm1over2_times_1my = xm1over2 * twice1my;
+    const gfloat twice_xp1over2_times_1my = xp1over2 * twice1my;
+    const gfloat four_times_1mx_times_1my = twice1mx * twice1my;
+    const gfloat four_times_1px_times_1my = twice1px * twice1my;
+
+    const gfloat twice_1px_times_ym1over2 = twice1px * ym1over2;
+    const gfloat twice_1mx_times_ym1over2 = twice1mx * ym1over2;
+    const gfloat xp1over2_times_ym1over2  = xp1over2 * ym1over2;
+    const gfloat xm1over2_times_ym1over2  = xm1over2 * ym1over2;
+
+    const gfloat xm1over2_times_yp1over2  = xm1over2 * yp1over2;
+    const gfloat xp1over2_times_yp1over2  = xp1over2 * yp1over2;
+    const gfloat twice_1mx_times_yp1over2 = twice1mx * yp1over2;
+    const gfloat twice_1px_times_yp1over2 = twice1px * yp1over2;
+
+    const gfloat c00     =
+      four_times_1px_times_1py * xm1over2sq_times_ym1over2sq;
+    const gfloat c00dx   =
+      twice_xp1over2_times_1py * xm1over2sq_times_ym1over2sq;
+    const gfloat c00dy   =
+      twice_1px_times_yp1over2 * xm1over2sq_times_ym1over2sq;
+    const gfloat c00dxdy =
+       xp1over2_times_yp1over2 * xm1over2sq_times_ym1over2sq;
+
+    const gfloat c10     =
+      four_times_1mx_times_1py * xp1over2sq_times_ym1over2sq;
+    const gfloat c10dx   =
+      twice_xm1over2_times_1py * xp1over2sq_times_ym1over2sq;
+    const gfloat c10dy   =
+      twice_1mx_times_yp1over2 * xp1over2sq_times_ym1over2sq;
+    const gfloat c10dxdy =
+       xm1over2_times_yp1over2 * xp1over2sq_times_ym1over2sq;
+
+    const gfloat c01     =
+      four_times_1px_times_1my * xm1over2sq_times_yp1over2sq;
+    const gfloat c01dx   =
+      twice_xp1over2_times_1my * xm1over2sq_times_yp1over2sq;
+    const gfloat c01dy   =
+      twice_1px_times_ym1over2 * xm1over2sq_times_yp1over2sq;
+    const gfloat c01dxdy =
+      xp1over2_times_ym1over2 * xm1over2sq_times_yp1over2sq;
+
+    const gfloat c11     =
+      four_times_1mx_times_1my * xp1over2sq_times_yp1over2sq;
+    const gfloat c11dx   =
+      twice_xm1over2_times_1my * xp1over2sq_times_yp1over2sq;
+    const gfloat c11dy   =
+      twice_1mx_times_ym1over2 * xp1over2sq_times_yp1over2sq;
+    const gfloat c11dxdy =
+      xm1over2_times_ym1over2 * xp1over2sq_times_yp1over2sq;
+
+    newval[0] = lbb (c00,
+                     c10,
+                     c01,
+                     c11,
+                     c00dx,
+                     c10dx,
+                     c01dx,
+                     c11dx,
+                     c00dy,
+                     c10dy,
+                     c01dy,
+                     c11dy,
+                     c00dxdy,
+                     c10dxdy,
+                     c01dxdy,
+                     c11dxdy,
+                     uno_one_0,
+                     uno_two_0,
+                     uno_thr_0,
+                     uno_fou_0,
+                     dos_one_0,
+                     dos_two_0,
+                     dos_thr_0,
+                     dos_fou_0,
+                     tre_one_0,
+                     tre_two_0,
+                     tre_thr_0,
+                     tre_fou_0,
+                     qua_one_0,
+                     qua_two_0,
+                     qua_thr_0,
+                     qua_fou_0);
+    /*
+     * Second channel:
+     */
+    nohalo_subdivision (input_bptr[ uno_two_shift + 1 ],
+                        input_bptr[ uno_thr_shift + 1 ],
+                        input_bptr[ uno_fou_shift + 1 ],
+                        input_bptr[ dos_one_shift + 1 ],
+                        input_bptr[ dos_two_shift + 1 ],
+                        input_bptr[ dos_thr_shift + 1 ],
+                        input_bptr[ dos_fou_shift + 1 ],
+                        input_bptr[ dos_fiv_shift + 1 ],
+                        input_bptr[ tre_one_shift + 1 ],
+                        input_bptr[ tre_two_shift + 1 ],
+                        input_bptr[ tre_thr_shift + 1 ],
+                        input_bptr[ tre_fou_shift + 1 ],
+                        input_bptr[ tre_fiv_shift + 1 ],
+                        input_bptr[ qua_one_shift + 1 ],
+                        input_bptr[ qua_two_shift + 1 ],
+                        input_bptr[ qua_thr_shift + 1 ],
+                        input_bptr[ qua_fou_shift + 1 ],
+                        input_bptr[ qua_fiv_shift + 1 ],
+                        input_bptr[ cin_two_shift + 1 ],
+                        input_bptr[ cin_thr_shift + 1 ],
+                        input_bptr[ cin_fou_shift + 1 ],
+                        &uno_one_1,
+                        &uno_two_1,
+                        &uno_thr_1,
+                        &uno_fou_1,
+                        &dos_one_1,
+                        &dos_two_1,
+                        &dos_thr_1,
+                        &dos_fou_1,
+                        &tre_one_1,
+                        &tre_two_1,
+                        &tre_thr_1,
+                        &tre_fou_1,
+                        &qua_one_1,
+                        &qua_two_1,
+                        &qua_thr_1,
+                        &qua_fou_1);
+    newval[1] = lbb (c00,
+                     c10,
+                     c01,
+                     c11,
+                     c00dx,
+                     c10dx,
+                     c01dx,
+                     c11dx,
+                     c00dy,
+                     c10dy,
+                     c01dy,
+                     c11dy,
+                     c00dxdy,
+                     c10dxdy,
+                     c01dxdy,
+                     c11dxdy,
+                     uno_one_1,
+                     uno_two_1,
+                     uno_thr_1,
+                     uno_fou_1,
+                     dos_one_1,
+                     dos_two_1,
+                     dos_thr_1,
+                     dos_fou_1,
+                     tre_one_1,
+                     tre_two_1,
+                     tre_thr_1,
+                     tre_fou_1,
+                     qua_one_1,
+                     qua_two_1,
+                     qua_thr_1,
+                     qua_fou_1);
+    /*
+     * Third channel:
+     */
+    nohalo_subdivision (input_bptr[ uno_two_shift + 2 ],
+                        input_bptr[ uno_thr_shift + 2 ],
+                        input_bptr[ uno_fou_shift + 2 ],
+                        input_bptr[ dos_one_shift + 2 ],
+                        input_bptr[ dos_two_shift + 2 ],
+                        input_bptr[ dos_thr_shift + 2 ],
+                        input_bptr[ dos_fou_shift + 2 ],
+                        input_bptr[ dos_fiv_shift + 2 ],
+                        input_bptr[ tre_one_shift + 2 ],
+                        input_bptr[ tre_two_shift + 2 ],
+                        input_bptr[ tre_thr_shift + 2 ],
+                        input_bptr[ tre_fou_shift + 2 ],
+                        input_bptr[ tre_fiv_shift + 2 ],
+                        input_bptr[ qua_one_shift + 2 ],
+                        input_bptr[ qua_two_shift + 2 ],
+                        input_bptr[ qua_thr_shift + 2 ],
+                        input_bptr[ qua_fou_shift + 2 ],
+                        input_bptr[ qua_fiv_shift + 2 ],
+                        input_bptr[ cin_two_shift + 2 ],
+                        input_bptr[ cin_thr_shift + 2 ],
+                        input_bptr[ cin_fou_shift + 2 ],
+                        &uno_one_2,
+                        &uno_two_2,
+                        &uno_thr_2,
+                        &uno_fou_2,
+                        &dos_one_2,
+                        &dos_two_2,
+                        &dos_thr_2,
+                        &dos_fou_2,
+                        &tre_one_2,
+                        &tre_two_2,
+                        &tre_thr_2,
+                        &tre_fou_2,
+                        &qua_one_2,
+                        &qua_two_2,
+                        &qua_thr_2,
+                        &qua_fou_2);
+    newval[2] = lbb (c00,
+                     c10,
+                     c01,
+                     c11,
+                     c00dx,
+                     c10dx,
+                     c01dx,
+                     c11dx,
+                     c00dy,
+                     c10dy,
+                     c01dy,
+                     c11dy,
+                     c00dxdy,
+                     c10dxdy,
+                     c01dxdy,
+                     c11dxdy,
+                     uno_one_2,
+                     uno_two_2,
+                     uno_thr_2,
+                     uno_fou_2,
+                     dos_one_2,
+                     dos_two_2,
+                     dos_thr_2,
+                     dos_fou_2,
+                     tre_one_2,
+                     tre_two_2,
+                     tre_thr_2,
+                     tre_fou_2,
+                     qua_one_2,
+                     qua_two_2,
+                     qua_thr_2,
+                     qua_fou_2);
+    /*
+     * Fourth channel:
+     */
+    nohalo_subdivision (input_bptr[ uno_two_shift + 3 ],
+                        input_bptr[ uno_thr_shift + 3 ],
+                        input_bptr[ uno_fou_shift + 3 ],
+                        input_bptr[ dos_one_shift + 3 ],
+                        input_bptr[ dos_two_shift + 3 ],
+                        input_bptr[ dos_thr_shift + 3 ],
+                        input_bptr[ dos_fou_shift + 3 ],
+                        input_bptr[ dos_fiv_shift + 3 ],
+                        input_bptr[ tre_one_shift + 3 ],
+                        input_bptr[ tre_two_shift + 3 ],
+                        input_bptr[ tre_thr_shift + 3 ],
+                        input_bptr[ tre_fou_shift + 3 ],
+                        input_bptr[ tre_fiv_shift + 3 ],
+                        input_bptr[ qua_one_shift + 3 ],
+                        input_bptr[ qua_two_shift + 3 ],
+                        input_bptr[ qua_thr_shift + 3 ],
+                        input_bptr[ qua_fou_shift + 3 ],
+                        input_bptr[ qua_fiv_shift + 3 ],
+                        input_bptr[ cin_two_shift + 3 ],
+                        input_bptr[ cin_thr_shift + 3 ],
+                        input_bptr[ cin_fou_shift + 3 ],
+                        &uno_one_3,
+                        &uno_two_3,
+                        &uno_thr_3,
+                        &uno_fou_3,
+                        &dos_one_3,
+                        &dos_two_3,
+                        &dos_thr_3,
+                        &dos_fou_3,
+                        &tre_one_3,
+                        &tre_two_3,
+                        &tre_thr_3,
+                        &tre_fou_3,
+                        &qua_one_3,
+                        &qua_two_3,
+                        &qua_thr_3,
+                        &qua_fou_3);
+    newval[3] = lbb (c00,
+                     c10,
+                     c01,
+                     c11,
+                     c00dx,
+                     c10dx,
+                     c01dx,
+                     c11dx,
+                     c00dy,
+                     c10dy,
+                     c01dy,
+                     c11dy,
+                     c00dxdy,
+                     c10dxdy,
+                     c01dxdy,
+                     c11dxdy,
+                     uno_one_3,
+                     uno_two_3,
+                     uno_thr_3,
+                     uno_fou_3,
+                     dos_one_3,
+                     dos_two_3,
+                     dos_thr_3,
+                     dos_fou_3,
+                     tre_one_3,
+                     tre_two_3,
+                     tre_thr_3,
+                     tre_fou_3,
+                     qua_one_3,
+                     qua_two_3,
+                     qua_thr_3,
+                     qua_fou_3);
+
+    {
+      /*
+       * Determine whether LBB-Nohalo needs to be blended with the
+       * downsampling method (Clamped EWA with the tent filter).
+       *
+       * This is done by taking the 2x2 matrix Jinv (the exact or
+       * approximate inverse Jacobian of the transformation at the
+       * location under consideration:
+       *
+       * Jinv = [ a b ] = [ dx/dX dx/dY ]
+       *        [ c d ] = [ dy/dX dy/dY ]
+       *
+       * and computes from it the major and minor axis vectors
+       * [major_x, major_y] and [minor_x,minor_y] of the smallest
+       * ellipse containing both the unit disk and the ellipse which
+       * is the image of the unit disk by the linear transformation
+       *
+       * [ a b ] [S] = [s]
+       * [ c d ] [T] = [t]
+       *
+       * The vector [S,T] is the difference between a position in
+       * output space and [X,Y], the output location under
+       * consideration; the vector [s,t] is the difference between a
+       * position in input space and [x,y], the corresponding input
+       * location.
+       *
+       */
+      /*
+       * GOAL:
+       * Fix things so that the pullback, in input space, of a disk of
+       * radius r in output space is an ellipse which contains, at
+       * least, a disc of radius r. (Make this hold for any r>0.)
+       *
+       * ESSENCE OF THE METHOD:
+       * Compute the product of the first two factors of an SVD of the
+       * linear transformation defining the ellipse and make sure that
+       * both its columns have norm at least 1.  Because rotations and
+       * reflexions map disks to themselves, it is not necessary to
+       * compute the third (rightmost) factor of the SVD.
+       *
+       * DETAILS:
+       * Find the singular values and (unit) left singular vectors of
+       * Jinv, clamping up the singular values to 1, and multiply the
+       * unit left singular vectors by the new singular values in
+       * order to get the minor and major ellipse axis vectors.
+       *
+       * Image resampling context:
+       *
+       * The Jacobian matrix of the transformation at the output point
+       * under consideration is defined as follows:
+       *
+       * Consider the transformation (x,y) -> (X,Y) from input
+       * locations to output locations.
+       *
+       * The Jacobian matrix of the transformation at (x,y) is equal
+       * to
+       *
+       *   J = [ A, B ] = [ dX/dx, dX/dy ]
+       *       [ C, D ]   [ dY/dx, dY/dy ]
+       *
+       * that is, the vector [A,C] is the tangent vector corresponding
+       * to input changes in the horizontal direction, and the vector
+       * [B,D] is the tangent vector corresponding to input changes in
+       * the vertical direction.
+       *
+       * In the context of resampling, it is natural to use the
+       * inverse Jacobian matrix Jinv because resampling is generally
+       * performed by pulling pixel locations in the output image back
+       * to locations in the input image. Jinv is
+       *
+       *   Jinv = [ a, b ] = [ dx/dX, dx/dY ]
+       *          [ c, d ]   [ dy/dX, dy/dY ]
+       *
+       * Note: Jinv can be computed from J with the following matrix
+       * formula:
+       *
+       *   Jinv = 1/(A*D-B*C) [  D, -B ]
+       *                      [ -C,  A ]
+       *
+       * What we do is modify Jinv so that it generates an ellipse
+       * which is as close as possible to the original but which
+       * contains the unit disk. This can be accomplished as follows:
+       *
+       * Let
+       *
+       *   Jinv = U Sigma V^T
+       *
+       * be an SVD decomposition of Jinv. (The SVD is not unique, but
+       * the final ellipse does not depend on the particular SVD.)
+       *
+       * We could clamp up the entries of the diagonal matrix Sigma so
+       * that they are at least 1, and then set
+       *
+       *   Jinv = U newSigma V^T.
+       *
+       * However, we do not need to compute V for the following
+       * reason: V^T is an orthogonal matrix (that is, it represents a
+       * combination of rotations and reflexions) so that it maps the
+       * unit circle to itself. For this reason, the exact value of V
+       * does not affect the final ellipse, and we can choose V to be
+       * the identity matrix. This gives
+       *
+       *   Jinv = U newSigma.
+       *
+       * In the end, we return the two diagonal entries of newSigma
+       * together with the two columns of U.
+       *
+       */
+      /*
+       * We compute:
+       *
+       * major_mag: half-length of the major axis of the "new"
+       *            (post-clamping) ellipse.
+       *
+       * minor_mag: half-length of the minor axis of the "new"
+       *            ellipse.
+       *
+       * major_unit_x: x-coordinate of the major axis direction vector
+       *               of both the "old" and "new" ellipses.
+       *
+       * major_unit_y: y-coordinate of the major axis direction
+       *               vector.
+       *
+       * minor_unit_x: x-coordinate of the minor axis direction
+       *               vector.
+       *
+       * minor_unit_y: y-coordinate of the minor axis direction
+       *               vector.
+       *
+       * Unit vectors are useful for computing projections, in
+       * particular, to compute the distance between a point in output
+       * space and the center of a unit disk in output space, using
+       * the position of the corresponding point [s,t] in input space.
+       * Following the clamping, the square of this distance is
+       *
+       * ( ( s * major_unit_x + t * major_unit_y ) / major_mag )^2
+       * +
+       * ( ( s * minor_unit_x + t * minor_unit_y ) / minor_mag )^2
+       *
+       * If such distances will be computed for many [s,t]'s, it makes
+       * sense to actually compute the reciprocal of major_mag and
+       * minor_mag and multiply them by the above unit lengths.
+       */
+      /*
+       * History:
+       *
+       * ClampUpAxes, the ImageMagick function (found in resample.c)
+       * on which this is based, was written by Nicolas Robidoux and
+       * Chantal Racette of Laurentian University with insightful
+       * suggestions from Anthony Thyssen and funding from the
+       * National Science and Engineering Research Council of
+       * Canada. It is distinguished from its predecessors by its
+       * efficient handling of degenerate cases.
+       *
+       * The idea of clamping up the EWA ellipse's major and minor
+       * axes so that the result contains the reconstruction kernel
+       * filter support is taken from Andreas Gustaffson's Masters
+       * thesis "Interactive Image Warping", Helsinki University of
+       * Technology, Faculty of Information Technology, 59 pages, 1993
+       * (see Section 3.6).
+       *
+       * The use of the SVD to clamp up the singular values of the
+       * Jacobian matrix of the pullback transformation for EWA
+       * resampling is taken from the astrophysicist Craig DeForest.
+       * It is implemented in his PDL::Transform code (PDL = Perl Data
+       * Language).
+       *
+       * SVD reference:
+       * "We Recommend Singular Value Decomposition" by David Austin
+       * http://www.ams.org/samplings/feature-column/fcarc-svd
+       *
+       * Ellipse reference:
+       * http://en.wikipedia.org/wiki/Ellipse#Canonical_form
+       */
+      const gdouble a = scale?scale->coeff[0][0]:1;
+      const gdouble b = scale?scale->coeff[0][1]:0;
+      const gdouble c = scale?scale->coeff[1][0]:0;
+      const gdouble d = scale?scale->coeff[1][1]:1;
+
+      /*
+       * Computations are done in double precision because "direct"
+       * SVD computations are prone to round off error. (Computing in
+       * single precision most likely would be fine.)
+       */
+      /*
+       * n is the matrix Jinv * transpose(Jinv). Eigenvalues of n are
+       * the squares of the singular values of Jinv.
+       */
+      const gdouble aa = a * a;
+      const gdouble bb = b * b;
+      const gdouble cc = c * c;
+      const gdouble dd = d * d;
+      /*
+       * Eigenvectors of n are left singular vectors of Jinv.
+       */
+      const gdouble n11 = aa + bb;
+      const gdouble n12 = a * c + b * d;
+      const gdouble n21 = n12;
+      const gdouble n22 = cc + dd;
+      const double det = a * d - b * c;
+      const double twice_det = det + det;
+      const double frobenius_squared = n11 + n22;
+      const double discriminant =
+        ( frobenius_squared + twice_det ) * ( frobenius_squared - twice_det );
+      /*
+       * In exact arithmetic, the discriminant cannot be negative. In
+       * floating point, it can, leading a non-deterministic bug in
+       * ImageMagick (now fixed, thanks to Cristy, the lead dev).
+       */
+      const double sqrt_discriminant =
+        sqrt (discriminant > 0. ? discriminant : 0.);
+
+      /*
+       * Initially, we only compute the squares of the singular
+       * values.
+       */
+      /*
+       * s1 is the largest singular value of the inverse Jacobian
+       * matrix. In other words, its reciprocal is the smallest
+       * singular value of the Jacobian matrix itself.  If s1 = 0,
+       * both singular values are 0, and any orthogonal pair of left
+       * and right factors produces a singular decomposition of Jinv.
+       */
+      const gdouble twice_s1s1 = frobenius_squared + sqrt_discriminant;
+      /*
+       * If s1 <= 1, the forward transformation is not downsampling in
+       * any direction, and consequently we do not need the
+       * downsampling scheme at all.
+       */
+
+      if (twice_s1s1 > (gdouble) 2.)
+        {
+          /*
+           * The result (most likely) has a nonzero teepee component.
+           */
+          const gdouble s1s1 = (gdouble) 0.5 * twice_s1s1;
+          /*
+           * s2 the smallest singular value of the inverse Jacobian
+           * matrix. Its reciprocal is the largest singular value of
+           * the Jacobian matrix itself.
+           */
+          const gdouble s2s2 = 0.5 * ( frobenius_squared - sqrt_discriminant );
+
+          const gdouble s1s1minusn11 = s1s1 - n11;
+          const gdouble s1s1minusn22 = s1s1 - n22;
+          /*
+           * u1, the first column of the U factor of a singular
+           * decomposition of Jinv, is a (non-normalized) left
+           * singular vector corresponding to s1. It has entries u11
+           * and u21. We compute u1 from the fact that it is an
+           * eigenvector of n corresponding to the eigenvalue s1^2.
+           */
+          const gdouble s1s1minusn11_squared = s1s1minusn11 * s1s1minusn11;
+          const gdouble s1s1minusn22_squared = s1s1minusn22 * s1s1minusn22;
+          /*
+           * The following selects the largest row of n-s1^2 I ("I"
+           * being the 2x2 identity matrix) as the one which is used
+           * to find the eigenvector. If both s1^2-n11 and s1^2-n22
+           * are zero, n-s1^2 I is the zero matrix.  In that case, any
+           * vector is an eigenvector; in addition, norm below is
+           * equal to zero, and, in exact arithmetic, this is the only
+           * case in which norm = 0. So, setting u1 to the simple but
+           * arbitrary vector [1,0] if norm = 0 safely takes care of
+           * all cases.
+           */
+          const gdouble temp_u11 =
+            s1s1minusn11_squared >= s1s1minusn22_squared
+            ?
+            n12
+            :
+            s1s1minusn22;
+          const gdouble temp_u21 =
+            s1s1minusn11_squared >= s1s1minusn22_squared
+            ?
+            s1s1minusn11
+            :
+            n21;
+          const gdouble norm =
+            sqrt( temp_u11 * temp_u11 + temp_u21 * temp_u21 );
+          /*
+           * Finalize the entries of first left singular vector
+           * (associated with the largest singular value).
+           */
+          const gdouble u11 =
+            norm > (gdouble) 0.0 ? temp_u11 / norm : (gdouble) 1.0;
+          const gdouble u21 =
+            norm > (gdouble) 0.0 ? temp_u21 / norm : (gdouble) 0.0;
+          /*
+           * Clamp the singular values up to 1:
+           */
+          const gdouble major_mag =
+            s1s1 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s1s1 );
+          const gdouble minor_mag =
+            s2s2 <= (gdouble) 1.0 ? (gdouble) 1.0 : sqrt( s2s2 );
+          /*
+           * Unit major and minor axis direction vectors:
+           */
+          const gdouble major_unit_x =  u11;
+          const gdouble major_unit_y =  u21;
+          const gdouble minor_unit_x = -u21;
+          const gdouble minor_unit_y =  u11;
+
+          /*
+           * The square of the distance to the key location in output
+           * place of a point [s,t] in input space is the square root of
+           *
+           * ( s * c_major_x + t * c_major_y )^2
+           * +
+           * ( s * c_minor_x + t * c_minor_y )^2.
+           */
+          const gfloat c_major_x = major_unit_x / major_mag;
+          const gfloat c_major_y = major_unit_y / major_mag;
+          const gfloat c_minor_x = minor_unit_x / minor_mag;
+          const gfloat c_minor_y = minor_unit_y / minor_mag;
+
+          /*
+           * Remainder of the ellipse geometry computation:
+           */
+          /*
+           * Major and minor axis direction vectors:
+           */
+          const gdouble major_x = major_mag * major_unit_x;
+          const gdouble major_y = major_mag * major_unit_y;
+          const gdouble minor_x = minor_mag * minor_unit_x;
+          const gdouble minor_y = minor_mag * minor_unit_y;
+
+          /*
+           * Ellipse coefficients:
+           */
+          const gdouble ellipse_a =
+            major_y * major_y + minor_y * minor_y;
+          const gdouble folded_ellipse_b =
+            major_x * major_y + minor_x * minor_y;
+          const gdouble ellipse_c =
+            major_x * major_x + minor_x * minor_x;
+          const gdouble ellipse_f = major_mag * minor_mag;
+
+          /*
+           * Bounding box of the ellipse:
+           */
+          const gdouble bounding_box_factor =
+            ellipse_f * ellipse_f /
+            ( ellipse_c * ellipse_a - folded_ellipse_b * folded_ellipse_b );
+          const gfloat bounding_box_half_width =
+            sqrtf( (gfloat) (ellipse_c * bounding_box_factor) );
+          const gfloat bounding_box_half_height =
+            sqrtf( (gfloat) (ellipse_a * bounding_box_factor) );
+
+          /*
+           * Relative weight of the contribution of LBB-Nohalo:
+           */
+          const gfloat theta = (gfloat) ( (gdouble) 1. / ellipse_f );
+
+          /*
+           * Grab the pixel values located within the level 0
+           * context_rect.  Farther ones will be accessed through
+           * higher mipmap levels.
+           */
+          const gint out_left_0 =
+            NOHALO_MAX
+            (
+              (gint) ceilf  ( (double) ( x_0 - bounding_box_half_width  ) )
+              ,
+              -NOHALO_OFFSET_0
+            );
+          const gint out_rite_0 =
+            NOHALO_MIN
+            (
+              (gint) floorf ( (double) ( x_0 + bounding_box_half_width  ) )
+              ,
+              NOHALO_OFFSET_0
+            );
+          const gint out_top_0 =
+            NOHALO_MAX
+            (
+              (gint) ceilf  ( (double) ( y_0 - bounding_box_half_height ) )
+              ,
+              -NOHALO_OFFSET_0
+            );
+          const gint out_bot_0 =
+            NOHALO_MIN
+            (
+              (gint) floorf ( (double) ( y_0 + bounding_box_half_height ) )
+              ,
+              NOHALO_OFFSET_0
+            );
+
+          /*
+           * Accumulator for the EWA weights:
+           */
+          gdouble total_weight = (gdouble) 0.0;
+          /*
+           * Storage for the EWA contribution:
+           */
+          gfloat ewa_newval[channels];
+          ewa_newval[0] = (gfloat) 0;
+          ewa_newval[1] = (gfloat) 0;
+          ewa_newval[2] = (gfloat) 0;
+          ewa_newval[3] = (gfloat) 0;
+
+          {
+            gint i = out_top_0;
+            do {
+              gint j = out_left_0;
+              do {
+                ewa_update (j,
+                            i,
+                            c_major_x,
+                            c_major_y,
+                            c_minor_x,
+                            c_minor_y,
+                            x_0,
+                            y_0,
+                            channels,
+                            row_skip,
+                            input_bptr,
+                            &total_weight,
+                            ewa_newval);
+              } while ( ++j <= out_rite_0 );
+            } while ( ++i <= out_bot_0 );
+          }
+
+          {
+            /*
+             * In order to know whether we use higher mipmap level
+             * values, we need to check whether there is a level 1
+             * mipmap location within the ellipse. So, we need to
+             * determine the alignment of the level 1 mipmap level
+             * w.r.t. the current level 0.
+             *
+             * At level 0, we can access pixels which are at most
+             * NOHALO_OFFSET_0 away from the anchor pixel location in
+             * box distance.
+             */
+            /*
+             * Determine whether the anchor level_0 pixel locations
+             * are odd (VS even):
+             */
+            const gint odd_ix_0 = ix_0 % 2;
+            const gint odd_iy_0 = iy_0 % 2;
+            /*
+             * Find the closest locations, on all four sides, of level 1
+             * pixels which involve data not found in the level 0
+             * NOHALO_SIZE_0xNOHALO_SIZE_0.
+             */
+            NOHALO_FIND_CLOSEST_LOCATIONS(0,1)
+
+            if (( x_0 - bounding_box_half_width  < closest_left_1 ) ||
+                ( x_0 + bounding_box_half_width  > closest_rite_1 ) ||
+                ( y_0 - bounding_box_half_height < closest_top_1  ) ||
+                ( y_0 + bounding_box_half_height > closest_bot_1  ))
+              {
+                /*
+                 * We most likely need higher mipmap level(s) because
+                 * the bounding box of the ellipse covers mipmap pixel
+                 * locations which involve data not "covered" by the
+                 * level 0 context_rect. (The ellipse may still fail
+                 * to involve mipmap level 1 values--in which case all
+                 * mipmap pixel values will get 0 coefficients--but we
+                 * used a quick and dirty bounding box test which lets
+                 * through false positives.)
+                 */
+                /*
+                 * Nearest mipmap anchor pixel location:
+                 */
+                const gint ix_1 = NOHALO_FLOORED_DIVISION_BY_2(ix_0);
+                const gint iy_1 = NOHALO_FLOORED_DIVISION_BY_2(iy_0);
+                /*
+                 * Get pointer to mipmap level 1 data:
+                 */
+                const gfloat* restrict input_bptr_1 =
+                  (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                          ix_1,
+                                                          iy_1,
+                                                          (gint) 1,
+                                                          repeat_mode);
+                /*
+                 * Position of the sampling location in the coordinate
+                 * system defined by the mipmap "pixel locations"
+                 * relative to the level 1 anchor pixel location. The
+                 * "-1/2"s are because the center of a level 0 pixel
+                 * is at a box distance of 1/2 from the center of the
+                 * closest level 1 pixel.
+                 */
+                const gfloat x_1 =
+                  x_0 + (gfloat) ( ix_0 - 2 * ix_1 ) - (gfloat) 0.5;
+                const gfloat y_1 =
+                  y_0 + (gfloat) ( iy_0 - 2 * iy_1 ) - (gfloat) 0.5;
+                /*
+                 * Key index ranges:
+                 */
+                /*
+                 * The "in" indices are the closest relative mipmap 1
+                 * indices of needed mipmap values:
+                 */
+                NOHALO_FIND_CLOSEST_INDICES(0,1)
+                /*
+                 * The "out" indices are the farthest relative mipmap 1
+                 * indices we use at this level:
+                 */
+                NOHALO_FIND_FARTHEST_INDICES(1)
+                /*
+                 * Update using mipmap level 1 values.
+                 */
+                NOHALO_MIPMAP_EWA_UPDATE(1)
+
+                {
+                /*
+                 * Second mipmap level.
+                 */
+                const gint odd_ix_1 = ix_1 % 2;
+                const gint odd_iy_1 = iy_1 % 2;
+                NOHALO_FIND_CLOSEST_LOCATIONS(1,2)
+                if (( x_1 - bounding_box_half_width  < closest_left_2 ) ||
+                    ( x_1 + bounding_box_half_width  > closest_rite_2 ) ||
+                    ( y_1 - bounding_box_half_height < closest_top_2  ) ||
+                    ( y_1 + bounding_box_half_height > closest_bot_2  ))
+                  {
+                  const gint ix_2 = NOHALO_FLOORED_DIVISION_BY_2(ix_1);
+                  const gint iy_2 = NOHALO_FLOORED_DIVISION_BY_2(iy_1);
+                  const gfloat* restrict input_bptr_2 =
+                    (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                            ix_2,
+                                                            iy_2,
+                                                            (gint) 2,
+                                                            repeat_mode);
+                  const gfloat x_2 =
+                    x_1 + (gfloat) ( 2 * ( ix_1 - 2 * ix_2 ) - 1 );
+                  const gfloat y_2 =
+                    y_1 + (gfloat) ( 2 * ( iy_1 - 2 * iy_2 ) - 1 );
+                  NOHALO_FIND_CLOSEST_INDICES(1,2)
+                  NOHALO_FIND_FARTHEST_INDICES(2)
+                  NOHALO_MIPMAP_EWA_UPDATE(2)
+
+                  {
+                  /*
+                   * Third mipmap level.
+                   */
+                  const gint odd_ix_2 = ix_2 % 2;
+                  const gint odd_iy_2 = iy_2 % 2;
+                  NOHALO_FIND_CLOSEST_LOCATIONS(2,3)
+                  if (( x_2 - bounding_box_half_width  < closest_left_3 ) ||
+                      ( x_2 + bounding_box_half_width  > closest_rite_3 ) ||
+                      ( y_2 - bounding_box_half_height < closest_top_3  ) ||
+                      ( y_2 + bounding_box_half_height > closest_bot_3  ))
+                    {
+                    const gint ix_3 = NOHALO_FLOORED_DIVISION_BY_2(ix_2);
+                    const gint iy_3 = NOHALO_FLOORED_DIVISION_BY_2(iy_2);
+                    const gfloat* restrict input_bptr_3 =
+                      (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                              ix_3,
+                                                              iy_3,
+                                                              (gint) 3,
+                                                              repeat_mode);
+                    const gfloat x_3 =
+                      x_2 + (gfloat) ( 2 * ( ix_2 - 2 * ix_3 ) - 1 );
+                    const gfloat y_3 =
+                      y_2 + (gfloat) ( 2 * ( iy_2 - 2 * iy_3 ) - 1 );
+                    NOHALO_FIND_CLOSEST_INDICES(2,3)
+                    NOHALO_FIND_FARTHEST_INDICES(3)
+                    NOHALO_MIPMAP_EWA_UPDATE(3)
+
+                    {
+                    /*
+                     * Fourth mipmap level.
+                     */
+                    const gint odd_ix_3 = ix_3 % 2;
+                    const gint odd_iy_3 = iy_3 % 2;
+                    NOHALO_FIND_CLOSEST_LOCATIONS(3,4)
+                    if (( x_3 - bounding_box_half_width  < closest_left_4 ) ||
+                        ( x_3 + bounding_box_half_width  > closest_rite_4 ) ||
+                        ( y_3 - bounding_box_half_height < closest_top_4  ) ||
+                        ( y_3 + bounding_box_half_height > closest_bot_4  ))
+                      {
+                      const gint ix_4 = NOHALO_FLOORED_DIVISION_BY_2(ix_3);
+                      const gint iy_4 = NOHALO_FLOORED_DIVISION_BY_2(iy_3);
+                      const gfloat* restrict input_bptr_4 =
+                        (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                                ix_4,
+                                                                iy_4,
+                                                                (gint) 4,
+                                                                repeat_mode);
+                      const gfloat x_4 =
+                        x_3 + (gfloat) ( 2 * ( ix_3 - 2 * ix_4 ) - 1 );
+                      const gfloat y_4 =
+                        y_3 + (gfloat) ( 2 * ( iy_3 - 2 * iy_4 ) - 1 );
+                      NOHALO_FIND_CLOSEST_INDICES(3,4)
+                      NOHALO_FIND_FARTHEST_INDICES(4)
+                      NOHALO_MIPMAP_EWA_UPDATE(4)
+
+                      {
+                      /*
+                       * Fifth mipmap level.
+                       */
+                      const gint odd_ix_4 = ix_4 % 2;
+                      const gint odd_iy_4 = iy_4 % 2;
+                      NOHALO_FIND_CLOSEST_LOCATIONS(4,5)
+                      if (( x_4 - bounding_box_half_width  < closest_left_5 ) ||
+                          ( x_4 + bounding_box_half_width  > closest_rite_5 ) ||
+                          ( y_4 - bounding_box_half_height < closest_top_5  ) ||
+                          ( y_4 + bounding_box_half_height > closest_bot_5  ))
+                        {
+                        const gint ix_5 = NOHALO_FLOORED_DIVISION_BY_2(ix_4);
+                        const gint iy_5 = NOHALO_FLOORED_DIVISION_BY_2(iy_4);
+                        const gfloat* restrict input_bptr_5 =
+                          (gfloat*) gegl_sampler_get_from_mipmap (self,
+                                                                  ix_5,
+                                                                  iy_5,
+                                                                  (gint) 5,
+                                                                  repeat_mode);
+                        const gfloat x_5 =
+                          x_4 + (gfloat) ( 2 * ( ix_4 - 2 * ix_5 ) - 1 );
+                        const gfloat y_5 =
+                          y_4 + (gfloat) ( 2 * ( iy_4 - 2 * iy_5 ) - 1 );
+                        NOHALO_FIND_CLOSEST_INDICES(4,5)
+                        NOHALO_FIND_FARTHEST_INDICES(5)
+                        NOHALO_MIPMAP_EWA_UPDATE(5)
+
+                        {
+                        /*
+                         * Sixth mipmap level.
+                         */
+                        const gint odd_ix_5 = ix_5 % 2;
+                        const gint odd_iy_5 = iy_5 % 2;
+                        NOHALO_FIND_CLOSEST_LOCATIONS(5,6)
+                        if (( x_5 - bounding_box_half_width
+                              < closest_left_6 ) ||
+                            ( x_5 + bounding_box_half_width
+                              > closest_rite_6 ) ||
+                            ( y_5 - bounding_box_half_height
+                              < closest_top_6  ) ||
+                            ( y_5 + bounding_box_half_height
+                              > closest_bot_6  ))
+                          {
+                          const gint ix_6 = NOHALO_FLOORED_DIVISION_BY_2(ix_5);
+                          const gint iy_6 = NOHALO_FLOORED_DIVISION_BY_2(iy_5);
+                          const gfloat* restrict input_bptr_6 = (gfloat*)
+                            gegl_sampler_get_from_mipmap (self,
+                                                          ix_6,
+                                                          iy_6,
+                                                          (gint) 6,
+                                                          repeat_mode);
+                          const gfloat x_6 =
+                            x_5 + (gfloat) ( 2 * ( ix_5 - 2 * ix_6 ) - 1 );
+                          const gfloat y_6 =
+                            y_5 + (gfloat) ( 2 * ( iy_5 - 2 * iy_6 ) - 1 );
+                          NOHALO_FIND_CLOSEST_INDICES(5,6)
+                          NOHALO_FIND_FARTHEST_INDICES(6)
+                          NOHALO_MIPMAP_EWA_UPDATE(6)
+
+                          {
+                          /*
+                           * Seventh mipmap level (eight if counted
+                           * from zero = "straight up").
+                           */
+                          const gint odd_ix_6 = ix_6 % 2;
+                          const gint odd_iy_6 = iy_6 % 2;
+                          NOHALO_FIND_CLOSEST_LOCATIONS(6,7)
+                          if (( x_6 - bounding_box_half_width
+                                < closest_left_7 ) ||
+                              ( x_6 + bounding_box_half_width
+                                > closest_rite_7 ) ||
+                              ( y_6 - bounding_box_half_height
+                                < closest_top_7  ) ||
+                              ( y_6 + bounding_box_half_height
+                                > closest_bot_7  ))
+                            {
+                            const gint ix_7 =
+                              NOHALO_FLOORED_DIVISION_BY_2(ix_6);
+                            const gint iy_7 =
+                              NOHALO_FLOORED_DIVISION_BY_2(iy_6);
+                            const gfloat* restrict input_bptr_7 = (gfloat*)
+                              gegl_sampler_get_from_mipmap (self,
+                                                            ix_7,
+                                                            iy_7,
+                                                            (gint) 7,
+                                                            repeat_mode);
+                            const gfloat x_7 =
+                              x_6 + (gfloat) ( 2 * ( ix_6 - 2 * ix_7 ) - 1 );
+                            const gfloat y_7 =
+                              y_6 + (gfloat) ( 2 * ( iy_6 - 2 * iy_7 ) - 1 );
+                            NOHALO_FIND_CLOSEST_INDICES(6,7)
+                            NOHALO_FIND_FARTHEST_INDICES(7)
+                            NOHALO_MIPMAP_EWA_UPDATE(7)
+                            }
+                          }
+                          }
+                        }
+                        }
+                      }
+                      }
+                    }
+                    }
+                  }
+                  }
+                }
+              }
+
+            {
+              /*
+               * Blend the LBB-Nohalo and EWA results:
+               */
+              const gfloat beta =
+                (gfloat) ( ( (gdouble) 1.0 - theta ) / total_weight );
+              newval[0] = theta * newval[0] + beta * ewa_newval[0];
+              newval[1] = theta * newval[1] + beta * ewa_newval[1];
+              newval[2] = theta * newval[2] + beta * ewa_newval[2];
+              newval[3] = theta * newval[3] + beta * ewa_newval[3];
+            }
+          }
+        }
+
+      /*
+       * Ship out the result:
+       */
+      babl_process (self->fish, newval, output, 1);
+      return;
+    }
+  }
+}
diff --git a/gegl/buffer/gegl-sampler-nohalo.h b/gegl/buffer/gegl-sampler-nohalo.h
new file mode 100644
index 0000000..3b24172
--- /dev/null
+++ b/gegl/buffer/gegl-sampler-nohalo.h
@@ -0,0 +1,49 @@
+/* This file is part of GEGL
+ *
+ * GEGL is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU Lesser General Public License as
+ * published by the Free Software Foundation; either version 3 of the
+ * License, or (at your option) any later version.
+ *
+ * GEGL is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General
+ * Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with GEGL; if not, see
+ * <http://www.gnu.org/licenses/>.
+ *
+ */
+#ifndef __GEGL_SAMPLER_NOHALO_H__
+#define __GEGL_SAMPLER_NOHALO_H__
+
+#include "gegl-sampler.h"
+
+G_BEGIN_DECLS
+
+#define GEGL_TYPE_SAMPLER_NOHALO            (gegl_sampler_nohalo_get_type ())
+#define GEGL_SAMPLER_NOHALO(obj)            (G_TYPE_CHECK_INSTANCE_CAST ((obj), GEGL_TYPE_SAMPLER_NOHALO, GeglSamplerNohalo))
+#define GEGL_SAMPLER_NOHALO_CLASS(klass)    (G_TYPE_CHECK_CLASS_CAST ((klass),  GEGL_TYPE_SAMPLER_NOHALO, GeglSamplerNohaloClass))
+#define GEGL_IS_SAMPLER_NOHALO(obj)         (G_TYPE_CHECK_INSTANCE_TYPE ((obj), GEGL_TYPE_SAMPLER_NOHALO))
+#define GEGL_IS_SAMPLER_NOHALO_CLASS(klass) (G_TYPE_CHECK_CLASS_TYPE ((klass),  GEGL_TYPE_SAMPLER_NOHALO))
+#define GEGL_SAMPLER_NOHALO_GET_CLASS(obj)  (G_TYPE_INSTANCE_GET_CLASS ((obj),  GEGL_TYPE_SAMPLER_NOHALO, GeglSamplerNohaloClass))
+
+typedef struct _GeglSamplerNohalo      GeglSamplerNohalo;
+typedef struct _GeglSamplerNohaloClass GeglSamplerNohaloClass;
+
+struct _GeglSamplerNohalo
+{
+  GeglSampler parent_instance;
+};
+
+struct _GeglSamplerNohaloClass
+{
+  GeglSamplerClass parent_class;
+};
+
+GType gegl_sampler_nohalo_get_type (void) G_GNUC_CONST;
+
+G_END_DECLS
+
+#endif
diff --git a/gegl/buffer/gegl-sampler.c b/gegl/buffer/gegl-sampler.c
index fa5b468..8a5ac8f 100644
--- a/gegl/buffer/gegl-sampler.c
+++ b/gegl/buffer/gegl-sampler.c
@@ -33,6 +33,7 @@
 #include "gegl-sampler-nearest.h"
 #include "gegl-sampler-linear.h"
 #include "gegl-sampler-cubic.h"
+#include "gegl-sampler-nohalo.h"
 #include "gegl-sampler-lohalo.h"
 
 enum
@@ -524,6 +525,9 @@ gegl_sampler_type_from_string (const gchar *string)
   if (g_str_equal (string, "cubic")   || g_str_equal (string, "bicubic"))
     return GEGL_SAMPLER_CUBIC;
 
+  if (g_str_equal (string, "nohalo"))
+    return GEGL_SAMPLER_NOHALO;
+
   if (g_str_equal (string, "lohalo"))
     return GEGL_SAMPLER_LOHALO;
 
@@ -541,6 +545,8 @@ gegl_sampler_gtype_from_enum (GeglSamplerType sampler_type)
         return GEGL_TYPE_SAMPLER_LINEAR;
       case GEGL_SAMPLER_CUBIC:
         return GEGL_TYPE_SAMPLER_CUBIC;
+      case GEGL_SAMPLER_NOHALO:
+        return GEGL_TYPE_SAMPLER_NOHALO;
       case GEGL_SAMPLER_LOHALO:
         return GEGL_TYPE_SAMPLER_LOHALO;
       default:
diff --git a/gegl/gegl-enums.h b/gegl/gegl-enums.h
index 648a766..66f5a05 100644
--- a/gegl/gegl-enums.h
+++ b/gegl/gegl-enums.h
@@ -35,6 +35,7 @@ typedef enum {
   GEGL_SAMPLER_NEAREST = 0,   /*< desc="nearest"      >*/
   GEGL_SAMPLER_LINEAR,        /*< desc="linear"       >*/
   GEGL_SAMPLER_CUBIC,         /*< desc="cubic"        >*/
+  GEGL_SAMPLER_NOHALO,        /*< desc="nohalo"       >*/
   GEGL_SAMPLER_LOHALO         /*< desc="lohalo"       >*/
 } GeglSamplerType;
 GType gegl_sampler_type_get_type   (void) G_GNUC_CONST;
diff --git a/operations/common/polar-coordinates.c b/operations/common/polar-coordinates.c
index 54dc3a6..2102294 100644
--- a/operations/common/polar-coordinates.c
+++ b/operations/common/polar-coordinates.c
@@ -344,7 +344,7 @@ process (GeglOperation       *operation,
 
         if (inside)
           gegl_buffer_sample (input, px, py, &scale, dest, format,
-                              GEGL_SAMPLER_LOHALO, GEGL_ABYSS_NONE);
+                              GEGL_SAMPLER_NOHALO, GEGL_ABYSS_NONE);
         else
           for (i=0; i<4; i++)
             dest[i] = 0.0;
diff --git a/operations/transform/transform-core.c b/operations/transform/transform-core.c
index ba54d9f..ed1cbca 100644
--- a/operations/transform/transform-core.c
+++ b/operations/transform/transform-core.c
@@ -178,7 +178,7 @@ op_transform_class_init (OpTransformClass *klass)
                                    g_param_spec_string (
                                      "filter",
                                      _("Filter"),
-                              _("Filter type (nearest, linear, cubic, lohalo)"),
+                      _("Filter type (nearest, linear, cubic, nohalo, lohalo)"),
                                      "linear",
                                      G_PARAM_CONSTRUCT | G_PARAM_READWRITE));
   g_object_class_install_property (gobject_class, PROP_HARD_EDGES,
diff --git a/operations/workshop/fractal-trace.c b/operations/workshop/fractal-trace.c
index 1f7647c..316393d 100644
--- a/operations/workshop/fractal-trace.c
+++ b/operations/workshop/fractal-trace.c
@@ -89,7 +89,7 @@ julia (gdouble  x,
       xx  = tmp;
 
       if ((x2 + y2) > bailout2)
-	break;
+        break;
     }
 
   *u = xx;
@@ -130,10 +130,10 @@ fractaltrace (GeglBuffer          *input,
       switch (fractal_type)
         {
         case FRACTAL_TYPE_JULIA:
-#define gegl_unmap(u,v,ud,vd) {\
-            gdouble rx, ry;                       \
-            cx = o->X1 + ((u) - picture->x) * scale_x;  \
-            cy = o->Y1 + ((v) - picture->y) * scale_y;              \
+#define gegl_unmap(u,v,ud,vd) {                                         \
+            gdouble rx, ry;                                             \
+            cx = o->X1 + ((u) - picture->x) * scale_x;                  \
+            cy = o->Y1 + ((v) - picture->y) * scale_y;                  \
             julia (cx, cy, o->JX, o->JY, &rx, &ry, o->depth, bailout2); \
             ud = (rx - o->X1) / scale_x + picture->x;                   \
             vd = (ry - o->Y1) / scale_y + picture->y;                   \
@@ -144,7 +144,7 @@ fractaltrace (GeglBuffer          *input,
         break;
 
         case FRACTAL_TYPE_MANDELBROT:
-#define gegl_unmap(u,v,ud,vd) {                 \
+#define gegl_unmap(u,v,ud,vd) {                                     \
             gdouble rx, ry;                                         \
             cx = o->X1 + ((u) - picture->x) * scale_x;              \
             cy = o->Y1 + ((v) - picture->y) * scale_y;              \
@@ -162,7 +162,7 @@ fractaltrace (GeglBuffer          *input,
         }
 
       gegl_buffer_sample (input, px, py, &scale, dest, format,
-                          GEGL_SAMPLER_LOHALO, o->abyss_policy);
+                          GEGL_SAMPLER_NOHALO, o->abyss_policy);
 
       for (i = 0; i < 4; i++)
         dst_buf[offset++] = dest[i];
@@ -176,7 +176,7 @@ process (GeglOperation       *operation,
          const GeglRectangle *result,
          gint                 level)
 {
-  GeglChantO	*o;
+  GeglChantO    *o;
   GeglRectangle  boundary;
   const Babl    *format;
   FractalType    fractal_type;
diff --git a/operations/workshop/whirl-pinch.c b/operations/workshop/whirl-pinch.c
index eb71dff..5174f96 100644
--- a/operations/workshop/whirl-pinch.c
+++ b/operations/workshop/whirl-pinch.c
@@ -141,7 +141,7 @@ apply_whirl_pinch (gdouble whirl, gdouble pinch, gdouble radius,
   scale_x = 1.0;
   scale_y = roi->width / (gdouble) roi->height;
   sampler = gegl_buffer_sampler_new (src, babl_format ("RaGaBaA float"),
-                                     GEGL_SAMPLER_LOHALO);
+                                     GEGL_SAMPLER_NOHALO);
 
   for (row = 0; row < roi->height; row++) {
     for (col = 0; col < roi->width; col++) {
[Date Prev][Date Next] [Thread Prev][Thread Next] [Thread Index] [Date Index] [Author Index]