thinplate_8c_source.html

/*

 *    This file is part of darktable,

 *    Copyright (C) 2016 Erwin Burema.

 *    Copyright (C) 2016 johannes hanika.

 *    Copyright (C) 2016 Roman Lebedev.

 *    Copyright (C) 2016 Tobias Ellinghaus.

 *    Copyright (C) 2019 Jacques Le Clerc.

 *    Copyright (C) 2020 Hubert Kowalski.

 *    Copyright (C) 2020 Pascal Obry.

 *    Copyright (C) 2021 Ralf Brown.

 *    Copyright (C) 2022 Martin Bařinka.

 *    Copyright (C) 2025 Aurélien PIERRE.

 *

 *    darktable is free software: you can redistribute it and/or modify

 *    it under the terms of the GNU General Public License as published by

 *    the Free Software Foundation, either version 3 of the License, or

 *    (at your option) any later version.

 *

 *    darktable is distributed in the hope that it will be useful,

 *    but WITHOUT ANY WARRANTY; without even the implied warranty of

 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 *    GNU General Public License for more details.

 *

 *    You should have received a copy of the GNU General Public License

 *    along with darktable.  If not, see <http://www.gnu.org/licenses/>.

 */


#ifndef MAX

#define MAX(a, b) ((a) < (b) ? (b) : (a))

#endif

#ifndef MIN

#define MIN(a, b) ((a) > (b) ? (b) : (a))

#endif


#include "common/darktable.h"

#include "chart/thinplate.h"

#include "chart/deltaE.h"

#include "common/svd/svd.h"


#include <assert.h>

#include <float.h>

#include <stdlib.h>

#include <string.h>


// #define REPLACEMENT // either broken code or doesn't help at all

// #define EXACT       // use full solve instead of dot in inner loop


// very fast, very approximate


static inline float __attribute__((__unused__)) fasterlog(float x)

{

  union { float f; uint32_t i; } vx = { x };

  float y = vx.i;

  y *= 8.2629582881927490e-8f;

  return y - 87.989971088f;

}


// thinplate spline kernel \phi(r)


static inline double thinplate_kernel(const double *x, const double *y)

{

  const double r

      = sqrt((x[0] - y[0]) * (x[0] - y[0]) + (x[1] - y[1]) * (x[1] - y[1]) + (x[2] - y[2]) * (x[2] - y[2]));

  return r * r * logf(MAX(1e-8f, r));

  // even when using both here and in the iop the approximate version,

  // it still doesn't work so well. need to be a bit more precise it seems.

  // return r * r * fasterlog(MAX(1e-8f, r));

}


static inline double compute_error(

    const tonecurve_t *c,

    const double **target,

    const double *residual_L,

    const double *residual_a,

    const double *residual_b,

    const int wd,

    double *maxerr)

{

  // compute error:

  double err = 0.0;

  double merr = 0.0;

  for(int i = 0; i < wd; i++)

  {

#ifdef EXACT

    const double Lt = target[0][i];

    const double L0 = tonecurve_apply(c, Lt);

    const double L1 = tonecurve_apply(c, Lt + residual_L[i]);

    dt_aligned_pixel_t Lab0 = { L0, target[1][i], target[2][i] };

    dt_aligned_pixel_t Lab1 = { L1, target[1][i], target[2][i] };

    const double localerr = dt_colorspaces_deltaE_2000(Lab0, Lab1);

    err += localerr;

#else

    const double localerr = sqrt(residual_L[i] * residual_L[i] + residual_a[i] * residual_a[i] + residual_b[i] * residual_b[i]);

    err += localerr/wd;

#endif

    merr = MAX(merr, localerr);


#if 0

#if 0   // max rmse

    // err = MAX(err, residual_L[i]*residual_L[i] +

    //     residual_a[i]*residual_a[i] + residual_b[i]*residual_b[i]);

#elif 0 // total rmse

    err += (residual_L[i]*residual_L[i] +

        residual_a[i]*residual_a[i] + residual_b[i]*residual_b[i])/wd;

#elif 1 // delta e 2000

    const double Lt = target[0][i];

    const double L0 = tonecurve_apply(c, Lt);

    const double L1 = tonecurve_apply(c, Lt + residual_L[i]);

    dt_aligned_pixel_t Lab0 = {L0, target[1][i], target[2][i]};

    dt_aligned_pixel_t Lab1 = {L1, target[1][i], target[2][i]};

    err += dt_colorspaces_deltaE_2000(Lab0, Lab1);

#else

    const double Lt = target[0][i];

    const double L = tonecurve_apply(c, Lt + residual_L[i]);

    const double dL = L - tonecurve_apply(c, Lt);

    err = MAX(err, dL*dL +

        residual_a[i]*residual_a[i] + residual_b[i]*residual_b[i]);

#endif

#endif

  }

  if(maxerr) *maxerr = merr;

  return err;

}


static inline int solve(double *As, double *w, double *v, const double *b, double *coeff, int wd, int s, int S)

{

  // A'[wd][s+1] = u[wd][s+1] diag(w[s+1]) v[s+1][s+1]^t

  //

  // svd to solve for c:

  // A * c = b

  // A = u w v^t => A-1 = v 1/w u^t

  dsvd(As, wd, s + 1, S, w, v); // As is wd x s+1 but row stride S.

  if(w[s] < 1e-3)               // if the smallest singular value becomes too small, we're done

    return 1;


  double *tmp = malloc(sizeof(double) * S);

  if(IS_NULL_PTR(tmp)) return 1;


  for(int i = 0; i <= s; i++) // compute tmp = u^t * b

  {

    tmp[i] = 0.0;

    for(int j = 0; j < wd; j++) tmp[i] += As[j * S + i] * b[j];

  }

  for(int i = 0; i <= s; i++) // apply singular values:

    tmp[i] /= w[i];

  for(int j = 0; j <= s; j++)

  { // compute first s output coefficients coeff[j]

    coeff[j] = 0.0;

    for(int i = 0; i <= s; i++) coeff[j] += v[j * (s + 1) + i] * tmp[i];

  }

  dt_free(tmp);

  return 0;

}


#pragma GCC diagnostic push

#pragma GCC diagnostic ignored "-Wvla"


// returns sparsity <= S


int thinplate_match(const tonecurve_t *curve, // tonecurve to apply after this (needed for error estimation)

                    int dim,                  // dimensionality of points

                    int N,                    // number of points

                    const double *point,      // dim-strided points

                    const double **target,    // target values, one pointer per dimension

                    int S,                    // desired sparsity level, actual result will be returned

                    int *permutation, // pointing to original order of points, to identify correct output coeff

                    double **coeff,   // output coefficient arrays for each dimension, ordered according to

                                      // permutation[dim]

                    double *avgerr,           // average error

                    double *maxerr)           // max error

{

  if(avgerr) *avgerr = 0.0;

  if(maxerr) *maxerr = 0.0;


  const int wd = N + 4;

  double *A = malloc(sizeof(double) * wd * wd);

  // construct system matrix A such that:

  // A c = f

  //

  // | R   P | |c| = |f|

  // | P^t 0 | |d|   |0|

  //

  // to interpolate values f_i with the radial basis function system matrix R and a polynomial term P.

  // P is a 3D linear polynomial a + b x + c y + d z

  //

  // radial basis function part R

  for(int j = 0; j < N; j++)

    for(int i = j; i < N; i++) A[j * wd + i] = A[i * wd + j] = thinplate_kernel(point + 3 * i, point + 3 * j);


  // polynomial part P: constant + 3x linear

  for(int i = 0; i < N; i++) A[i * wd + N + 0] = A[(N + 0) * wd + i] = 1.0f;

  for(int i = 0; i < N; i++) A[i * wd + N + 1] = A[(N + 1) * wd + i] = point[3 * i + 0];

  for(int i = 0; i < N; i++) A[i * wd + N + 2] = A[(N + 2) * wd + i] = point[3 * i + 1];

  for(int i = 0; i < N; i++) A[i * wd + N + 3] = A[(N + 3) * wd + i] = point[3 * i + 2];


  for(int j = N; j < wd; j++)

    for(int i = N; i < wd; i++) A[j * wd + i] = 0.0f;


  // precompute normalisation factors for columns of A

  double *norm = malloc(sizeof(double) * wd);

  for(int i = 0; i < wd; i++)

  {

    norm[i] = 0.0;

    for(int j = 0; j < wd; j++) norm[i] += A[j * wd + i] * A[j * wd + i];

    norm[i] = 1.0 / sqrt(norm[i]);

  }


  // XXX do we need these explicitly?

  // residual = target vector

  double(*r)[wd] = malloc(sizeof(double) * dim * wd);

  const double **b = malloc(sizeof(double *) * dim);

  for(int k = 0; k < dim; k++) b[k] = target[k];

  for(int k = 0; k < dim; k++) memcpy(r[k], b[k], sizeof(double) * wd);


  double *w = malloc(sizeof(double) * S);

  double *v = malloc(sizeof(double) * S * S);

  double *As = calloc((size_t)wd * S, sizeof(double));


  // for rank from 0 to sparsity level

  int s = 0, patches = 0;

  double olderr = FLT_MAX;

  // in case of replacement, iterate all the way to wd

  for(; s < wd; s++)

  {

    const int sparsity = MIN(s, S);

#ifndef REPLACEMENT

    if(patches >= S - 4)

    {

      dt_free(r);

      dt_free(b);

      dt_free(w);

      dt_free(v);

      dt_free(As);

      dt_free(norm);

      dt_free(A);

      return sparsity;

    }

    assert(sparsity < S + 4);

#endif

    // find (sparsity+1)-th column a_m by m = argmax_t{ a_t^t r . norm_t}

    // by searching over all three residuals

    double maxdot = 0.0;

    int maxcol = 0;

    for(int t = 0; t < wd; t++)

    {

      double dot = 0.0;

      if(norm[t] > 0.0)

      {

#ifdef EXACT // use full solve

        permutation[sparsity] = t;

        for(int ch = 0; ch < dim; ch++)

        {

          // re-init columns in As

          // svd will destroy its contents:

          for(int i = 0; i <= sparsity; i++)

            for(int j = 0; j < wd; j++) As[j * S + i] = A[j * wd + permutation[i]];


          if(solve(As, w, v, b[ch], coeff[ch], wd, sparsity, S))

          {

            dt_free(r);

            dt_free(b);

            dt_free(w);

            dt_free(v);

            dt_free(As);

            dt_free(norm);

            dt_free(A);

            return sparsity;

          }


          // compute tentative residual:

          // r = b - As c

          for(int j = 0; j < wd; j++)

          {

            r[ch][j] = b[ch][j];

            for(int i = 0; i <= sparsity; i++) r[ch][j] -= A[j * wd + permutation[i]] * coeff[ch][i];

          }

        }


        // compute error:

        const double err = compute_error(curve, target, r[0], r[1], r[2], wd, 0);

        dot = 1. / err; // searching for smallest error or largest dot

#else                   // use dot product

        for(int ch = 0; ch < dim; ch++)

        {

          double chdot = 0.0;

          for(int j = 0; j < wd; j++) chdot += A[j * wd + t] * r[ch][j];

          dot += fabs(chdot);

        }

        dot *= norm[t];

#endif

      }

      // fprintf(stderr, "dot %d = %g\n", i, dot);

      if(dot > maxdot)

      {

        maxcol = t;

        maxdot = dot;

      }

    }


    if(patches < S - 4)

    {

      // remember which column that was, we'll need it to evaluate later:

      permutation[s] = maxcol;

      if(maxcol < N) patches++;

      // make sure we won't choose it again:

      norm[maxcol] = 0.0;

    }

    else

    { // already have chosen S-4 patches as columns, now do the replacement:

      int mincol = 0;

      double minerr = FLT_MAX;

      for(int t = 0; t < sparsity; t++)

      {

        // find already chosen column t with min error reduction when replacing

        // XXX do we set perm[t] above, ever? for t=S-1?

        int oldperm = permutation[t];

        permutation[t] = maxcol;

#ifdef EXACT

        for(int ch = 0; ch < dim; ch++)

        {

          // re-init all columns in As

          for(int i = 0; i < sparsity; i++)

            for(int j = 0; j < wd; j++) As[j * S + i] = A[j * wd + permutation[i]];


          if(solve(As, w, v, b[ch], coeff[ch], wd, sparsity-1, S))

          {

            dt_free(r);

            dt_free(b);

            dt_free(w);

            dt_free(v);

            dt_free(As);

            dt_free(norm);

            dt_free(A);

            return s;

          }


          // compute tentative residual:

          // r = b - As c

          for(int j = 0; j < wd; j++)

          {

            r[ch][j] = b[ch][j];

            for(int i = 0; i < sparsity; i++) r[ch][j] -= A[j * wd + permutation[i]] * coeff[ch][i];

          }

        }


        // compute error:

        const double err = compute_error(curve, target, r[0], r[1], r[2], wd, 0);

#else

        double dot = 0.0;

        for(int ch = 0; ch < dim; ch++)

        {

          double chdot = 0.0;

          for(int j = 0; j < wd; j++) chdot += A[j * wd + t] * r[ch][j];

          dot += fabs(chdot);

        }

        double n = 0.0; // recompute column norm

        for(int j = 0; j < wd; j++) n += A[j * wd + mincol] * A[j * wd + mincol];

        dot *= n;

        double err = 1. / dot;

#endif


        if(err < minerr)

        {

          mincol = t;

          minerr = err;

        }

        permutation[t] = oldperm;

        // fprintf(stderr, "perm %d %d\n", t, oldperm);

      }

      // if(minerr >= 1. / maxdot) return sparsity + 1;

      if(minerr < 1. / maxdot)

      {

        fprintf(stderr, "replacing %d <- %d\n", mincol, maxcol);

        // replace column

        permutation[mincol] = maxcol;

        // reset norm[] of discarded column to something > 0

#ifdef EXACT

        norm[mincol] = 1.0;

#else

        norm[mincol] = 0.0;

        for(int j = 0; j < wd; j++) norm[mincol] += A[j * wd + mincol] * A[j * wd + mincol];

        norm[mincol] = 1.0 / sqrt(norm[mincol]);

#endif

        norm[maxcol] = 0.0;

      }

    }


#ifdef EXACT

    double err = 1. / maxdot;

#else

    const int sp = MIN(sparsity, S-1); // need to fix up for replacement

    // solve linear least squares for sparse c for every output channel:

    for(int ch = 0; ch < dim; ch++)

    {

      // re-init all of the previous columns in As since

      // svd will destroy its contents:

      for(int i = 0; i <= sp; i++)

        for(int j = 0; j < wd; j++) As[j * S + i] = A[j * wd + permutation[i]];


      // on error, return last valid configuration

      if(solve(As, w, v, b[ch], coeff[ch], wd, sp, S))

      {

        dt_free(r);

        dt_free(b);

        dt_free(w);

        dt_free(v);

        dt_free(As);

        dt_free(norm);

        dt_free(A);

        return sparsity;

      }


      // compute new residual:

      // r = b - As c

      for(int j = 0; j < wd; j++)

      {

        r[ch][j] = b[ch][j];

        for(int i = 0; i <= sp; i++) r[ch][j] -= A[j * wd + permutation[i]] * coeff[ch][i];

      }

    }


    double merr = 0.0;

    const double err = compute_error(curve, target, r[0], r[1], r[2], wd, &merr);

#endif

    // residual is max CIE76 delta E now

    // everything < 2 is usually considired a very good approximation:

    if(patches == S-4)

    {

      if(avgerr) *avgerr = err;

      if(maxerr) *maxerr = merr;

      fprintf(stderr, "rank %d/%d avg DE %g max DE %g\n", sp + 1, patches, err, merr);

    }

    if(s >= S && err >= olderr)

      fprintf(stderr, "error increased!\n");

      // return sparsity + 1;

    // if(err < 2.0) return sparsity+1;

    olderr = err;

  }

  dt_free(r);

  dt_free(b);

  dt_free(w);

  dt_free(v);

  dt_free(As);

  dt_free(norm);

  dt_free(A);

  return -1;

}


#pragma GCC diagnostic pop


float thinplate_color_pos(float L, float a, float b)

{

  const float pi = 3.14153f; // clearly true.

  const float h = atan2f(b, a) + pi;

  // const float C = sqrtf(a*a + b*b);

  const int sector = 4.0f * h / (2.0f * pi);

  return 256.0 * sector + L; // C;

}


// clang-format off

// modelines: These editor modelines have been set for all relevant files by tools/update_modelines.py

// vim: shiftwidth=2 expandtab tabstop=2 cindent

// kate: tab-indents: off; indent-width 2; replace-tabs on; indent-mode cstyle; remove-trailing-spaces modified;

// clang-format on

assert.h

tonecurve_apply
double tonecurve_apply(const tonecurve_t *c, const double L)
Definition chart/tonecurve.c:73

A
#define A(y, x)
Definition colorspaces.c:186

i
const float i
Definition colorspaces_inline_conversions.h:440

L
const float L
Definition colorspaces_inline_conversions.h:493

f
const dt_aligned_pixel_t f
Definition colorspaces_inline_conversions.h:102

n
const float n
Definition colorspaces_inline_conversions.h:678

S
#define S(V, params)
Definition common/histogram.c:36

darktable.h

__attribute__
float dt_aligned_pixel_simd_t __attribute__((vector_size(16), aligned(16)))
Enable aggressive floating-point arithmetic optimizations, in denormals handling. Set through user pr...
Definition darktable.h:524

dt_free
#define dt_free(ptr)
Definition darktable.h:456

IS_NULL_PTR
#define IS_NULL_PTR(p)
C is way too permissive with !=, == and if(var) checks, which can mean too many things depending on w...
Definition darktable.h:281

dt_colorspaces_deltaE_2000
float dt_colorspaces_deltaE_2000(dt_aligned_pixel_t Lab0, dt_aligned_pixel_t Lab1)
Definition deltaE.c:48

deltaE.h

permutation
static int permutation[]
Definition grain.c:160

x
static const float x
Definition iop_profile.h:235

coeff
const float *const const float coeff[3]
Definition iop_profile.h:240

t
const int t
Definition iop_profile.h:225

v
const float v
Definition iop_profile.h:221

k
float *const restrict const size_t k
Definition luminance_mask.h:78

ch
float *const restrict const size_t const size_t ch
Definition luminance_mask.h:78

N
#define N
Definition noiseprofile.c:158

dt_aligned_pixel_t
float dt_aligned_pixel_t[4]
Definition noiseprofile.c:28

r
const float r
Definition src/develop/noise_generator.h:101

point
Definition ashift_lsd.c:192

tonecurve_t
Definition tonecurve.h:28

svd.h
Singular value decomposition helper shared by chart and color-math code.

dsvd
static int dsvd(double *a, int m, int n, int str, double *w, double *v)
Compute the singular value decomposition of a dense matrix.
Definition svd.h:80

double
typedef double((*spd)(unsigned long int wavelength, double TempK))

MIN
#define MIN(a, b)
Definition thinplate.c:32

thinplate_color_pos
float thinplate_color_pos(float L, float a, float b)
Definition thinplate.c:448

thinplate_kernel
static double thinplate_kernel(const double *x, const double *y)
Definition thinplate.c:58

solve
static int solve(double *As, double *w, double *v, const double *b, double *coeff, int wd, int s, int S)
Definition thinplate.c:123

compute_error
static double compute_error(const tonecurve_t *c, const double **target, const double *residual_L, const double *residual_a, const double *residual_b, const int wd, double *maxerr)
Definition thinplate.c:68

thinplate_match
int thinplate_match(const tonecurve_t *curve, int dim, int N, const double *point, const double **target, int S, int *permutation, double **coeff, double *avgerr, double *maxerr)
Definition thinplate.c:157

MAX
#define MAX(a, b)
Definition thinplate.c:29

thinplate.h