laserIMUCalibration/lmmin_8c_source.html

 #include <stdlib.h>

 #include <stdio.h>

 #include <math.h>

 #include <float.h>

 #include "lmmin.h"


 #define MIN(a,b) (((a)<=(b)) ? (a) : (b))


 #define MAX(a,b) (((a)>=(b)) ? (a) : (b))


 #define SQR(x)   (x)*(x)


 void lm_lmpar( int n, double *r, int ldr, int *ipvt, double *diag,

                double *qtb, double delta, double *par, double *x,

                double *sdiag, double *aux, double *xdi );

 void lm_qrfac( int m, int n, double *a, int *ipvt,

                double *rdiag, double *acnorm, double *wa );

 void lm_qrsolv( int n, double *r, int ldr, int *ipvt, double *diag,

                 double *qtb, double *x, double *sdiag, double *wa );


 /*****************************************************************************/

 /*  Numeric constants                                                        */

 /*****************************************************************************/


 /* machine-dependent constants from float.h */

 #define LM_MACHEP     DBL_EPSILON   /* resolution of arithmetic */

 #define LM_DWARF      DBL_MIN       /* smallest nonzero number */

 #define LM_SQRT_DWARF sqrt(DBL_MIN) /* square should not underflow */

 #define LM_SQRT_GIANT sqrt(DBL_MAX) /* square should not overflow */

 #define LM_USERTOL    30*LM_MACHEP  /* users are recommended to require this */


 /* If the above values do not work, the following seem good for an x86:

  LM_MACHEP     .555e-16

  LM_DWARF      9.9e-324

  LM_SQRT_DWARF 1.e-160

  LM_SQRT_GIANT 1.e150

  LM_USER_TOL   1.e-14

    The following values should work on any machine:

  LM_MACHEP     1.2e-16

  LM_DWARF      1.0e-38

  LM_SQRT_DWARF 3.834e-20

  LM_SQRT_GIANT 1.304e19

  LM_USER_TOL   1.e-14

 */


 const lm_control_struct lm_control_double = {

     LM_USERTOL, LM_USERTOL, LM_USERTOL, LM_USERTOL, 100., 100, 1,

     NULL, 0, -1, -1

 };

 const lm_control_struct lm_control_float = {

     1.e-7,      1.e-7,      1.e-7,      1.e-7,      100., 100, 1,

     NULL, 0, -1, -1

 };


 /*****************************************************************************/

 /*  Message texts (indexed by status.info)                                   */

 /*****************************************************************************/


 const char *lm_infmsg[] = {

     "found zero (sum of squares below underflow limit)",

     "converged  (the relative error in the sum of squares is at most tol)",

     "converged  (the relative error of the parameter vector is at most tol)",

     "converged  (both errors are at most tol)",

     "trapped    (by degeneracy; increasing epsilon might help)",

     "exhausted  (number of function calls exceeding preset patience)",

     "failed     (ftol<tol: cannot reduce sum of squares any further)",

     "failed     (xtol<tol: cannot improve approximate solution any further)",

     "failed     (gtol<tol: cannot improve approximate solution any further)",

     "crashed    (not enough memory)",

     "exploded   (fatal coding error: improper input parameters)",

     "stopped    (break requested within function evaluation)"

 };


 const char *lm_shortmsg[] = {

     "found zero",

     "converged (f)",

     "converged (p)",

     "converged (2)",

     "degenerate",

     "call limit",

     "failed (f)",

     "failed (p)",

     "failed (o)",

     "no memory",

     "invalid input",

     "user break"

 };


 /*****************************************************************************/

 /*  Monitoring auxiliaries.                                                  */

 /*****************************************************************************/


 void lm_print_pars( int nout, const double *par, double fnorm, FILE* fout )

 {

     int i;

     for (i = 0; i < nout; ++i)

         fprintf( fout, " %16.9g", par[i] );

     fprintf( fout, " => %18.11g\n", fnorm );

 }


 /*****************************************************************************/

 /*  lmmin (main minimization routine)                                        */

 /*****************************************************************************/


 void lmmin( int n, double *x, int m, const void *data,

             void (*evaluate) (const double *par, int m_dat, const void *data,

                               double *fvec, int *userbreak),

             const lm_control_struct *C, lm_status_struct *S )

 {

     double *fvec, *diag, *fjac, *qtf, *wa1, *wa2, *wa3, *wf;

     int *ipvt;

     int j, i;

     double actred, dirder, fnorm, fnorm1, gnorm, pnorm,

            prered, ratio, step, sum, temp, temp1, temp2, temp3;

     static double p0001 = 1.0e-4;


     int maxfev = C->patience * (n + 1);


     int    outer, inner;  /* loop counters, for monitoring */

     int    inner_success; /* flag for loop control */

     double lmpar = 0;     /* Levenberg-Marquardt parameter */

     double delta = 0;

     double xnorm = 0;

     double eps = sqrt(MAX(C->epsilon, LM_MACHEP)); /* for forward differences */


     int nout = C->n_maxpri == -1 ? n : MIN( C->n_maxpri, n );


     /* The workaround msgfile=NULL is needed for default initialization */

     FILE* msgfile = C->msgfile ? C->msgfile : stdout;


     /* Default status info; must be set ahead of first return statements */

     S->outcome = 0;      /* status code */

     S->userbreak = 0;

     S->nfev = 0;      /* function evaluation counter */


     /***  Check input parameters for errors.  ***/


     if ( n <= 0 ) {

         fprintf( stderr, "lmmin: invalid number of parameters %i\n", n );

         S->outcome = 10; /* invalid parameter */

         return;

     }

     if (m < n) {

         fprintf( stderr, "lmmin: number of data points (%i) "

                  "smaller than number of parameters (%i)\n", m, n );

         S->outcome = 10;

         return;

     }

     if (C->ftol < 0. || C->xtol < 0. || C->gtol < 0.) {

         fprintf( stderr,

                  "lmmin: negative tolerance (at least one of %g %g %g)\n",

                  C->ftol, C->xtol, C->gtol );

         S->outcome = 10;

         return;

     }

     if (maxfev <= 0) {

         fprintf( stderr, "lmmin: nonpositive function evaluations limit %i\n",

                  maxfev );

         S->outcome = 10;

         return;

     }

     if (C->stepbound <= 0.) {

         fprintf( stderr, "lmmin: nonpositive stepbound %g\n", C->stepbound );

         S->outcome = 10;

         return;

     }

     if (C->scale_diag != 0 && C->scale_diag != 1) {

         fprintf( stderr, "lmmin: logical variable scale_diag=%i, "

                  "should be 0 or 1\n", C->scale_diag );

         S->outcome = 10;

         return;

     }


     /***  Allocate work space.  ***/


     if ( (fvec = (double *) malloc(m * sizeof(double))) == NULL ||

             (diag = (double *) malloc(n * sizeof(double))) == NULL ||

             (qtf  = (double *) malloc(n * sizeof(double))) == NULL ||

             (fjac = (double *) malloc(n * m * sizeof(double))) == NULL ||

             (wa1  = (double *) malloc(n * sizeof(double))) == NULL ||

             (wa2  = (double *) malloc(n * sizeof(double))) == NULL ||

             (wa3  = (double *) malloc(n * sizeof(double))) == NULL ||

             (wf  = (double *)  malloc(m * sizeof(double))) == NULL ||

             (ipvt = (int *)    malloc(n * sizeof(int)   )) == NULL    ) {

         S->outcome = 9;

         return;

     }


     if (!C->scale_diag) {

         for (j = 0; j < n; j++)

             diag[j] = 1.;

     }


     /***  Evaluate function at starting point and calculate norm.  ***/


     (*evaluate)( x, m, data, fvec, &(S->userbreak) );

     S->nfev = 1;

     if ( S->userbreak )

         goto terminate;

     fnorm = lm_enorm(m, fvec);

     if ( C->verbosity ) {

         fprintf( msgfile, "lmmin start " );

         lm_print_pars( nout, x, fnorm, msgfile );

     }

     if ( fnorm <= LM_DWARF ) {

         S->outcome = 0; /* sum of squares almost zero, nothing to do */

         goto terminate;

     }


     /***  The outer loop: compute gradient, then descend.  ***/


     for ( outer = 0; ; ++outer ) {


         /***  [outer]  Calculate the Jacobian.  ***/


         for (j = 0; j < n; j++) {

             temp = x[j];

             step = MAX(eps * eps, eps * fabs(temp));

             x[j] += step; /* replace temporarily */

             (*evaluate)( x, m, data, wf, &(S->userbreak) );

             ++(S->nfev);

             if ( S->userbreak )

                 goto terminate;

             for (i = 0; i < m; i++)

                 fjac[j * m + i] = (wf[i] - fvec[i]) / step;

             x[j] = temp; /* restore */

         }

         if ( C->verbosity >= 10 ) {

             /* print the entire matrix */

             printf("\nlmmin Jacobian\n");

             for (i = 0; i < m; i++) {

                 printf("  ");

                 for (j = 0; j < n; j++)

                     printf("%.5e ", fjac[j * m + i]);

                 printf("\n");

             }

         }


         /***  [outer]  Compute the QR factorization of the Jacobian.  ***/


         /*      fjac is an m by n array. The upper n by n submatrix of fjac

          *        is made to contain an upper triangular matrix r with diagonal

          *        elements of nonincreasing magnitude such that

          *

          *              p^T*(jac^T*jac)*p = r^T*r

          *

          *              (NOTE: ^T stands for matrix transposition),

          *

          *        where p is a permutation matrix and jac is the final calculated

          *        Jacobian. Column j of p is column ipvt(j) of the identity matrix.

          *        The lower trapezoidal part of fjac contains information generated

          *        during the computation of r.

          *

          *      ipvt is an integer array of length n. It defines a permutation

          *        matrix p such that jac*p = q*r, where jac is the final calculated

          *        Jacobian, q is orthogonal (not stored), and r is upper triangular

          *        with diagonal elements of nonincreasing magnitude. Column j of p

          *        is column ipvt(j) of the identity matrix.

          */


         lm_qrfac(m, n, fjac, ipvt, wa1, wa2, wa3);

         /* return values are ipvt, wa1=rdiag, wa2=acnorm */


         /***  [outer]  Form q^T * fvec and store first n components in qtf.  ***/


         for (i = 0; i < m; i++)

             wf[i] = fvec[i];


         for (j = 0; j < n; j++) {

             temp3 = fjac[j * m + j];

             if (temp3 != 0.) {

                 sum = 0;

                 for (i = j; i < m; i++)

                     sum += fjac[j * m + i] * wf[i];

                 temp = -sum / temp3;

                 for (i = j; i < m; i++)

                     wf[i] += fjac[j * m + i] * temp;

             }

             fjac[j * m + j] = wa1[j];

             qtf[j] = wf[j];

         }


         /***  [outer]  Compute norm of scaled gradient and detect degeneracy.  ***/


         gnorm = 0;

         for (j = 0; j < n; j++) {

             if (wa2[ipvt[j]] == 0)

                 continue;

             sum = 0.;

             for (i = 0; i <= j; i++)

                 sum += fjac[j * m + i] * qtf[i];

             gnorm = MAX( gnorm, fabs( sum / wa2[ipvt[j]] / fnorm ) );

         }


         if (gnorm <= C->gtol) {

             S->outcome = 4;

             goto terminate;

         }


         /***  [outer]  Initialize / update diag and delta. ***/


         if ( !outer ) {

             /* first iteration only */

             if (C->scale_diag) {

                 /* diag := norms of the columns of the initial Jacobian */

                 for (j = 0; j < n; j++)

                     diag[j] = wa2[j] ? wa2[j] : 1;

                 /* xnorm := || D x || */

                 for (j = 0; j < n; j++)

                     wa3[j] = diag[j] * x[j];

                 xnorm = lm_enorm(n, wa3);

                 if ( C->verbosity >= 2 ) {

                     fprintf( msgfile, "lmmin diag  " );

                     lm_print_pars( nout, x, xnorm, msgfile );

                 }

                 /* only now print the header for the loop table */

                 if ( C->verbosity >= 3 ) {

                     fprintf( msgfile, "  o  i     lmpar    prered"

                              "          ratio    dirder      delta"

                              "      pnorm                 fnorm" );

                     for (i = 0; i < nout; ++i)

                         fprintf( msgfile, "               p%i", i );

                     fprintf( msgfile, "\n" );

                 }

             } else {

                 xnorm = lm_enorm(n, x);

             }

             /* initialize the step bound delta. */

             if ( xnorm )

                 delta = C->stepbound * xnorm;

             else

                 delta = C->stepbound;

         } else {

             if (C->scale_diag) {

                 for (j = 0; j < n; j++)

                     diag[j] = MAX( diag[j], wa2[j] );

             }

         }


         /***  The inner loop. ***/

         inner = 0;

         do {


             /***  [inner]  Determine the Levenberg-Marquardt parameter.  ***/


             lm_lmpar( n, fjac, m, ipvt, diag, qtf, delta, &lmpar,

                       wa1, wa2, wf, wa3 );

             /* used return values are fjac (partly), lmpar, wa1=x, wa3=diag*x */


             /* predict scaled reduction */

             pnorm = lm_enorm(n, wa3);

             temp2 = lmpar * SQR( pnorm / fnorm );

             for (j = 0; j < n; j++) {

                 wa3[j] = 0;

                 for (i = 0; i <= j; i++)

                     wa3[i] -= fjac[j * m + i] * wa1[ipvt[j]];

             }

             temp1 = SQR( lm_enorm(n, wa3) / fnorm );

             prered = temp1 + 2 * temp2;

             dirder = -temp1 + temp2; /* scaled directional derivative */


             /* at first call, adjust the initial step bound. */

             if ( !outer && pnorm < delta )

                 delta = pnorm;


             /***  [inner]  Evaluate the function at x + p.  ***/


             for (j = 0; j < n; j++)

                 wa2[j] = x[j] - wa1[j];


             (*evaluate)( wa2, m, data, wf, &(S->userbreak) );

             ++(S->nfev);

             if ( S->userbreak )

                 goto terminate;

             fnorm1 = lm_enorm(m, wf);


             /***  [inner]  Evaluate the scaled reduction.  ***/


             /* actual scaled reduction */

             actred = 1 - SQR(fnorm1 / fnorm);


             /* ratio of actual to predicted reduction */

             ratio = prered ? actred / prered : 0;


             if ( C->verbosity == 2 ) {

                 fprintf( msgfile, "lmmin (%i:%i) ", outer, inner );

                 lm_print_pars( nout, wa2, fnorm1, msgfile );

             } else if ( C->verbosity >= 3 ) {

                 printf( "%3i %2i %9.2g %9.2g %14.6g"

                         " %9.2g %10.3e %10.3e %21.15e",

                         outer, inner, lmpar, prered, ratio,

                         dirder, delta, pnorm, fnorm1 );

                 for (i = 0; i < nout; ++i)

                     fprintf( msgfile, " %16.9g", wa2[i] );

                 fprintf( msgfile, "\n" );

             }


             /* update the step bound */

             if        ( ratio <= 0.25 ) {

                 if      ( actred >= 0 )

                     temp = 0.5;

                 else if ( actred > -99 ) /* -99 = 1-1/0.1^2 */

                     temp = MAX( dirder / (2 * dirder + actred), 0.1 );

                 else

                     temp = 0.1;

                 delta = temp * MIN(delta, pnorm / 0.1);

                 lmpar /= temp;

             } else if ( ratio >= 0.75 ) {

                 delta = 2 * pnorm;

                 lmpar *= 0.5;

             } else if ( !lmpar ) {

                 delta = 2 * pnorm;

             }


             /***  [inner]  On success, update solution, and test for convergence.  ***/


             inner_success = ratio >= p0001;

             if ( inner_success ) {


                 /* update x, fvec, and their norms */

                 if (C->scale_diag) {

                     for (j = 0; j < n; j++) {

                         x[j] = wa2[j];

                         wa2[j] = diag[j] * x[j];

                     }

                 } else {

                     for (j = 0; j < n; j++)

                         x[j] = wa2[j];

                 }

                 for (i = 0; i < m; i++)

                     fvec[i] = wf[i];

                 xnorm = lm_enorm(n, wa2);

                 fnorm = fnorm1;

             }


             /* convergence tests */

             S->outcome = 0;

             if ( fnorm <= LM_DWARF )

                 goto terminate;  /* success: sum of squares almost zero */

             /* test two criteria (both may be fulfilled) */

             if (fabs(actred) <= C->ftol && prered <= C->ftol && ratio <= 2)

                 S->outcome = 1;  /* success: x almost stable */

             if (delta <= C->xtol * xnorm)

                 S->outcome += 2; /* success: sum of squares almost stable */

             if (S->outcome != 0) {

                 goto terminate;

             }


             /***  [inner]  Tests for termination and stringent tolerances.  ***/


             if ( S->nfev >= maxfev ) {

                 S->outcome = 5;

                 goto terminate;

             }

             if ( fabs(actred) <= LM_MACHEP &&

                     prered <= LM_MACHEP && ratio <= 2 ) {

                 S->outcome = 6;

                 goto terminate;

             }

             if ( delta <= LM_MACHEP * xnorm ) {

                 S->outcome = 7;

                 goto terminate;

             }

             if ( gnorm <= LM_MACHEP ) {

                 S->outcome = 8;

                 goto terminate;

             }


             /***  [inner]  End of the loop. Repeat if iteration unsuccessful.  ***/


             ++inner;

         } while ( !inner_success );


         /***  [outer]  End of the loop. ***/


     };


 terminate:

     S->fnorm = lm_enorm(m, fvec);

     if ( C->verbosity >= 2 )

         printf("lmmin outcome (%i) xnorm %g ftol %g xtol %g\n",

                S->outcome, xnorm, C->ftol, C->xtol );

     if ( C->verbosity & 1 ) {

         fprintf( msgfile, "lmmin final " );

         lm_print_pars( nout, x, S->fnorm, msgfile );

     }

     if ( S->userbreak ) /* user-requested break */

         S->outcome = 11;


     /***  Deallocate the workspace.  ***/

     free(fvec);

     free(diag);

     free(qtf);

     free(fjac);

     free(wa1);

     free(wa2);

     free(wa3);

     free(wf);

     free(ipvt);


 } /*** lmmin. ***/


 /*****************************************************************************/

 /*  lm_lmpar (determine Levenberg-Marquardt parameter)                       */

 /*****************************************************************************/


 void lm_lmpar(int n, double *r, int ldr, int *ipvt, double *diag,

               double *qtb, double delta, double *par, double *x,

               double *sdiag, double *aux, double *xdi)

 {

     /*     Given an m by n matrix a, an n by n nonsingular diagonal

      *     matrix d, an m-vector b, and a positive number delta,

      *     the problem is to determine a value for the parameter

      *     par such that if x solves the system

      *

      *          a*x = b  and  sqrt(par)*d*x = 0

      *

      *     in the least squares sense, and dxnorm is the euclidean

      *     norm of d*x, then either par=0 and (dxnorm-delta) < 0.1*delta,

      *     or par>0 and abs(dxnorm-delta) < 0.1*delta.

      *

      *     Using lm_qrsolv, this subroutine completes the solution of the problem

      *     if it is provided with the necessary information from the

      *     qr factorization, with column pivoting, of a. That is, if

      *     a*p = q*r, where p is a permutation matrix, q has orthogonal

      *     columns, and r is an upper triangular matrix with diagonal

      *     elements of nonincreasing magnitude, then lmpar expects

      *     the full upper triangle of r, the permutation matrix p,

      *     and the first n components of qT*b. On output

      *     lmpar also provides an upper triangular matrix s such that

      *

      *          p^T*(a^T*a + par*d*d)*p = s^T*s.

      *

      *     s is employed within lmpar and may be of separate interest.

      *

      *     Only a few iterations are generally needed for convergence

      *     of the algorithm. If, however, the limit of 10 iterations

      *     is reached, then the output par will contain the best

      *     value obtained so far.

      *

      *     parameters:

      *

      *      n is a positive integer input variable set to the order of r.

      *

      *      r is an n by n array. on input the full upper triangle

      *        must contain the full upper triangle of the matrix r.

      *        on OUTPUT the full upper triangle is unaltered, and the

      *        strict lower triangle contains the strict upper triangle

      *        (transposed) of the upper triangular matrix s.

      *

      *      ldr is a positive integer input variable not less than n

      *        which specifies the leading dimension of the array r.

      *

      *      ipvt is an integer input array of length n which defines the

      *        permutation matrix p such that a*p = q*r. column j of p

      *        is column ipvt(j) of the identity matrix.

      *

      *      diag is an input array of length n which must contain the

      *        diagonal elements of the matrix d.

      *

      *      qtb is an input array of length n which must contain the first

      *        n elements of the vector (q transpose)*b.

      *

      *      delta is a positive input variable which specifies an upper

      *        bound on the euclidean norm of d*x.

      *

      *      par is a nonnegative variable. on input par contains an

      *        initial estimate of the levenberg-marquardt parameter.

      *        on OUTPUT par contains the final estimate.

      *

      *      x is an OUTPUT array of length n which contains the least

      *        squares solution of the system a*x = b, sqrt(par)*d*x = 0,

      *        for the output par.

      *

      *      sdiag is an array of length n needed as workspace; on OUTPUT

      *        it contains the diagonal elements of the upper triangular matrix s.

      *

      *      aux is a multi-purpose work array of length n.

      *

      *      xdi is a work array of length n. On OUTPUT: diag[j] * x[j].

      *

      */

     int i, iter, j, nsing;

     double dxnorm, fp, fp_old, gnorm, parc, parl, paru;

     double sum, temp;

     static double p1 = 0.1;


     /*** lmpar: compute and store in x the gauss-newton direction. if the

          jacobian is rank-deficient, obtain a least squares solution. ***/


     nsing = n;

     for (j = 0; j < n; j++) {

         aux[j] = qtb[j];

         if (r[j * ldr + j] == 0 && nsing == n)

             nsing = j;

         if (nsing < n)

             aux[j] = 0;

     }

     for (j = nsing - 1; j >= 0; j--) {

         aux[j] = aux[j] / r[j + ldr * j];

         temp = aux[j];

         for (i = 0; i < j; i++)

             aux[i] -= r[j * ldr + i] * temp;

     }


     for (j = 0; j < n; j++)

         x[ipvt[j]] = aux[j];


     /*** lmpar: initialize the iteration counter, evaluate the function at the

          origin, and test for acceptance of the gauss-newton direction. ***/


     for (j = 0; j < n; j++)

         xdi[j] = diag[j] * x[j];

     dxnorm = lm_enorm(n, xdi);

     fp = dxnorm - delta;

     if (fp <= p1 * delta) {

 #ifdef LMFIT_DEBUG_MESSAGES

         printf("debug lmpar nsing %d n %d, terminate (fp<p1*delta)\n",

                nsing, n);

 #endif

         *par = 0;

         return;

     }


     /*** lmpar: if the jacobian is not rank deficient, the newton

          step provides a lower bound, parl, for the 0. of

          the function. otherwise set this bound to 0.. ***/


     parl = 0;

     if (nsing >= n) {

         for (j = 0; j < n; j++)

             aux[j] = diag[ipvt[j]] * xdi[ipvt[j]] / dxnorm;


         for (j = 0; j < n; j++) {

             sum = 0.;

             for (i = 0; i < j; i++)

                 sum += r[j * ldr + i] * aux[i];

             aux[j] = (aux[j] - sum) / r[j + ldr * j];

         }

         temp = lm_enorm(n, aux);

         parl = fp / delta / temp / temp;

     }


     /*** lmpar: calculate an upper bound, paru, for the 0. of the function. ***/


     for (j = 0; j < n; j++) {

         sum = 0;

         for (i = 0; i <= j; i++)

             sum += r[j * ldr + i] * qtb[i];

         aux[j] = sum / diag[ipvt[j]];

     }

     gnorm = lm_enorm(n, aux);

     paru = gnorm / delta;

     if (paru == 0.)

         paru = LM_DWARF / MIN(delta, p1);


     /*** lmpar: if the input par lies outside of the interval (parl,paru),

          set par to the closer endpoint. ***/


     *par = MAX(*par, parl);

     *par = MIN(*par, paru);

     if (*par == 0.)

         *par = gnorm / dxnorm;


     /*** lmpar: iterate. ***/


     for (iter = 0; ; iter++) {


         if (*par == 0.)

             *par = MAX(LM_DWARF, 0.001 * paru);

         temp = sqrt(*par);

         for (j = 0; j < n; j++)

             aux[j] = temp * diag[j];


         lm_qrsolv( n, r, ldr, ipvt, aux, qtb, x, sdiag, xdi );

         /* return values are r, x, sdiag */


         for (j = 0; j < n; j++)

             xdi[j] = diag[j] * x[j]; /* used as output */

         dxnorm = lm_enorm(n, xdi);

         fp_old = fp;

         fp = dxnorm - delta;


         if (fabs(fp) <= p1 * delta

                 || (parl == 0. && fp <= fp_old && fp_old < 0.)

                 || iter == 10) {

 #ifdef LMFIT_DEBUG_MESSAGES

             printf("debug lmpar nsing %d iter %d "

                    "par %.4e [%.4e %.4e] delta %.4e fp %.4e\n",

                    nsing, iter, *par, parl, paru, delta, fp);

 #endif

             break; /* the only exit from the iteration. */

         }


         for (j = 0; j < n; j++)

             aux[j] = diag[ipvt[j]] * xdi[ipvt[j]] / dxnorm;


         for (j = 0; j < n; j++) {

             aux[j] = aux[j] / sdiag[j];

             for (i = j + 1; i < n; i++)

                 aux[i] -= r[j * ldr + i] * aux[j];

         }

         temp = lm_enorm(n, aux);

         parc = fp / delta / temp / temp;


         if (fp > 0)

             parl = MAX(parl, *par);

         else if (fp < 0)

             paru = MIN(paru, *par);

         /* the case fp==0 is precluded by the break condition  */


         *par = MAX(parl, *par + parc);


     }


 } /*** lm_lmpar. ***/


 /*****************************************************************************/

 /*  lm_qrfac (QR factorization, from lapack)                                 */

 /*****************************************************************************/


 void lm_qrfac(int m, int n, double *a, int *ipvt,

               double *rdiag, double *acnorm, double *wa)

 {

     /*

      *     This subroutine uses Householder transformations with column

      *     pivoting (optional) to compute a qr factorization of the

      *     m by n matrix a. That is, qrfac determines an orthogonal

      *     matrix q, a permutation matrix p, and an upper trapezoidal

      *     matrix r with diagonal elements of nonincreasing magnitude,

      *     such that a*p = q*r. The Householder transformation for

      *     column k, k = 1,2,...,min(m,n), is of the form

      *

      *          i - (1/u(k))*u*uT

      *

      *     where u has zeroes in the first k-1 positions. The form of

      *     this transformation and the method of pivoting first

      *     appeared in the corresponding linpack subroutine.

      *

      *     Parameters:

      *

      *      m is a positive integer input variable set to the number

      *        of rows of a.

      *

      *      n is a positive integer input variable set to the number

      *        of columns of a.

      *

      *      a is an m by n array. On input a contains the matrix for

      *        which the qr factorization is to be computed. On OUTPUT

      *        the strict upper trapezoidal part of a contains the strict

      *        upper trapezoidal part of r, and the lower trapezoidal

      *        part of a contains a factored form of q (the non-trivial

      *        elements of the u vectors described above).

      *

      *      ipvt is an integer OUTPUT array of length lipvt. This array

      *        defines the permutation matrix p such that a*p = q*r.

      *        Column j of p is column ipvt(j) of the identity matrix.

      *

      *      rdiag is an OUTPUT array of length n which contains the

      *        diagonal elements of r.

      *

      *      acnorm is an OUTPUT array of length n which contains the

      *        norms of the corresponding columns of the input matrix a.

      *        If this information is not needed, then acnorm can coincide

      *        with rdiag.

      *

      *      wa is a work array of length n.

      *

      */

     int i, j, k, kmax, minmn;

     double ajnorm, sum, temp;


     /*** qrfac: compute initial column norms and initialize several arrays. ***/


     for (j = 0; j < n; j++) {

         acnorm[j] = lm_enorm(m, &a[j * m]);

         rdiag[j] = acnorm[j];

         wa[j] = rdiag[j];

         ipvt[j] = j;

     }

 #ifdef LMFIT_DEBUG_MESSAGES

     printf("debug qrfac\n");

 #endif


     /*** qrfac: reduce a to r with Householder transformations. ***/


     minmn = MIN(m, n);

     for (j = 0; j < minmn; j++) {


         kmax = j;

         for (k = j + 1; k < n; k++)

             if (rdiag[k] > rdiag[kmax])

                 kmax = k;

         if (kmax == j)

             goto pivot_ok;


         for (i = 0; i < m; i++) {

             temp = a[j * m + i];

             a[j * m + i] = a[kmax * m + i];

             a[kmax * m + i] = temp;

         }

         rdiag[kmax] = rdiag[j];

         wa[kmax] = wa[j];

         k = ipvt[j];

         ipvt[j] = ipvt[kmax];

         ipvt[kmax] = k;


 pivot_ok:

         ajnorm = lm_enorm(m - j, &a[j * m + j]);

         if (ajnorm == 0.) {

             rdiag[j] = 0;

             continue;

         }


         if (a[j * m + j] < 0.)

             ajnorm = -ajnorm;

         for (i = j; i < m; i++)

             a[j * m + i] /= ajnorm;

         a[j * m + j] += 1;


         for (k = j + 1; k < n; k++) {

             sum = 0;


             for (i = j; i < m; i++)

                 sum += a[j * m + i] * a[k * m + i];


             temp = sum / a[j + m * j];


             for (i = j; i < m; i++)

                 a[k * m + i] -= temp * a[j * m + i];


             if (rdiag[k] != 0.) {

                 temp = a[m * k + j] / rdiag[k];

                 temp = MAX(0., 1 - temp * temp);

                 rdiag[k] *= sqrt(temp);

                 temp = rdiag[k] / wa[k];

                 if ( 0.05 * SQR(temp) <= LM_MACHEP ) {

                     rdiag[k] = lm_enorm(m - j - 1, &a[m * k + j + 1]);

                     wa[k] = rdiag[k];

                 }

             }

         }


         rdiag[j] = -ajnorm;

     }

 } /*** lm_qrfac. ***/


 /*****************************************************************************/

 /*  lm_qrsolv (linear least-squares)                                         */

 /*****************************************************************************/


 void lm_qrsolv(int n, double *r, int ldr, int *ipvt, double *diag,

                double *qtb, double *x, double *sdiag, double *wa)

 {

     /*

      *     Given an m by n matrix a, an n by n diagonal matrix d,

      *     and an m-vector b, the problem is to determine an x which

      *     solves the system

      *

      *          a*x = b  and  d*x = 0

      *

      *     in the least squares sense.

      *

      *     This subroutine completes the solution of the problem

      *     if it is provided with the necessary information from the

      *     qr factorization, with column pivoting, of a. That is, if

      *     a*p = q*r, where p is a permutation matrix, q has orthogonal

      *     columns, and r is an upper triangular matrix with diagonal

      *     elements of nonincreasing magnitude, then qrsolv expects

      *     the full upper triangle of r, the permutation matrix p,

      *     and the first n components of (q transpose)*b. The system

      *     a*x = b, d*x = 0, is then equivalent to

      *

      *          r*z = q^T*b,  p^T*d*p*z = 0,

      *

      *     where x = p*z. If this system does not have full rank,

      *     then a least squares solution is obtained. On output qrsolv

      *     also provides an upper triangular matrix s such that

      *

      *          p^T *(a^T *a + d*d)*p = s^T *s.

      *

      *     s is computed within qrsolv and may be of separate interest.

      *

      *     Parameters

      *

      *      n is a positive integer input variable set to the order of r.

      *

      *      r is an n by n array. On input the full upper triangle

      *        must contain the full upper triangle of the matrix r.

      *        On OUTPUT the full upper triangle is unaltered, and the

      *        strict lower triangle contains the strict upper triangle

      *        (transposed) of the upper triangular matrix s.

      *

      *      ldr is a positive integer input variable not less than n

      *        which specifies the leading dimension of the array r.

      *

      *      ipvt is an integer input array of length n which defines the

      *        permutation matrix p such that a*p = q*r. Column j of p

      *        is column ipvt(j) of the identity matrix.

      *

      *      diag is an input array of length n which must contain the

      *        diagonal elements of the matrix d.

      *

      *      qtb is an input array of length n which must contain the first

      *        n elements of the vector (q transpose)*b.

      *

      *      x is an OUTPUT array of length n which contains the least

      *        squares solution of the system a*x = b, d*x = 0.

      *

      *      sdiag is an OUTPUT array of length n which contains the

      *        diagonal elements of the upper triangular matrix s.

      *

      *      wa is a work array of length n.

      *

      */

     int i, kk, j, k, nsing;

     double qtbpj, sum, temp;

     double _sin, _cos, _tan, _cot; /* local variables, not functions */


     /*** qrsolv: copy r and q^T*b to preserve input and initialize s.

          in particular, save the diagonal elements of r in x. ***/


     for (j = 0; j < n; j++) {

         for (i = j; i < n; i++)

             r[j * ldr + i] = r[i * ldr + j];

         x[j] = r[j * ldr + j];

         wa[j] = qtb[j];

     }

     /*** qrsolv: eliminate the diagonal matrix d using a Givens rotation. ***/


     for (j = 0; j < n; j++) {


         /*** qrsolv: prepare the row of d to be eliminated, locating the

              diagonal element using p from the qr factorization. ***/


         if (diag[ipvt[j]] == 0.)

             goto L90;

         for (k = j; k < n; k++)

             sdiag[k] = 0.;

         sdiag[j] = diag[ipvt[j]];


         /*** qrsolv: the transformations to eliminate the row of d modify only

              a single element of qT*b beyond the first n, which is initially 0. ***/


         qtbpj = 0.;

         for (k = j; k < n; k++) {


             if (sdiag[k] == 0.)

                 continue;

             kk = k + ldr * k;

             if (fabs(r[kk]) < fabs(sdiag[k])) {

                 _cot = r[kk] / sdiag[k];

                 _sin = 1 / sqrt(1 + SQR(_cot));

                 _cos = _sin * _cot;

             } else {

                 _tan = sdiag[k] / r[kk];

                 _cos = 1 / sqrt(1 + SQR(_tan));

                 _sin = _cos * _tan;

             }


             r[kk] = _cos * r[kk] + _sin * sdiag[k];

             temp = _cos * wa[k] + _sin * qtbpj;

             qtbpj = -_sin * wa[k] + _cos * qtbpj;

             wa[k] = temp;


             for (i = k + 1; i < n; i++) {

                 temp = _cos * r[k * ldr + i] + _sin * sdiag[i];

                 sdiag[i] = -_sin * r[k * ldr + i] + _cos * sdiag[i];

                 r[k * ldr + i] = temp;

             }

         }


 L90:

         sdiag[j] = r[j * ldr + j];

         r[j * ldr + j] = x[j];

     }


     /*** qrsolv: solve the triangular system for z. if the system is

          singular, then obtain a least squares solution. ***/


     nsing = n;

     for (j = 0; j < n; j++) {

         if (sdiag[j] == 0. && nsing == n)

             nsing = j;

         if (nsing < n)

             wa[j] = 0;

     }


     for (j = nsing - 1; j >= 0; j--) {

         sum = 0;

         for (i = j + 1; i < nsing; i++)

             sum += r[j * ldr + i] * wa[i];

         wa[j] = (wa[j] - sum) / sdiag[j];

     }


     /*** qrsolv: permute the components of z back to components of x. ***/


     for (j = 0; j < n; j++)

         x[ipvt[j]] = wa[j];


 } /*** lm_qrsolv. ***/


 /*****************************************************************************/

 /*  lm_enorm (Euclidean norm)                                                */

 /*****************************************************************************/


 double lm_enorm(int n, const double *x)

 {

     /*     Given an n-vector x, this function calculates the

      *     euclidean norm of x.

      *

      *     The euclidean norm is computed by accumulating the sum of

      *     squares in three different sums. The sums of squares for the

      *     small and large components are scaled so that no overflows

      *     occur. Non-destructive underflows are permitted. Underflows

      *     and overflows do not occur in the computation of the unscaled

      *     sum of squares for the intermediate components.

      *     The definitions of small, intermediate and large components

      *     depend on two constants, LM_SQRT_DWARF and LM_SQRT_GIANT. The main

      *     restrictions on these constants are that LM_SQRT_DWARF**2 not

      *     underflow and LM_SQRT_GIANT**2 not overflow.

      *

      *     Parameters

      *

      *      n is a positive integer input variable.

      *

      *      x is an input array of length n.

      */

     int i;

     double agiant, s1, s2, s3, xabs, x1max, x3max, temp;


     s1 = 0;

     s2 = 0;

     s3 = 0;

     x1max = 0;

     x3max = 0;

     agiant = LM_SQRT_GIANT / n;


     for (i = 0; i < n; i++) {

         xabs = fabs(x[i]);

         if (xabs > LM_SQRT_DWARF) {

             if ( xabs < agiant ) {

                 s2 += xabs * xabs;

             } else if ( xabs > x1max ) {

                 temp = x1max / xabs;

                 s1 = 1 + s1 * SQR(temp);

                 x1max = xabs;

             } else {

                 temp = xabs / x1max;

                 s1 += SQR(temp);

             }

         } else if ( xabs > x3max ) {

             temp = x3max / xabs;

             s3 = 1 + s3 * SQR(temp);

             x3max = xabs;

         } else if (xabs != 0.) {

             temp = xabs / x3max;

             s3 += SQR(temp);

         }

     }


     if (s1 != 0)

         return x1max * sqrt(s1 + (s2 / x1max) / x1max);

     else if (s2 != 0)

         if (s2 >= x3max)

             return sqrt(s2 * (1 + (x3max / s2) * (x3max * s3)));

         else

             return sqrt(x3max * ((s2 / x3max) + (x3max * s3)));

     else

         return x3max * sqrt(s3);


 } /*** lm_enorm. ***/

lm_control_struct::epsilon
double epsilon
Step used to calculate the Jacobian.
Definition: lmstruct.h:59

lmmin.h
Declarations for Levenberg-Marquardt minimization.

lm_control_float
const lm_control_struct lm_control_float
Preset (and recommended) control parameter settings.
Definition: lmmin.c:125

lm_control_struct
Collection of input parameters for fit control.
Definition: lmstruct.h:33

lm_qrfac
void lm_qrfac(int m, int n, double *a, int *ipvt, double *rdiag, double *acnorm, double *wa)
[brief description]
Definition: lmmin.c:813

lm_control_struct::n_maxpri
int n_maxpri
Maximum parameters to print.
Definition: lmstruct.h:95

lm_enorm
double lm_enorm(int n, const double *x)
Refined calculation of Eucledian norm.
Definition: lmmin.c:1119

LM_SQRT_DWARF
#define LM_SQRT_DWARF
Definition: lmmin.c:103

LM_DWARF
#define LM_DWARF
Definition: lmmin.c:102

lm_control_struct::patience
int patience
Used to set the maximum number of function evaluations.
Definition: lmstruct.h:73

lm_infmsg
const char * lm_infmsg[]
Preset message texts.
Definition: lmmin.c:135

LM_SQRT_GIANT
#define LM_SQRT_GIANT
Definition: lmmin.c:104

lm_status_struct::userbreak
int userbreak
Set when function evaluation requests termination.
Definition: lmstruct.h:124

lm_control_double
const lm_control_struct lm_control_double
Preset (and recommended) control parameter settings.
Definition: lmmin.c:121

lm_status_struct
Collection of output parameters for status info.
Definition: lmstruct.h:106

lm_control_struct::stepbound
double stepbound
Used in determining the initial step bound.
Definition: lmstruct.h:68

lm_control_struct::verbosity
int verbosity
Controls the ouput verbosity.
Definition: lmstruct.h:90

SQR
#define SQR(x)
[brief description]
Definition: lmmin.c:42

lm_control_struct::xtol
double xtol
Relative error between last two approximations.
Definition: lmstruct.h:46

lm_shortmsg
const char * lm_shortmsg[]
Preset message texts.
Definition: lmmin.c:150

lm_control_struct::msgfile
FILE * msgfile
Progress messages will be written to this file.
Definition: lmstruct.h:82

lm_print_pars
void lm_print_pars(int nout, const double *par, double fnorm, FILE *fout)
Definition: lmmin.c:170

lm_control_struct::scale_diag
int scale_diag
If 1, the variables will be rescaled internally.
Definition: lmstruct.h:78

lm_lmpar
void lm_lmpar(int n, double *r, int ldr, int *ipvt, double *diag, double *qtb, double delta, double *par, double *x, double *sdiag, double *aux, double *xdi)
[brief description]
Definition: lmmin.c:586

lm_control_struct::gtol
double gtol
Orthogonality desired between fvec and its derivs.
Definition: lmstruct.h:53

lm_qrsolv
void lm_qrsolv(int n, double *r, int ldr, int *ipvt, double *diag, double *qtb, double *x, double *sdiag, double *wa)
[brief description]
Definition: lmmin.c:952

MAX
#define MAX(a, b)
[brief description]
Definition: lmmin.c:35

LM_MACHEP
#define LM_MACHEP
Definition: lmmin.c:101

lmmin
void lmmin(int n, double *x, int m, const void *data, void(*evaluate)(const double *par, int m_dat, const void *data,                                                                                                               double *fvec, int *userbreak), const lm_control_struct *C, lm_status_struct *S)
Levenberg-Marquardt minimization.
Definition: lmmin.c:183

MIN
#define MIN(a, b)
[brief description]
Definition: lmmin.c:28

lm_status_struct::outcome
int outcome
Status indicator.
Definition: lmstruct.h:120

lm_status_struct::nfev
int nfev
actual number of iterations.
Definition: lmstruct.h:114

lm_status_struct::fnorm
double fnorm
norm of the residue vector fvec.
Definition: lmstruct.h:110

lm_control_struct::ftol
double ftol
Relative error desired in the sum of squares.
Definition: lmstruct.h:40

LM_USERTOL
#define LM_USERTOL
Definition: lmmin.c:105