unsupported/Eigen/src/NonLinearOptimization/HybridNonLinearSolver.h - mirror - Git at Google


 template<typename FunctorType, typename Scalar=double>
 class HybridNonLinearSolver
 {
 public:
     HybridNonLinearSolver(FunctorType &_functor)
         : functor(_functor) { nfev=njev=iter = 0;  fnorm= 0.; }

     enum Status {
         Running = -1,
         ImproperInputParameters = 0,
         RelativeErrorTooSmall = 1,
         TooManyFunctionEvaluation = 2,
         TolTooSmall = 3,
         NotMakingProgressJacobian = 4,
         NotMakingProgressIterations = 5,
         UserAksed = 6
     };

     struct Parameters {
         Parameters()
             : factor(Scalar(100.))
             , maxfev(1000)
             , xtol(ei_sqrt(epsilon<Scalar>()))
             , nb_of_subdiagonals(-1)
             , nb_of_superdiagonals(-1)
             , epsfcn(Scalar(0.)) {}
         Scalar factor;
         int maxfev;   // maximum number of function evaluation
         Scalar xtol;
         int nb_of_subdiagonals;
         int nb_of_superdiagonals;
         Scalar epsfcn;
     };

     Status hybrj1(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const Scalar tol = ei_sqrt(epsilon<Scalar>())
             );

     Status solveInit(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );
     Status solveOneStep(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );
     Status solve(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );

     Status hybrd1(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const Scalar tol = ei_sqrt(epsilon<Scalar>())
             );

     Status solveNumericalDiffInit(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );
     Status solveNumericalDiffOneStep(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );
     Status solveNumericalDiff(
             Matrix< Scalar, Dynamic, 1 >  &x,
             const int mode=1
             );

     void resetParameters(void) { parameters = Parameters(); }
     Parameters parameters;
     Matrix< Scalar, Dynamic, 1 >  fvec;
     Matrix< Scalar, Dynamic, Dynamic > fjac;
     Matrix< Scalar, Dynamic, 1 >  R;
     Matrix< Scalar, Dynamic, 1 >  qtf;
     Matrix< Scalar, Dynamic, 1 >  diag;
     int nfev;
     int njev;
     int iter;
     Scalar fnorm;
 private:
     FunctorType &functor;
     int n;
     Scalar sum;
     bool sing;
     Scalar temp;
     Scalar delta;
     bool jeval;
     int ncsuc;
     Scalar ratio;
     Scalar pnorm, xnorm, fnorm1;
     int nslow1, nslow2;
     int ncfail;
     Scalar actred, prered;
     Matrix< Scalar, Dynamic, 1 > wa1, wa2, wa3, wa4;
 };


 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::hybrj1(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const Scalar tol
         )
 {
     n = x.size();

     /* check the input parameters for errors. */
     if (n <= 0 || tol < 0.)
         return ImproperInputParameters;

     resetParameters();
     parameters.maxfev = 100*(n+1);
     parameters.xtol = tol;
     diag.setConstant(n, 1.);
     return solve(
         x,
         2
     );
 }

 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solveInit(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     n = x.size();

     wa1.resize(n); wa2.resize(n); wa3.resize(n); wa4.resize(n);
     fvec.resize(n);
     qtf.resize(n);
     R.resize( (n*(n+1))/2);
     fjac.resize(n, n);
     if (mode != 2)
         diag.resize(n);
     assert( (mode!=2 || diag.size()==n) || "When using mode==2, the caller must provide a valid 'diag'");

     /* Function Body */
     nfev = 0;
     njev = 0;

     /*     check the input parameters for errors. */

     if (n <= 0 || parameters.xtol < 0. || parameters.maxfev <= 0 || parameters.factor <= 0. )
         return ImproperInputParameters;
     if (mode == 2)
         for (int j = 0; j < n; ++j)
             if (diag[j] <= 0.)
                 return ImproperInputParameters;

     /*     evaluate the function at the starting point */
     /*     and calculate its norm. */

     nfev = 1;
     if ( functor(x, fvec) < 0)
         return UserAksed;
     fnorm = fvec.stableNorm();

     /*     initialize iteration counter and monitors. */

     iter = 1;
     ncsuc = 0;
     ncfail = 0;
     nslow1 = 0;
     nslow2 = 0;

     return Running;
 }

 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solveOneStep(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     int i, j, l, iwa[1];
     jeval = true;

     /* calculate the jacobian matrix. */

     if ( functor.df(x, fjac) < 0)
         return UserAksed;
     ++njev;

     /* compute the qr factorization of the jacobian. */

     ei_qrfac<Scalar>(n, n, fjac.data(), fjac.rows(), false, iwa, wa1.data(), wa2.data());


     if (iter == 1) {

         /* on the first iteration and if mode is 1, scale according */
         /* to the norms of the columns of the initial jacobian. */
         if (mode != 2)
             for (j = 0; j < n; ++j) {
                 diag[j] = wa2[j];
                 if (wa2[j] == 0.)
                     diag[j] = 1.;
             }

         /* on the first iteration, calculate the norm of the scaled x */
         /* and initialize the step bound delta. */
         wa3 = diag.cwise() * x;
         xnorm = wa3.stableNorm();
         delta = parameters.factor * xnorm;
         if (delta == 0.)
             delta = parameters.factor;
     }

     /* form (q transpose)*fvec and store in qtf. */

     qtf = fvec;
     for (j = 0; j < n; ++j)
         if (fjac(j,j) != 0.) {
             sum = 0.;
             for (i = j; i < n; ++i)
                 sum += fjac(i,j) * qtf[i];
             temp = -sum / fjac(j,j);
             for (i = j; i < n; ++i)
                 qtf[i] += fjac(i,j) * temp;
         }

     /* copy the triangular factor of the qr factorization into r. */

     sing = false;
     for (j = 0; j < n; ++j) {
         l = j;
         if (j)
             for (i = 0; i < j; ++i) {
                 R[l] = fjac(i,j);
                 l = l + n - i -1;
             }
         R[l] = wa1[j];
         if (wa1[j] == 0.)
             sing = true;
     }

     /* accumulate the orthogonal factor in fjac. */

     ei_qform<Scalar>(n, n, fjac.data(), fjac.rows(), wa1.data());

     /* rescale if necessary. */

     /* Computing MAX */
     if (mode != 2)
         diag = diag.cwise().max(wa2);

     /* beginning of the inner loop. */

     while (true) {

         /* determine the direction p. */

         ei_dogleg<Scalar>(R, diag, qtf, delta, wa1);

         /* store the direction p and x + p. calculate the norm of p. */

         wa1 = -wa1;
         wa2 = x + wa1;
         wa3 = diag.cwise() * wa1;
         pnorm = wa3.stableNorm();

         /* on the first iteration, adjust the initial step bound. */

         if (iter == 1)
             delta = std::min(delta,pnorm);

         /* evaluate the function at x + p and calculate its norm. */

         if ( functor(wa2, wa4) < 0)
             return UserAksed;
         ++nfev;
         fnorm1 = wa4.stableNorm();

         /* compute the scaled actual reduction. */

         actred = -1.;
         if (fnorm1 < fnorm) /* Computing 2nd power */
             actred = 1. - ei_abs2(fnorm1 / fnorm);

         /* compute the scaled predicted reduction. */

         l = 0;
         for (i = 0; i < n; ++i) {
             sum = 0.;
             for (j = i; j < n; ++j) {
                 sum += R[l] * wa1[j];
                 ++l;
             }
             wa3[i] = qtf[i] + sum;
         }
         temp = wa3.stableNorm();
         prered = 0.;
         if (temp < fnorm) /* Computing 2nd power */
             prered = 1. - ei_abs2(temp / fnorm);

         /* compute the ratio of the actual to the predicted */
         /* reduction. */

         ratio = 0.;
         if (prered > 0.)
             ratio = actred / prered;

         /* update the step bound. */

         if (ratio < Scalar(.1)) {
             ncsuc = 0;
             ++ncfail;
             delta = Scalar(.5) * delta;
         } else {
             ncfail = 0;
             ++ncsuc;
             if (ratio >= Scalar(.5) || ncsuc > 1) /* Computing MAX */
                 delta = std::max(delta, pnorm / Scalar(.5));
             if (ei_abs(ratio - 1.) <= Scalar(.1)) {
                 delta = pnorm / Scalar(.5);
             }
         }

         /* test for successful iteration. */

         if (ratio >= Scalar(1e-4)) {
             /* successful iteration. update x, fvec, and their norms. */
             x = wa2;
             wa2 = diag.cwise() * x;
             fvec = wa4;
             xnorm = wa2.stableNorm();
             fnorm = fnorm1;
             ++iter;
         }

         /* determine the progress of the iteration. */

         ++nslow1;
         if (actred >= Scalar(.001))
             nslow1 = 0;
         if (jeval)
             ++nslow2;
         if (actred >= Scalar(.1))
             nslow2 = 0;

         /* test for convergence. */

         if (delta <= parameters.xtol * xnorm || fnorm == 0.)
             return RelativeErrorTooSmall;

         /* tests for termination and stringent tolerances. */

         if (nfev >= parameters.maxfev)
             return TooManyFunctionEvaluation;
         if (Scalar(.1) * std::max(Scalar(.1) * delta, pnorm) <= epsilon<Scalar>() * xnorm)
             return TolTooSmall;
         if (nslow2 == 5)
             return NotMakingProgressJacobian;
         if (nslow1 == 10)
             return NotMakingProgressIterations;

         /* criterion for recalculating jacobian. */

         if (ncfail == 2)
             break; // leave inner loop and go for the next outer loop iteration

         /* calculate the rank one modification to the jacobian */
         /* and update qtf if necessary. */

         for (j = 0; j < n; ++j) {
             sum = wa4.dot(fjac.col(j));
             wa2[j] = (sum - wa3[j]) / pnorm;
             wa1[j] = diag[j] * (diag[j] * wa1[j] / pnorm);
             if (ratio >= Scalar(1e-4))
                 qtf[j] = sum;
         }

         /* compute the qr factorization of the updated jacobian. */

         ei_r1updt<Scalar>(n, n, R.data(), R.size(), wa1.data(), wa2.data(), wa3.data(), &sing);
         ei_r1mpyq<Scalar>(n, n, fjac.data(), fjac.rows(), wa2.data(), wa3.data());
         ei_r1mpyq<Scalar>(1, n, qtf.data(), 1, wa2.data(), wa3.data());

         /* end of the inner loop. */

         jeval = false;
     }
     /* end of the outer loop. */

     return Running;
 }


 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solve(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     Status status = solveInit(x, mode);
     while (status==Running)
         status = solveOneStep(x, mode);
     return status;
 }


 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::hybrd1(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const Scalar tol
         )
 {
     n = x.size();

     /* check the input parameters for errors. */
     if (n <= 0 || tol < 0.)
         return ImproperInputParameters;

     resetParameters();
     parameters.maxfev = 200*(n+1);
     parameters.xtol = tol;

     diag.setConstant(n, 1.);
     return solveNumericalDiff(
         x,
         2
     );
 }

 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiffInit(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     n = x.size();

     if (parameters.nb_of_subdiagonals<0) parameters.nb_of_subdiagonals= n-1;
     if (parameters.nb_of_superdiagonals<0) parameters.nb_of_superdiagonals= n-1;

     wa1.resize(n); wa2.resize(n); wa3.resize(n); wa4.resize(n);
     qtf.resize(n);
     R.resize( (n*(n+1))/2);
     fjac.resize(n, n);
     fvec.resize(n);
     if (mode != 2)
         diag.resize(n);
     assert( (mode!=2 || diag.size()==n) || "When using mode==2, the caller must provide a valid 'diag'");


     /* Function Body */

     nfev = 0;
     njev = 0;

     /*     check the input parameters for errors. */

     if (n <= 0 || parameters.xtol < 0. || parameters.maxfev <= 0 || parameters.nb_of_subdiagonals< 0 || parameters.nb_of_superdiagonals< 0 || parameters.factor <= 0. )
         return ImproperInputParameters;
     if (mode == 2)
         for (int j = 0; j < n; ++j)
             if (diag[j] <= 0.)
                 return ImproperInputParameters;

     /*     evaluate the function at the starting point */
     /*     and calculate its norm. */

     nfev = 1;
     if ( functor(x, fvec) < 0)
         return UserAksed;
     fnorm = fvec.stableNorm();

     /*     initialize iteration counter and monitors. */

     iter = 1;
     ncsuc = 0;
     ncfail = 0;
     nslow1 = 0;
     nslow2 = 0;

     return Running;
 }

 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiffOneStep(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     int i, j, l, iwa[1];
     jeval = true;
     if (parameters.nb_of_subdiagonals<0) parameters.nb_of_subdiagonals= n-1;
     if (parameters.nb_of_superdiagonals<0) parameters.nb_of_superdiagonals= n-1;

     /* calculate the jacobian matrix. */

     if (ei_fdjac1(functor, x, fvec, fjac, parameters.nb_of_subdiagonals, parameters.nb_of_superdiagonals, parameters.epsfcn) <0)
         return UserAksed;
     nfev += std::min(parameters.nb_of_subdiagonals+parameters.nb_of_superdiagonals+ 1, n);

     /* compute the qr factorization of the jacobian. */

     ei_qrfac<Scalar>(n, n, fjac.data(), fjac.rows(), false, iwa, wa1.data(), wa2.data());

     /* on the first iteration and if mode is 1, scale according */
     /* to the norms of the columns of the initial jacobian. */

     if (iter == 1) {
         if (mode != 2)
             for (j = 0; j < n; ++j) {
                 diag[j] = wa2[j];
                 if (wa2[j] == 0.)
                     diag[j] = 1.;
             }

         /* on the first iteration, calculate the norm of the scaled x */
         /* and initialize the step bound delta. */

         wa3 = diag.cwise() * x;
         xnorm = wa3.stableNorm();
         delta = parameters.factor * xnorm;
         if (delta == 0.)
             delta = parameters.factor;
     }

     /* form (q transpose)*fvec and store in qtf. */

     qtf = fvec;
     for (j = 0; j < n; ++j)
         if (fjac(j,j) != 0.) {
             sum = 0.;
             for (i = j; i < n; ++i)
                 sum += fjac(i,j) * qtf[i];
             temp = -sum / fjac(j,j);
             for (i = j; i < n; ++i)
                 qtf[i] += fjac(i,j) * temp;
         }

     /* copy the triangular factor of the qr factorization into r. */

     sing = false;
     for (j = 0; j < n; ++j) {
         l = j;
         if (j)
             for (i = 0; i < j; ++i) {
                 R[l] = fjac(i,j);
                 l = l + n - i -1;
             }
         R[l] = wa1[j];
         if (wa1[j] == 0.)
             sing = true;
     }

     /* accumulate the orthogonal factor in fjac. */

     ei_qform<Scalar>(n, n, fjac.data(), fjac.rows(), wa1.data());

     /* rescale if necessary. */

     /* Computing MAX */
     if (mode != 2)
         diag = diag.cwise().max(wa2);

     /* beginning of the inner loop. */

     while (true) {

         /* determine the direction p. */

         ei_dogleg<Scalar>(R, diag, qtf, delta, wa1);

         /* store the direction p and x + p. calculate the norm of p. */

         wa1 = -wa1;
         wa2 = x + wa1;
         wa3 = diag.cwise() * wa1;
         pnorm = wa3.stableNorm();

         /* on the first iteration, adjust the initial step bound. */

         if (iter == 1)
             delta = std::min(delta,pnorm);

         /* evaluate the function at x + p and calculate its norm. */

         if ( functor(wa2, wa4) < 0)
             return UserAksed;
         ++nfev;
         fnorm1 = wa4.stableNorm();

         /* compute the scaled actual reduction. */

         actred = -1.;
         if (fnorm1 < fnorm) /* Computing 2nd power */
             actred = 1. - ei_abs2(fnorm1 / fnorm);

         /* compute the scaled predicted reduction. */

         l = 0;
         for (i = 0; i < n; ++i) {
             sum = 0.;
             for (j = i; j < n; ++j) {
                 sum += R[l] * wa1[j];
                 ++l;
             }
             wa3[i] = qtf[i] + sum;
         }
         temp = wa3.stableNorm();
         prered = 0.;
         if (temp < fnorm) /* Computing 2nd power */
             prered = 1. - ei_abs2(temp / fnorm);

         /* compute the ratio of the actual to the predicted */
         /* reduction. */

         ratio = 0.;
         if (prered > 0.)
             ratio = actred / prered;

         /* update the step bound. */

         if (ratio < Scalar(.1)) {
             ncsuc = 0;
             ++ncfail;
             delta = Scalar(.5) * delta;
         } else {
             ncfail = 0;
             ++ncsuc;
             if (ratio >= Scalar(.5) || ncsuc > 1) /* Computing MAX */
                 delta = std::max(delta, pnorm / Scalar(.5));
             if (ei_abs(ratio - 1.) <= Scalar(.1)) {
                 delta = pnorm / Scalar(.5);
             }
         }

         /* test for successful iteration. */

         if (ratio >= Scalar(1e-4)) {
             /* successful iteration. update x, fvec, and their norms. */
             x = wa2;
             wa2 = diag.cwise() * x;
             fvec = wa4;
             xnorm = wa2.stableNorm();
             fnorm = fnorm1;
             ++iter;
         }

         /* determine the progress of the iteration. */

         ++nslow1;
         if (actred >= Scalar(.001))
             nslow1 = 0;
         if (jeval)
             ++nslow2;
         if (actred >= Scalar(.1))
             nslow2 = 0;

         /* test for convergence. */

         if (delta <= parameters.xtol * xnorm || fnorm == 0.)
             return RelativeErrorTooSmall;

         /* tests for termination and stringent tolerances. */

         if (nfev >= parameters.maxfev)
             return TooManyFunctionEvaluation;
         if (Scalar(.1) * std::max(Scalar(.1) * delta, pnorm) <= epsilon<Scalar>() * xnorm)
             return TolTooSmall;
         if (nslow2 == 5)
             return NotMakingProgressJacobian;
         if (nslow1 == 10)
             return NotMakingProgressIterations;

         /* criterion for recalculating jacobian approximation */
         /* by forward differences. */

         if (ncfail == 2)
             break; // leave inner loop and go for the next outer loop iteration

         /* calculate the rank one modification to the jacobian */
         /* and update qtf if necessary. */

         for (j = 0; j < n; ++j) {
             sum = wa4.dot(fjac.col(j));
             wa2[j] = (sum - wa3[j]) / pnorm;
             wa1[j] = diag[j] * (diag[j] * wa1[j] / pnorm);
             if (ratio >= Scalar(1e-4))
                 qtf[j] = sum;
         }

         /* compute the qr factorization of the updated jacobian. */

         ei_r1updt<Scalar>(n, n, R.data(), R.size(), wa1.data(), wa2.data(), wa3.data(), &sing);
         ei_r1mpyq<Scalar>(n, n, fjac.data(), fjac.rows(), wa2.data(), wa3.data());
         ei_r1mpyq<Scalar>(1, n, qtf.data(), 1, wa2.data(), wa3.data());

         /* end of the inner loop. */

         jeval = false;
     }
     /* end of the outer loop. */

     return Running;
 }

 template<typename FunctorType, typename Scalar>
 typename HybridNonLinearSolver<FunctorType,Scalar>::Status
 HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiff(
         Matrix< Scalar, Dynamic, 1 >  &x,
         const int mode
         )
 {
     Status status = solveNumericalDiffInit(x, mode);
     while (status==Running)
         status = solveNumericalDiffOneStep(x, mode);
     return status;
 }

	template<typename FunctorType, typename Scalar=double>
	class HybridNonLinearSolver
	{
	public:
	HybridNonLinearSolver(FunctorType &_functor)
	: functor(_functor) { nfev=njev=iter = 0; fnorm= 0.; }

	enum Status {
	Running = -1,
	ImproperInputParameters = 0,
	RelativeErrorTooSmall = 1,
	TooManyFunctionEvaluation = 2,
	TolTooSmall = 3,
	NotMakingProgressJacobian = 4,
	NotMakingProgressIterations = 5,
	UserAksed = 6
	};

	struct Parameters {
	Parameters()
	: factor(Scalar(100.))
	, maxfev(1000)
	, xtol(ei_sqrt(epsilon<Scalar>()))
	, nb_of_subdiagonals(-1)
	, nb_of_superdiagonals(-1)
	, epsfcn(Scalar(0.)) {}
	Scalar factor;
	int maxfev; // maximum number of function evaluation
	Scalar xtol;
	int nb_of_subdiagonals;
	int nb_of_superdiagonals;
	Scalar epsfcn;
	};

	Status hybrj1(
	Matrix< Scalar, Dynamic, 1 > &x,
	const Scalar tol = ei_sqrt(epsilon<Scalar>())
	);

	Status solveInit(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);
	Status solveOneStep(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);
	Status solve(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);

	Status hybrd1(
	Matrix< Scalar, Dynamic, 1 > &x,
	const Scalar tol = ei_sqrt(epsilon<Scalar>())
	);

	Status solveNumericalDiffInit(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);
	Status solveNumericalDiffOneStep(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);
	Status solveNumericalDiff(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode=1
	);

	void resetParameters(void) { parameters = Parameters(); }
	Parameters parameters;
	Matrix< Scalar, Dynamic, 1 > fvec;
	Matrix< Scalar, Dynamic, Dynamic > fjac;
	Matrix< Scalar, Dynamic, 1 > R;
	Matrix< Scalar, Dynamic, 1 > qtf;
	Matrix< Scalar, Dynamic, 1 > diag;
	int nfev;
	int njev;
	int iter;
	Scalar fnorm;
	private:
	FunctorType &functor;
	int n;
	Scalar sum;
	bool sing;
	Scalar temp;
	Scalar delta;
	bool jeval;
	int ncsuc;
	Scalar ratio;
	Scalar pnorm, xnorm, fnorm1;
	int nslow1, nslow2;
	int ncfail;
	Scalar actred, prered;
	Matrix< Scalar, Dynamic, 1 > wa1, wa2, wa3, wa4;
	};



	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::hybrj1(
	Matrix< Scalar, Dynamic, 1 > &x,
	const Scalar tol
	)
	{
	n = x.size();

	/* check the input parameters for errors. */
	if (n <= 0 \|\| tol < 0.)
	return ImproperInputParameters;

	resetParameters();
	parameters.maxfev = 100*(n+1);
	parameters.xtol = tol;
	diag.setConstant(n, 1.);
	return solve(
	x,
	2
	);
	}

	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solveInit(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	n = x.size();

	wa1.resize(n); wa2.resize(n); wa3.resize(n); wa4.resize(n);
	fvec.resize(n);
	qtf.resize(n);
	R.resize( (n*(n+1))/2);
	fjac.resize(n, n);
	if (mode != 2)
	diag.resize(n);
	assert( (mode!=2 \|\| diag.size()==n) \|\| "When using mode==2, the caller must provide a valid 'diag'");

	/* Function Body */
	nfev = 0;
	njev = 0;

	/* check the input parameters for errors. */

	if (n <= 0 \|\| parameters.xtol < 0. \|\| parameters.maxfev <= 0 \|\| parameters.factor <= 0. )
	return ImproperInputParameters;
	if (mode == 2)
	for (int j = 0; j < n; ++j)
	if (diag[j] <= 0.)
	return ImproperInputParameters;

	/* evaluate the function at the starting point */
	/* and calculate its norm. */

	nfev = 1;
	if ( functor(x, fvec) < 0)
	return UserAksed;
	fnorm = fvec.stableNorm();

	/* initialize iteration counter and monitors. */

	iter = 1;
	ncsuc = 0;
	ncfail = 0;
	nslow1 = 0;
	nslow2 = 0;

	return Running;
	}

	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solveOneStep(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	int i, j, l, iwa[1];
	jeval = true;

	/* calculate the jacobian matrix. */

	if ( functor.df(x, fjac) < 0)
	return UserAksed;
	++njev;

	/* compute the qr factorization of the jacobian. */

	ei_qrfac<Scalar>(n, n, fjac.data(), fjac.rows(), false, iwa, wa1.data(), wa2.data());


	if (iter == 1) {

	/* on the first iteration and if mode is 1, scale according */
	/* to the norms of the columns of the initial jacobian. */
	if (mode != 2)
	for (j = 0; j < n; ++j) {
	diag[j] = wa2[j];
	if (wa2[j] == 0.)
	diag[j] = 1.;
	}

	/* on the first iteration, calculate the norm of the scaled x */
	/* and initialize the step bound delta. */
	wa3 = diag.cwise() * x;
	xnorm = wa3.stableNorm();
	delta = parameters.factor * xnorm;
	if (delta == 0.)
	delta = parameters.factor;
	}

	/* form (q transpose)fvec and store in qtf. /

	qtf = fvec;
	for (j = 0; j < n; ++j)
	if (fjac(j,j) != 0.) {
	sum = 0.;
	for (i = j; i < n; ++i)
	sum += fjac(i,j) * qtf[i];
	temp = -sum / fjac(j,j);
	for (i = j; i < n; ++i)
	qtf[i] += fjac(i,j) * temp;
	}

	/* copy the triangular factor of the qr factorization into r. */

	sing = false;
	for (j = 0; j < n; ++j) {
	l = j;
	if (j)
	for (i = 0; i < j; ++i) {
	R[l] = fjac(i,j);
	l = l + n - i -1;
	}
	R[l] = wa1[j];
	if (wa1[j] == 0.)
	sing = true;
	}

	/* accumulate the orthogonal factor in fjac. */

	ei_qform<Scalar>(n, n, fjac.data(), fjac.rows(), wa1.data());

	/* rescale if necessary. */

	/* Computing MAX */
	if (mode != 2)
	diag = diag.cwise().max(wa2);

	/* beginning of the inner loop. */

	while (true) {

	/* determine the direction p. */

	ei_dogleg<Scalar>(R, diag, qtf, delta, wa1);

	/* store the direction p and x + p. calculate the norm of p. */

	wa1 = -wa1;
	wa2 = x + wa1;
	wa3 = diag.cwise() * wa1;
	pnorm = wa3.stableNorm();

	/* on the first iteration, adjust the initial step bound. */

	if (iter == 1)
	delta = std::min(delta,pnorm);

	/* evaluate the function at x + p and calculate its norm. */

	if ( functor(wa2, wa4) < 0)
	return UserAksed;
	++nfev;
	fnorm1 = wa4.stableNorm();

	/* compute the scaled actual reduction. */

	actred = -1.;
	if (fnorm1 < fnorm) /* Computing 2nd power */
	actred = 1. - ei_abs2(fnorm1 / fnorm);

	/* compute the scaled predicted reduction. */

	l = 0;
	for (i = 0; i < n; ++i) {
	sum = 0.;
	for (j = i; j < n; ++j) {
	sum += R[l] * wa1[j];
	++l;
	}
	wa3[i] = qtf[i] + sum;
	}
	temp = wa3.stableNorm();
	prered = 0.;
	if (temp < fnorm) /* Computing 2nd power */
	prered = 1. - ei_abs2(temp / fnorm);

	/* compute the ratio of the actual to the predicted */
	/* reduction. */

	ratio = 0.;
	if (prered > 0.)
	ratio = actred / prered;

	/* update the step bound. */

	if (ratio < Scalar(.1)) {
	ncsuc = 0;
	++ncfail;
	delta = Scalar(.5) * delta;
	} else {
	ncfail = 0;
	++ncsuc;
	if (ratio >= Scalar(.5) \|\| ncsuc > 1) /* Computing MAX */
	delta = std::max(delta, pnorm / Scalar(.5));
	if (ei_abs(ratio - 1.) <= Scalar(.1)) {
	delta = pnorm / Scalar(.5);
	}
	}

	/* test for successful iteration. */

	if (ratio >= Scalar(1e-4)) {
	/* successful iteration. update x, fvec, and their norms. */
	x = wa2;
	wa2 = diag.cwise() * x;
	fvec = wa4;
	xnorm = wa2.stableNorm();
	fnorm = fnorm1;
	++iter;
	}

	/* determine the progress of the iteration. */

	++nslow1;
	if (actred >= Scalar(.001))
	nslow1 = 0;
	if (jeval)
	++nslow2;
	if (actred >= Scalar(.1))
	nslow2 = 0;

	/* test for convergence. */

	if (delta <= parameters.xtol * xnorm \|\| fnorm == 0.)
	return RelativeErrorTooSmall;

	/* tests for termination and stringent tolerances. */

	if (nfev >= parameters.maxfev)
	return TooManyFunctionEvaluation;
	if (Scalar(.1) * std::max(Scalar(.1) * delta, pnorm) <= epsilon<Scalar>() * xnorm)
	return TolTooSmall;
	if (nslow2 == 5)
	return NotMakingProgressJacobian;
	if (nslow1 == 10)
	return NotMakingProgressIterations;

	/* criterion for recalculating jacobian. */

	if (ncfail == 2)
	break; // leave inner loop and go for the next outer loop iteration

	/* calculate the rank one modification to the jacobian */
	/* and update qtf if necessary. */

	for (j = 0; j < n; ++j) {
	sum = wa4.dot(fjac.col(j));
	wa2[j] = (sum - wa3[j]) / pnorm;
	wa1[j] = diag[j] * (diag[j] * wa1[j] / pnorm);
	if (ratio >= Scalar(1e-4))
	qtf[j] = sum;
	}

	/* compute the qr factorization of the updated jacobian. */

	ei_r1updt<Scalar>(n, n, R.data(), R.size(), wa1.data(), wa2.data(), wa3.data(), &sing);
	ei_r1mpyq<Scalar>(n, n, fjac.data(), fjac.rows(), wa2.data(), wa3.data());
	ei_r1mpyq<Scalar>(1, n, qtf.data(), 1, wa2.data(), wa3.data());

	/* end of the inner loop. */

	jeval = false;
	}
	/* end of the outer loop. */

	return Running;
	}


	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solve(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	Status status = solveInit(x, mode);
	while (status==Running)
	status = solveOneStep(x, mode);
	return status;
	}



	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::hybrd1(
	Matrix< Scalar, Dynamic, 1 > &x,
	const Scalar tol
	)
	{
	n = x.size();

	/* check the input parameters for errors. */
	if (n <= 0 \|\| tol < 0.)
	return ImproperInputParameters;

	resetParameters();
	parameters.maxfev = 200*(n+1);
	parameters.xtol = tol;

	diag.setConstant(n, 1.);
	return solveNumericalDiff(
	x,
	2
	);
	}

	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiffInit(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	n = x.size();

	if (parameters.nb_of_subdiagonals<0) parameters.nb_of_subdiagonals= n-1;
	if (parameters.nb_of_superdiagonals<0) parameters.nb_of_superdiagonals= n-1;

	wa1.resize(n); wa2.resize(n); wa3.resize(n); wa4.resize(n);
	qtf.resize(n);
	R.resize( (n*(n+1))/2);
	fjac.resize(n, n);
	fvec.resize(n);
	if (mode != 2)
	diag.resize(n);
	assert( (mode!=2 \|\| diag.size()==n) \|\| "When using mode==2, the caller must provide a valid 'diag'");


	/* Function Body */

	nfev = 0;
	njev = 0;

	/* check the input parameters for errors. */

	if (n <= 0 \|\| parameters.xtol < 0. \|\| parameters.maxfev <= 0 \|\| parameters.nb_of_subdiagonals< 0 \|\| parameters.nb_of_superdiagonals< 0 \|\| parameters.factor <= 0. )
	return ImproperInputParameters;
	if (mode == 2)
	for (int j = 0; j < n; ++j)
	if (diag[j] <= 0.)
	return ImproperInputParameters;

	/* evaluate the function at the starting point */
	/* and calculate its norm. */

	nfev = 1;
	if ( functor(x, fvec) < 0)
	return UserAksed;
	fnorm = fvec.stableNorm();

	/* initialize iteration counter and monitors. */

	iter = 1;
	ncsuc = 0;
	ncfail = 0;
	nslow1 = 0;
	nslow2 = 0;

	return Running;
	}

	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiffOneStep(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	int i, j, l, iwa[1];
	jeval = true;
	if (parameters.nb_of_subdiagonals<0) parameters.nb_of_subdiagonals= n-1;
	if (parameters.nb_of_superdiagonals<0) parameters.nb_of_superdiagonals= n-1;

	/* calculate the jacobian matrix. */

	if (ei_fdjac1(functor, x, fvec, fjac, parameters.nb_of_subdiagonals, parameters.nb_of_superdiagonals, parameters.epsfcn) <0)
	return UserAksed;
	nfev += std::min(parameters.nb_of_subdiagonals+parameters.nb_of_superdiagonals+ 1, n);

	/* compute the qr factorization of the jacobian. */

	ei_qrfac<Scalar>(n, n, fjac.data(), fjac.rows(), false, iwa, wa1.data(), wa2.data());

	/* on the first iteration and if mode is 1, scale according */
	/* to the norms of the columns of the initial jacobian. */

	if (iter == 1) {
	if (mode != 2)
	for (j = 0; j < n; ++j) {
	diag[j] = wa2[j];
	if (wa2[j] == 0.)
	diag[j] = 1.;
	}

	/* on the first iteration, calculate the norm of the scaled x */
	/* and initialize the step bound delta. */

	wa3 = diag.cwise() * x;
	xnorm = wa3.stableNorm();
	delta = parameters.factor * xnorm;
	if (delta == 0.)
	delta = parameters.factor;
	}

	/* form (q transpose)fvec and store in qtf. /

	qtf = fvec;
	for (j = 0; j < n; ++j)
	if (fjac(j,j) != 0.) {
	sum = 0.;
	for (i = j; i < n; ++i)
	sum += fjac(i,j) * qtf[i];
	temp = -sum / fjac(j,j);
	for (i = j; i < n; ++i)
	qtf[i] += fjac(i,j) * temp;
	}

	/* copy the triangular factor of the qr factorization into r. */

	sing = false;
	for (j = 0; j < n; ++j) {
	l = j;
	if (j)
	for (i = 0; i < j; ++i) {
	R[l] = fjac(i,j);
	l = l + n - i -1;
	}
	R[l] = wa1[j];
	if (wa1[j] == 0.)
	sing = true;
	}

	/* accumulate the orthogonal factor in fjac. */

	ei_qform<Scalar>(n, n, fjac.data(), fjac.rows(), wa1.data());

	/* rescale if necessary. */

	/* Computing MAX */
	if (mode != 2)
	diag = diag.cwise().max(wa2);

	/* beginning of the inner loop. */

	while (true) {

	/* determine the direction p. */

	ei_dogleg<Scalar>(R, diag, qtf, delta, wa1);

	/* store the direction p and x + p. calculate the norm of p. */

	wa1 = -wa1;
	wa2 = x + wa1;
	wa3 = diag.cwise() * wa1;
	pnorm = wa3.stableNorm();

	/* on the first iteration, adjust the initial step bound. */

	if (iter == 1)
	delta = std::min(delta,pnorm);

	/* evaluate the function at x + p and calculate its norm. */

	if ( functor(wa2, wa4) < 0)
	return UserAksed;
	++nfev;
	fnorm1 = wa4.stableNorm();

	/* compute the scaled actual reduction. */

	actred = -1.;
	if (fnorm1 < fnorm) /* Computing 2nd power */
	actred = 1. - ei_abs2(fnorm1 / fnorm);

	/* compute the scaled predicted reduction. */

	l = 0;
	for (i = 0; i < n; ++i) {
	sum = 0.;
	for (j = i; j < n; ++j) {
	sum += R[l] * wa1[j];
	++l;
	}
	wa3[i] = qtf[i] + sum;
	}
	temp = wa3.stableNorm();
	prered = 0.;
	if (temp < fnorm) /* Computing 2nd power */
	prered = 1. - ei_abs2(temp / fnorm);

	/* compute the ratio of the actual to the predicted */
	/* reduction. */

	ratio = 0.;
	if (prered > 0.)
	ratio = actred / prered;

	/* update the step bound. */

	if (ratio < Scalar(.1)) {
	ncsuc = 0;
	++ncfail;
	delta = Scalar(.5) * delta;
	} else {
	ncfail = 0;
	++ncsuc;
	if (ratio >= Scalar(.5) \|\| ncsuc > 1) /* Computing MAX */
	delta = std::max(delta, pnorm / Scalar(.5));
	if (ei_abs(ratio - 1.) <= Scalar(.1)) {
	delta = pnorm / Scalar(.5);
	}
	}

	/* test for successful iteration. */

	if (ratio >= Scalar(1e-4)) {
	/* successful iteration. update x, fvec, and their norms. */
	x = wa2;
	wa2 = diag.cwise() * x;
	fvec = wa4;
	xnorm = wa2.stableNorm();
	fnorm = fnorm1;
	++iter;
	}

	/* determine the progress of the iteration. */

	++nslow1;
	if (actred >= Scalar(.001))
	nslow1 = 0;
	if (jeval)
	++nslow2;
	if (actred >= Scalar(.1))
	nslow2 = 0;

	/* test for convergence. */

	if (delta <= parameters.xtol * xnorm \|\| fnorm == 0.)
	return RelativeErrorTooSmall;

	/* tests for termination and stringent tolerances. */

	if (nfev >= parameters.maxfev)
	return TooManyFunctionEvaluation;
	if (Scalar(.1) * std::max(Scalar(.1) * delta, pnorm) <= epsilon<Scalar>() * xnorm)
	return TolTooSmall;
	if (nslow2 == 5)
	return NotMakingProgressJacobian;
	if (nslow1 == 10)
	return NotMakingProgressIterations;

	/* criterion for recalculating jacobian approximation */
	/* by forward differences. */

	if (ncfail == 2)
	break; // leave inner loop and go for the next outer loop iteration

	/* calculate the rank one modification to the jacobian */
	/* and update qtf if necessary. */

	for (j = 0; j < n; ++j) {
	sum = wa4.dot(fjac.col(j));
	wa2[j] = (sum - wa3[j]) / pnorm;
	wa1[j] = diag[j] * (diag[j] * wa1[j] / pnorm);
	if (ratio >= Scalar(1e-4))
	qtf[j] = sum;
	}

	/* compute the qr factorization of the updated jacobian. */

	ei_r1updt<Scalar>(n, n, R.data(), R.size(), wa1.data(), wa2.data(), wa3.data(), &sing);
	ei_r1mpyq<Scalar>(n, n, fjac.data(), fjac.rows(), wa2.data(), wa3.data());
	ei_r1mpyq<Scalar>(1, n, qtf.data(), 1, wa2.data(), wa3.data());

	/* end of the inner loop. */

	jeval = false;
	}
	/* end of the outer loop. */

	return Running;
	}

	template<typename FunctorType, typename Scalar>
	typename HybridNonLinearSolver<FunctorType,Scalar>::Status
	HybridNonLinearSolver<FunctorType,Scalar>::solveNumericalDiff(
	Matrix< Scalar, Dynamic, 1 > &x,
	const int mode
	)
	{
	Status status = solveNumericalDiffInit(x, mode);
	while (status==Running)
	status = solveNumericalDiffOneStep(x, mode);
	return status;
	}