d4/d94/cp__lbfgs_8F_source.html

!--------------------------------------------------------------------------------------------------!

!   CP2K: A general program to perform molecular dynamics simulations                              !

!   Copyright 2000-2025 CP2K developers group <https://cp2k.org>                                   !

!                                                                                                  !

!   SPDX-License-Identifier: GPL-2.0-or-later                                                      !

!--------------------------------------------------------------------------------------------------!


! **************************************************************************************************

!> \brief LBFGS-B routine (version 3.0, April 25, 2011)

!> \note

!>      L-BFGS-B (version 3.0, April 25, 2011) converted to Fortran 90 module

!> \par History

!>      02.2005 Update to the new version 2.4 and deleting the blas part of

!>              the code (Teodoro Laino)

!>      11.2012 New version 3.0 converted to Fortran 90 (Matthias Krack)

!>      12.2020 Implementation of Space Group Symmetry (Pierre-André Cazade)

!> \author Fawzi Mohamed (first version)

! **************************************************************************************************

MODULE cp_lbfgs

   USE bibliography,                    ONLY: byrd1995,&

                                              cite_reference

   USE cp_files,                        ONLY: open_file

   USE kinds,                           ONLY: dp

   USE machine,                         ONLY: m_walltime

   USE space_groups,                    ONLY: spgr_apply_rotations_coord,&

                                              spgr_apply_rotations_force

   USE space_groups_types,              ONLY: spgr_type

#include "../base/base_uses.f90"


   IMPLICIT NONE


   PRIVATE


   CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'cp_lbfgs'


   PUBLIC :: setulb


CONTAINS


!===========   L-BFGS-B (version 3.0.  April 25, 2011  =================

!

!     This is a modified version of L-BFGS-B.

!

!     Major changes are described in the accompanying paper:

!

!         Jorge Nocedal and Jose Luis Morales, Remark on "Algorithm 778:

!         L-BFGS-B: Fortran Subroutines for Large-Scale Bound Constraine

!         Optimization"  (2011). To appear in  ACM Transactions on

!         Mathematical Software,

!

!     The paper describes an improvement and a correction to Algorithm 7

!     It is shown that the performance of the algorithm can be improved

!     significantly by making a relatively simple modication to the subs

!     minimization phase. The correction concerns an error caused by the

!     of routine dpmeps to estimate machine precision.

!

!     The total work space **wa** required by the new version is

!

!                  2*m*n + 11m*m + 5*n + 8*m

!

!     the old version required

!

!                  2*m*n + 12m*m + 4*n + 12*m

!

!

!            J. Nocedal  Department of Electrical Engineering and

!                        Computer Science.

!                        Northwestern University. Evanston, IL. USA

!

!

!           J.L Morales  Departamento de Matematicas,

!                        Instituto Tecnologico Autonomo de Mexico

!                        Mexico D.F. Mexico.

!

!                        March  2011

!

!=======================================================================

! **************************************************************************************************

!> \brief          This subroutine partitions the working arrays wa and iwa, and

!>                 then uses the limited memory BFGS method to solve the bound

!>                 constrained optimization problem by calling mainlb.

!>                 (The direct method will be used in the subspace minimization.)

!> \param n        n is the dimension of the problem.

!> \param m        m is the maximum number of variable metric corrections

!>                 used to define the limited memory matrix.

!> \param x        On entry x is an approximation to the solution.

!>                 On exit x is the current approximation.

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd      nbd represents the type of bounds imposed on the

!>                 variables, and must be specified as follows:

!>                 nbd(i)=0 if x(i) is unbounded,

!>                        1 if x(i) has only a lower bound,

!>                        2 if x(i) has both lower and upper bounds, and

!>                        3 if x(i) has only an upper bound.

!> \param f        On first entry f is unspecified.

!>                 On final exit f is the value of the function at x.

!> \param g        On first entry g is unspecified.

!>                 On final exit g is the value of the gradient at x.

!> \param factr    factr >= 0 is specified by the user.  The iteration

!>                 will stop when

!>

!>                 (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= factr*epsmch

!>

!>                 where epsmch is the machine precision, which is automatically

!>                 generated by the code. Typical values for factr: 1.d+12 for

!>                 low accuracy; 1.d+7 for moderate accuracy; 1.d+1 for extremely

!>                 high accuracy.

!> \param pgtol    pgtol >= 0 is specified by the user.  The iteration

!>                 will stop when

!>

!>                 max{|proj g_i | i = 1, ..., n} <= pgtol

!>

!>                 where pg_i is the ith component of the projected gradient.

!> \param wa       working array

!> \param iwa      integer working array

!> \param task     is a working string of characters of length 60 indicating

!>                 the current job when entering and quitting this subroutine.

!> \param iprint   iprint is a variable that must be set by the user.

!>                 It controls the frequency and type of output generated:

!>                 iprint<0    no output is generated;

!>                 iprint=0    print only one line at the last iteration;

!>                 0<iprint<99 print also f and |proj g| every iprint iterations;

!>                 iprint=99   print details of every iteration except n-vectors;

!>                 iprint=100  print also the changes of active set and final x;

!>                 iprint>100  print details of every iteration including x and g;

!>                 When iprint > 0, the file iterate.dat will be created to

!>                 summarize the iteration.

!> \param csave    is a working string of characters

!> \param lsave    lsave is a working array

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 If lsave(1) = .true.  then  the initial X has been replaced by

!>                               its projection in the feasible set

!>                 If lsave(2) = .true.  then  the problem is constrained;

!>                 If lsave(3) = .true.  then  each variable has upper and lower bounds;

!> \param isave    isave is a working array

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 isave(22) = the total number of intervals explored in the

!>                         search of Cauchy points;

!>                 isave(26) = the total number of skipped BFGS updates before the current iteration;

!>                 isave(30) = the number of current iteration;

!>                 isave(31) = the total number of BFGS updates prior the current iteration;

!>                 isave(33) = the number of intervals explored in the search of

!>                             Cauchy point in the current iteration;

!>                 isave(34) = the total number of function and gradient evaluations;

!>                 isave(36) = the number of function value or gradient

!>                             evaluations in the current iteration;

!>                 if isave(37) = 0  then the subspace argmin is within the box;

!>                 if isave(37) = 1  then the subspace argmin is beyond the box;

!>                 isave(38) = the number of free variables in the current iteration;

!>                 isave(39) = the number of active constraints in the current iteration;

!>                 n + 1 - isave(40) = the number of variables leaving the set of

!>                                     active constraints in the current iteration;

!>                 isave(41) = the number of variables entering the set of active

!>                             constraints in the current iteration.

!> \param dsave    dsave is a working array of dimension 29.

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 dsave(1) = current 'theta' in the BFGS matrix;

!>                 dsave(2) = f(x) in the previous iteration;

!>                 dsave(3) = factr*epsmch;

!>                 dsave(4) = 2-norm of the line search direction vector;

!>                 dsave(5) = the machine precision epsmch generated by the code;

!>                 dsave(7) = the accumulated time spent on searching for Cauchy points;

!>                 dsave(8) = the accumulated time spent on subspace minimization;

!>                 dsave(9) = the accumulated time spent on line search;

!>                 dsave(11) = the slope of the line search function at the current point of line search;

!>                 dsave(12) = the maximum relative step length imposed in line search;

!>                 dsave(13) = the infinity norm of the projected gradient;

!>                 dsave(14) = the relative step length in the line search;

!>                 dsave(15) = the slope of the line search function at the starting point of the line search;

!>                 dsave(16) = the square of the 2-norm of the line search direction vector.

!> \param trust_radius ...

!> \param spgr ...

!> \par History

!>      12.2020 Implementation of Space Group Symmetry [pcazade]

!> \author         NEOS, November 1994. (Latest revision June 1996.)

!>                 Optimization Technology Center.

!>                 Argonne National Laboratory and Northwestern University.

!>                 Written by

!>                             Ciyou Zhu

!>                 in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************


   SUBROUTINE setulb(n, m, x, lower_bound, upper_bound, nbd, f, g, factr, pgtol, wa, iwa, &

                     task, iprint, csave, lsave, isave, dsave, trust_radius, spgr)


      INTEGER, INTENT(in)                                :: n, m

      REAL(kind=dp), INTENT(inout)                       :: x(n)

      REAL(kind=dp)                                      :: lower_bound(n), upper_bound(n)

      INTEGER                                            :: nbd(n)

      REAL(kind=dp)                                      :: f, g(n)

      REAL(kind=dp), INTENT(in)                          :: factr, pgtol

      REAL(kind=dp)                                      :: wa(2*m*n + 5*n + 11*m*m + 8*m)

      INTEGER                                            :: iwa(3*n)

      CHARACTER(LEN=60)                                  :: task

      INTEGER                                            :: iprint

      CHARACTER(LEN=60)                                  :: csave

      LOGICAL                                            :: lsave(4)

      INTEGER                                            :: isave(44)

      REAL(kind=dp)                                      :: dsave(29)

      REAL(kind=dp), INTENT(in)                          :: trust_radius

      TYPE(spgr_type), OPTIONAL, POINTER                 :: spgr


      INTEGER                                            :: i, ld, lr, lsnd, lss, lsy, lt, lwa, lwn, &

                                                            lws, lwt, lwy, lxp, lz


!     References:

!

!       [1] R. H. Byrd, P. Lu, J. Nocedal and C. Zhu, ``A limited

!       memory algorithm for bound constrained optimization'',

!       SIAM J. Scientific Computing 16 (1995), no. 5, pp. 1190--1208.

!

!       [2] C. Zhu, R.H. Byrd, P. Lu, J. Nocedal, ``L-BFGS-B: a

!       limited memory FORTRAN code for solving bound constrained

!       optimization problems'', Tech. Report, NAM-11, EECS Department,

!       Northwestern University, 1994.

!

!       (Postscript files of these papers are available via anonymous

!        ftp to eecs.nwu.edu in the directory pub/lbfgs/lbfgs_bcm.)

!

!                           *  *  *


      IF (task == 'START') THEN

         CALL cite_reference(byrd1995)

         isave(1) = m*n

         isave(2) = m**2

         isave(3) = 4*m**2

         ! ws      m*n

         isave(4) = 1

         ! wy      m*n

         isave(5) = isave(4) + isave(1)

         ! wsy     m**2

         isave(6) = isave(5) + isave(1)

         ! wss     m**2

         isave(7) = isave(6) + isave(2)

         ! wt      m**2

         isave(8) = isave(7) + isave(2)

         ! wn      4*m**2

         isave(9) = isave(8) + isave(2)

         ! wsnd    4*m**2

         isave(10) = isave(9) + isave(3)

         ! wz      n

         isave(11) = isave(10) + isave(3)

         ! wr      n

         isave(12) = isave(11) + n

         ! wd      n

         isave(13) = isave(12) + n

         ! wt      n

         isave(14) = isave(13) + n

         ! wxp     n

         isave(15) = isave(14) + n

         ! wa      8*m

         isave(16) = isave(15) + n

      END IF

      lws = isave(4)

      lwy = isave(5)

      lsy = isave(6)

      lss = isave(7)

      lwt = isave(8)

      lwn = isave(9)

      lsnd = isave(10)

      lz = isave(11)

      lr = isave(12)

      ld = isave(13)

      lt = isave(14)

      lxp = isave(15)

      lwa = isave(16)


      !in case we use a trust radius we set the boundaries to be one times the trust radius away from the current positions

      !the original implementation only allowed for boundaries that remain constant during the optimization.

      !This way of including a trust radius seems to work,

      !but the change of the boundaries during optimization might introduce some not yet discovered problems.

      IF (trust_radius >= 0) THEN

         DO i = 1, n

            lower_bound(i) = x(i) - trust_radius

            upper_bound(i) = x(i) + trust_radius

            nbd(i) = 2

         END DO

      END IF


      ! passes spgr to mainlb

      CALL mainlb(n, m, x, lower_bound, upper_bound, nbd, f, g, factr, pgtol, &

                  wa(lws), wa(lwy), wa(lsy), wa(lss), wa(lwt), &

                  wa(lwn), wa(lsnd), wa(lz), wa(lr), wa(ld), wa(lt), wa(lxp), &

                  wa(lwa), &

                  iwa(1), iwa(n + 1), iwa(2*n + 1), task, iprint, &

                  csave, lsave, isave(22), dsave, spgr=spgr)


      RETURN


   END SUBROUTINE setulb


! **************************************************************************************************

!> \brief        This subroutine solves bound constrained optimization problems by

!>               using the compact formula of the limited memory BFGS updates.

!> \param n      n is the number of variables

!> \param m      m is the maximum number of variable metric

!>               corrections allowed in the limited memory matrix.

!> \param x      On entry x is an approximation to the solution.

!>               On exit x is the current approximation.

!> \param lower_bound  lower_bound is the lower bound of x.

!> \param upper_bound  upper_bound is the upper bound of x.

!> \param nbd    nbd represents the type of bounds imposed on the

!>               variables, and must be specified as follows:

!>               nbd(i)=0 if x(i) is unbounded,

!>               1 if x(i) has only a lower bound,

!>               2 if x(i) has both lower and upper bounds,

!>               3 if x(i) has only an upper bound.

!> \param f      On first entry f is unspecified.

!>               On final exit f is the value of the function at x.

!> \param g      On first entry g is unspecified.

!>               On final exit g is the value of the gradient at x.

!> \param factr  factr >= 0 is specified by the user.  The iteration

!>               will stop when

!>

!>               (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= factr*epsmch

!>

!>               where epsmch is the machine precision, which is automatically

!>               generated by the code.

!> \param pgtol  pgtol >= 0 is specified by the user.  The iteration

!>               will stop when

!>

!>                 max{|proj g_i | i = 1, ..., n} <= pgtol

!>

!>               where pg_i is the ith component of the projected gradient.

!> \param ws     ws, wy, sy, and wt are working arrays used to store the following

!>               information defining the limited memory BFGS matrix:

!>               ws stores S, the matrix of s-vectors;

!> \param wy     stores Y, the matrix of y-vectors;

!> \param sy     stores S'Y;

!> \param ss     stores S'S;

!> \param wt     stores the Cholesky factorization of (theta*S'S+LD^(-1)L');

!>               see eq. (2.26) in [3].

!> \param wn     wn is a working array of dimension 2m x 2m

!>               used to store the LEL^T factorization of the indefinite matrix

!>               K = [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!>                   [L_a -R_z           theta*S'AA'S ]

!>

!>               where     E = [-I  0]

!>                             [ 0  I]

!> \param snd    is a working array of dimension 2m x 2m

!>               used to store the lower triangular part of

!>               N = [Y' ZZ'Y   L_a'+R_z']

!>                   [L_a +R_z  S'AA'S   ]

!> \param z      z(n),r(n),d(n),t(n), xp(n),wa(8*m) are working arrays

!>               z  is used at different times to store the Cauchy point and

!>               the Newton point.

!> \param r      working array

!> \param d      working array

!> \param t      workign array

!> \param xp     xp is a workng array used to safeguard the projected Newton direction

!> \param wa     working array

!> \param index  In subroutine freev, index is used to store the free and fixed

!>               variables at the Generalized Cauchy Point (GCP).

!> \param iwhere iwhere is an integer working array of dimension n used to record

!>               the status of the vector x for GCP computation.

!>               iwhere(i)=0 or -3 if x(i) is free and has bounds,

!>                         1       if x(i) is fixed at l(i), and l(i) .ne. u(i)

!>                         2       if x(i) is fixed at u(i), and u(i) .ne. l(i)

!>                         3       if x(i) is always fixed, i.e.,  u(i)=x(i)=l(i)

!>                        -1       if x(i) is always free, i.e., no bounds on it.

!> \param indx2  indx2 is a working array. Within subroutine cauchy, indx2 corresponds to the array iorder.

!>               In subroutine freev, a list of variables entering and leaving

!>               the free set is stored in indx2, and it is passed on to

!>               subroutine formk with this information

!> \param task   task is a working string of characters indicating

!>               the current job when entering and leaving this subroutine.

!> \param iprint is an variable that must be set by the user.

!>               It controls the frequency and type of output generated:

!>               iprint<0    no output is generated;

!>               iprint=0    print only one line at the last iteration;

!>               0<iprint<99 print also f and |proj g| every iprint iterations;

!>               iprint=99   print details of every iteration except n-vectors;

!>               iprint=100  print also the changes of active set and final x;

!>               iprint>100  print details of every iteration including x and g;

!>               When iprint > 0, the file iterate.dat will be created to summarize the iteration.

!> \param csave  csave is a working string of characters

!> \param lsave  lsave is a logical working array

!> \param isave  isave is an integer working array

!> \param dsave  is a double precision working array

!> \param spgr ...

!> \par History

!>      12.2020 Implementation of Space Group Symmetry [pcazade]

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE mainlb(n, m, x, lower_bound, upper_bound, nbd, f, g, factr, pgtol, ws, wy, &

                     sy, ss, wt, wn, snd, z, r, d, t, xp, wa, &

                     index, iwhere, indx2, task, &

                     iprint, csave, lsave, isave, dsave, spgr)

      INTEGER, INTENT(in)                                :: n, m

      REAL(kind=dp), INTENT(inout)                       :: x(n)

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n)

      INTEGER                                            :: nbd(n)

      REAL(kind=dp) :: f, g(n), factr, pgtol, ws(n, m), wy(n, m), sy(m, m), ss(m, m), wt(m, m), &

         wn(2*m, 2*m), snd(2*m, 2*m), z(n), r(n), d(n), t(n), xp(n), wa(8*m)

      INTEGER                                            :: index(n), iwhere(n), indx2(n)

      CHARACTER(LEN=60)                                  :: task

      INTEGER                                            :: iprint

      CHARACTER(LEN=60)                                  :: csave

      LOGICAL                                            :: lsave(4)

      INTEGER                                            :: isave(23)

      REAL(kind=dp)                                      :: dsave(29)

      TYPE(spgr_type), OPTIONAL, POINTER                 :: spgr


      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp, zero = 0.0_dp


      CHARACTER(LEN=3)                                   :: word

      INTEGER                                            :: col, head, i, iback, ifun, ileave, info, &

                                                            itail, iter, itfile, iupdat, iword, k, &

                                                            nact, nenter, nfgv, nfree, nintol, &

                                                            nseg, nskip

      LOGICAL                                            :: boxed, constrained, first, &

                                                            keep_space_group, updatd, wrk, &

                                                            x_projected

      REAL(kind=dp) :: cachyt, cpu1, cpu2, ddot, ddum, dnorm, dr, dtd, epsmch, fold, g_inf_norm, &

         gd, gdold, lnscht, rr, sbtime, step_max, stp, theta, time, time1, time2, tol, xstep


!     References:

!

!       [1] R. H. Byrd, P. Lu, J. Nocedal and C. Zhu, ``A limited

!       memory algorithm for bound constrained optimization'',

!       SIAM J. Scientific Computing 16 (1995), no. 5, pp. 1190--1208.

!

!       [2] C. Zhu, R.H. Byrd, P. Lu, J. Nocedal, ``L-BFGS-B: FORTRAN

!       Subroutines for Large Scale Bound Constrained Optimization''

!       Tech. Report, NAM-11, EECS Department, Northwestern University,

!       1994.

!

!       [3] R. Byrd, J. Nocedal and R. Schnabel "Representations of

!       Quasi-Newton Matrices and their use in Limited Memory Methods'',

!       Mathematical Programming 63 (1994), no. 4, pp. 129-156.

!

!       (Postscript files of these papers are available via anonymous

!        ftp to eecs.nwu.edu in the directory pub/lbfgs/lbfgs_bcm.)

!

!                           *  *  *


      keep_space_group = .false.

      IF (PRESENT(spgr)) THEN

         IF (ASSOCIATED(spgr)) keep_space_group = spgr%keep_space_group

      END IF


      IF (task == 'START') THEN


         epsmch = epsilon(one)


         CALL timer(time1)


!        Initialize counters and scalars when task='START'.


!           for the limited memory BFGS matrices:

         col = 0

         head = 1

         theta = one

         iupdat = 0

         updatd = .false.

         iback = 0

         itail = 0

         iword = 0

         nact = 0

         ileave = 0

         nenter = 0

         fold = zero

         dnorm = zero

         cpu1 = zero

         gd = zero

         step_max = zero

         g_inf_norm = zero

         stp = zero

         gdold = zero

         dtd = zero


!           for operation counts:

         iter = 0

         nfgv = 0

         nseg = 0

         nintol = 0

         nskip = 0

         nfree = n

         ifun = 0

!           for stopping tolerance:

         tol = factr*epsmch


!           for measuring running time:

         cachyt = 0

         sbtime = 0

         lnscht = 0


!           'word' records the status of subspace solutions.

         word = '---'


!           'info' records the termination information.

         info = 0


         itfile = 8

         IF (iprint >= 1) THEN

!                                open a summary file 'iterate.dat'

            CALL open_file(file_name='iterate.dat', unit_number=itfile, file_action='WRITE', file_status='UNKNOWN')

         END IF


!        Check the input arguments for errors.


         CALL errclb(n, m, factr, lower_bound, upper_bound, nbd, task, info, k)

         IF (task(1:5) == 'ERROR') THEN

            CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                        iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                        zero, nseg, word, iback, stp, xstep, k, &

                        cachyt, sbtime, lnscht)

            RETURN

         END IF


         CALL prn1lb(n, m, lower_bound, upper_bound, x, iprint, itfile, epsmch)


!        Initialize iwhere & project x onto the feasible set.


         CALL active(n, lower_bound, upper_bound, nbd, x, iwhere, iprint, x_projected, constrained, boxed)

         ! applies rotation matrices to coordinates

         IF (keep_space_group) THEN

            CALL spgr_apply_rotations_coord(spgr, x)

         END IF


!        The end of the initialization.

         task = 'FG_START'

!        return to the driver to calculate f and g; reenter at 111.

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                         cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

         RETURN

      ELSE

         ! applies rotation matrices to coordinates

         IF (keep_space_group) THEN

            CALL spgr_apply_rotations_coord(spgr, x)

            CALL spgr_apply_rotations_force(spgr, g)

         END IF


!          restore local variables.


         x_projected = lsave(1)

         constrained = lsave(2)

         boxed = lsave(3)

         updatd = lsave(4)


         nintol = isave(1)

         itfile = isave(3)

         iback = isave(4)

         nskip = isave(5)

         head = isave(6)

         col = isave(7)

         itail = isave(8)

         iter = isave(9)

         iupdat = isave(10)

         nseg = isave(12)

         nfgv = isave(13)

         info = isave(14)

         ifun = isave(15)

         iword = isave(16)

         nfree = isave(17)

         nact = isave(18)

         ileave = isave(19)

         nenter = isave(20)


         theta = dsave(1)

         fold = dsave(2)

         tol = dsave(3)

         dnorm = dsave(4)

         epsmch = dsave(5)

         cpu1 = dsave(6)

         cachyt = dsave(7)

         sbtime = dsave(8)

         lnscht = dsave(9)

         time1 = dsave(10)

         gd = dsave(11)

         step_max = dsave(12)

         g_inf_norm = dsave(13)

         stp = dsave(14)

         gdold = dsave(15)

         dtd = dsave(16)


!        After returning from the driver go to the point where execution

!        is to resume.


         IF (task(1:4) == 'STOP') THEN

            IF (task(7:9) == 'CPU') THEN

!                                          restore the previous iterate.

               CALL dcopy(n, t, 1, x, 1)

               CALL dcopy(n, r, 1, g, 1)

               f = fold

            END IF

            CALL timer(time2)

            time = time2 - time1

            CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                        iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                        time, nseg, word, iback, stp, xstep, k, &

                        cachyt, sbtime, lnscht)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                            cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

            RETURN

         END IF

      END IF


      IF (.NOT. (task(1:5) == 'FG_LN' .OR. task(1:5) == 'NEW_X')) THEN


!     Compute f0 and g0.

         nfgv = 1


!     Compute the infinity norm of the (-) projected gradient.


         CALL projgr(n, lower_bound, upper_bound, nbd, x, g, g_inf_norm)


         IF (iprint >= 1) THEN

            WRITE (*, 1002) iter, f, g_inf_norm

            WRITE (itfile, 1003) iter, nfgv, g_inf_norm, f

         END IF

         IF (g_inf_norm <= pgtol) THEN

!                                terminate the algorithm.

            task = 'CONVERGENCE: NORM_OF_PROJECTED_GRADIENT_<=_PGTOL'

            CALL timer(time2)

            time = time2 - time1

            CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                        iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                        time, nseg, word, iback, stp, xstep, k, &

                        cachyt, sbtime, lnscht)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                            cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

            RETURN

         END IF

      END IF


      first = .true.

      DO WHILE (.true.)

      IF (.NOT. first .OR. .NOT. (task(1:5) == 'FG_LN' .OR. task(1:5) == 'NEW_X')) THEN

         IF (iprint >= 99) WRITE (*, 1001) iter + 1

         iword = -1

!

         IF (.NOT. constrained .AND. col > 0) THEN

!                                            skip the search for GCP.

            CALL dcopy(n, x, 1, z, 1)

            wrk = updatd

            nseg = 0

         ELSE


!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc

!

!     Compute the Generalized Cauchy Point (GCP).

!

!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc


            CALL timer(cpu1)

            CALL cauchy(n, x, lower_bound, upper_bound, nbd, g, indx2, iwhere, t, d, z, &

                        m, wy, ws, sy, wt, theta, col, head, &

                        wa(1), wa(2*m + 1), wa(4*m + 1), wa(6*m + 1), nseg, &

                        iprint, g_inf_norm, info, epsmch)

            ! applies rotation matrices to coordinates

            IF (keep_space_group) THEN

               CALL spgr_apply_rotations_coord(spgr, z)

            END IF

            IF (info /= 0) THEN

!            singular triangular system detected; refresh the lbfgs memory.

               IF (iprint >= 1) WRITE (*, 1005)

               info = 0

               col = 0

               head = 1

               theta = one

               iupdat = 0

               updatd = .false.

               CALL timer(cpu2)

               cachyt = cachyt + cpu2 - cpu1

               first = .false.

               cycle

            END IF

            CALL timer(cpu2)

            cachyt = cachyt + cpu2 - cpu1

            nintol = nintol + nseg


!        Count the entering and leaving variables for iter > 0;

!        find the index set of free and active variables at the GCP.


            CALL freev(n, nfree, index, nenter, ileave, indx2, &

                       iwhere, wrk, updatd, constrained, iprint, iter)

            nact = n - nfree


         END IF


!     If there are no free variables or B=theta*I, then

!                                        skip the subspace minimization.


         IF (.NOT. (nfree == 0 .OR. col == 0)) THEN


!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc

!

!     Subspace minimization.

!

!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc


            CALL timer(cpu1)


!     Form  the LEL^T factorization of the indefinite

!       matrix    K = [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!                     [L_a -R_z           theta*S'AA'S ]

!       where     E = [-I  0]

!                     [ 0  I]


            IF (wrk) CALL formk(n, nfree, index, nenter, ileave, indx2, iupdat, &

                                updatd, wn, snd, m, ws, wy, sy, theta, col, head, info)

            IF (info /= 0) THEN

!          nonpositive definiteness in Cholesky factorization;

!          refresh the lbfgs memory and restart the iteration.

               IF (iprint >= 1) WRITE (*, 1006)

               info = 0

               col = 0

               head = 1

               theta = one

               iupdat = 0

               updatd = .false.

               CALL timer(cpu2)

               sbtime = sbtime + cpu2 - cpu1

               first = .false.

               cycle

            END IF


!        compute r=-Z'B(xcp-xk)-Z'g (using wa(2m+1)=W'(xcp-x)

!                                                   from 'cauchy').

            CALL cmprlb(n, m, x, g, ws, wy, sy, wt, z, r, wa, index, &

                        theta, col, head, nfree, constrained, info)

            ! applies rotation matrices to coordinates

            IF (keep_space_group) THEN

               CALL spgr_apply_rotations_force(spgr, r)

            END IF

            IF (info == 0) THEN


!     call the direct method.


               CALL subsm(n, m, nfree, index, lower_bound, upper_bound, nbd, z, r, xp, ws, wy, &

                          theta, x, g, col, head, iword, wa, wn, iprint, info)

               ! applies rotation matrices to coordinates

               IF (keep_space_group) THEN

                  CALL spgr_apply_rotations_coord(spgr, z)

                  CALL spgr_apply_rotations_force(spgr, r)

               END IF

            END IF

            IF (info /= 0) THEN

!          singular triangular system detected;

!          refresh the lbfgs memory and restart the iteration.

               IF (iprint >= 1) WRITE (*, 1005)

               info = 0

               col = 0

               head = 1

               theta = one

               iupdat = 0

               updatd = .false.

               CALL timer(cpu2)

               sbtime = sbtime + cpu2 - cpu1

               first = .false.

               cycle

            END IF


            CALL timer(cpu2)

            sbtime = sbtime + cpu2 - cpu1

         END IF


!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc

!

!     Line search and optimality tests.

!

!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc


!     Generate the search direction d:=z-x.

         ! applies rotation matrices to coordinates

         IF (keep_space_group) THEN

            CALL spgr_apply_rotations_coord(spgr, x)

            CALL spgr_apply_rotations_coord(spgr, z)

         END IF

         DO i = 1, n

            d(i) = z(i) - x(i)

         END DO

         CALL timer(cpu1)

      END IF

      IF (.NOT. first .OR. .NOT. (task(1:5) == 'NEW_X')) THEN

         ! applies rotation matrices to coordinates

         IF (keep_space_group) THEN

            CALL spgr_apply_rotations_coord(spgr, x)

            CALL spgr_apply_rotations_coord(spgr, z)

            CALL spgr_apply_rotations_force(spgr, d)

            CALL spgr_apply_rotations_force(spgr, g)

            CALL spgr_apply_rotations_force(spgr, r)

         END IF

         CALL lnsrlb(n, lower_bound, upper_bound, nbd, x, f, fold, gd, gdold, g, d, r, t, z, stp, dnorm, &

                     dtd, xstep, step_max, iter, ifun, iback, nfgv, info, task, &

                     boxed, constrained, csave, isave(22), dsave(17))

         ! applies rotation matrices to coordinates

         IF (keep_space_group) THEN

            CALL spgr_apply_rotations_coord(spgr, x)

            CALL spgr_apply_rotations_force(spgr, g)

         END IF

         IF (info /= 0 .OR. iback >= 20) THEN

!          restore the previous iterate.

            CALL dcopy(n, t, 1, x, 1)

            CALL dcopy(n, r, 1, g, 1)

            f = fold

            IF (col == 0) THEN

!             abnormal termination.

               IF (info == 0) THEN

                  info = -9

!                restore the actual number of f and g evaluations etc.

                  nfgv = nfgv - 1

                  ifun = ifun - 1

                  iback = iback - 1

               END IF

               task = 'ABNORMAL_TERMINATION_IN_LNSRCH'

               iter = iter + 1

               CALL timer(time2)

               time = time2 - time1

               CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                           iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                           time, nseg, word, iback, stp, xstep, k, &

                           cachyt, sbtime, lnscht)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                               cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

               RETURN

            ELSE

!             refresh the lbfgs memory and restart the iteration.

               IF (iprint >= 1) WRITE (*, 1008)

               IF (info == 0) nfgv = nfgv - 1

               info = 0

               col = 0

               head = 1

               theta = one

               iupdat = 0

               updatd = .false.

               task = 'RESTART_FROM_LNSRCH'

               CALL timer(cpu2)

               lnscht = lnscht + cpu2 - cpu1

               first = .false.

               cycle

            END IF

         ELSE IF (task(1:5) == 'FG_LN') THEN

!          return to the driver for calculating f and g; reenter at 666.

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                            cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

            RETURN

         ELSE

!          calculate and print out the quantities related to the new X.

            CALL timer(cpu2)

            lnscht = lnscht + cpu2 - cpu1

            iter = iter + 1


!        Compute the infinity norm of the projected (-)gradient.


            CALL projgr(n, lower_bound, upper_bound, nbd, x, g, g_inf_norm)


!        Print iteration information.


            CALL prn2lb(n, x, f, g, iprint, itfile, iter, nfgv, nact, &

                        g_inf_norm, nseg, word, iword, iback, stp, xstep)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                            cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

            RETURN

         END IF

      END IF


!     Test for termination.


      IF (g_inf_norm <= pgtol) THEN

!                                terminate the algorithm.

         task = 'CONVERGENCE: NORM_OF_PROJECTED_GRADIENT_<=_PGTOL'

         CALL timer(time2)

         time = time2 - time1

         CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                     iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                     time, nseg, word, iback, stp, xstep, k, &

                     cachyt, sbtime, lnscht)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                         cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

         RETURN

      END IF


      ddum = max(abs(fold), abs(f), one)

      IF ((fold - f) <= tol*ddum) THEN

!                                        terminate the algorithm.

         task = 'CONVERGENCE: REL_REDUCTION_OF_F_<=_FACTR*EPSMCH'

         IF (iback >= 10) info = -5

!           i.e., to issue a warning if iback>10 in the line search.

         CALL timer(time2)

         time = time2 - time1

         CALL prn3lb(n, x, f, task, iprint, info, itfile, &

                     iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                     time, nseg, word, iback, stp, xstep, k, &

                     cachyt, sbtime, lnscht)

     CALL save_local(lsave, isave, dsave, x_projected, constrained, boxed, updatd, nintol, itfile, iback, nskip, head, col, itail, &

                        iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, &

                         cpu1, cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

         RETURN

      END IF


!     Compute d=newx-oldx, r=newg-oldg, rr=y'y and dr=y's.

      IF (keep_space_group) THEN

         CALL spgr_apply_rotations_force(spgr, g)

         CALL spgr_apply_rotations_force(spgr, r)

      END IF

      DO i = 1, n

         r(i) = g(i) - r(i)

      END DO

      rr = ddot(n, r, 1, r, 1)

      IF (stp == one) THEN

         dr = gd - gdold

         ddum = -gdold

      ELSE

         dr = (gd - gdold)*stp

         CALL dscal(n, stp, d, 1)

         ddum = -gdold*stp

      END IF


      IF (dr <= epsmch*ddum) THEN

!                            skip the L-BFGS update.

         nskip = nskip + 1

         updatd = .false.

         IF (iprint >= 1) WRITE (*, 1004) dr, ddum

         first = .false.

         cycle

      END IF


!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc

!

!     Update the L-BFGS matrix.

!

!ccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccccc


      updatd = .true.

      iupdat = iupdat + 1


!     Update matrices WS and WY and form the middle matrix in B.


      CALL matupd(n, m, ws, wy, sy, ss, d, r, itail, &

                  iupdat, col, head, theta, rr, dr, stp, dtd)


!     Form the upper half of the pds T = theta*SS + L*D^(-1)*L';

!        Store T in the upper triangular of the array wt;

!        Cholesky factorize T to J*J' with

!           J' stored in the upper triangular of wt.


      CALL formt(m, wt, sy, ss, col, theta, info)


      IF (info /= 0) THEN

!          nonpositive definiteness in Cholesky factorization;

!          refresh the lbfgs memory and restart the iteration.

         IF (iprint >= 1) WRITE (*, 1007)

         info = 0

         col = 0

         head = 1

         theta = one

         iupdat = 0

         updatd = .false.

      END IF


!     Now the inverse of the middle matrix in B is


!       [  D^(1/2)      O ] [ -D^(1/2)  D^(-1/2)*L' ]

!       [ -L*D^(-1/2)   J ] [  0        J'          ]


      first = .false.

      END DO


1001  FORMAT(//, 'ITERATION ', i5)

1002  FORMAT &

         (/, 'At iterate', i5, 4x, 'f= ', 1p, d12.5, 4x, '|proj g|= ', 1p, d12.5)

1003  FORMAT(2(1x, i4), 5x, '-', 5x, '-', 3x, '-', 5x, '-', 5x, '-', 8x, '-', 3x, &

             1p, 2(1x, d10.3))

1004  FORMAT('  ys=', 1p, e10.3, '  -gs=', 1p, e10.3, ' BFGS update SKIPPED')

1005  FORMAT(/, &

              ' Singular triangular system detected;', /, &

              '   refresh the lbfgs memory and restart the iteration.')

1006  FORMAT(/, &

              ' Nonpositive definiteness in Cholesky factorization in formk;', /, &

              '   refresh the lbfgs memory and restart the iteration.')

1007  FORMAT(/, &

              ' Nonpositive definiteness in Cholesky factorization in formt;', /, &

              '   refresh the lbfgs memory and restart the iteration.')

1008  FORMAT(/, &

              ' Bad direction in the line search;', /, &

              '   refresh the lbfgs memory and restart the iteration.')


      RETURN


   END SUBROUTINE mainlb


! **************************************************************************************************

!> \brief This subroutine initializes iwhere and projects the initial x to the feasible set if necessary.

!> \param n ...

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd ...

!> \param x ...

!> \param iwhere  iwhere(i)=-1  if x(i) has no bounds

!>                           3   if l(i)=u(i)

!>                           0   otherwise.

!>                In cauchy, iwhere is given finer gradations.

!> \param iprint ...

!> \param x_projected ...

!> \param constrained ...

!> \param boxed ...

!> \author        NEOS, November 1994. (Latest revision June 1996.)

!>                Optimization Technology Center.

!>                Argonne National Laboratory and Northwestern University.

!>                Written by

!>                            Ciyou Zhu

!>                in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE active(n, lower_bound, upper_bound, nbd, x, iwhere, iprint, &

                     x_projected, constrained, boxed)


      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n)

      INTEGER                                            :: nbd(n)

      REAL(kind=dp)                                      :: x(n)

      INTEGER, INTENT(out)                               :: iwhere(n)

      INTEGER                                            :: iprint

      LOGICAL                                            :: x_projected, constrained, boxed


      REAL(kind=dp), PARAMETER                           :: zero = 0.0_dp


      INTEGER                                            :: i, nbdd


!     ************

!     Initialize nbdd, x_projected, constrained and boxed.


      nbdd = 0

      x_projected = .false.

      constrained = .false.

      boxed = .true.


!     Project the initial x to the easible set if necessary.


      DO i = 1, n

         IF (nbd(i) > 0) THEN

            IF (nbd(i) <= 2 .AND. x(i) <= lower_bound(i)) THEN

               IF (x(i) < lower_bound(i)) THEN

                  x_projected = .true.

                  x(i) = lower_bound(i)

               END IF

               nbdd = nbdd + 1

            ELSE IF (nbd(i) >= 2 .AND. x(i) >= upper_bound(i)) THEN

               IF (x(i) > upper_bound(i)) THEN

                  x_projected = .true.

                  x(i) = upper_bound(i)

               END IF

               nbdd = nbdd + 1

            END IF

         END IF

      END DO


!     Initialize iwhere and assign values to constrained and boxed.


      DO i = 1, n

         IF (nbd(i) /= 2) boxed = .false.

         IF (nbd(i) == 0) THEN

!                                this variable is always free

            iwhere(i) = -1


!           otherwise set x(i)=mid(x(i), u(i), l(i)).

         ELSE

            constrained = .true.

            IF (nbd(i) == 2 .AND. upper_bound(i) - lower_bound(i) <= zero) THEN

!                   this variable is always fixed

               iwhere(i) = 3

            ELSE

               iwhere(i) = 0

            END IF

         END IF

      END DO


      IF (iprint >= 0) THEN

         IF (x_projected) WRITE (*, *)                                        &

     &   'The initial X is infeasible.  Restart with its projection.'

         IF (.NOT. constrained) &

            WRITE (*, *) 'This problem is unconstrained.'

      END IF


      IF (iprint > 0) WRITE (*, 1001) nbdd


1001  FORMAT(/, 'At X0 ', i9, ' variables are exactly at the bounds')


      RETURN


   END SUBROUTINE active


! **************************************************************************************************

!> \brief       This subroutine computes the product of the 2m x 2m middle matrix

!>              in the compact L-BFGS formula of B and a 2m vector v;

!>              it returns the product in p.

!> \param m     m is the maximum number of variable metric corrections

!>              used to define the limited memory matrix.

!> \param sy    sy specifies the matrix S'Y.

!> \param wt    wt specifies the upper triangular matrix J' which is

!>              the Cholesky factor of (thetaS'S+LD^(-1)L').

!> \param col   col specifies the number of s-vectors (or y-vectors)

!>              stored in the compact L-BFGS formula.

!> \param v     v specifies vector v.

!> \param p     p is the product Mv.

!> \param info  info = 0 for normal return,

!>                   = nonzero for abnormal return when the system to be solved by dtrsl is singular.

!> \author      NEOS, November 1994. (Latest revision June 1996.)

!>              Optimization Technology Center.

!>              Argonne National Laboratory and Northwestern University.

!>              Written by

!>                          Ciyou Zhu

!>              in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE bmv(m, sy, wt, col, v, p, info)


      INTEGER                                            :: m

      REAL(kind=dp)                                      :: sy(m, m), wt(m, m)

      INTEGER                                            :: col

      REAL(kind=dp), INTENT(in)                          :: v(2*col)

      REAL(kind=dp), INTENT(out)                         :: p(2*col)

      INTEGER, INTENT(out)                               :: info


      INTEGER                                            :: i, i2, k

      REAL(kind=dp)                                      :: sum


      IF (col == 0) RETURN


!     PART I: solve [  D^(1/2)      O ] [ p1 ] = [ v1 ]

!                   [ -L*D^(-1/2)   J ] [ p2 ]   [ v2 ].


!       solve Jp2=v2+LD^(-1)v1.

      p(col + 1) = v(col + 1)

      DO i = 2, col

         i2 = col + i

         sum = 0.0_dp

         DO k = 1, i - 1

            sum = sum + sy(i, k)*v(k)/sy(k, k)

         END DO

         p(i2) = v(i2) + sum

      END DO

!     Solve the triangular system

      CALL dtrsl(wt, m, col, p(col + 1), 11, info)

      IF (info /= 0) RETURN


!       solve D^(1/2)p1=v1.

      DO i = 1, col

         p(i) = v(i)/sqrt(sy(i, i))

      END DO


!     PART II: solve [ -D^(1/2)   D^(-1/2)*L'  ] [ p1 ] = [ p1 ]

!                    [  0         J'           ] [ p2 ]   [ p2 ].


!       solve J^Tp2=p2.

      CALL dtrsl(wt, m, col, p(col + 1), 01, info)

      IF (info /= 0) RETURN


!       compute p1=-D^(-1/2)(p1-D^(-1/2)L'p2)

!                 =-D^(-1/2)p1+D^(-1)L'p2.

      DO i = 1, col

         p(i) = -p(i)/sqrt(sy(i, i))

      END DO

      DO i = 1, col

         sum = 0._dp

         DO k = i + 1, col

            sum = sum + sy(k, i)*p(col + k)/sy(i, i)

         END DO

         p(i) = p(i) + sum

      END DO


      RETURN


   END SUBROUTINE bmv


! **************************************************************************************************

!> \brief        For given x, l, u, g (with g_inf_norm > 0), and a limited memory

!>               BFGS matrix B defined in terms of matrices WY, WS, WT, and

!>               scalars head, col, and theta, this subroutine computes the

!>               generalized Cauchy point (GCP), defined as the first local

!>               minimizer of the quadratic

!>

!>                    Q(x + s) = g's + 1/2 s'Bs

!>

!>               along the projected gradient direction P(x-tg,l,u).

!>               The routine returns the GCP in xcp.

!> \param n      n is the dimension of the problem.

!> \param x      x is the starting point for the GCP computation.

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd    nbd represents the type of bounds imposed on the

!>               variables, and must be specified as follows:

!>               nbd(i)=0 if x(i) is unbounded,

!>                      1 if x(i) has only a lower bound,

!>                      2 if x(i) has both lower and upper bounds, and

!>                      3 if x(i) has only an upper bound.

!> \param g      g is the gradient of f(x).  g must be a nonzero vector.

!> \param iorder iorder will be used to store the breakpoints in the piecewise

!>               linear path and free variables encountered. On exit,

!>               iorder(1),...,iorder(nleft) are indices of breakpoints

!>                                which have not been encountered;

!>               iorder(nleft+1),...,iorder(nbreak) are indices of

!>                                     encountered breakpoints; and

!>               iorder(nfree),...,iorder(n) are indices of variables which

!>               have no bound constraits along the search direction.

!> \param iwhere On entry iwhere indicates only the permanently fixed (iwhere=3)

!>               or free (iwhere= -1) components of x.

!>               On exit iwhere records the status of the current x variables.

!>               iwhere(i)=-3  if x(i) is free and has bounds, but is not moved

!>                          0   if x(i) is free and has bounds, and is moved

!>                          1   if x(i) is fixed at l(i), and l(i) .ne. u(i)

!>                          2   if x(i) is fixed at u(i), and u(i) .ne. l(i)

!>                          3   if x(i) is always fixed, i.e.,  u(i)=x(i)=l(i)

!>                         -1  if x(i) is always free, i.e., it has no bounds.

!> \param t      t will be used to store the break points.

!> \param d      d is used to store the Cauchy direction P(x-tg)-x.

!> \param xcp    is a double precision array of dimension n used to return the GCP on exit.

!> \param m      m is the maximum number of variable metric corrections used to define the limited memory matrix.

!> \param wy     ws, wy, sy, and wt are double precision arrays.

!>               On entry they store information that defines the limited memory BFGS matrix:

!>               wy(n,m) stores Y, a set of y-vectors;

!> \param ws     ws(n,m) stores S, a set of s-vectors;

!> \param sy     sy(m,m) stores S'Y;

!> \param wt     wt(m,m) stores the Cholesky factorization of (theta*S'S+LD^(-1)L').

!> \param theta  theta is the scaling factor specifying B_0 = theta I.

!> \param col    col is the actual number of variable metric corrections stored so far.

!> \param head   head is the location of the first s-vector (or y-vector in S (or Y)

!> \param p      p will be used to store the vector p = W^(T)d.

!> \param c      c will be used to store the vector c = W^(T)(xcp-x).

!> \param wbp    wbp will be used to store the row of W corresponding to a breakpoint.

!> \param v      v is a double precision working array.

!> \param nseg   On exit nseg records the number of quadratic segments explored in searching for the GCP.

!> \param iprint iprint is an INTEGER variable that must be set by the user.

!>               It controls the frequency and type of output generated:

!>               iprint<0    no output is generated;

!>               iprint=0    print only one line at the last iteration;

!>               0<iprint<99 print also f and |proj g| every iprint iterations;

!>               iprint=99   print details of every iteration except n-vectors;

!>               iprint=100  print also the changes of active set and final x;

!>               iprint>100  print details of every iteration including x and g;

!>               When iprint > 0, the file iterate.dat will be created to summarize the iteration.

!> \param g_inf_norm g_inf_norm is the norm of the projected gradient at x.

!> \param info   On entry info is 0.

!>               On exit info = 0       for normal return,

!>                            = nonzero for abnormal return when the the system

!>                              used in routine bmv is singular.

!> \param epsmch ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE cauchy(n, x, lower_bound, upper_bound, nbd, g, iorder, iwhere, t, d, xcp, &

                     m, wy, ws, sy, wt, theta, col, head, p, c, wbp, &

                     v, nseg, iprint, g_inf_norm, info, epsmch)

      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: x(n), lower_bound(n), upper_bound(n)

      INTEGER, INTENT(in)                                :: nbd(n)

      REAL(kind=dp), INTENT(in)                          :: g(n)

      INTEGER                                            :: iorder(n)

      INTEGER, INTENT(inout)                             :: iwhere(n)

      REAL(kind=dp)                                      :: t(n), d(n), xcp(n)

      INTEGER, INTENT(in)                                :: m

      REAL(kind=dp), INTENT(in)                          :: sy(m, m), wt(m, m), theta

      INTEGER, INTENT(in)                                :: col

      REAL(kind=dp), INTENT(in)                          :: ws(n, col), wy(n, col)

      INTEGER, INTENT(in)                                :: head

      REAL(kind=dp)                                      :: p(2*m), c(2*m), wbp(2*m), v(2*m)

      INTEGER                                            :: nseg, iprint

      REAL(kind=dp), INTENT(in)                          :: g_inf_norm

      INTEGER, INTENT(inout)                             :: info

      REAL(kind=dp)                                      :: epsmch


      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp, zero = 0.0_dp


      INTEGER                                            :: col2, i, ibkmin, ibp, iter, j, nbreak, &

                                                            nfree, nleft, pointr

      LOGICAL                                            :: bnded, xlower, xupper

      REAL(kind=dp)                                      :: bkmin, ddot, dibp, dibp2, dt, dtm, f1, &

                                                            f2, f2_org, neggi, tj, tj0, tl, tsum, &

                                                            tu, wmc, wmp, wmw, zibp


!     References:

!

!       [1] R. H. Byrd, P. Lu, J. Nocedal and C. Zhu, ``A limited

!       memory algorithm for bound constrained optimization'',

!       SIAM J. Scientific Computing 16 (1995), no. 5, pp. 1190--1208.

!

!       [2] C. Zhu, R.H. Byrd, P. Lu, J. Nocedal, ``L-BFGS-B: FORTRAN

!       Subroutines for Large Scale Bound Constrained Optimization''

!       Tech. Report, NAM-11, EECS Department, Northwestern University,

!       1994.

!

!       (Postscript files of these papers are available via anonymous

!        ftp to eecs.nwu.edu in the directory pub/lbfgs/lbfgs_bcm.)

!

!                           *  *  *

!     Check the status of the variables, reset iwhere(i) if necessary;

!       compute the Cauchy direction d and the breakpoints t; initialize

!       the derivative f1 and the vector p = W'd (for theta = 1).


      IF (g_inf_norm <= zero) THEN

         IF (iprint >= 0) WRITE (*, *) 'Subgnorm = 0.  GCP = X.'

         CALL dcopy(n, x, 1, xcp, 1)

         RETURN

      END IF

      bnded = .true.

      nfree = n + 1

      nbreak = 0

      ibkmin = 0

      bkmin = zero

      col2 = 2*col

      f1 = zero

      IF (iprint >= 99) WRITE (*, 3010)


!     We set p to zero and build it up as we determine d.


      DO i = 1, col2

         p(i) = zero

      END DO


!     In the following loop we determine for each variable its bound

!        status and its breakpoint, and update p accordingly.

!        Smallest breakpoint is identified.


      DO i = 1, n

         neggi = -g(i)

         IF (iwhere(i) /= 3 .AND. iwhere(i) /= -1) THEN

!             if x(i) is not a constant and has bounds,

!             compute the difference between x(i) and its bounds.

            IF (nbd(i) <= 2) tl = x(i) - lower_bound(i)

            IF (nbd(i) >= 2) tu = upper_bound(i) - x(i)


!           If a variable is close enough to a bound

!             we treat it as at bound.

            xlower = nbd(i) <= 2 .AND. tl <= zero

            xupper = nbd(i) >= 2 .AND. tu <= zero


!              reset iwhere(i).

            iwhere(i) = 0

            IF (xlower) THEN

               IF (neggi <= zero) iwhere(i) = 1

            ELSE IF (xupper) THEN

               IF (neggi >= zero) iwhere(i) = 2

            ELSE

               IF (abs(neggi) <= zero) iwhere(i) = -3

            END IF

         END IF

         pointr = head

         IF (iwhere(i) /= 0 .AND. iwhere(i) /= -1) THEN

            d(i) = zero

         ELSE

            d(i) = neggi

            f1 = f1 - neggi*neggi

!             calculate p := p - W'e_i* (g_i).

            DO j = 1, col

               p(j) = p(j) + wy(i, pointr)*neggi

               p(col + j) = p(col + j) + ws(i, pointr)*neggi

               pointr = mod(pointr, m) + 1

            END DO

            IF (nbd(i) <= 2 .AND. nbd(i) /= 0                       &

     &                        .AND. neggi < zero) THEN

!                                 x(i) + d(i) is bounded; compute t(i).

               nbreak = nbreak + 1

               iorder(nbreak) = i

               t(nbreak) = tl/(-neggi)

               IF (nbreak == 1 .OR. t(nbreak) < bkmin) THEN

                  bkmin = t(nbreak)

                  ibkmin = nbreak

               END IF

            ELSE IF (nbd(i) >= 2 .AND. neggi > zero) THEN

!                                 x(i) + d(i) is bounded; compute t(i).

               nbreak = nbreak + 1

               iorder(nbreak) = i

               t(nbreak) = tu/neggi

               IF (nbreak == 1 .OR. t(nbreak) < bkmin) THEN

                  bkmin = t(nbreak)

                  ibkmin = nbreak

               END IF

            ELSE

!                x(i) + d(i) is not bounded.

               nfree = nfree - 1

               iorder(nfree) = i

               IF (abs(neggi) > zero) bnded = .false.

            END IF

         END IF

      END DO


!     The indices of the nonzero components of d are now stored

!       in iorder(1),...,iorder(nbreak) and iorder(nfree),...,iorder(n).

!       The smallest of the nbreak breakpoints is in t(ibkmin)=bkmin.


      IF (theta /= one) THEN

!                   complete the initialization of p for theta not= one.

         CALL dscal(col, theta, p(col + 1), 1)

      END IF


!     Initialize GCP xcp = x.


      CALL dcopy(n, x, 1, xcp, 1)


      IF (nbreak == 0 .AND. nfree == n + 1) THEN

!                  is a zero vector, return with the initial xcp as GCP.

         IF (iprint > 100) WRITE (*, 1010) (xcp(i), i=1, n)

         RETURN

      END IF


!     Initialize c = W'(xcp - x) = 0.


      DO j = 1, col2

         c(j) = zero

      END DO


!     Initialize derivative f2.


      f2 = -theta*f1

      f2_org = f2

      IF (col > 0) THEN

         CALL bmv(m, sy, wt, col, p, v, info)

         IF (info /= 0) RETURN

         f2 = f2 - ddot(col2, v, 1, p, 1)

      END IF

      dtm = -f1/f2

      tsum = zero

      nseg = 1

      IF (iprint >= 99) &

         WRITE (*, *) 'There are ', nbreak, '  breakpoints '


      nleft = nbreak

      iter = 1


      tj = zero


!     If there are no breakpoints, locate the GCP and return.


      IF (nleft == 0) THEN

         IF (iprint >= 99) THEN

            WRITE (*, *)

            WRITE (*, *) 'GCP found in this segment'

            WRITE (*, 4010) nseg, f1, f2

            WRITE (*, 6010) dtm

         END IF

         IF (dtm <= zero) dtm = zero

         tsum = tsum + dtm


!        Move free variables (i.e., the ones w/o breakpoints) and

!          the variables whose breakpoints haven't been reached.


         CALL daxpy(n, tsum, d, 1, xcp, 1)

      END IF


      DO WHILE (nleft > 0)


!     Find the next smallest breakpoint;

!       compute dt = t(nleft) - t(nleft + 1).


         tj0 = tj

         IF (iter == 1) THEN

!         Since we already have the smallest breakpoint we need not do

!         heapsort yet. Often only one breakpoint is used and the

!         cost of heapsort is avoided.

            tj = bkmin

            ibp = iorder(ibkmin)

         ELSE

            IF (iter == 2) THEN

!             Replace the already used smallest breakpoint with the

!             breakpoint numbered nbreak > nlast, before heapsort call.

               IF (ibkmin /= nbreak) THEN

                  t(ibkmin) = t(nbreak)

                  iorder(ibkmin) = iorder(nbreak)

               END IF

!        Update heap structure of breakpoints

!           (if iter=2, initialize heap).

            END IF

            CALL hpsolb(nleft, t, iorder, iter - 2)

            tj = t(nleft)

            ibp = iorder(nleft)

         END IF


         dt = tj - tj0


         IF (dt /= zero .AND. iprint >= 100) THEN

            WRITE (*, 4011) nseg, f1, f2

            WRITE (*, 5010) dt

            WRITE (*, 6010) dtm

         END IF


!     If a minimizer is within this interval, locate the GCP and return.


         IF (dtm < dt) THEN

            IF (iprint >= 99) THEN

               WRITE (*, *)

               WRITE (*, *) 'GCP found in this segment'

               WRITE (*, 4010) nseg, f1, f2

               WRITE (*, 6010) dtm

            END IF

            IF (dtm <= zero) dtm = zero

            tsum = tsum + dtm


!        Move free variables (i.e., the ones w/o breakpoints) and

!          the variables whose breakpoints haven't been reached.


            CALL daxpy(n, tsum, d, 1, xcp, 1)

            EXIT

         END IF


!     Otherwise fix one variable and

!       reset the corresponding component of d to zero.


         tsum = tsum + dt

         nleft = nleft - 1

         iter = iter + 1

         dibp = d(ibp)

         d(ibp) = zero

         IF (dibp > zero) THEN

            zibp = upper_bound(ibp) - x(ibp)

            xcp(ibp) = upper_bound(ibp)

            iwhere(ibp) = 2

         ELSE

            zibp = lower_bound(ibp) - x(ibp)

            xcp(ibp) = lower_bound(ibp)

            iwhere(ibp) = 1

         END IF

         IF (iprint >= 100) WRITE (*, *) 'Variable  ', ibp, '  is fixed.'

         IF (nleft == 0 .AND. nbreak == n) THEN

!                                             all n variables are fixed,

!                                                return with xcp as GCP.

            dtm = dt

            EXIT

         END IF


!     Update the derivative information.


         nseg = nseg + 1

         dibp2 = dibp**2


!     Update f1 and f2.


!        temporarily set f1 and f2 for col=0.

         f1 = f1 + dt*f2 + dibp2 - theta*dibp*zibp

         f2 = f2 - theta*dibp2


         IF (col > 0) THEN

!                          update c = c + dt*p.

            CALL daxpy(col2, dt, p, 1, c, 1)


!           choose wbp,

!           the row of W corresponding to the breakpoint encountered.

            pointr = head

            DO j = 1, col

               wbp(j) = wy(ibp, pointr)

               wbp(col + j) = theta*ws(ibp, pointr)

               pointr = mod(pointr, m) + 1

            END DO


!           compute (wbp)Mc, (wbp)Mp, and (wbp)M(wbp)'.

            CALL bmv(m, sy, wt, col, wbp, v, info)

            IF (info /= 0) RETURN

            wmc = ddot(col2, c, 1, v, 1)

            wmp = ddot(col2, p, 1, v, 1)

            wmw = ddot(col2, wbp, 1, v, 1)


!           update p = p - dibp*wbp.

            CALL daxpy(col2, -dibp, wbp, 1, p, 1)


!           complete updating f1 and f2 while col > 0.

            f1 = f1 + dibp*wmc

            f2 = f2 + 2.0_dp*dibp*wmp - dibp2*wmw

         END IF


         f2 = max(epsmch*f2_org, f2)

         IF (nleft > 0) THEN

            dtm = -f1/f2

            cycle

!                 to repeat the loop for unsearched intervals.

         ELSE

            IF (bnded) THEN

               f1 = zero

               f2 = zero

               dtm = zero

            ELSE

               dtm = -f1/f2

            END IF

            IF (iprint >= 99) THEN

               WRITE (*, *)

               WRITE (*, *) 'GCP found in this segment'

               WRITE (*, 4010) nseg, f1, f2

               WRITE (*, 6010) dtm

            END IF

            IF (dtm <= zero) dtm = zero

            tsum = tsum + dtm


!        Move free variables (i.e., the ones w/o breakpoints) and

!          the variables whose breakpoints haven't been reached.


            CALL daxpy(n, tsum, d, 1, xcp, 1)

            EXIT

         END IF

      END DO


!     Update c = c + dtm*p = W'(x^c - x)

!       which will be used in computing r = Z'(B(x^c - x) + g).


      IF (col > 0) CALL daxpy(col2, dtm, p, 1, c, 1)

      IF (iprint > 100) WRITE (*, 1010) (xcp(i), i=1, n)

      IF (iprint >= 99) WRITE (*, 2010)


1010  FORMAT('Cauchy X =  ', /, (4x, 1p, 6(1x, d11.4)))

2010  FORMAT(/, '---------------- exit CAUCHY----------------------',/)

3010  FORMAT(/, '---------------- CAUCHY entered-------------------')

4010  FORMAT('Piece    ', i3, ' --f1, f2 at start point ', 1p, 2(1x, d11.4))

4011  FORMAT(/, 'Piece    ', i3, ' --f1, f2 at start point ', &

              1p, 2(1x, d11.4))

5010  FORMAT('Distance to the next break point =  ', 1p, d11.4)

6010  FORMAT('Distance to the stationary point =  ', 1p, d11.4)


      RETURN


   END SUBROUTINE cauchy


! **************************************************************************************************

!> \brief        This subroutine computes r=-Z'B(xcp-xk)-Z'g by using

!>               wa(2m+1)=W'(xcp-x) from subroutine cauchy.

!> \param n ...

!> \param m ...

!> \param x ...

!> \param g ...

!> \param ws ...

!> \param wy ...

!> \param sy ...

!> \param wt ...

!> \param z ...

!> \param r ...

!> \param wa ...

!> \param index ...

!> \param theta ...

!> \param col ...

!> \param head ...

!> \param nfree ...

!> \param constrained ...

!> \param info ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE cmprlb(n, m, x, g, ws, wy, sy, wt, z, r, wa, index, &

                     theta, col, head, nfree, constrained, info)


      INTEGER, INTENT(in)                                :: n, m

      REAL(kind=dp), INTENT(in)                          :: x(n), g(n), ws(n, m), wy(n, m), &

                                                            sy(m, m), wt(m, m), z(n)

      REAL(kind=dp), INTENT(out)                         :: r(n), wa(4*m)

      INTEGER, INTENT(in)                                :: index(n)

      REAL(kind=dp), INTENT(in)                          :: theta

      INTEGER, INTENT(in)                                :: col, head, nfree

      LOGICAL, INTENT(in)                                :: constrained

      INTEGER                                            :: info


      INTEGER                                            :: i, j, k, pointr

      REAL(kind=dp)                                      :: a1, a2


      IF (.NOT. constrained .AND. col > 0) THEN

         DO i = 1, n

            r(i) = -g(i)

         END DO

      ELSE

         DO i = 1, nfree

            k = index(i)

            r(i) = -theta*(z(k) - x(k)) - g(k)

         END DO

         CALL bmv(m, sy, wt, col, wa(2*m + 1), wa(1), info)

         IF (info /= 0) THEN

            info = -8

            RETURN

         END IF

         pointr = head

         DO j = 1, col

            a1 = wa(j)

            a2 = theta*wa(col + j)

            DO i = 1, nfree

               k = index(i)

               r(i) = r(i) + wy(k, pointr)*a1 + ws(k, pointr)*a2

            END DO

            pointr = mod(pointr, m) + 1

         END DO

      END IF


      RETURN


   END SUBROUTINE cmprlb


! **************************************************************************************************

!> \brief       This subroutine checks the validity of the input data.

!> \param n ...

!> \param m ...

!> \param factr ...

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd ...

!> \param task ...

!> \param info ...

!> \param k ...

!> \author      NEOS, November 1994. (Latest revision June 1996.)

!>              Optimization Technology Center.

!>              Argonne National Laboratory and Northwestern University.

!>              Written by

!>                          Ciyou Zhu

!>              in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE errclb(n, m, factr, lower_bound, upper_bound, nbd, task, info, k)


      INTEGER, INTENT(in)                                :: n, m

      REAL(kind=dp), INTENT(in)                          :: factr, lower_bound(n), upper_bound(n)

      INTEGER                                            :: nbd(n)

      CHARACTER(LEN=60)                                  :: task

      INTEGER                                            :: info, k


      REAL(kind=dp), PARAMETER                           :: zero = 0.0_dp


      INTEGER                                            :: i


!     Check the input arguments for errors.


      IF (n <= 0) task = 'ERROR: N <= 0'

      IF (m <= 0) task = 'ERROR: M <= 0'

      IF (factr < zero) task = 'ERROR: FACTR < 0'


!     Check the validity of the arrays nbd(i), u(i), and l(i).


      DO i = 1, n

         IF (nbd(i) < 0 .OR. nbd(i) > 3) THEN

!                                                   return

            task = 'ERROR: INVALID NBD'

            info = -6

            k = i

         END IF

         IF (nbd(i) == 2) THEN

            IF (lower_bound(i) > upper_bound(i)) THEN

!                                    return

               task = 'ERROR: NO FEASIBLE SOLUTION'

               info = -7

               k = i

            END IF

         END IF

      END DO


      RETURN


   END SUBROUTINE errclb


! **************************************************************************************************

!> \brief        This subroutine forms  the LEL^T factorization of the indefinite

!>               matrix    K = [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!>                             [L_a -R_z           theta*S'AA'S ]

!>               where     E = [-I  0]

!>                             [ 0  I]

!>               The matrix K can be shown to be equal to the matrix M^[-1]N

!>               occurring in section 5.1 of [1], as well as to the matrix

!>               Mbar^[-1] Nbar in section 5.3.

!> \param n      n is the dimension of the problem.

!> \param nsub   nsub is the number of subspace variables in free set.

!> \param ind    ind specifies the indices of subspace variables.

!> \param nenter nenter is the number of variables entering the free set.

!> \param ileave indx2(ileave),...,indx2(n) are the variables leaving the free set.

!> \param indx2  indx2(1),...,indx2(nenter) are the variables entering the free set,

!>               while indx2(ileave),...,indx2(n) are the variables leaving the free set.

!> \param iupdat iupdat is the total number of BFGS updates made so far.

!> \param updatd 'updatd' is true if the L-BFGS matrix is updatd.

!> \param wn     the upper triangle of wn stores the LEL^T factorization

!>               of the 2*col x 2*col indefinite matrix

!>                     [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!>                     [L_a -R_z           theta*S'AA'S ]

!> \param wn1    On entry wn1 stores the lower triangular part of

!>                     [Y' ZZ'Y   L_a'+R_z']

!>                     [L_a+R_z   S'AA'S   ]

!>               in the previous iteration.

!>               On exit wn1 stores the corresponding updated matrices.

!>               The purpose of wn1 is just to store these inner products

!>               so they can be easily updated and inserted into wn.

!> \param m      m is the maximum number of variable metric corrections

!>               used to define the limited memory matrix.

!> \param ws     ws(n,m) stores S, a set of s-vectors;

!> \param wy     wy(n,m) stores Y, a set of y-vectors;

!> \param sy     sy(m,m) stores S'Y;

!> \param theta  is the scaling factor specifying B_0 = theta I;

!> \param col    is the number of variable metric corrections stored;

!> \param head   is the location of the 1st s- (or y-) vector in S (or Y).

!> \param info   info =  0 for normal return;

!>                    = -1 when the 1st Cholesky factorization failed;

!>                    = -2 when the 2st Cholesky factorization failed.

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE formk(n, nsub, ind, nenter, ileave, indx2, iupdat, &

                    updatd, wn, wn1, m, ws, wy, sy, theta, col, &

                    head, info)


      INTEGER, INTENT(in)                                :: n, nsub, ind(n), nenter, ileave, &

                                                            indx2(n), iupdat

      LOGICAL                                            :: updatd

      INTEGER, INTENT(in)                                :: m

      REAL(kind=dp)                                      :: wn1(2*m, 2*m)

      REAL(kind=dp), INTENT(out)                         :: wn(2*m, 2*m)

      REAL(kind=dp), INTENT(in)                          :: ws(n, m), wy(n, m), sy(m, m), theta

      INTEGER, INTENT(in)                                :: col, head

      INTEGER, INTENT(out)                               :: info


      REAL(kind=dp), PARAMETER                           :: zero = 0.0_dp


      INTEGER                                            :: col2, dbegin, dend, i, ipntr, is, is1, &

                                                            iy, jpntr, js, js1, jy, k, k1, m2, &

                                                            pbegin, pend, upcl

      REAL(kind=dp)                                      :: ddot, temp1, temp2, temp3, temp4


!     References:

!       [1] R. H. Byrd, P. Lu, J. Nocedal and C. Zhu, ``A limited

!       memory algorithm for bound constrained optimization'',

!       SIAM J. Scientific Computing 16 (1995), no. 5, pp. 1190--1208.

!

!       [2] C. Zhu, R.H. Byrd, P. Lu, J. Nocedal, ``L-BFGS-B: a

!       limited memory FORTRAN code for solving bound constrained

!       optimization problems'', Tech. Report, NAM-11, EECS Department,

!       Northwestern University, 1994.

!

!       (Postscript files of these papers are available via anonymous

!        ftp to eecs.nwu.edu in the directory pub/lbfgs/lbfgs_bcm.)

!

!                           *  *  *

!     Form the lower triangular part of

!               WN1 = [Y' ZZ'Y   L_a'+R_z']

!                     [L_a+R_z   S'AA'S   ]

!        where L_a is the strictly lower triangular part of S'AA'Y

!              R_z is the upper triangular part of S'ZZ'Y.


      IF (updatd) THEN

         IF (iupdat > m) THEN

!                                 shift old part of WN1.

            DO jy = 1, m - 1

               js = m + jy

               CALL dcopy(m - jy, wn1(jy + 1, jy + 1), 1, wn1(jy, jy), 1)

               CALL dcopy(m - jy, wn1(js + 1, js + 1), 1, wn1(js, js), 1)

               CALL dcopy(m - 1, wn1(m + 2, jy + 1), 1, wn1(m + 1, jy), 1)

            END DO

         END IF


!          put new rows in blocks (1,1), (2,1) and (2,2).

         pbegin = 1

         pend = nsub

         dbegin = nsub + 1

         dend = n

         iy = col

         is = m + col

         ipntr = head + col - 1

         IF (ipntr > m) ipntr = ipntr - m

         jpntr = head

         DO jy = 1, col

            js = m + jy

            temp1 = zero

            temp2 = zero

            temp3 = zero

!             compute element jy of row 'col' of Y'ZZ'Y

            DO k = pbegin, pend

               k1 = ind(k)

               temp1 = temp1 + wy(k1, ipntr)*wy(k1, jpntr)

            END DO

!             compute elements jy of row 'col' of L_a and S'AA'S

            DO k = dbegin, dend

               k1 = ind(k)

               temp2 = temp2 + ws(k1, ipntr)*ws(k1, jpntr)

               temp3 = temp3 + ws(k1, ipntr)*wy(k1, jpntr)

            END DO

            wn1(iy, jy) = temp1

            wn1(is, js) = temp2

            wn1(is, jy) = temp3

            jpntr = mod(jpntr, m) + 1

         END DO


!          put new column in block (2,1).

         jy = col

         jpntr = head + col - 1

         IF (jpntr > m) jpntr = jpntr - m

         ipntr = head

         DO i = 1, col

            is = m + i

            temp3 = zero

!             compute element i of column 'col' of R_z

            DO k = pbegin, pend

               k1 = ind(k)

               temp3 = temp3 + ws(k1, ipntr)*wy(k1, jpntr)

            END DO

            ipntr = mod(ipntr, m) + 1

            wn1(is, jy) = temp3

         END DO

         upcl = col - 1

      ELSE

         upcl = col

      END IF


!       modify the old parts in blocks (1,1) and (2,2) due to changes

!       in the set of free variables.

      ipntr = head

      DO iy = 1, upcl

         is = m + iy

         jpntr = head

         DO jy = 1, iy

            js = m + jy

            temp1 = zero

            temp2 = zero

            temp3 = zero

            temp4 = zero

            DO k = 1, nenter

               k1 = indx2(k)

               temp1 = temp1 + wy(k1, ipntr)*wy(k1, jpntr)

               temp2 = temp2 + ws(k1, ipntr)*ws(k1, jpntr)

            END DO

            DO k = ileave, n

               k1 = indx2(k)

               temp3 = temp3 + wy(k1, ipntr)*wy(k1, jpntr)

               temp4 = temp4 + ws(k1, ipntr)*ws(k1, jpntr)

            END DO

            wn1(iy, jy) = wn1(iy, jy) + temp1 - temp3

            wn1(is, js) = wn1(is, js) - temp2 + temp4

            jpntr = mod(jpntr, m) + 1

         END DO

         ipntr = mod(ipntr, m) + 1

      END DO


!       modify the old parts in block (2,1).

      ipntr = head

      DO is = m + 1, m + upcl

         jpntr = head

         DO jy = 1, upcl

            temp1 = zero

            temp3 = zero

            DO k = 1, nenter

               k1 = indx2(k)

               temp1 = temp1 + ws(k1, ipntr)*wy(k1, jpntr)

            END DO

            DO k = ileave, n

               k1 = indx2(k)

               temp3 = temp3 + ws(k1, ipntr)*wy(k1, jpntr)

            END DO

            IF (is <= jy + m) THEN

               wn1(is, jy) = wn1(is, jy) + temp1 - temp3

            ELSE

               wn1(is, jy) = wn1(is, jy) - temp1 + temp3

            END IF

            jpntr = mod(jpntr, m) + 1

         END DO

         ipntr = mod(ipntr, m) + 1

      END DO


!     Form the upper triangle of WN = [D+Y' ZZ'Y/theta   -L_a'+R_z' ]

!                                     [-L_a +R_z        S'AA'S*theta]


      m2 = 2*m

      DO iy = 1, col

         is = col + iy

         is1 = m + iy

         DO jy = 1, iy

            js = col + jy

            js1 = m + jy

            wn(jy, iy) = wn1(iy, jy)/theta

            wn(js, is) = wn1(is1, js1)*theta

         END DO

         DO jy = 1, iy - 1

            wn(jy, is) = -wn1(is1, jy)

         END DO

         DO jy = iy, col

            wn(jy, is) = wn1(is1, jy)

         END DO

         wn(iy, iy) = wn(iy, iy) + sy(iy, iy)

      END DO


!     Form the upper triangle of WN= [  LL'            L^-1(-L_a'+R_z')]

!                                    [(-L_a +R_z)L'^-1   S'AA'S*theta  ]


!        first Cholesky factor (1,1) block of wn to get LL'

!                          with L' stored in the upper triangle of wn.

      CALL dpofa(wn, m2, col, info)

      IF (info /= 0) THEN

         info = -1

         RETURN

      END IF

!        then form L^-1(-L_a'+R_z') in the (1,2) block.

      col2 = 2*col

      DO js = col + 1, col2

         CALL dtrsl(wn, m2, col, wn(1, js), 11, info)

      END DO


!     Form S'AA'S*theta + (L^-1(-L_a'+R_z'))'L^-1(-L_a'+R_z') in the

!        upper triangle of (2,2) block of wn.


      DO is = col + 1, col2

         DO js = is, col2

            wn(is, js) = wn(is, js) + ddot(col, wn(1, is), 1, wn(1, js), 1)

         END DO

      END DO


!     Cholesky factorization of (2,2) block of wn.


      CALL dpofa(wn(col + 1, col + 1), m2, col, info)

      IF (info /= 0) THEN

         info = -2

         RETURN

      END IF


      RETURN


   END SUBROUTINE formk


! **************************************************************************************************

!> \brief       This subroutine forms the upper half of the pos. def. and symm.

!>              T = theta*SS + L*D^(-1)*L', stores T in the upper triangle

!>              of the array wt, and performs the Cholesky factorization of T

!>              to produce J*J', with J' stored in the upper triangle of wt.

!> \param m ...

!> \param wt ...

!> \param sy ...

!> \param ss ...

!> \param col ...

!> \param theta ...

!> \param info ...

!> \author      NEOS, November 1994. (Latest revision June 1996.)

!>              Optimization Technology Center.

!>              Argonne National Laboratory and Northwestern University.

!>              Written by

!>                          Ciyou Zhu

!>              in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE formt(m, wt, sy, ss, col, theta, info)


      INTEGER                                            :: m

      REAL(kind=dp)                                      :: wt(m, m), sy(m, m), ss(m, m)

      INTEGER                                            :: col

      REAL(kind=dp)                                      :: theta

      INTEGER                                            :: info


      REAL(kind=dp), PARAMETER                           :: zero = 0.0_dp


      INTEGER                                            :: i, j, k, k1

      REAL(kind=dp)                                      :: ddum


!     Form the upper half of  T = theta*SS + L*D^(-1)*L',

!        store T in the upper triangle of the array wt.


      DO j = 1, col

         wt(1, j) = theta*ss(1, j)

      END DO

      DO i = 2, col

         DO j = i, col

            k1 = min(i, j) - 1

            ddum = zero

            DO k = 1, k1

               ddum = ddum + sy(i, k)*sy(j, k)/sy(k, k)

            END DO

            wt(i, j) = ddum + theta*ss(i, j)

         END DO

      END DO


!     Cholesky factorize T to J*J' with

!        J' stored in the upper triangle of wt.


      CALL dpofa(wt, m, col, info)

      IF (info /= 0) THEN

         info = -3

      END IF


      RETURN


   END SUBROUTINE formt


! **************************************************************************************************

!> \brief        This subroutine counts the entering and leaving variables when

!>               iter > 0, and finds the index set of free and active variables

!>               at the GCP.

!> \param n ...

!> \param nfree ...

!> \param index  for i=1,...,nfree, index(i) are the indices of free variables

!>               for i=nfree+1,...,n, index(i) are the indices of bound variables

!>               On entry after the first iteration, index gives

!>               the free variables at the previous iteration.

!>               On exit it gives the free variables based on the determination

!>               in cauchy using the array iwhere.

!> \param nenter ...

!> \param ileave ...

!> \param indx2  On exit with iter>0, indx2 indicates which variables

!>               have changed status since the previous iteration.

!>               For i= 1,...,nenter, indx2(i) have changed from bound to free.

!>               For i= ileave+1,...,n, indx2(i) have changed from free to bound.

!> \param iwhere ...

!> \param wrk ...

!> \param updatd ...

!> \param constrained     A variable indicating whether bounds are present

!> \param iprint ...

!> \param iter ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE freev(n, nfree, index, nenter, ileave, indx2, &

                    iwhere, wrk, updatd, constrained, iprint, iter)


      INTEGER                                            :: n, nfree

      INTEGER, INTENT(inout)                             :: index(n)

      INTEGER                                            :: nenter, ileave

      INTEGER, INTENT(out)                               :: indx2(n)

      INTEGER                                            :: iwhere(n)

      LOGICAL                                            :: wrk, updatd, constrained

      INTEGER                                            :: iprint, iter


      INTEGER                                            :: i, iact, k


      nenter = 0

      ileave = n + 1

      IF (iter > 0 .AND. constrained) THEN

!                           count the entering and leaving variables.

         DO i = 1, nfree

            k = index(i)


!            write(*,*) ' k  = index(i) ', k

!            write(*,*) ' index = ', i


            IF (iwhere(k) > 0) THEN

               ileave = ileave - 1

               indx2(ileave) = k

               IF (iprint >= 100) WRITE (*, *)                         &

     &             'Variable ', k, ' leaves the set of free variables'

            END IF

         END DO

         DO i = 1 + nfree, n

            k = index(i)

            IF (iwhere(k) <= 0) THEN

               nenter = nenter + 1

               indx2(nenter) = k

               IF (iprint >= 100) WRITE (*, *)                         &

     &             'Variable ', k, ' enters the set of free variables'

            END IF

         END DO

         IF (iprint >= 99) WRITE (*, *) &

            n + 1 - ileave, ' variables leave; ', nenter, ' variables enter'

      END IF

      wrk = (ileave < n + 1) .OR. (nenter > 0) .OR. updatd


!     Find the index set of free and active variables at the GCP.


      nfree = 0

      iact = n + 1

      DO i = 1, n

         IF (iwhere(i) <= 0) THEN

            nfree = nfree + 1

            index(nfree) = i

         ELSE

            iact = iact - 1

            index(iact) = i

         END IF

      END DO

      IF (iprint >= 99) WRITE (*, *) &

         nfree, ' variables are free at GCP ', iter + 1


      RETURN


   END SUBROUTINE freev


! **************************************************************************************************

!> \brief        This subroutine sorts out the least element of t, and puts the

!>               remaining elements of t in a heap.

!> \param n      n is the dimension of the arrays t and iorder.

!> \param t      On entry t stores the elements to be sorted,

!>               On exit t(n) stores the least elements of t, and t(1) to t(n-1)

!>               stores the remaining elements in the form of a heap.

!> \param iorder On entry iorder(i) is the index of t(i).

!>               On exit iorder(i) is still the index of t(i), but iorder may be

!>               permuted in accordance with t.

!> \param iheap  iheap should be set as follows:

!>               iheap .eq. 0 if t(1) to t(n) is not in the form of a heap,

!>               iheap .ne. 0 if otherwise.

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE hpsolb(n, t, iorder, iheap)

      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(inout)                       :: t(n)

      INTEGER, INTENT(inout)                             :: iorder(n)

      INTEGER, INTENT(in)                                :: iheap


      INTEGER                                            :: i, indxin, indxou, j, k

      REAL(kind=dp)                                      :: ddum, out


!

!     References:

!       Algorithm 232 of CACM (J. W. J. Williams): HEAPSORT.

!

!                           *  *  *


      IF (iheap == 0) THEN


!        Rearrange the elements t(1) to t(n) to form a heap.


         DO k = 2, n

            ddum = t(k)

            indxin = iorder(k)


!           Add ddum to the heap.

            i = k

            DO WHILE (i > 1)

               j = i/2

               IF (ddum < t(j)) THEN

                  t(i) = t(j)

                  iorder(i) = iorder(j)

                  i = j

               ELSE

                  EXIT

               END IF

            END DO

            t(i) = ddum

            iorder(i) = indxin

         END DO

      END IF


!     Assign to 'out' the value of t(1), the least member of the heap,

!        and rearrange the remaining members to form a heap as

!        elements 1 to n-1 of t.


      IF (n > 1) THEN

         i = 1

         out = t(1)

         indxou = iorder(1)

         ddum = t(n)

         indxin = iorder(n)


!        Restore the heap

         j = 2*i

         DO WHILE (j <= n - 1)

            IF (t(j + 1) < t(j)) j = j + 1

            IF (t(j) < ddum) THEN

               t(i) = t(j)

               iorder(i) = iorder(j)

               i = j

            ELSE

               EXIT

            END IF

            j = 2*i

         END DO

         t(i) = ddum

         iorder(i) = indxin


!     Put the least member in t(n).


         t(n) = out

         iorder(n) = indxou

      END IF


      RETURN


   END SUBROUTINE hpsolb


! **************************************************************************************************

!> \brief        This subroutine calls subroutine dcsrch from the Minpack2 library

!>               to perform the line search.  Subroutine dscrch is safeguarded so

!>               that all trial points lie within the feasible region.

!> \param n ...

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd ...

!> \param x ...

!> \param f ...

!> \param fold ...

!> \param gd ...

!> \param gdold ...

!> \param g ...

!> \param d ...

!> \param r ...

!> \param t ...

!> \param z ...

!> \param stp ...

!> \param dnorm ...

!> \param dtd ...

!> \param xstep ...

!> \param step_max ...

!> \param iter ...

!> \param ifun ...

!> \param iback ...

!> \param nfgv ...

!> \param info ...

!> \param task ...

!> \param boxed ...

!> \param constrained ...

!> \param csave ...

!> \param isave ...

!> \param dsave ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE lnsrlb(n, lower_bound, upper_bound, nbd, x, f, fold, gd, gdold, g, d, r, t, &

                     z, stp, dnorm, dtd, xstep, step_max, iter, ifun, &

                     iback, nfgv, info, task, boxed, constrained, csave, &

                     isave, dsave)


      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n)

      INTEGER                                            :: nbd(n)

      REAL(kind=dp)                                      :: x(n), f, fold, gd, gdold, g(n), d(n), &

                                                            r(n), t(n), z(n), stp, dnorm, dtd, &

                                                            xstep, step_max

      INTEGER                                            :: iter, ifun, iback, nfgv, info

      CHARACTER(LEN=60)                                  :: task

      LOGICAL                                            :: boxed, constrained

      CHARACTER(LEN=60)                                  :: csave

      INTEGER                                            :: isave(2)

      REAL(kind=dp)                                      :: dsave(13)


      REAL(kind=dp), PARAMETER                           :: big = 1.0e10_dp, ftol = 1.0e-3_dp, &

                                                            gtol = 0.9_dp, one = 1.0_dp, &

                                                            xtol = 0.1_dp, zero = 0.0_dp


      INTEGER                                            :: i

      REAL(kind=dp)                                      :: a1, a2, ddot


      IF (.NOT. (task(1:5) == 'FG_LN')) THEN


         dtd = ddot(n, d, 1, d, 1)

         dnorm = sqrt(dtd)


!     Determine the maximum step length.


         step_max = big

         IF (constrained) THEN

            IF (iter == 0) THEN

               step_max = one

            ELSE

               DO i = 1, n

                  a1 = d(i)

                  IF (nbd(i) /= 0) THEN

                     IF (a1 < zero .AND. nbd(i) <= 2) THEN

                        a2 = lower_bound(i) - x(i)

                        IF (a2 >= zero) THEN

                           step_max = zero

                        ELSE IF (a1*step_max < a2) THEN

                           step_max = a2/a1

                        END IF

                     ELSE IF (a1 > zero .AND. nbd(i) >= 2) THEN

                        a2 = upper_bound(i) - x(i)

                        IF (a2 <= zero) THEN

                           step_max = zero

                        ELSE IF (a1*step_max > a2) THEN

                           step_max = a2/a1

                        END IF

                     END IF

                  END IF

               END DO

            END IF

         END IF


         IF (iter == 0 .AND. .NOT. boxed) THEN

            stp = min(one/dnorm, step_max)

         ELSE

            stp = one

         END IF


         CALL dcopy(n, x, 1, t, 1)

         CALL dcopy(n, g, 1, r, 1)

         fold = f

         ifun = 0

         iback = 0

         csave = 'START'

      END IF

      gd = ddot(n, g, 1, d, 1)

      IF (ifun == 0) THEN

         gdold = gd

         IF (gd >= zero) THEN

!                               the directional derivative >=0.

!                               Line search is impossible.

            WRITE (*, *) ' ascent direction in projection gd = ', gd

            info = -4

            RETURN

         END IF

      END IF


      CALL dcsrch(f, gd, stp, ftol, gtol, xtol, zero, step_max, csave, isave, dsave)


      xstep = stp*dnorm

      IF (csave(1:4) /= 'CONV' .AND. csave(1:4) /= 'WARN') THEN

         task = 'FG_LNSRCH'

         ifun = ifun + 1

         nfgv = nfgv + 1

         iback = ifun - 1

         IF (stp == one) THEN

            CALL dcopy(n, z, 1, x, 1)

         ELSE

            DO i = 1, n

               x(i) = stp*d(i) + t(i)

            END DO

         END IF

      ELSE

         task = 'NEW_X'

      END IF


      RETURN


   END SUBROUTINE lnsrlb


! **************************************************************************************************

!> \brief        This subroutine updates matrices WS and WY, and forms the middle matrix in B.

!> \param n ...

!> \param m ...

!> \param ws ...

!> \param wy ...

!> \param sy ...

!> \param ss ...

!> \param d ...

!> \param r ...

!> \param itail ...

!> \param iupdat ...

!> \param col ...

!> \param head ...

!> \param theta ...

!> \param rr ...

!> \param dr ...

!> \param stp ...

!> \param dtd ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE matupd(n, m, ws, wy, sy, ss, d, r, itail, &

                     iupdat, col, head, theta, rr, dr, stp, dtd)


      INTEGER                                            :: n, m

      REAL(kind=dp)                                      :: ws(n, m), wy(n, m), sy(m, m), ss(m, m), &

                                                            d(n), r(n)

      INTEGER                                            :: itail, iupdat, col, head

      REAL(kind=dp)                                      :: theta, rr, dr, stp, dtd


      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp


      INTEGER                                            :: j, pointr

      REAL(kind=dp)                                      :: ddot


!     ************

!     Set pointers for matrices WS and WY.


      IF (iupdat <= m) THEN

         col = iupdat

         itail = mod(head + iupdat - 2, m) + 1

      ELSE

         itail = mod(itail, m) + 1

         head = mod(head, m) + 1

      END IF


!     Update matrices WS and WY.


      CALL dcopy(n, d, 1, ws(1, itail), 1)

      CALL dcopy(n, r, 1, wy(1, itail), 1)


!     Set theta=yy/ys.


      theta = rr/dr


!     Form the middle matrix in B.


!        update the upper triangle of SS,

!                                         and the lower triangle of SY:

      IF (iupdat > m) THEN

!                              move old information

         DO j = 1, col - 1

            CALL dcopy(j, ss(2, j + 1), 1, ss(1, j), 1)

            CALL dcopy(col - j, sy(j + 1, j + 1), 1, sy(j, j), 1)

         END DO

      END IF

!        add new information: the last row of SY

!                                             and the last column of SS:

      pointr = head

      DO j = 1, col - 1

         sy(col, j) = ddot(n, d, 1, wy(1, pointr), 1)

         ss(j, col) = ddot(n, ws(1, pointr), 1, d, 1)

         pointr = mod(pointr, m) + 1

      END DO

      IF (stp == one) THEN

         ss(col, col) = dtd

      ELSE

         ss(col, col) = stp*stp*dtd

      END IF

      sy(col, col) = dr


      RETURN


   END SUBROUTINE matupd


! **************************************************************************************************

!> \brief        This subroutine prints the input data, initial point, upper and

!>               lower bounds of each variable, machine precision, as well as

!>               the headings of the output.

!>

!> \param n ...

!> \param m ...

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param x ...

!> \param iprint ...

!> \param itfile ...

!> \param epsmch ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE prn1lb(n, m, lower_bound, upper_bound, x, iprint, itfile, epsmch)


      INTEGER, INTENT(in)                                :: n, m

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n), x(n)

      INTEGER                                            :: iprint, itfile

      REAL(kind=dp)                                      :: epsmch


      INTEGER                                            :: i


      IF (iprint >= 0) THEN

         WRITE (*, 7001) epsmch

         WRITE (*, *) 'N = ', n, '    M = ', m

         IF (iprint >= 1) THEN

            WRITE (itfile, 2001) epsmch

            WRITE (itfile, *) 'N = ', n, '    M = ', m

            WRITE (itfile, 9001)

            IF (iprint > 100) THEN

               WRITE (*, 1004) 'L =', (lower_bound(i), i=1, n)

               WRITE (*, 1004) 'X0 =', (x(i), i=1, n)

               WRITE (*, 1004) 'U =', (upper_bound(i), i=1, n)

            END IF

         END IF

      END IF


1004  FORMAT(/, a4, 1p, 6(1x, d11.4), /, (4x, 1p, 6(1x, d11.4)))

2001  FORMAT('RUNNING THE L-BFGS-B CODE', /, /, &

             'it    = iteration number', /, &

             'nf    = number of function evaluations', /, &

             'nseg  = number of segments explored during the Cauchy search', /, &

             'nact  = number of active bounds at the generalized Cauchy point' &

             , /, &

             'sub   = manner in which the subspace minimization terminated:' &

             , /, '        con = converged, bnd = a bound was reached', /, &

             'itls  = number of iterations performed in the line search', /, &

             'stepl = step length used', /, &

             'tstep = norm of the displacement (total step)', /, &

             'projg = norm of the projected gradient', /, &

             'f     = function value', /, /, &

             '           * * *', /, /, &

             'Machine precision =', 1p, d10.3)

7001  FORMAT('RUNNING THE L-BFGS-B CODE', /, /, &

             '           * * *', /, /, &

             'Machine precision =', 1p, d10.3)

9001  FORMAT(/, 3x, 'it', 3x, 'nf', 2x, 'nseg', 2x, 'nact', 2x, 'sub', 2x, 'itls', &

              2x, 'stepl', 4x, 'tstep', 5x, 'projg', 8x, 'f')


      RETURN


   END SUBROUTINE prn1lb


! **************************************************************************************************

!> \brief        This subroutine prints out new information after a successful line search.

!> \param n ...

!> \param x ...

!> \param f ...

!> \param g ...

!> \param iprint ...

!> \param itfile ...

!> \param iter ...

!> \param nfgv ...

!> \param nact ...

!> \param g_inf_norm ...

!> \param nseg ...

!> \param word ...

!> \param iword ...

!> \param iback ...

!> \param stp ...

!> \param xstep ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE prn2lb(n, x, f, g, iprint, itfile, iter, nfgv, nact, &

                     g_inf_norm, nseg, word, iword, iback, stp, xstep)


      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: x(n), f, g(n)

      INTEGER, INTENT(in)                                :: iprint, itfile, iter, nfgv, nact

      REAL(kind=dp), INTENT(in)                          :: g_inf_norm

      INTEGER, INTENT(in)                                :: nseg

      CHARACTER(LEN=3)                                   :: word

      INTEGER                                            :: iword, iback

      REAL(kind=dp)                                      :: stp, xstep


      INTEGER                                            :: i, imod


!           'word' records the status of subspace solutions.


      IF (iword == 0) THEN

!                            the subspace minimization converged.

         word = 'con'

      ELSE IF (iword == 1) THEN

!                          the subspace minimization stopped at a bound.

         word = 'bnd'

      ELSE IF (iword == 5) THEN

!                             the truncated Newton step has been used.

         word = 'TNT'

      ELSE

         word = '---'

      END IF

      IF (iprint >= 99) THEN

         WRITE (*, *) 'LINE SEARCH', iback, ' times; norm of step = ', xstep

         WRITE (*, 2001) iter, f, g_inf_norm

         IF (iprint > 100) THEN

            WRITE (*, 1004) 'X =', (x(i), i=1, n)

            WRITE (*, 1004) 'G =', (g(i), i=1, n)

         END IF

      ELSE IF (iprint > 0) THEN

         imod = mod(iter, iprint)

         IF (imod == 0) WRITE (*, 2001) iter, f, g_inf_norm

      END IF

      IF (iprint >= 1) WRITE (itfile, 3001) &

         iter, nfgv, nseg, nact, word, iback, stp, xstep, g_inf_norm, f


1004  FORMAT(/, a4, 1p, 6(1x, d11.4), /, (4x, 1p, 6(1x, d11.4)))

2001  FORMAT &

         (/, 'At iterate', i5, 4x, 'f= ', 1p, d12.5, 4x, '|proj g|= ', 1p, d12.5)

3001  FORMAT(2(1x, i4), 2(1x, i5), 2x, a3, 1x, i4, 1p, 2(2x, d7.1), 1p, 2(1x, d10.3))


      RETURN


   END SUBROUTINE prn2lb


! **************************************************************************************************

!> \brief        This subroutine prints out information when either a built-in

!>               convergence test is satisfied or when an error message is

!>               generated.

!> \param n ...

!> \param x ...

!> \param f ...

!> \param task ...

!> \param iprint ...

!> \param info ...

!> \param itfile ...

!> \param iter ...

!> \param nfgv ...

!> \param nintol ...

!> \param nskip ...

!> \param nact ...

!> \param g_inf_norm ...

!> \param time ...

!> \param nseg ...

!> \param word ...

!> \param iback ...

!> \param stp ...

!> \param xstep ...

!> \param k ...

!> \param cachyt ...

!> \param sbtime ...

!> \param lnscht ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE prn3lb(n, x, f, task, iprint, info, itfile, &

                     iter, nfgv, nintol, nskip, nact, g_inf_norm, &

                     time, nseg, word, iback, stp, xstep, k, &

                     cachyt, sbtime, lnscht)


      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: x(n), f

      CHARACTER(LEN=60), INTENT(in)                      :: task

      INTEGER, INTENT(in)                                :: iprint, info, itfile, iter, nfgv, &

                                                            nintol, nskip, nact

      REAL(kind=dp), INTENT(in)                          :: g_inf_norm, time

      INTEGER, INTENT(in)                                :: nseg

      CHARACTER(LEN=3)                                   :: word

      INTEGER                                            :: iback

      REAL(kind=dp)                                      :: stp, xstep

      INTEGER                                            :: k

      REAL(kind=dp)                                      :: cachyt, sbtime, lnscht


      INTEGER                                            :: i


      IF (iprint >= 0 .AND. .NOT. (task(1:5) == 'ERROR')) THEN

         WRITE (*, 3003)

         WRITE (*, 3004)

         WRITE (*, 3005) n, iter, nfgv, nintol, nskip, nact, g_inf_norm, f

         IF (iprint >= 100) THEN

            WRITE (*, 1004) 'X =', (x(i), i=1, n)

         END IF

         IF (iprint >= 1) WRITE (*, *) ' F =', f

      END IF

      IF (iprint >= 0) THEN

         WRITE (*, 3009) task

         IF (info /= 0) THEN

            IF (info == -1) WRITE (*, 9011)

            IF (info == -2) WRITE (*, 9012)

            IF (info == -3) WRITE (*, 9013)

            IF (info == -4) WRITE (*, 9014)

            IF (info == -5) WRITE (*, 9015)

            IF (info == -6) WRITE (*, *) ' Input nbd(', k, ') is invalid.'

            IF (info == -7) &

               WRITE (*, *) ' l(', k, ') > u(', k, ').  No feasible solution.'

            IF (info == -8) WRITE (*, 9018)

            IF (info == -9) WRITE (*, 9019)

         END IF

         IF (iprint >= 1) WRITE (*, 3007) cachyt, sbtime, lnscht

         WRITE (*, 3008) time

         IF (iprint >= 1) THEN

            IF (info == -4 .OR. info == -9) THEN

               WRITE (itfile, 3002) &

                  iter, nfgv, nseg, nact, word, iback, stp, xstep

            END IF

            WRITE (itfile, 3009) task

            IF (info /= 0) THEN

               IF (info == -1) WRITE (itfile, 9011)

               IF (info == -2) WRITE (itfile, 9012)

               IF (info == -3) WRITE (itfile, 9013)

               IF (info == -4) WRITE (itfile, 9014)

               IF (info == -5) WRITE (itfile, 9015)

               IF (info == -8) WRITE (itfile, 9018)

               IF (info == -9) WRITE (itfile, 9019)

            END IF

            WRITE (itfile, 3008) time

         END IF

      END IF


1004  FORMAT(/, a4, 1p, 6(1x, d11.4), /, (4x, 1p, 6(1x, d11.4)))

3002  FORMAT(2(1x, i4), 2(1x, i5), 2x, a3, 1x, i4, 1p, 2(2x, d7.1), 6x, '-', 10x, '-')

3003  FORMAT(/, &

              '           * * *', /, /, &

              'Tit   = total number of iterations', /, &

              'Tnf   = total number of function evaluations', /, &

              'Tnint = total number of segments explored during', &

              ' Cauchy searches', /, &

              'Skip  = number of BFGS updates skipped', /, &

              'Nact  = number of active bounds at final generalized', &

              ' Cauchy point', /, &

              'Projg = norm of the final projected gradient', /, &

              'F     = final function value', /, /, &

              '           * * *')

3004  FORMAT(/, 3x, 'N', 4x, 'Tit', 5x, 'Tnf', 2x, 'Tnint', 2x, &

              'Skip', 2x, 'Nact', 5x, 'Projg', 8x, 'F')

3005  FORMAT(i5, 2(1x, i6), (1x, i6), (2x, i4), (1x, i5), 1p, 2(2x, d10.3))

3007  FORMAT(/, ' Cauchy                time', 1p, e10.3, ' seconds.', / &

              ' Subspace minimization time', 1p, e10.3, ' seconds.', / &

              ' Line search           time', 1p, e10.3, ' seconds.')

3008  FORMAT(/, ' Total User time', 1p, e10.3, ' seconds.',/)

3009  FORMAT(/, a60)

9011  FORMAT(/, &

              ' Matrix in 1st Cholesky factorization in formk is not Pos. Def.')

9012  FORMAT(/, &

              ' Matrix in 2st Cholesky factorization in formk is not Pos. Def.')

9013  FORMAT(/, &

              ' Matrix in the Cholesky factorization in formt is not Pos. Def.')

9014  FORMAT(/, &

              ' Derivative >= 0, backtracking line search impossible.', /, &

              '   Previous x, f and g restored.', /, &

              ' Possible causes: 1 error in function or gradient evaluation;', /, &

              '                  2 rounding errors dominate computation.')

9015  FORMAT(/, &

              ' Warning:  more than 10 function and gradient', /, &

              '   evaluations in the last line search.  Termination', /, &

              '   may possibly be caused by a bad search direction.')

9018  FORMAT(/, ' The triangular system is singular.')

9019  FORMAT(/, &

              ' Line search cannot locate an adequate point after 20 function', /, &

              '  and gradient evaluations.  Previous x, f and g restored.', /, &

              ' Possible causes: 1 error in function or gradient evaluation;', /, &

              '                  2 rounding error dominate computation.')


      RETURN


   END SUBROUTINE prn3lb


! **************************************************************************************************

!> \brief        This subroutine computes the infinity norm of the projected  gradient.

!> \param n ...

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd ...

!> \param x ...

!> \param g ...

!> \param g_inf_norm ...

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE projgr(n, lower_bound, upper_bound, nbd, x, g, g_inf_norm)


      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n)

      INTEGER, INTENT(in)                                :: nbd(n)

      REAL(kind=dp), INTENT(in)                          :: x(n), g(n)

      REAL(kind=dp)                                      :: g_inf_norm


      REAL(kind=dp), PARAMETER                           :: zero = 0.0_dp


      INTEGER                                            :: i

      REAL(kind=dp)                                      :: gi


      g_inf_norm = zero

      DO i = 1, n

         gi = g(i)

         IF (nbd(i) /= 0) THEN

            IF (gi < zero) THEN

               IF (nbd(i) >= 2) gi = max((x(i) - upper_bound(i)), gi)

            ELSE

               IF (nbd(i) <= 2) gi = min((x(i) - lower_bound(i)), gi)

            END IF

         END IF

         g_inf_norm = max(g_inf_norm, abs(gi))

      END DO


      RETURN


   END SUBROUTINE projgr


! **************************************************************************************************

!> \brief        This routine contains the major changes in the updated version.

!>               The changes are described in the accompanying paper

!>

!>               Jose Luis Morales, Jorge Nocedal

!>               "Remark On Algorithm 788: L-BFGS-B: Fortran Subroutines for Large

!>               Bound Constrained Optimization". Decemmber 27, 2010.

!>

!>               J.L. Morales  Departamento de Matematicas,

!>                             Instituto Tecnologico Autonomo de Mexico

!>                             Mexico D.F.

!>

!>               J, Nocedal    Department of Electrical Engineering and

!>                            Computer Science.

!>                             Northwestern University. Evanston, IL. USA

!>

!>                             January 17, 2011

!>

!>      *****************************************************************

!>

!>               Given xcp, l, u, r, an index set that specifies

!>               the active set at xcp, and an l-BFGS matrix B

!>               (in terms of WY, WS, SY, WT, head, col, and theta),

!>               this subroutine computes an approximate solution

!>               of the subspace problem

!>

!>               (P)   min Q(x) = r'(x-xcp) + 1/2 (x-xcp)' B (x-xcp)

!>

!>               subject to l<=x<=u

!>                       x_i=xcp_i for all i in A(xcp)

!>

!>               along the subspace unconstrained Newton direction

!>

!>               d = -(Z'BZ)^(-1) r.

!>

!>               The formula for the Newton direction, given the L-BFGS matrix

!>               and the Sherman-Morrison formula, is

!>

!>               d = (1/theta)r + (1/theta*2) Z'WK^(-1)W'Z r.

!>

!>               where

!>                 K = [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!>                     [L_a -R_z           theta*S'AA'S ]

!>

!>               Note that this procedure for computing d differs

!>               from that described in [1]. One can show that the matrix K is

!>               equal to the matrix M^[-1]N in that paper.

!> \param n      n is the dimension of the problem.

!> \param m      m is the maximum number of variable metric corrections

!>               used to define the limited memory matrix.

!> \param nsub   nsub is the number of free variables.

!> \param ind    ind specifies the coordinate indices of free variables.

!> \param lower_bound  the lower bound on x.

!> \param upper_bound  the upper bound on x.

!> \param nbd    nbd represents the type of bounds imposed on the

!>               variables, and must be specified as follows:

!>               nbd(i)=0 if x(i) is unbounded,

!>                      1 if x(i) has only a lower bound,

!>                      2 if x(i) has both lower and upper bounds, and

!>                      3 if x(i) has only an upper bound.

!> \param x      x is a double precision array of dimension n.

!>               On entry x specifies the Cauchy point xcp.

!>               On exit x(i) is the minimizer of Q over the subspace of free variables.

!> \param d      On entry d is the reduced gradient of Q at xcp.

!>               On exit d is the Newton direction of Q.

!> \param xp     xp is a double precision array of dimension n.

!>               used to safeguard the projected Newton direction

!> \param ws     ws and wy are double precision arrays;

!>               On entry they store the information defining the limited memory BFGS matrix:

!>               ws(n,m) stores S, a set of s-vectors;

!> \param wy     wy(n,m) stores Y, a set of y-vectors;

!> \param theta  theta is the scaling factor specifying B_0 = theta I;

!> \param xx     xx holds the current iterate

!> \param gg     gg holds the gradient at the current iterate

!> \param col    is the number of variable metric corrections stored;

!> \param head   head is the location of the 1st s- (or y-) vector in S (or Y).

!> \param iword  iword specifies the status of the subspace solution.

!>               iword = 0 if the solution is in the box,

!>                       1 if some bound is encountered.

!> \param wv     wv is a working array

!> \param wn     the upper triangle of wn stores the LEL^T factorization

!>               of the indefinite matrix

!>

!>               K = [-D -Y'ZZ'Y/theta     L_a'-R_z'  ]

!>                   [L_a -R_z           theta*S'AA'S ]

!>               where E = [-I  0]

!>                         [ 0  I]

!> \param iprint iprint is an INTEGER variable that must be set by the user.

!>               It controls the frequency and type of output generated:

!>               iprint<0    no output is generated;

!>               iprint=0    print only one line at the last iteration;

!>               0<iprint<99 print also f and |proj g| every iprint iterations;

!>               iprint=99   print details of every iteration except n-vectors;

!>               iprint=100  print also the changes of active set and final x;

!>               iprint>100  print details of every iteration including x and g;

!>               When iprint > 0, the file iterate.dat will be created to summarize the iteration.

!> \param info   info = 0       for normal return,

!>                    = nonzero for abnormal return when the matrix K is ill-conditioned.

!> \author       NEOS, November 1994. (Latest revision June 1996.)

!>               Optimization Technology Center.

!>               Argonne National Laboratory and Northwestern University.

!>               Written by

!>                           Ciyou Zhu

!>               in collaboration with R.H. Byrd, P. Lu-Chen and J. Nocedal.

! **************************************************************************************************

   SUBROUTINE subsm(n, m, nsub, ind, lower_bound, upper_bound, nbd, x, d, xp, ws, wy, &

                    theta, xx, gg, &

                    col, head, iword, wv, wn, iprint, info)

      INTEGER, INTENT(in)                                :: n, m, nsub, ind(nsub)

      REAL(kind=dp), INTENT(in)                          :: lower_bound(n), upper_bound(n)

      INTEGER, INTENT(in)                                :: nbd(n)

      REAL(kind=dp), INTENT(inout)                       :: x(n), d(n)

      REAL(kind=dp)                                      :: xp(n)

      REAL(kind=dp), INTENT(in)                          :: ws(n, m), wy(n, m), theta, xx(n), gg(n)

      INTEGER, INTENT(in)                                :: col, head

      INTEGER, INTENT(out)                               :: iword

      REAL(kind=dp)                                      :: wv(2*m)

      REAL(kind=dp), INTENT(in)                          :: wn(2*m, 2*m)

      INTEGER                                            :: iprint

      INTEGER, INTENT(out)                               :: info


      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp, zero = 0.0_dp


      INTEGER                                            :: col2, i, ibd, j, js, jy, k, m2, pointr

      REAL(kind=dp)                                      :: alpha, dd_p, dk, temp1, temp2, xk


!     References:

!

!       [1] R. H. Byrd, P. Lu, J. Nocedal and C. Zhu, ``A limited

!       memory algorithm for bound constrained optimization'',

!       SIAM J. Scientific Computing 16 (1995), no. 5, pp. 1190--1208.

!

!

!

!                           *  *  *

!


      IF (nsub <= 0) RETURN

      IF (iprint >= 99) WRITE (*, 1001)


!     Compute wv = W'Zd.


      pointr = head

      DO i = 1, col

         temp1 = zero

         temp2 = zero

         DO j = 1, nsub

            k = ind(j)

            temp1 = temp1 + wy(k, pointr)*d(j)

            temp2 = temp2 + ws(k, pointr)*d(j)

         END DO

         wv(i) = temp1

         wv(col + i) = theta*temp2

         pointr = mod(pointr, m) + 1

      END DO


!     Compute wv:=K^(-1)wv.


      m2 = 2*m

      col2 = 2*col

      CALL dtrsl(wn, m2, col2, wv, 11, info)

      IF (info /= 0) RETURN

      DO i = 1, col

         wv(i) = -wv(i)

      END DO

      CALL dtrsl(wn, m2, col2, wv, 01, info)

      IF (info /= 0) RETURN


!     Compute d = (1/theta)d + (1/theta**2)Z'W wv.


      pointr = head

      DO jy = 1, col

         js = col + jy

         DO i = 1, nsub

            k = ind(i)

            d(i) = d(i) + wy(k, pointr)*wv(jy)/theta                     &

     &                  + ws(k, pointr)*wv(js)

         END DO

         pointr = mod(pointr, m) + 1

      END DO


      CALL dscal(nsub, one/theta, d, 1)

!

!-----------------------------------------------------------------

!     Let us try the projection, d is the Newton direction


      iword = 0


      CALL dcopy(n, x, 1, xp, 1)

!

      DO i = 1, nsub

         k = ind(i)

         dk = d(i)

         xk = x(k)

         IF (nbd(k) /= 0) THEN

!

            ! lower bounds only

            IF (nbd(k) .EQ. 1) THEN

               x(k) = max(lower_bound(k), xk + dk)

               IF (x(k) .EQ. lower_bound(k)) iword = 1

            ELSE

!

               ! upper and lower bounds

               IF (nbd(k) .EQ. 2) THEN

                  xk = max(lower_bound(k), xk + dk)

                  x(k) = min(upper_bound(k), xk)

                  IF (x(k) .EQ. lower_bound(k) .OR. x(k) .EQ. upper_bound(k)) iword = 1

               ELSE

!

                  ! upper bounds only

                  IF (nbd(k) .EQ. 3) THEN

                     x(k) = min(upper_bound(k), xk + dk)

                     IF (x(k) .EQ. upper_bound(k)) iword = 1

                  END IF

               END IF

            END IF

!

            ! free variables

         ELSE

            x(k) = xk + dk

         END IF

      END DO

!

      IF (.NOT. (iword .EQ. 0)) THEN

!

!     check sign of the directional derivative

!

         dd_p = zero

         DO i = 1, n

            dd_p = dd_p + (x(i) - xx(i))*gg(i)

         END DO

         IF (dd_p .GT. zero) THEN

            CALL dcopy(n, xp, 1, x, 1)

            IF (iprint > 0) WRITE (*, *) ' Positive dir derivative in projection '

            IF (iprint > 0) WRITE (*, *) ' Using the backtracking step '

            alpha = one

            temp1 = alpha

            ibd = 0

            DO i = 1, nsub

               k = ind(i)

               dk = d(i)

               IF (nbd(k) /= 0) THEN

                  IF (dk < zero .AND. nbd(k) <= 2) THEN

                     temp2 = lower_bound(k) - x(k)

                     IF (temp2 >= zero) THEN

                        temp1 = zero

                     ELSE IF (dk*alpha < temp2) THEN

                        temp1 = temp2/dk

                     END IF

                  ELSE IF (dk > zero .AND. nbd(k) >= 2) THEN

                     temp2 = upper_bound(k) - x(k)

                     IF (temp2 <= zero) THEN

                        temp1 = zero

                     ELSE IF (dk*alpha > temp2) THEN

                        temp1 = temp2/dk

                     END IF

                  END IF

                  IF (temp1 < alpha) THEN

                     alpha = temp1

                     ibd = i

                  END IF

               END IF

            END DO


            IF (alpha < one) THEN

               dk = d(ibd)

               k = ind(ibd)

               IF (dk > zero) THEN

                  x(k) = upper_bound(k)

                  d(ibd) = zero

               ELSE IF (dk < zero) THEN

                  x(k) = lower_bound(k)

                  d(ibd) = zero

               END IF

            END IF

            DO i = 1, nsub

               k = ind(i)

               x(k) = x(k) + alpha*d(i)

            END DO

         END IF

      END IF


      IF (iprint >= 99) WRITE (*, 1004)


1001  FORMAT(/, '----------------SUBSM entered-----------------',/)

1004  FORMAT(/, '----------------exit SUBSM --------------------',/)


      RETURN


   END SUBROUTINE subsm


! **************************************************************************************************

!> \brief         This subroutine finds a step that satisfies a sufficient

!>                decrease condition and a curvature condition.

!>

!>                Each call of the subroutine updates an interval with

!>                endpoints stx and sty. The interval is initially chosen

!>                so that it contains a minimizer of the modified function

!>

!>                      psi(stp) = f(stp) - f(0) - ftol*stp*f'(0).

!>

!>                If psi(stp) <= 0 and f'(stp) >= 0 for some step, then the

!>                interval is chosen so that it contains a minimizer of f.

!>

!>                The algorithm is designed to find a step that satisfies

!>                the sufficient decrease condition

!>

!>                f(stp) <= f(0) + ftol*stp*f'(0),

!>

!>                and the curvature condition

!>

!>                abs(f'(stp)) <= gtol*abs(f'(0)).

!>

!>                If ftol is less than gtol and if, for example, the function

!>                is bounded below, then there is always a step which satisfies

!>                both conditions.

!>

!>                If no step can be found that satisfies both conditions, then

!>                the algorithm stops with a warning. In this case stp only

!>                satisfies the sufficient decrease condition.

!>

!>                A typical invocation of dcsrch has the following outline:

!>

!>                task = 'START'

!>                DO WHILE (.TRUE.)

!>                   call dcsrch( ... )

!>                   if (task .eq. 'FG') then

!>                      Evaluate the function and the gradient at stp

!>                   else

!>                      exit

!>                   end if

!>                END DO

!> \param f       On initial entry f is the value of the function at 0.

!>                On subsequent entries f is the value of the

!>                function at stp.

!>                On exit f is the value of the function at stp.

!> \param g       On initial entry g is the derivative of the function at 0.

!>                On subsequent entries g is the derivative of the

!>                function at stp.

!>                On exit g is the derivative of the function at stp.

!> \param stp     On entry stp is the current estimate of a satisfactory

!>                step. On initial entry, a positive initial estimate

!>                must be provided.

!>                On exit stp is the current estimate of a satisfactory step

!>                if task = 'FG'. If task = 'CONV' then stp satisfies

!>                the sufficient decrease and curvature condition.

!> \param ftol    ftol specifies a nonnegative tolerance for the

!>                sufficient decrease condition.

!> \param gtol    gtol specifies a nonnegative tolerance for the

!>                curvature condition.

!> \param xtol    xtol specifies a nonnegative relative tolerance

!>                for an acceptable step. The subroutine exits with a

!>                warning if the relative difference between sty and stx

!>                is less than xtol.

!> \param stpmin  stpmin is a nonnegative lower bound for the step.

!> \param stpmax  stpmax is a nonnegative upper bound for the step.

!> \param task    task is a character variable of length at least 60.

!>                On initial entry task must be set to 'START'.

!>                On exit task indicates the required action:

!>

!>                If task(1:2) = 'FG' then evaluate the function and

!>                derivative at stp and call dcsrch again.

!>

!>                If task(1:4) = 'CONV' then the search is successful.

!>

!>                If task(1:4) = 'WARN' then the subroutine is not able

!>                to satisfy the convergence conditions. The exit value of

!>                stp contains the best point found during the search.

!>

!>                If task(1:5) = 'ERROR' then there is an error in the

!>                input arguments.

!>

!>                On exit with convergence, a warning or an error, the

!>                variable task contains additional information.

!> \param isave   is work array

!> \param dsave   is a work array

! **************************************************************************************************

   SUBROUTINE dcsrch(f, g, stp, ftol, gtol, xtol, stpmin, stpmax, &

                     task, isave, dsave)

      REAL(kind=dp)                                      :: f, g

      REAL(kind=dp), INTENT(inout)                       :: stp

      REAL(kind=dp)                                      :: ftol, gtol, xtol, stpmin, stpmax

      CHARACTER(LEN=*)                                   :: task

      INTEGER                                            :: isave(2)

      REAL(kind=dp)                                      :: dsave(13)


      REAL(kind=dp), PARAMETER                           :: p5 = 0.5_dp, p66 = 0.66_dp, &

                                                            xtrapl = 1.1_dp, xtrapu = 4.0_dp, &

                                                            zero = 0.0_dp


      INTEGER                                            :: stage

      LOGICAL                                            :: brackt

      REAL(kind=dp)                                      :: finit, fm, ftest, fx, fxm, fy, fym, &

                                                            ginit, gm, gtest, gx, gxm, gy, gym, &

                                                            stmax, stmin, stx, sty, width, width1


!

!     NOTE: The user must no alter work arrays between calls.

!

!

!     MINPACK-1 Project. June 1983.

!     Argonne National Laboratory.

!     Jorge J. More' and David J. Thuente.

!

!     MINPACK-2 Project. October 1993.

!     Argonne National Laboratory and University of Minnesota.

!     Brett M. Averick, Richard G. Carter, and Jorge J. More'.

!

!     **********

!     Initialization block.


      IF (task(1:5) == 'START') THEN


!        Check the input arguments for errors.


         IF (stp < stpmin) task = 'ERROR: STP < STPMIN'

         IF (stp > stpmax) task = 'ERROR: STP > STPMAX'

         IF (g >= zero) task = 'ERROR: INITIAL G >= ZERO'

         IF (ftol < zero) task = 'ERROR: FTOL < ZERO'

         IF (gtol < zero) task = 'ERROR: GTOL < ZERO'

         IF (xtol < zero) task = 'ERROR: XTOL < ZERO'

         IF (stpmin < zero) task = 'ERROR: STPMIN < ZERO'

         IF (stpmax < stpmin) task = 'ERROR: STPMAX < STPMIN'


!        Exit if there are errors on input.


         IF (task(1:5) == 'ERROR') RETURN


!        Initialize local variables.


         brackt = .false.

         stage = 1

         finit = f

         ginit = g

         gtest = ftol*ginit

         width = stpmax - stpmin

         width1 = width/p5


!        The variables stx, fx, gx contain the values of the step,

!        function, and derivative at the best step.

!        The variables sty, fy, gy contain the value of the step,

!        function, and derivative at sty.

!        The variables stp, f, g contain the values of the step,

!        function, and derivative at stp.


         stx = zero

         fx = finit

         gx = ginit

         sty = zero

         fy = finit

         gy = ginit

         stmin = zero

         stmax = stp + xtrapu*stp

         task = 'FG'


      ELSE


!        Restore local variables.


         IF (isave(1) == 1) THEN

            brackt = .true.

         ELSE

            brackt = .false.

         END IF

         stage = isave(2)

         ginit = dsave(1)

         gtest = dsave(2)

         gx = dsave(3)

         gy = dsave(4)

         finit = dsave(5)

         fx = dsave(6)

         fy = dsave(7)

         stx = dsave(8)

         sty = dsave(9)

         stmin = dsave(10)

         stmax = dsave(11)

         width = dsave(12)

         width1 = dsave(13)


!        If psi(stp) <= 0 and f'(stp) >= 0 for some step, then the

!        algorithm enters the second stage.


         ftest = finit + stp*gtest

         IF (stage == 1 .AND. f <= ftest .AND. g >= zero) &

            stage = 2


!        Test for warnings.


         IF (brackt .AND. (stp <= stmin .OR. stp >= stmax)) &

            task = 'WARNING: ROUNDING ERRORS PREVENT PROGRESS'

         IF (brackt .AND. stmax - stmin <= xtol*stmax) &

            task = 'WARNING: XTOL TEST SATISFIED'

         IF (stp == stpmax .AND. f <= ftest .AND. g <= gtest) &

            task = 'WARNING: STP = STPMAX'

         IF (stp == stpmin .AND. (f > ftest .OR. g >= gtest)) &

            task = 'WARNING: STP = STPMIN'


!        Test for convergence.


         IF (f <= ftest .AND. abs(g) <= gtol*(-ginit)) &

            task = 'CONVERGENCE'


!        Test for termination.


         IF (.NOT. (task(1:4) == 'WARN' .OR. task(1:4) == 'CONV')) THEN


!        A modified function is used to predict the step during the

!        first stage if a lower function value has been obtained but

!        the decrease is not sufficient.


            IF (stage == 1 .AND. f <= fx .AND. f > ftest) THEN


!             Define the modified function and derivative values.


               fm = f - stp*gtest

               fxm = fx - stx*gtest

               fym = fy - sty*gtest

               gm = g - gtest

               gxm = gx - gtest

               gym = gy - gtest


!             Call dcstep to update stx, sty, and to compute the new step.


               CALL dcstep(stx, fxm, gxm, sty, fym, gym, stp, fm, gm, &

                           brackt, stmin, stmax)


!             Reset the function and derivative values for f.


               fx = fxm + stx*gtest

               fy = fym + sty*gtest

               gx = gxm + gtest

               gy = gym + gtest


            ELSE


!             Call dcstep to update stx, sty, and to compute the new step.


               CALL dcstep(stx, fx, gx, sty, fy, gy, stp, f, g, &

                           brackt, stmin, stmax)


            END IF


!          Decide if a bisection step is needed.


            IF (brackt) THEN

               IF (abs(sty - stx) >= p66*width1) stp = stx + p5*(sty - stx)

               width1 = width

               width = abs(sty - stx)

            END IF


!          Set the minimum and maximum steps allowed for stp.


            IF (brackt) THEN

               stmin = min(stx, sty)

               stmax = max(stx, sty)

            ELSE

               stmin = stp + xtrapl*(stp - stx)

               stmax = stp + xtrapu*(stp - stx)

            END IF


!          Force the step to be within the bounds stpmax and stpmin.


            stp = max(stp, stpmin)

            stp = min(stp, stpmax)


!          If further progress is not possible, let stp be the best

!          point obtained during the search.


            IF (brackt .AND. (stp <= stmin .OR. stp >= stmax) &

                .OR. (brackt .AND. stmax - stmin <= xtol*stmax)) stp = stx


!          Obtain another function and derivative.


            task = 'FG'


         END IF

      END IF


!     Save local variables.


      IF (brackt) THEN

         isave(1) = 1

      ELSE

         isave(1) = 0

      END IF

      isave(2) = stage

      dsave(1) = ginit

      dsave(2) = gtest

      dsave(3) = gx

      dsave(4) = gy

      dsave(5) = finit

      dsave(6) = fx

      dsave(7) = fy

      dsave(8) = stx

      dsave(9) = sty

      dsave(10) = stmin

      dsave(11) = stmax

      dsave(12) = width

      dsave(13) = width1


      RETURN

   END SUBROUTINE dcsrch


! **************************************************************************************************

!> \brief          This subroutine computes a safeguarded step for a search

!>                 procedure and updates an interval that contains a step that

!>                 satisfies a sufficient decrease and a curvature condition.

!>

!>                 The parameter stx contains the step with the least function

!>                 value. If brackt is set to .true. then a minimizer has

!>                 been bracketed in an interval with endpoints stx and sty.

!>                 The parameter stp contains the current step.

!>                 The subroutine assumes that if brackt is set to .true. then

!>

!>                    min(stx,sty) < stp < max(stx,sty),

!>

!>                 and that the derivative at stx is negative in the direction

!>                 of the step.

!> \param stx      On entry stx is the best step obtained so far and is an

!>                 endpoint of the interval that contains the minimizer.

!>                 On exit stx is the updated best step.

!> \param fx       fx is the function at stx.

!> \param dx       On entry dx is the derivative of the function at

!>                 stx. The derivative must be negative in the direction of

!>                 the step, that is, dx and stp - stx must have opposite

!>                 signs.

!>                 On exit dx is the derivative of the function at stx.

!> \param sty      On entry sty is the second endpoint of the interval that

!>                 contains the minimizer.

!>                 On exit sty is the updated endpoint of the interval that

!>                 contains the minimizer.

!> \param fy       fy is the function at sty.

!> \param dy       On entry dy is the derivative of the function at sty.

!>                 On exit dy is the derivative of the function at the exit sty.

!> \param stp      On entry stp is the current step. If brackt is set to .true.

!>                 then on input stp must be between stx and sty.

!>                 On exit stp is a new trial step.

!> \param fp       fp is the function at stp

!> \param dp_loc   dp_loc is the the derivative of the function at stp.

!> \param brackt   On entry brackt specifies if a minimizer has been bracketed.

!>                 Initially brackt must be set to .false.

!>                 On exit brackt specifies if a minimizer has been bracketed.

!>                 When a minimizer is bracketed brackt is set to .true.

!> \param stpmin   stpmin is a lower bound for the step.

!> \param stpmax   stpmax is an upper bound for the step.

! **************************************************************************************************

   SUBROUTINE dcstep(stx, fx, dx, sty, fy, dy, stp, fp, dp_loc, brackt, &

                     stpmin, stpmax)

      REAL(kind=dp), INTENT(inout)                       :: stx, fx, dx, sty, fy, dy, stp

      REAL(kind=dp), INTENT(in)                          :: fp, dp_loc

      LOGICAL, INTENT(inout)                             :: brackt

      REAL(kind=dp), INTENT(in)                          :: stpmin, stpmax


      REAL(kind=dp), PARAMETER                           :: p66 = 0.66_dp, three = 3.0_dp, &

                                                            two = 2.0_dp, zero = 0.0_dp


      REAL(kind=dp)                                      :: gamma, p, q, r, s, sgnd, stpc, stpf, &

                                                            stpq, theta


!

!     MINPACK-1 Project. June 1983

!     Argonne National Laboratory.

!     Jorge J. More' and David J. Thuente.

!

!     MINPACK-2 Project. October 1993.

!     Argonne National Laboratory and University of Minnesota.

!     Brett M. Averick and Jorge J. More'.

!

!     **********


      sgnd = dp_loc*sign(1.0_dp, dx)


!     First case: A higher function value. The minimum is bracketed.

!     If the cubic step is closer to stx than the quadratic step, the

!     cubic step is taken, otherwise the average of the cubic and

!     quadratic steps is taken.


      IF (fp > fx) THEN

         theta = three*(fx - fp)/(stp - stx) + dx + dp_loc

         s = max(abs(theta), abs(dx), abs(dp_loc))

         gamma = s*sqrt((theta/s)**2 - (dx/s)*(dp_loc/s))

         IF (stp < stx) gamma = -gamma

         p = (gamma - dx) + theta

         q = ((gamma - dx) + gamma) + dp_loc

         r = p/q

         stpc = stx + r*(stp - stx)

         stpq = stx + ((dx/((fx - fp)/(stp - stx) + dx))/two)*          &

     &                                                       (stp - stx)

         IF (abs(stpc - stx) < abs(stpq - stx)) THEN

            stpf = stpc

         ELSE

            stpf = stpc + (stpq - stpc)/two

         END IF

         brackt = .true.


!     Second case: A lower function value and derivatives of opposite

!     sign. The minimum is bracketed. If the cubic step is farther from

!     stp than the secant step, the cubic step is taken, otherwise the

!     secant step is taken.


      ELSE IF (sgnd < zero) THEN

         theta = three*(fx - fp)/(stp - stx) + dx + dp_loc

         s = max(abs(theta), abs(dx), abs(dp_loc))

         gamma = s*sqrt((theta/s)**2 - (dx/s)*(dp_loc/s))

         IF (stp > stx) gamma = -gamma

         p = (gamma - dp_loc) + theta

         q = ((gamma - dp_loc) + gamma) + dx

         r = p/q

         stpc = stp + r*(stx - stp)

         stpq = stp + (dp_loc/(dp_loc - dx))*(stx - stp)

         IF (abs(stpc - stp) > abs(stpq - stp)) THEN

            stpf = stpc

         ELSE

            stpf = stpq

         END IF

         brackt = .true.


!     Third case: A lower function value, derivatives of the same sign,

!     and the magnitude of the derivative decreases.


      ELSE IF (abs(dp_loc) < abs(dx)) THEN


!        The cubic step is computed only if the cubic tends to infinity

!        in the direction of the step or if the minimum of the cubic

!        is beyond stp. Otherwise the cubic step is defined to be the

!        secant step.


         theta = three*(fx - fp)/(stp - stx) + dx + dp_loc

         s = max(abs(theta), abs(dx), abs(dp_loc))


!        The case gamma = 0 only arises if the cubic does not tend

!        to infinity in the direction of the step.


         gamma = s*sqrt(max(zero, (theta/s)**2 - (dx/s)*(dp_loc/s)))

         IF (stp > stx) gamma = -gamma

         p = (gamma - dp_loc) + theta

         q = (gamma + (dx - dp_loc)) + gamma

         r = p/q

         IF (r < zero .AND. gamma /= zero) THEN

            stpc = stp + r*(stx - stp)

         ELSE IF (stp > stx) THEN

            stpc = stpmax

         ELSE

            stpc = stpmin

         END IF

         stpq = stp + (dp_loc/(dp_loc - dx))*(stx - stp)


         IF (brackt) THEN


!           A minimizer has been bracketed. If the cubic step is

!           closer to stp than the secant step, the cubic step is

!           taken, otherwise the secant step is taken.


            IF (abs(stpc - stp) < abs(stpq - stp)) THEN

               stpf = stpc

            ELSE

               stpf = stpq

            END IF

            IF (stp > stx) THEN

               stpf = min(stp + p66*(sty - stp), stpf)

            ELSE

               stpf = max(stp + p66*(sty - stp), stpf)

            END IF

         ELSE


!           A minimizer has not been bracketed. If the cubic step is

!           farther from stp than the secant step, the cubic step is

!           taken, otherwise the secant step is taken.


            IF (abs(stpc - stp) > abs(stpq - stp)) THEN

               stpf = stpc

            ELSE

               stpf = stpq

            END IF

            stpf = min(stpmax, stpf)

            stpf = max(stpmin, stpf)

         END IF


!     Fourth case: A lower function value, derivatives of the same sign,

!     and the magnitude of the derivative does not decrease. If the

!     minimum is not bracketed, the step is either stpmin or stpmax,

!     otherwise the cubic step is taken.


      ELSE

         IF (brackt) THEN

            theta = three*(fp - fy)/(sty - stp) + dy + dp_loc

            s = max(abs(theta), abs(dy), abs(dp_loc))

            gamma = s*sqrt((theta/s)**2 - (dy/s)*(dp_loc/s))

            IF (stp > sty) gamma = -gamma

            p = (gamma - dp_loc) + theta

            q = ((gamma - dp_loc) + gamma) + dy

            r = p/q

            stpc = stp + r*(sty - stp)

            stpf = stpc

         ELSE IF (stp > stx) THEN

            stpf = stpmax

         ELSE

            stpf = stpmin

         END IF

      END IF


!     Update the interval which contains a minimizer.


      IF (fp > fx) THEN

         sty = stp

         fy = fp

         dy = dp_loc

      ELSE

         IF (sgnd < zero) THEN

            sty = stx

            fy = fx

            dy = dx

         END IF

         stx = stp

         fx = fp

         dx = dp_loc

      END IF


!     Compute the new step.


      stp = stpf


      RETURN

   END SUBROUTINE dcstep


!MK LINPACK


! **************************************************************************************************

!> \brief         factors a double precision symmetric positive definite

!>                matrix.

!>

!>                dpofa is usually called by dpoco, but it can be called

!>                directly with a saving in time if  rcond  is not needed.

!>                (time for dpoco) = (1 + 18/n)*(time for dpofa) .

!> \param a       the symmetric matrix to be factored.  only the

!>                diagonal and upper triangle are used.

!>                on return

!>                an upper triangular matrix  r  so that  a = trans(r)*r

!>                where  trans(r)  is the transpose.

!>                the strict lower triangle is unaltered.

!>                if  info .ne. 0 , the factorization is not complete.

!> \param lda     the leading dimension of the array  a .

!> \param n       the order of the matrix  a .

!> \param info    = 0  for normal return.

!>                = k  signals an error condition.  the leading minor

!>                     of order  k  is not positive definite.

! **************************************************************************************************

   SUBROUTINE dpofa(a, lda, n, info)

      INTEGER, INTENT(in)                                :: lda

      REAL(kind=dp)                                      :: a(lda, *)

      INTEGER, INTENT(in)                                :: n

      INTEGER                                            :: info


      INTEGER                                            :: j, jm1, k

      REAL(kind=dp)                                      :: ddot, s, t


!

!     linpack.  this version dated 08/14/78 .

!     cleve moler, university of new mexico, argonne national lab.

!

!     begin block with ...exits to 40

!

!


      DO j = 1, n

         info = j

         s = 0.0_dp

         jm1 = j - 1

         IF (.NOT. (jm1 < 1)) THEN

            DO k = 1, jm1

               t = a(k, j) - ddot(k - 1, a(1, k), 1, a(1, j), 1)

               t = t/a(k, k)

               a(k, j) = t

               s = s + t*t

            END DO

         END IF

         s = a(j, j) - s

!     ......exit

         IF (s <= 0.0_dp) EXIT

         a(j, j) = sqrt(s)

         info = 0

      END DO

      RETURN

   END SUBROUTINE dpofa


! **************************************************************************************************

!> \brief           dtrsl solves systems of the form

!>

!>                  t * x = b

!>                  or

!>                  trans(t) * x = b

!>

!>                  where t is a triangular matrix of order n. here trans(t)

!>                  denotes the transpose of the matrix t.

!> \param t         t contains the matrix of the system. the zero

!>                  elements of the matrix are not referenced, and

!>                  the corresponding elements of the array can be

!>                  used to store other information.

!> \param ldt       ldt is the leading dimension of the array t.

!> \param n         n is the order of the system.

!> \param b         contains the right hand side of the system.

!>                  on return

!>                  b contains the solution, if info .eq. 0.

!>                  otherwise b is unaltered.

!> \param job       job specifies what kind of system is to be solved.

!>                   if job is

!>                       00   solve t*x=b, t lower triangular,

!>                       01   solve t*x=b, t upper triangular,

!>                       10   solve trans(t)*x=b, t lower triangular,

!>                       11   solve trans(t)*x=b, t upper triangular.

!> \param info      on return

!>                  info contains zero if the system is nonsingular.

!>                  otherwise info contains the index of

!>                  the first zero diagonal element of t.

! **************************************************************************************************

   SUBROUTINE dtrsl(t, ldt, n, b, job, info)

      INTEGER, INTENT(in)                                :: ldt

      REAL(kind=dp), INTENT(in)                          :: t(ldt, *)

      INTEGER, INTENT(in)                                :: n

      REAL(kind=dp), INTENT(inout)                       :: b(*)

      INTEGER, INTENT(in)                                :: job

      INTEGER, INTENT(out)                               :: info


      INTEGER                                            :: case, j, jj

      REAL(kind=dp)                                      :: ddot, temp


!     linpack. this version dated 08/14/78 .

!     g. w. stewart, university of maryland, argonne national lab.

!

!     begin block permitting ...exits to 150

!

!        check for zero diagonal elements.

!


      DO info = 1, n

!     ......exit

         IF (t(info, info) == 0.0_dp) RETURN

      END DO

      info = 0

!

!        determine the task and go to it.

!

      CASE = 1

      IF (mod(job, 10) /= 0) CASE = 2

      IF (mod(job, 100)/10 /= 0) CASE = CASE + 2


      SELECT CASE (case)

      CASE (1)

!

!        solve t*x=b for t lower triangular

!

         b(1) = b(1)/t(1, 1)

         IF (n > 1) THEN

            DO j = 2, n

               temp = -b(j - 1)

               CALL daxpy(n - j + 1, temp, t(j, j - 1), 1, b(j), 1)

               b(j) = b(j)/t(j, j)

            END DO

         END IF

      CASE (2)

!

!        solve t*x=b for t upper triangular.

!

         b(n) = b(n)/t(n, n)

         IF (n > 1) THEN

            DO jj = 2, n

               j = n - jj + 1

               temp = -b(j + 1)

               CALL daxpy(j, temp, t(1, j + 1), 1, b(1), 1)

               b(j) = b(j)/t(j, j)

            END DO

         END IF

      CASE (3)

!

!        solve trans(t)*x=b for t lower triangular.

!

         b(n) = b(n)/t(n, n)

         IF (n > 1) THEN

            DO jj = 2, n

               j = n - jj + 1

               b(j) = b(j) - ddot(jj - 1, t(j + 1, j), 1, b(j + 1), 1)

               b(j) = b(j)/t(j, j)

            END DO

         END IF

      CASE (4)

!

!        solve trans(t)*x=b for t upper triangular.

!

         b(1) = b(1)/t(1, 1)

         IF (.NOT. (n < 2)) THEN

            DO j = 2, n

               b(j) = b(j) - ddot(j - 1, t(1, j), 1, b(1), 1)

               b(j) = b(j)/t(j, j)

            END DO

         END IF

      CASE DEFAULT

         cpabort("unexpected case")

      END SELECT


      RETURN

   END SUBROUTINE dtrsl


!MK Timer


! **************************************************************************************************

!> \brief This routine computes cpu time in double precision; it makes use o

!>        the intrinsic f90 cpu_time therefore a conversion type is

!>        needed.

!> \param ttime ...

! **************************************************************************************************

   SUBROUTINE timer(ttime)

      REAL(kind=dp)                                      :: ttime


!

!     REAL temp

!

!           J.L Morales  Departamento de Matematicas,

!                        Instituto Tecnologico Autonomo de Mexico

!                        Mexico D.F.

!

!           J.L Nocedal  Department of Electrical Engineering and

!                        Computer Science.

!                        Northwestern University. Evanston, IL. USA

!

!                        January 21, 2011

!

!MK      temp = sngl(ttime)

!MK      CALL cpu_time(temp)

!MK      ttime = REAL(temp, KIND=dp)


      ttime = m_walltime()


   END SUBROUTINE timer


! **************************************************************************************************

!> \brief  Saves the lcoal variables, long term this should be replaces by a lbfgs type

!> \param lsave    lsave is a working array

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 If lsave(1) = .true.  then  the initial X has been replaced by

!>                               its projection in the feasible set

!>                 If lsave(2) = .true.  then  the problem is constrained;

!>                 If lsave(3) = .true.  then  each variable has upper and lower bounds;

!> \param isave    isave is a working array

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 isave(22) = the total number of intervals explored in the

!>                         search of Cauchy points;

!>                 isave(26) = the total number of skipped BFGS updates before the current iteration;

!>                 isave(30) = the number of current iteration;

!>                 isave(31) = the total number of BFGS updates prior the current iteration;

!>                 isave(33) = the number of intervals explored in the search of

!>                             Cauchy point in the current iteration;

!>                 isave(34) = the total number of function and gradient evaluations;

!>                 isave(36) = the number of function value or gradient

!>                             evaluations in the current iteration;

!>                 if isave(37) = 0  then the subspace argmin is within the box;

!>                 if isave(37) = 1  then the subspace argmin is beyond the box;

!>                 isave(38) = the number of free variables in the current iteration;

!>                 isave(39) = the number of active constraints in the current iteration;

!>                 n + 1 - isave(40) = the number of variables leaving the set of

!>                                     active constraints in the current iteration;

!>                 isave(41) = the number of variables entering the set of active

!>                             constraints in the current iteration.

!> \param dsave    dsave is a working array of dimension 29.

!>                 On exit with 'task' = NEW_X, the following information is available:

!>                 dsave(1) = current 'theta' in the BFGS matrix;

!>                 dsave(2) = f(x) in the previous iteration;

!>                 dsave(3) = factr*epsmch;

!>                 dsave(4) = 2-norm of the line search direction vector;

!>                 dsave(5) = the machine precision epsmch generated by the code;

!>                 dsave(7) = the accumulated time spent on searching for Cauchy points;

!>                 dsave(8) = the accumulated time spent on subspace minimization;

!>                 dsave(9) = the accumulated time spent on line search;

!>                 dsave(11) = the slope of the line search function at the current point of line search;

!>                 dsave(12) = the maximum relative step length imposed in line search;

!>                 dsave(13) = the infinity norm of the projected gradient;

!>                 dsave(14) = the relative step length in the line search;

!>                 dsave(15) = the slope of the line search function at the starting point of the line search;

!>                 dsave(16) = the square of the 2-norm of the line search direction vector.

!> \param x_projected ...

!> \param constrained ...

!> \param boxed ...

!> \param updatd ...

!> \param nintol ...

!> \param itfile ...

!> \param iback ...

!> \param nskip ...

!> \param head ...

!> \param col ...

!> \param itail ...

!> \param iter ...

!> \param iupdat ...

!> \param nseg ...

!> \param nfgv ...

!> \param info ...

!> \param ifun ...

!> \param iword ...

!> \param nfree ...

!> \param nact ...

!> \param ileave ...

!> \param nenter ...

!> \param theta ...

!> \param fold ...

!> \param tol ...

!> \param dnorm ...

!> \param epsmch ...

!> \param cpu1 ...

!> \param cachyt ...

!> \param sbtime ...

!> \param lnscht ...

!> \param time1 ...

!> \param gd ...

!> \param step_max ...

!> \param g_inf_norm ...

!> \param stp ...

!> \param gdold ...

!> \param dtd ...

!> \author Samuel Andermatt (01.15)

! **************************************************************************************************


   SUBROUTINE save_local(lsave,isave,dsave,x_projected,constrained,boxed,updatd,nintol,itfile,iback,nskip,head,col,itail,&

                  iter, iupdat, nseg, nfgv, info, ifun, iword, nfree, nact, ileave, nenter, theta, fold, tol, dnorm, epsmch, cpu1, &

                         cachyt, sbtime, lnscht, time1, gd, step_max, g_inf_norm, stp, gdold, dtd)

      LOGICAL, INTENT(out)                               :: lsave(4)

      INTEGER, INTENT(out)                               :: isave(23)

      REAL(kind=dp), INTENT(out)                         :: dsave(29)

      LOGICAL, INTENT(in)                                :: x_projected, constrained, boxed, updatd

      INTEGER, INTENT(in)                                :: nintol, itfile, iback, nskip, head, col, &

                                                            itail, iter, iupdat, nseg, nfgv, info, &

                                                            ifun, iword, nfree, nact, ileave, &

                                                            nenter

      REAL(kind=dp), INTENT(in)                          :: theta, fold, tol, dnorm, epsmch, cpu1, &

                                                            cachyt, sbtime, lnscht, time1, gd, &

                                                            step_max, g_inf_norm, stp, gdold, dtd


      lsave(1) = x_projected

      lsave(2) = constrained

      lsave(3) = boxed

      lsave(4) = updatd


      isave(1) = nintol

      isave(3) = itfile

      isave(4) = iback

      isave(5) = nskip

      isave(6) = head

      isave(7) = col

      isave(8) = itail

      isave(9) = iter

      isave(10) = iupdat

      isave(12) = nseg

      isave(13) = nfgv

      isave(14) = info

      isave(15) = ifun

      isave(16) = iword

      isave(17) = nfree

      isave(18) = nact

      isave(19) = ileave

      isave(20) = nenter


      dsave(1) = theta

      dsave(2) = fold

      dsave(3) = tol

      dsave(4) = dnorm

      dsave(5) = epsmch

      dsave(6) = cpu1

      dsave(7) = cachyt

      dsave(8) = sbtime

      dsave(9) = lnscht

      dsave(10) = time1

      dsave(11) = gd

      dsave(12) = step_max

      dsave(13) = g_inf_norm

      dsave(14) = stp

      dsave(15) = gdold

      dsave(16) = dtd


   END SUBROUTINE save_local


END MODULE cp_lbfgs

bibliography
collects all references to literature in CP2K as new algorithms / method are included from literature...
Definition bibliography.F:21

bibliography::byrd1995
integer, save, public byrd1995
Definition bibliography.F:36

cp_files
Utility routines to open and close files. Tracking of preconnections.
Definition cp_files.F:16

cp_files::open_file
subroutine, public open_file(file_name, file_status, file_form, file_action, file_position, file_pad, unit_number, debug, skip_get_unit_number, file_access)
Opens the requested file using a free unit number.
Definition cp_files.F:308

cp_lbfgs
LBFGS-B routine (version 3.0, April 25, 2011)
Definition cp_lbfgs.F:19

cp_lbfgs::setulb
subroutine, public setulb(n, m, x, lower_bound, upper_bound, nbd, f, g, factr, pgtol, wa, iwa, task, iprint, csave, lsave, isave, dsave, trust_radius, spgr)
This subroutine partitions the working arrays wa and iwa, and then uses the limited memory BFGS metho...
Definition cp_lbfgs.F:185

gamma
Calculation of the incomplete Gamma function F_n(t) for multi-center integrals over Cartesian Gaussia...
Definition gamma.F:15

kinds
Defines the basic variable types.
Definition kinds.F:23

kinds::dp
integer, parameter, public dp
Definition kinds.F:34

machine
Machine interface based on Fortran 2003 and POSIX.
Definition machine.F:17

machine::m_walltime
real(kind=dp) function, public m_walltime()
returns time from a real-time clock, protected against rolling early/easily
Definition machine.F:147

space_groups_types
Space Group Symmetry Type Module (version 1.0, Ferbruary 12, 2021)
Definition space_groups_types.F:14

space_groups
Space Group Symmetry Module (version 1.0, January 16, 2020)
Definition space_groups.F:14

space_groups::spgr_apply_rotations_coord
subroutine, public spgr_apply_rotations_coord(spgr, coord)
routine applies the rotation matrices to the coordinates.
Definition space_groups.F:618

space_groups::spgr_apply_rotations_force
subroutine, public spgr_apply_rotations_force(spgr, force)
routine applies the rotation matrices to the forces.
Definition space_groups.F:679

space_groups_types::spgr_type
Definition space_groups_types.F:27