d7/dc2/matrix__exp_8F_source.html

!--------------------------------------------------------------------------------------------------!

!   CP2K: A general program to perform molecular dynamics simulations                              !

!   Copyright 2000-2025 CP2K developers group <https://cp2k.org>                                   !

!                                                                                                  !

!   SPDX-License-Identifier: GPL-2.0-or-later                                                      !

!--------------------------------------------------------------------------------------------------!


! **************************************************************************************************

!> \brief Routines for calculating a complex matrix exponential.

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


MODULE matrix_exp


   USE cp_cfm_basic_linalg,             ONLY: cp_cfm_scale_and_add,&

                                              cp_cfm_solve

   USE cp_cfm_types,                    ONLY: cp_cfm_create,&

                                              cp_cfm_release,&

                                              cp_cfm_set_all,&

                                              cp_cfm_to_cfm,&

                                              cp_cfm_type

   USE cp_fm_basic_linalg,              ONLY: cp_complex_fm_gemm,&

                                              cp_fm_scale_and_add,&

                                              cp_fm_solve

   USE cp_fm_struct,                    ONLY: cp_fm_struct_double,&

                                              cp_fm_struct_release,&

                                              cp_fm_struct_type

   USE cp_fm_types,                     ONLY: cp_fm_create,&

                                              cp_fm_get_info,&

                                              cp_fm_release,&

                                              cp_fm_set_all,&

                                              cp_fm_to_fm,&

                                              cp_fm_type

   USE cp_log_handling,                 ONLY: cp_to_string

   USE kinds,                           ONLY: dp

   USE mathconstants,                   ONLY: fac,&

                                              z_one,&

                                              z_zero

   USE message_passing,                 ONLY: mp_comm_type,&

                                              mp_para_env_type

   USE parallel_gemm_api,               ONLY: parallel_gemm

#include "./base/base_uses.f90"


   IMPLICIT NONE


   PRIVATE


   CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'matrix_exp'


   PUBLIC :: taylor_only_imaginary, &

             taylor_full_complex, &

             exp_pade_full_complex, &

             exp_pade_only_imaginary, &

             get_nsquare_norder, &

             arnoldi, exp_pade_real


CONTAINS


! **************************************************************************************************

!> \brief specialized subroutine for purely imaginary matrix exponentials

!> \param exp_H ...

!> \param im_matrix ...

!> \param nsquare ...

!> \param ntaylor ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE taylor_only_imaginary(exp_H, im_matrix, nsquare, ntaylor)

      TYPE(cp_fm_type), DIMENSION(2)                     :: exp_h

      TYPE(cp_fm_type), INTENT(IN)                       :: im_matrix

      INTEGER, INTENT(in)                                :: nsquare, ntaylor


      CHARACTER(len=*), PARAMETER :: routinen = 'taylor_only_imaginary'

      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp, zero = 0.0_dp


      INTEGER                                            :: handle, i, ndim, nloop

      REAL(kind=dp)                                      :: square_fac, tfac, tmp

      REAL(kind=dp), CONTIGUOUS, DIMENSION(:, :), &

         POINTER                                         :: local_data_im

      TYPE(cp_fm_type)                                   :: t1, t2, tres_im, tres_re


      CALL timeset(routinen, handle)


      CALL cp_fm_get_info(im_matrix, local_data=local_data_im)

      ndim = im_matrix%matrix_struct%nrow_global


      square_fac = 1.0_dp/(2.0_dp**real(nsquare, dp))

!    CALL cp_fm_scale(square_fac,im_matrix)

      CALL cp_fm_create(t1, &

                        matrix_struct=im_matrix%matrix_struct, &

                        name="T1")


      CALL cp_fm_create(t2, &

                        matrix_struct=t1%matrix_struct, &

                        name="T2")

      CALL cp_fm_create(tres_im, &

                        matrix_struct=t1%matrix_struct, &

                        name="T3")

      CALL cp_fm_create(tres_re, &

                        matrix_struct=t1%matrix_struct, &

                        name="Tres")

      tmp = 1.0_dp


      CALL cp_fm_set_all(tres_re, zero, one)

      CALL cp_fm_set_all(tres_im, zero, zero)

      CALL cp_fm_set_all(t1, zero, one)


      tfac = one

      nloop = ceiling(real(ntaylor, dp)/2.0_dp)


      DO i = 1, nloop

         tmp = tmp*(real(i, dp)*2.0_dp - 1.0_dp)

         CALL parallel_gemm("N", "N", ndim, ndim, ndim, square_fac, im_matrix, t1, zero, &

                            !       CALL parallel_gemm("N","N",ndim,ndim,ndim,one,im_matrix,T1,zero,&

                            t2)

         tfac = 1._dp/tmp

         IF (mod(i, 2) == 0) tfac = -tfac

         CALL cp_fm_scale_and_add(one, tres_im, tfac, t2)

         tmp = tmp*real(i, dp)*2.0_dp

         CALL parallel_gemm("N", "N", ndim, ndim, ndim, square_fac, im_matrix, t2, zero, &

                            !       CALL parallel_gemm("N","N",ndim,ndim,ndim,one,im_matrix,T2,zero,&

                            t1)

         tfac = 1._dp/tmp

         IF (mod(i, 2) == 1) tfac = -tfac

         CALL cp_fm_scale_and_add(one, tres_re, tfac, t1)


      END DO


      IF (nsquare .GT. 0) THEN

         DO i = 1, nsquare

            CALL cp_complex_fm_gemm("N", "N", ndim, ndim, ndim, one, tres_re, tres_im, &

                                    tres_re, tres_im, zero, exp_h(1), exp_h(2))


            CALL cp_fm_to_fm(exp_h(1), tres_re)

            CALL cp_fm_to_fm(exp_h(2), tres_im)

         END DO

      ELSE

         CALL cp_fm_to_fm(tres_re, exp_h(1))

         CALL cp_fm_to_fm(tres_im, exp_h(2))

      END IF


      CALL cp_fm_release(t1)

      CALL cp_fm_release(t2)

      CALL cp_fm_release(tres_re)

      CALL cp_fm_release(tres_im)


      CALL timestop(handle)


   END SUBROUTINE taylor_only_imaginary


! **************************************************************************************************

!> \brief subroutine for general complex matrix exponentials

!>        on input a separate cp_fm_type for real and complex part

!>        on output a size 2 cp_fm_type, first element is the real part of

!>        the exponential second the imaginary

!> \param exp_H ...

!> \param re_part ...

!> \param im_part ...

!> \param nsquare ...

!> \param ntaylor ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE taylor_full_complex(exp_H, re_part, im_part, nsquare, ntaylor)

      TYPE(cp_fm_type), DIMENSION(2)                     :: exp_h

      TYPE(cp_fm_type), INTENT(IN)                       :: re_part, im_part

      INTEGER, INTENT(in)                                :: nsquare, ntaylor


      CHARACTER(len=*), PARAMETER :: routinen = 'taylor_full_complex'


      COMPLEX(KIND=dp)                                   :: tfac

      INTEGER                                            :: handle, i, ndim

      REAL(kind=dp)                                      :: square_fac, tmp

      REAL(kind=dp), CONTIGUOUS, DIMENSION(:, :), &

         POINTER                                         :: local_data_im, local_data_re

      TYPE(cp_cfm_type)                                  :: t1, t2, t3, tres


      CALL timeset(routinen, handle)

      CALL cp_fm_get_info(re_part, local_data=local_data_re)

      CALL cp_fm_get_info(im_part, local_data=local_data_im)

      ndim = re_part%matrix_struct%nrow_global


      CALL cp_cfm_create(t1, &

                         matrix_struct=re_part%matrix_struct, &

                         name="T1")


      square_fac = 2.0_dp**real(nsquare, dp)


      t1%local_data = cmplx(local_data_re/square_fac, local_data_im/square_fac, kind=dp)


      CALL cp_cfm_create(t2, &

                         matrix_struct=t1%matrix_struct, &

                         name="T2")

      CALL cp_cfm_create(t3, &

                         matrix_struct=t1%matrix_struct, &

                         name="T3")

      CALL cp_cfm_create(tres, &

                         matrix_struct=t1%matrix_struct, &

                         name="Tres")

      tmp = 1.0_dp

      CALL cp_cfm_set_all(tres, z_zero, z_one)

      CALL cp_cfm_set_all(t2, z_zero, z_one)

      tfac = z_one


      DO i = 1, ntaylor

         tmp = tmp*real(i, dp)

         CALL parallel_gemm("N", "N", ndim, ndim, ndim, z_one, t1, t2, z_zero, &

                            t3)

         tfac = cmplx(1._dp/tmp, 0.0_dp, kind=dp)

         CALL cp_cfm_scale_and_add(z_one, tres, tfac, t3)

         CALL cp_cfm_to_cfm(t3, t2)

      END DO


      IF (nsquare .GT. 0) THEN

         DO i = 1, nsquare

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, z_one, tres, tres, z_zero, &

                               t2)

            CALL cp_cfm_to_cfm(t2, tres)

         END DO

      END IF


      exp_h(1)%local_data = real(tres%local_data, kind=dp)

      exp_h(2)%local_data = aimag(tres%local_data)


      CALL cp_cfm_release(t1)

      CALL cp_cfm_release(t2)

      CALL cp_cfm_release(t3)

      CALL cp_cfm_release(tres)

      CALL timestop(handle)


   END SUBROUTINE taylor_full_complex


! **************************************************************************************************

!> \brief optimization function for pade/taylor order and number of squaring steps

!> \param norm ...

!> \param nsquare ...

!> \param norder ...

!> \param eps_exp ...

!> \param method ...

!> \param do_emd ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE get_nsquare_norder(norm, nsquare, norder, eps_exp, method, do_emd)


      REAL(dp), INTENT(in)                               :: norm

      INTEGER, INTENT(out)                               :: nsquare, norder

      REAL(dp), INTENT(in)                               :: eps_exp

      INTEGER, INTENT(in)                                :: method

      LOGICAL, INTENT(in)                                :: do_emd


      INTEGER                                            :: cost, i, iscale, orders(3), p, &

                                                            prev_cost, q

      LOGICAL                                            :: new_scale

      REAL(dp)                                           :: d, eval, myval, n, scaled, scalen


      orders(:) = (/12, 12, 12/)

      IF (method == 2) THEN

         DO iscale = 0, 12

            new_scale = .false.

            eval = norm/(2.0_dp**real(iscale, dp))

            DO q = 1, 12

               DO p = max(1, q - 1), q

                  IF (p > q) EXIT

                  d = 1.0_dp

                  n = 1.0_dp

                  DO i = 1, q

                     IF (i .LE. p) scalen = fac(p + q - i)*fac(p)/(fac(p + q)*fac(i)*fac(p - i))

                     scaled = (-1.0)**i*fac(p + q - i)*fac(q)/(fac(p + q)*fac(i)*fac(q - i))

                     IF (i .LE. p) n = n + scalen*eval**i

                     d = d + scaled*eval**i

                  END DO

                  IF (abs((exp(norm) - (n/d)**(2.0_dp**iscale))/max(1.0_dp, exp(norm))) .LE. eps_exp) THEN

                     IF (do_emd) THEN

                        cost = iscale + q

                        prev_cost = orders(1) + orders(2)

                     ELSE

                        cost = iscale + ceiling(real(q, dp)/3.0_dp)

                        prev_cost = orders(1) + ceiling(real(orders(2), dp)/3.0_dp)

                     END IF

                     IF (cost .LT. prev_cost) THEN

                        orders(:) = (/iscale, q, p/)

                        myval = (n/d)**(2.0_dp**iscale)

                     END IF

                     new_scale = .true.

                     EXIT

                  END IF

               END DO

               IF (new_scale) EXIT

            END DO

            IF (iscale .GE. orders(1) + orders(2) .AND. new_scale) EXIT

         END DO

      ELSE IF (method == 1) THEN

         q = 0

         eval = norm

         DO iscale = 0, 6

            new_scale = .false.

            IF (iscale .GE. 1) eval = norm/(2.0_dp**real(iscale, dp))

            DO p = 1, 20

               d = 1.0_dp

               n = 1.0_dp

               DO i = 1, p

                  scalen = 1.0_dp/fac(i)

                  n = n + scalen*(eval**real(i, dp))

               END DO

               IF (abs((exp(norm) - n**(2.0_dp**real(iscale, dp)))/max(1.0_dp, exp(norm))) .LE. eps_exp) THEN

                  IF (do_emd) THEN

                     cost = iscale + p

                     prev_cost = orders(1) + orders(2)

                  ELSE

                     cost = iscale + ceiling(real(p, dp)/3.0_dp)

                     prev_cost = orders(1) + ceiling(real(orders(2), dp)/3.0_dp)

                  END IF

                  IF (cost .LT. prev_cost) THEN

                     orders(:) = (/iscale, p, 0/)

                     myval = (n)**(2.0_dp**iscale)

                  END IF

                  new_scale = .true.

                  EXIT

               END IF

            END DO

            IF (iscale .GE. orders(1) + orders(2) .AND. new_scale) EXIT

         END DO

      END IF


      nsquare = orders(1)

      norder = orders(2)


   END SUBROUTINE get_nsquare_norder


! **************************************************************************************************

!> \brief exponential of a complex matrix,

!>        calculated using pade approximation together with scaling and squaring

!> \param exp_H ...

!> \param re_part ...

!> \param im_part ...

!> \param nsquare ...

!> \param npade ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE exp_pade_full_complex(exp_H, re_part, im_part, nsquare, npade)

      TYPE(cp_fm_type), DIMENSION(2)                     :: exp_h

      TYPE(cp_fm_type), INTENT(IN)                       :: re_part, im_part

      INTEGER, INTENT(in)                                :: nsquare, npade


      CHARACTER(len=*), PARAMETER :: routinen = 'exp_pade_full_complex'


      COMPLEX(KIND=dp)                                   :: scaled, scalen

      INTEGER                                            :: handle, i, ldim, ndim, p, q

      REAL(kind=dp)                                      :: square_fac, tmp

      REAL(kind=dp), CONTIGUOUS, DIMENSION(:, :), &

         POINTER                                         :: local_data_im, local_data_re

      TYPE(cp_cfm_type)                                  :: dpq, fin_p, t1

      TYPE(cp_cfm_type), DIMENSION(2)                    :: mult_p

      TYPE(cp_cfm_type), TARGET                          :: npq, t2, tres


      p = npade

      q = npade


      CALL timeset(routinen, handle)

      CALL cp_fm_get_info(re_part, local_data=local_data_re, ncol_local=ldim, &

                          nrow_global=ndim)

      CALL cp_fm_get_info(im_part, local_data=local_data_im)


      CALL cp_cfm_create(dpq, &

                         matrix_struct=re_part%matrix_struct, &

                         name="Dpq")


      square_fac = 2.0_dp**real(nsquare, dp)


      CALL cp_cfm_create(t1, &

                         matrix_struct=dpq%matrix_struct, &

                         name="T1")


      CALL cp_cfm_create(t2, &

                         matrix_struct=t1%matrix_struct, &

                         name="T2")

      CALL cp_cfm_create(npq, &

                         matrix_struct=t1%matrix_struct, &

                         name="Npq")

      CALL cp_cfm_create(tres, &

                         matrix_struct=t1%matrix_struct, &

                         name="Tres")


      DO i = 1, ldim

         t2%local_data(:, i) = cmplx(local_data_re(:, i)/square_fac, local_data_im(:, i)/square_fac, kind=dp)

      END DO

      CALL cp_cfm_to_cfm(t2, t1)

      mult_p(1) = t2

      mult_p(2) = tres

      tmp = 1.0_dp

      CALL cp_cfm_set_all(npq, z_zero, z_one)

      CALL cp_cfm_set_all(dpq, z_zero, z_one)


      CALL cp_cfm_scale_and_add(z_one, npq, z_one*0.5_dp, t2)

      CALL cp_cfm_scale_and_add(z_one, dpq, -z_one*0.5_dp, t2)


      IF (npade .GT. 2) THEN

         DO i = 2, npade

            IF (i .LE. p) scalen = cmplx(fac(p + q - i)*fac(p)/(fac(p + q)*fac(i)*fac(p - i)), 0.0_dp, kind=dp)

            scaled = cmplx((-1.0_dp)**i*fac(p + q - i)*fac(q)/(fac(p + q)*fac(i)*fac(q - i)), 0.0_dp, kind=dp)

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, z_one, t1, mult_p(mod(i, 2) + 1), z_zero, &

                               mult_p(mod(i + 1, 2) + 1))

            IF (i .LE. p) CALL cp_cfm_scale_and_add(z_one, npq, scalen, mult_p(mod(i + 1, 2) + 1))

            IF (i .LE. q) CALL cp_cfm_scale_and_add(z_one, dpq, scaled, mult_p(mod(i + 1, 2) + 1))

         END DO

      END IF


      CALL cp_cfm_solve(dpq, npq)


      mult_p(2) = npq

      mult_p(1) = tres

      IF (nsquare .GT. 0) THEN

         DO i = 1, nsquare

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, z_one, mult_p(mod(i, 2) + 1), mult_p(mod(i, 2) + 1), z_zero, &

                               mult_p(mod(i + 1, 2) + 1))

            fin_p = mult_p(mod(i + 1, 2) + 1)

         END DO

      ELSE

         fin_p = npq

      END IF

      DO i = 1, ldim

         exp_h(1)%local_data(:, i) = real(fin_p%local_data(:, i), kind=dp)

         exp_h(2)%local_data(:, i) = aimag(fin_p%local_data(:, i))

      END DO


      CALL cp_cfm_release(npq)

      CALL cp_cfm_release(dpq)

      CALL cp_cfm_release(t1)

      CALL cp_cfm_release(t2)

      CALL cp_cfm_release(tres)

      CALL timestop(handle)


   END SUBROUTINE exp_pade_full_complex


! **************************************************************************************************

!> \brief exponential of a complex matrix,

!>        calculated using pade approximation together with scaling and squaring

!> \param exp_H ...

!> \param im_part ...

!> \param nsquare ...

!> \param npade ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE exp_pade_only_imaginary(exp_H, im_part, nsquare, npade)

      TYPE(cp_fm_type), DIMENSION(2)                     :: exp_h

      TYPE(cp_fm_type), INTENT(IN)                       :: im_part

      INTEGER, INTENT(in)                                :: nsquare, npade


      CHARACTER(len=*), PARAMETER :: routinen = 'exp_pade_only_imaginary'

      REAL(kind=dp), PARAMETER                           :: rone = 1.0_dp, rzero = 0.0_dp


      COMPLEX(KIND=dp)                                   :: scaled, scalen

      INTEGER                                            :: handle, i, j, k, ldim, ndim, p, q

      REAL(kind=dp)                                      :: my_fac, square_fac

      REAL(kind=dp), CONTIGUOUS, DIMENSION(:, :), &

         POINTER                                         :: local_data_im

      TYPE(cp_cfm_type)                                  :: dpq, fin_p

      TYPE(cp_cfm_type), DIMENSION(2)                    :: cmult_p

      TYPE(cp_cfm_type), TARGET                          :: npq, t1

      TYPE(cp_fm_type)                                   :: t2, tres


      CALL timeset(routinen, handle)

      p = npade

      q = npade !p==q seems to be necessary for the rest of the code


      CALL cp_fm_get_info(im_part, local_data=local_data_im, ncol_local=ldim, nrow_global=ndim)

      square_fac = 1.0_dp/(2.0_dp**real(nsquare, dp))


      CALL cp_cfm_create(dpq, &

                         matrix_struct=im_part%matrix_struct, &

                         name="Dpq")


      CALL cp_cfm_create(npq, &

                         matrix_struct=dpq%matrix_struct, &

                         name="Npq")


      CALL cp_cfm_create(t1, &

                         matrix_struct=dpq%matrix_struct, &

                         name="T1")


      CALL cp_fm_create(t2, &

                        matrix_struct=t1%matrix_struct, &

                        name="T2")


      CALL cp_fm_create(tres, &

                        matrix_struct=t1%matrix_struct, &

                        name="Tres")


!    DO i=1,ldim

!       local_data_im(:,i)=local_data_im(:,i)/square_fac

!    END DO


      CALL cp_fm_to_fm(im_part, t2)


      CALL cp_cfm_set_all(npq, z_zero, z_one)

      CALL cp_cfm_set_all(dpq, z_zero, z_one)


      DO i = 1, ldim

         npq%local_data(:, i) = npq%local_data(:, i) + cmplx(rzero, 0.5_dp*square_fac*local_data_im(:, i), dp)

         dpq%local_data(:, i) = dpq%local_data(:, i) - cmplx(rzero, 0.5_dp*square_fac*local_data_im(:, i), dp)

      END DO


      IF (npade .GT. 2) THEN

         DO j = 1, floor(npade/2.0_dp)

            i = 2*j

            my_fac = (-rone)**j

            IF (i .LE. p) scalen = cmplx(my_fac*fac(p + q - i)*fac(p)/(fac(p + q)*fac(i)*fac(p - i)), 0.0_dp, dp)

            scaled = cmplx(my_fac*fac(p + q - i)*fac(q)/(fac(p + q)*fac(i)*fac(q - i)), 0.0_dp, dp)

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, square_fac, im_part, t2, rzero, tres)


            DO k = 1, ldim

               npq%local_data(:, k) = npq%local_data(:, k) + scalen*tres%local_data(:, k)

               dpq%local_data(:, k) = dpq%local_data(:, k) + scaled*tres%local_data(:, k)

            END DO


            IF (2*j + 1 .LE. q) THEN

               i = 2*j + 1

               IF (i .LE. p) scalen = cmplx(my_fac*fac(p + q - i)*fac(p)/(fac(p + q)*fac(i)*fac(p - i)), rzero, dp)

               scaled = cmplx(-my_fac*fac(p + q - i)*fac(q)/(fac(p + q)*fac(i)*fac(q - i)), rzero, dp)

               CALL parallel_gemm("N", "N", ndim, ndim, ndim, square_fac, im_part, tres, rzero, t2)


               DO k = 1, ldim

                  npq%local_data(:, k) = npq%local_data(:, k) + scalen*cmplx(rzero, t2%local_data(:, k), dp)

                  dpq%local_data(:, k) = dpq%local_data(:, k) + scaled*cmplx(rzero, t2%local_data(:, k), dp)

               END DO

            END IF

         END DO

      END IF


      CALL cp_cfm_solve(dpq, npq)


      cmult_p(2) = npq

      cmult_p(1) = t1

      IF (nsquare .GT. 0) THEN

         DO i = 1, nsquare

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, z_one, cmult_p(mod(i, 2) + 1), cmult_p(mod(i, 2) + 1), z_zero, &

                               cmult_p(mod(i + 1, 2) + 1))

            fin_p = cmult_p(mod(i + 1, 2) + 1)

         END DO

      ELSE

         fin_p = npq

      END IF


      DO k = 1, ldim

         exp_h(1)%local_data(:, k) = real(fin_p%local_data(:, k), kind=dp)

         exp_h(2)%local_data(:, k) = aimag(fin_p%local_data(:, k))

      END DO


      CALL cp_cfm_release(npq)

      CALL cp_cfm_release(dpq)

      CALL cp_cfm_release(t1)

      CALL cp_fm_release(t2)

      CALL cp_fm_release(tres)

      CALL timestop(handle)


   END SUBROUTINE exp_pade_only_imaginary


! **************************************************************************************************

!> \brief exponential of a real matrix,

!>        calculated using pade approximation together with scaling and squaring

!> \param exp_H ...

!> \param matrix ...

!> \param nsquare ...

!> \param npade ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE exp_pade_real(exp_H, matrix, nsquare, npade)

      TYPE(cp_fm_type), INTENT(IN)                       :: exp_h, matrix

      INTEGER, INTENT(in)                                :: nsquare, npade


      CHARACTER(len=*), PARAMETER                        :: routinen = 'exp_pade_real'

      REAL(kind=dp), PARAMETER                           :: one = 1.0_dp, zero = 0.0_dp


      INTEGER                                            :: handle, i, j, k, ldim, ndim, p, q

      REAL(kind=dp)                                      :: my_fac, scaled, scalen, square_fac

      REAL(kind=dp), CONTIGUOUS, DIMENSION(:, :), &

         POINTER                                         :: local_data

      TYPE(cp_fm_type)                                   :: dpq, fin_p

      TYPE(cp_fm_type), DIMENSION(2)                     :: mult_p

      TYPE(cp_fm_type), TARGET                           :: npq, t1, t2, tres


      CALL timeset(routinen, handle)

      p = npade

      q = npade !p==q seems to be necessary for the rest of the code


      CALL cp_fm_get_info(matrix, local_data=local_data, ncol_local=ldim, nrow_global=ndim)

      square_fac = 2.0_dp**real(nsquare, dp)


      CALL cp_fm_create(dpq, &

                        matrix_struct=matrix%matrix_struct, &

                        name="Dpq")


      CALL cp_fm_create(npq, &

                        matrix_struct=dpq%matrix_struct, &

                        name="Npq")


      CALL cp_fm_create(t1, &

                        matrix_struct=dpq%matrix_struct, &

                        name="T1")


      CALL cp_fm_create(t2, &

                        matrix_struct=t1%matrix_struct, &

                        name="T2")


      CALL cp_fm_create(tres, &

                        matrix_struct=t1%matrix_struct, &

                        name="Tres")


      DO i = 1, ldim

         t2%local_data(:, i) = local_data(:, i)/square_fac

      END DO


      CALL cp_fm_to_fm(t2, t1)

      CALL cp_fm_set_all(npq, zero, one)

      CALL cp_fm_set_all(dpq, zero, one)


      DO i = 1, ldim

         npq%local_data(:, i) = npq%local_data(:, i) + 0.5_dp*local_data(:, i)

         dpq%local_data(:, i) = dpq%local_data(:, i) - 0.5_dp*local_data(:, i)

      END DO


      mult_p(1) = t2

      mult_p(2) = tres


      IF (npade .GE. 2) THEN

         DO j = 2, npade

            my_fac = (-1.0_dp)**j

            scalen = fac(p + q - j)*fac(p)/(fac(p + q)*fac(j)*fac(p - j))

            scaled = my_fac*fac(p + q - j)*fac(q)/(fac(p + q)*fac(j)*fac(q - j))

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, one, mult_p(mod(j, 2) + 1), t1, &

                               zero, mult_p(mod(j + 1, 2) + 1))


            DO k = 1, ldim

               npq%local_data(:, k) = npq%local_data(:, k) + scalen*mult_p(mod(j + 1, 2) + 1)%local_data(:, k)

               dpq%local_data(:, k) = dpq%local_data(:, k) + scaled*mult_p(mod(j + 1, 2) + 1)%local_data(:, k)

            END DO

         END DO

      END IF


      CALL cp_fm_solve(dpq, npq)


      mult_p(2) = npq

      mult_p(1) = t1

      IF (nsquare .GT. 0) THEN

         DO i = 1, nsquare

            CALL parallel_gemm("N", "N", ndim, ndim, ndim, one, mult_p(mod(i, 2) + 1), mult_p(mod(i, 2) + 1), zero, &

                               mult_p(mod(i + 1, 2) + 1))

         END DO

         fin_p = mult_p(mod(nsquare + 1, 2) + 1)

      ELSE

         fin_p = npq

      END IF


      DO k = 1, ldim

         exp_h%local_data(:, k) = fin_p%local_data(:, k)

      END DO


      CALL cp_fm_release(npq)

      CALL cp_fm_release(dpq)

      CALL cp_fm_release(t1)

      CALL cp_fm_release(t2)

      CALL cp_fm_release(tres)

      CALL timestop(handle)


   END SUBROUTINE exp_pade_real


! ***************************************************************************************************

!> \brief exponential of a complex matrix,

!>        calculated using arnoldi subspace method (directly applies to the MOs)

!> \param mos_old ...

!> \param mos_new ...

!> \param eps_exp ...

!> \param Hre ...

!> \param Him ...

!> \param mos_next ...

!> \param narn_old ...

!> \author Florian Schiffmann (02.09)

! **************************************************************************************************


   SUBROUTINE arnoldi(mos_old, mos_new, eps_exp, Hre, Him, mos_next, narn_old)


      TYPE(cp_fm_type), DIMENSION(2)                     :: mos_old, mos_new

      REAL(kind=dp), INTENT(in)                          :: eps_exp

      TYPE(cp_fm_type), INTENT(IN), OPTIONAL             :: hre

      TYPE(cp_fm_type), INTENT(IN)                       :: him

      TYPE(cp_fm_type), DIMENSION(2), OPTIONAL           :: mos_next

      INTEGER, INTENT(inout)                             :: narn_old


      CHARACTER(len=*), PARAMETER                        :: routinen = 'arnoldi'

      REAL(kind=dp), PARAMETER                           :: rone = 1.0_dp, rzero = 0.0_dp


      INTEGER                                            :: handle, i, icol_local, idim, info, j, l, &

                                                            mydim, nao, narnoldi, ncol_local, &

                                                            newdim, nmo, npade, pade_step

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: ipivot

      INTEGER, DIMENSION(:), POINTER                     :: col_indices, col_procs

      LOGICAL                                            :: convergence, double_col, double_row

      REAL(dp), ALLOCATABLE, DIMENSION(:)                :: last_norm, norm1, results

      REAL(dp), ALLOCATABLE, DIMENSION(:, :)             :: d, mat1, mat2, mat3, n

      REAL(dp), ALLOCATABLE, DIMENSION(:, :, :)          :: h_approx, h_approx_save

      REAL(kind=dp)                                      :: conv_norm, prefac, scaled, scalen

      TYPE(cp_fm_struct_type), POINTER                   :: mo_struct, newstruct

      TYPE(cp_fm_type), ALLOCATABLE, DIMENSION(:)        :: v_mats

      TYPE(mp_comm_type)                                 :: col_group

      TYPE(mp_para_env_type), POINTER                    :: para_env


      CALL timeset(routinen, handle)

      para_env => mos_new(1)%matrix_struct%para_env


      CALL cp_fm_get_info(mos_old(1), ncol_local=ncol_local, col_indices=col_indices, &

                          nrow_global=nao, ncol_global=nmo, matrix_struct=mo_struct)

      narnoldi = min(18, nao)


      ALLOCATE (results(ncol_local))

      ALLOCATE (norm1(ncol_local))

      ALLOCATE (v_mats(narnoldi + 1))

      ALLOCATE (last_norm(ncol_local))

      ALLOCATE (h_approx(narnoldi, narnoldi, ncol_local))

      ALLOCATE (h_approx_save(narnoldi, narnoldi, ncol_local))

      col_procs => mo_struct%context%blacs2mpi(:, mo_struct%context%mepos(2))

      CALL col_group%from_reordering(para_env, col_procs)


      double_col = .true.

      double_row = .false.

      CALL cp_fm_struct_double(newstruct, mo_struct, mo_struct%context, double_col, double_row)

      h_approx_save = rzero


      DO i = 1, narnoldi + 1

         CALL cp_fm_create(v_mats(i), matrix_struct=newstruct, &

                           name="V_mat"//cp_to_string(i))

      END DO

      CALL cp_fm_get_info(v_mats(1), ncol_global=newdim)


      norm1 = 0.0_dp

!$OMP PARALLEL DO PRIVATE(icol_local) DEFAULT(NONE) SHARED(V_mats,norm1,mos_old,ncol_local)

      DO icol_local = 1, ncol_local

         v_mats(1)%local_data(:, icol_local) = mos_old(1)%local_data(:, icol_local)

         v_mats(1)%local_data(:, icol_local + ncol_local) = mos_old(2)%local_data(:, icol_local)

         norm1(icol_local) = sum(v_mats(1)%local_data(:, icol_local)**2) &

                             + sum(v_mats(1)%local_data(:, icol_local + ncol_local)**2)

      END DO


      CALL col_group%sum(norm1)

      !!! normalize the mo vectors

      norm1(:) = sqrt(norm1(:))


!$OMP PARALLEL DO PRIVATE(icol_local) DEFAULT(NONE) SHARED(V_mats,norm1,ncol_local)

      DO icol_local = 1, ncol_local

         v_mats(1)%local_data(:, icol_local) = v_mats(1)%local_data(:, icol_local)/norm1(icol_local)

         v_mats(1)%local_data(:, icol_local + ncol_local) = &

            v_mats(1)%local_data(:, icol_local + ncol_local)/norm1(icol_local)

      END DO


      ! arnoldi subspace procedure to get H_approx

      DO i = 2, narnoldi + 1

         !Be careful, imaginary matrix multiplied with complex. Unfortunately requires a swap of arrays afterwards

         CALL parallel_gemm("N", "N", nao, newdim, nao, 1.0_dp, him, v_mats(i - 1), 0.0_dp, v_mats(i))


!$OMP PARALLEL DO PRIVATE(icol_local) DEFAULT(NONE) SHARED(mos_new,V_mats,ncol_local,i)

         DO icol_local = 1, ncol_local

            mos_new(1)%local_data(:, icol_local) = v_mats(i)%local_data(:, icol_local)

            v_mats(i)%local_data(:, icol_local) = -v_mats(i)%local_data(:, icol_local + ncol_local)

            v_mats(i)%local_data(:, icol_local + ncol_local) = mos_new(1)%local_data(:, icol_local)

         END DO


         IF (PRESENT(hre)) THEN

            CALL parallel_gemm("N", "N", nao, newdim, nao, 1.0_dp, hre, v_mats(i - 1), 1.0_dp, v_mats(i))

         END IF


         DO l = 1, i - 1

!$OMP PARALLEL DO DEFAULT(NONE) SHARED(results,V_mats,ncol_local,l,i)

            DO icol_local = 1, ncol_local

               results(icol_local) = sum(v_mats(l)%local_data(:, icol_local)*v_mats(i)%local_data(:, icol_local)) + &

                                     sum(v_mats(l)%local_data(:, icol_local + ncol_local)* &

                                         v_mats(i)%local_data(:, icol_local + ncol_local))

            END DO


            CALL col_group%sum(results)


!$OMP PARALLEL DO DEFAULT(NONE) SHARED(H_approx_save,V_mats,ncol_local,l,i,results)

            DO icol_local = 1, ncol_local

               h_approx_save(l, i - 1, icol_local) = results(icol_local)

               v_mats(i)%local_data(:, icol_local) = v_mats(i)%local_data(:, icol_local) - &

                                                     results(icol_local)*v_mats(l)%local_data(:, icol_local)

               v_mats(i)%local_data(:, icol_local + ncol_local) = &

                  v_mats(i)%local_data(:, icol_local + ncol_local) - &

                  results(icol_local)*v_mats(l)%local_data(:, icol_local + ncol_local)

            END DO

         END DO


!$OMP PARALLEL DO DEFAULT(NONE) SHARED(ncol_local,V_mats,results,i)

         DO icol_local = 1, ncol_local

            results(icol_local) = sum(v_mats(i)%local_data(:, icol_local)**2) + &

                                  sum(v_mats(i)%local_data(:, icol_local + ncol_local)**2)

         END DO


         CALL col_group%sum(results)


         IF (i .LE. narnoldi) THEN


!$OMP PARALLEL DO DEFAULT(NONE) SHARED(H_approx_save,last_norm,V_mats,ncol_local,i,results)

            DO icol_local = 1, ncol_local

               h_approx_save(i, i - 1, icol_local) = sqrt(results(icol_local))

               last_norm(icol_local) = sqrt(results(icol_local))

               v_mats(i)%local_data(:, icol_local) = v_mats(i)%local_data(:, icol_local)/sqrt(results(icol_local))

               v_mats(i)%local_data(:, icol_local + ncol_local) = &

                  v_mats(i)%local_data(:, icol_local + ncol_local)/sqrt(results(icol_local))

            END DO

         ELSE

!$OMP PARALLEL DO DEFAULT(NONE) SHARED(ncol_local,last_norm,results)

            DO icol_local = 1, ncol_local

               last_norm(icol_local) = sqrt(results(icol_local))

            END DO

         END IF


         h_approx(:, :, :) = h_approx_save


         ! PADE approximation for exp(H_approx), everything is done locally


         convergence = .false.

         IF (i .GE. narn_old) THEN

            npade = 9

            mydim = min(i, narnoldi)

            ALLOCATE (ipivot(mydim))

            ALLOCATE (mat1(mydim, mydim))

            ALLOCATE (mat2(mydim, mydim))

            ALLOCATE (mat3(mydim, mydim))

            ALLOCATE (n(mydim, mydim))

            ALLOCATE (d(mydim, mydim))

            DO icol_local = 1, ncol_local

               DO idim = 1, mydim

                  DO j = 1, mydim

                     mat1(idim, j) = h_approx(idim, j, icol_local)/16.0_dp

                     mat3(idim, j) = mat1(idim, j)

                  END DO

               END DO

               n = 0.0_dp

               d = 0.0_dp

               DO idim = 1, mydim

                  n(idim, idim) = rone

                  d(idim, idim) = rone

               END DO

               n(:, :) = n + 0.5_dp*mat1

               d(:, :) = d - 0.5_dp*mat1

               pade_step = 1

               DO idim = 1, 4

                  pade_step = pade_step + 1

                  CALL dgemm("N", 'N', mydim, mydim, mydim, rone, mat1(1, 1), &

                             mydim, mat3(1, 1), mydim, rzero, mat2(1, 1), mydim)

                  scalen = real(fac(2*npade - pade_step)*fac(npade)/ &

                                (fac(2*npade)*fac(pade_step)*fac(npade - pade_step)), dp)

                  scaled = real((-1.0_dp)**pade_step*fac(2*npade - pade_step)*fac(npade)/ &

                                (fac(2*npade)*fac(pade_step)*fac(npade - pade_step)), dp)

                  n(:, :) = n + scalen*mat2

                  d(:, :) = d + scaled*mat2

                  pade_step = pade_step + 1

                  CALL dgemm("N", 'N', mydim, mydim, mydim, rone, mat2(1, 1), &

                             mydim, mat1(1, 1), mydim, rzero, mat3(1, 1), mydim)

                  scalen = real(fac(2*npade - pade_step)*fac(npade)/ &

                                (fac(2*npade)*fac(pade_step)*fac(npade - pade_step)), dp)

                  scaled = real((-1.0_dp)**pade_step*fac(2*npade - pade_step)*fac(npade)/ &

                                (fac(2*npade)*fac(pade_step)*fac(npade - pade_step)), dp)

                  n(:, :) = n + scalen*mat3

                  d(:, :) = d + scaled*mat3

               END DO


               CALL dgetrf(mydim, mydim, d(1, 1), mydim, ipivot, info)

               CALL dgetrs("N", mydim, mydim, d(1, 1), mydim, ipivot, n, mydim, info)

               CALL dgemm("N", 'N', mydim, mydim, mydim, rone, n(1, 1), mydim, n(1, 1), mydim, rzero, mat1(1, 1), mydim)

               CALL dgemm("N", 'N', mydim, mydim, mydim, rone, mat1(1, 1), mydim, mat1(1, 1), mydim, rzero, n(1, 1), mydim)

               CALL dgemm("N", 'N', mydim, mydim, mydim, rone, n(1, 1), mydim, n(1, 1), mydim, rzero, mat1(1, 1), mydim)

               CALL dgemm("N", 'N', mydim, mydim, mydim, rone, mat1(1, 1), mydim, mat1(1, 1), mydim, rzero, n(1, 1), mydim)

               DO idim = 1, mydim

                  DO j = 1, mydim

                     h_approx(idim, j, icol_local) = n(idim, j)

                  END DO

               END DO

            END DO

            ! H_approx is exp(H_approx) right now, calculate new MOs and check for convergence

            conv_norm = 0.0_dp

            results = 0.0_dp

            DO icol_local = 1, ncol_local

               results(icol_local) = last_norm(icol_local)*h_approx(i - 1, 1, icol_local)

               conv_norm = max(conv_norm, abs(results(icol_local)))

            END DO


            CALL para_env%max(conv_norm)


            IF (conv_norm .LT. eps_exp .OR. i .GT. narnoldi) THEN


               mos_new(1)%local_data = rzero

               mos_new(2)%local_data = rzero

               DO icol_local = 1, ncol_local

                  DO idim = 1, mydim

                     prefac = h_approx(idim, 1, icol_local)*norm1(icol_local)

                     mos_new(1)%local_data(:, icol_local) = mos_new(1)%local_data(:, icol_local) + &

                                                            v_mats(idim)%local_data(:, icol_local)*prefac

                     mos_new(2)%local_data(:, icol_local) = mos_new(2)%local_data(:, icol_local) + &

                                                            v_mats(idim)%local_data(:, icol_local + ncol_local)*prefac

                  END DO

               END DO


               IF (PRESENT(mos_next)) THEN

                  DO icol_local = 1, ncol_local

                     DO idim = 1, mydim

                        DO j = 1, mydim

                           n(idim, j) = h_approx(idim, j, icol_local)

                        END DO

                     END DO

                     CALL dgemm("N", 'N', mydim, mydim, mydim, rone, n(1, 1), mydim, n(1, 1), mydim, rzero, mat1(1, 1), mydim)

                     DO idim = 1, mydim

                        DO j = 1, mydim

                           h_approx(idim, j, icol_local) = mat1(idim, j)

                        END DO

                     END DO

                  END DO

                  mos_next(1)%local_data = rzero

                  mos_next(2)%local_data = rzero

                  DO icol_local = 1, ncol_local

                     DO idim = 1, mydim

                        prefac = h_approx(idim, 1, icol_local)*norm1(icol_local)

                        mos_next(1)%local_data(:, icol_local) = &

                           mos_next(1)%local_data(:, icol_local) + &

                           v_mats(idim)%local_data(:, icol_local)*prefac

                        mos_next(2)%local_data(:, icol_local) = &

                           mos_next(2)%local_data(:, icol_local) + &

                           v_mats(idim)%local_data(:, icol_local + ncol_local)*prefac

                     END DO

                  END DO

               END IF

               IF (conv_norm .LT. eps_exp) THEN

                  convergence = .true.

                  narn_old = i - 1

               END IF

            END IF


            DEALLOCATE (ipivot)

            DEALLOCATE (mat1)

            DEALLOCATE (mat2)

            DEALLOCATE (mat3)

            DEALLOCATE (n)

            DEALLOCATE (d)

         END IF

         IF (convergence) EXIT


      END DO

      cpwarn_if(.NOT. convergence, "ARNOLDI method did not converge")

      !deallocate all work matrices


      CALL cp_fm_release(v_mats)

      CALL cp_fm_struct_release(newstruct)

      CALL col_group%free()


      DEALLOCATE (h_approx)

      DEALLOCATE (h_approx_save)

      DEALLOCATE (results)

      DEALLOCATE (norm1)

      DEALLOCATE (last_norm)

      CALL timestop(handle)


   END SUBROUTINE arnoldi


END MODULE matrix_exp

dgemm
static void dgemm(const char transa, const char transb, const int m, const int n, const int k, const double alpha, const double *a, const int lda, const double *b, const int ldb, const double beta, double *c, const int ldc)
Convenient wrapper to hide Fortran nature of dgemm_, swapping a and b.
Definition grid_cpu_task_list.c:206

cp_cfm_types::cp_cfm_to_cfm
Definition cp_cfm_types.F:55

cp_fm_types::cp_fm_release
Definition cp_fm_types.F:87

cp_fm_types::cp_fm_to_fm
Definition cp_fm_types.F:82

cp_log_handling::cp_to_string
Definition cp_log_handling.F:90

parallel_gemm_api::parallel_gemm
Definition parallel_gemm_api.F:38

cp_cfm_basic_linalg
Basic linear algebra operations for complex full matrices.
Definition cp_cfm_basic_linalg.F:16

cp_cfm_basic_linalg::cp_cfm_scale_and_add
subroutine, public cp_cfm_scale_and_add(alpha, matrix_a, beta, matrix_b)
Scale and add two BLACS matrices (a = alpha*a + beta*b).
Definition cp_cfm_basic_linalg.F:240

cp_cfm_basic_linalg::cp_cfm_solve
subroutine, public cp_cfm_solve(matrix_a, general_a, determinant)
Solve the system of linear equations A*b=A_general using LU decomposition. Pay attention that both ma...
Definition cp_cfm_basic_linalg.F:732

cp_cfm_types
Represents a complex full matrix distributed on many processors.
Definition cp_cfm_types.F:12

cp_cfm_types::cp_cfm_create
subroutine, public cp_cfm_create(matrix, matrix_struct, name)
Creates a new full matrix with the given structure.
Definition cp_cfm_types.F:121

cp_cfm_types::cp_cfm_release
subroutine, public cp_cfm_release(matrix)
Releases a full matrix.
Definition cp_cfm_types.F:155

cp_cfm_types::cp_cfm_set_all
subroutine, public cp_cfm_set_all(matrix, alpha, beta)
Set all elements of the full matrix to alpha. Besides, set all diagonal matrix elements to beta (if g...
Definition cp_cfm_types.F:175

cp_fm_basic_linalg
Basic linear algebra operations for full matrices.
Definition cp_fm_basic_linalg.F:14

cp_fm_basic_linalg::cp_fm_solve
subroutine, public cp_fm_solve(matrix_a, general_a)
computes the the solution to A*b=A_general using lu decomposition
Definition cp_fm_basic_linalg.F:2338

cp_fm_basic_linalg::cp_fm_scale_and_add
subroutine, public cp_fm_scale_and_add(alpha, matrix_a, beta, matrix_b)
calc A <- alpha*A + beta*B optimized for alpha == 1.0 (just add beta*B) and beta == 0....
Definition cp_fm_basic_linalg.F:167

cp_fm_basic_linalg::cp_complex_fm_gemm
subroutine, public cp_complex_fm_gemm(transa, transb, m, n, k, alpha, a_re, a_im, b_re, b_im, beta, c_re, c_im, a_first_col, a_first_row, b_first_col, b_first_row, c_first_col, c_first_row)
Convenience function. Computes the matrix multiplications needed for the multiplication of complex ma...
Definition cp_fm_basic_linalg.F:2410

cp_fm_struct
represent the structure of a full matrix
Definition cp_fm_struct.F:14

cp_fm_struct::cp_fm_struct_double
subroutine, public cp_fm_struct_double(fmstruct, struct, context, col, row)
creates a struct with twice the number of blocks on each core. If matrix A has to be multiplied with ...
Definition cp_fm_struct.F:523

cp_fm_struct::cp_fm_struct_release
subroutine, public cp_fm_struct_release(fmstruct)
releases a full matrix structure
Definition cp_fm_struct.F:351

cp_fm_types
represent a full matrix distributed on many processors
Definition cp_fm_types.F:15

cp_fm_types::cp_fm_get_info
subroutine, public cp_fm_get_info(matrix, name, nrow_global, ncol_global, nrow_block, ncol_block, nrow_local, ncol_local, row_indices, col_indices, local_data, context, nrow_locals, ncol_locals, matrix_struct, para_env)
returns all kind of information about the full matrix
Definition cp_fm_types.F:1009

cp_fm_types::cp_fm_set_all
subroutine, public cp_fm_set_all(matrix, alpha, beta)
set all elements of a matrix to the same value, and optionally the diagonal to a different one
Definition cp_fm_types.F:528

cp_fm_types::cp_fm_create
subroutine, public cp_fm_create(matrix, matrix_struct, name, use_sp)
creates a new full matrix with the given structure
Definition cp_fm_types.F:164

cp_log_handling
various routines to log and control the output. The idea is that decisions about where to log should ...
Definition cp_log_handling.F:41

kinds
Defines the basic variable types.
Definition kinds.F:23

kinds::dp
integer, parameter, public dp
Definition kinds.F:34

mathconstants
Definition of mathematical constants and functions.
Definition mathconstants.F:16

mathconstants::z_one
complex(kind=dp), parameter, public z_one
Definition mathconstants.F:143

mathconstants::one
real(kind=dp), parameter, public one
Definition mathconstants.F:123

mathconstants::zero
real(kind=dp), parameter, public zero
Definition mathconstants.F:123

mathconstants::fac
real(kind=dp), dimension(0:maxfac), parameter, public fac
Definition mathconstants.F:37

mathconstants::z_zero
complex(kind=dp), parameter, public z_zero
Definition mathconstants.F:143

matrix_exp
Routines for calculating a complex matrix exponential.
Definition matrix_exp.F:13

matrix_exp::exp_pade_real
subroutine, public exp_pade_real(exp_h, matrix, nsquare, npade)
exponential of a real matrix, calculated using pade approximation together with scaling and squaring
Definition matrix_exp.F:570

matrix_exp::get_nsquare_norder
subroutine, public get_nsquare_norder(norm, nsquare, norder, eps_exp, method, do_emd)
optimization function for pade/taylor order and number of squaring steps
Definition matrix_exp.F:244

matrix_exp::taylor_full_complex
subroutine, public taylor_full_complex(exp_h, re_part, im_part, nsquare, ntaylor)
subroutine for general complex matrix exponentials on input a separate cp_fm_type for real and comple...
Definition matrix_exp.F:165

matrix_exp::arnoldi
subroutine, public arnoldi(mos_old, mos_new, eps_exp, hre, him, mos_next, narn_old)
exponential of a complex matrix, calculated using arnoldi subspace method (directly applies to the MO...
Definition matrix_exp.F:683

matrix_exp::exp_pade_only_imaginary
subroutine, public exp_pade_only_imaginary(exp_h, im_part, nsquare, npade)
exponential of a complex matrix, calculated using pade approximation together with scaling and squari...
Definition matrix_exp.F:447

matrix_exp::taylor_only_imaginary
subroutine, public taylor_only_imaginary(exp_h, im_matrix, nsquare, ntaylor)
specialized subroutine for purely imaginary matrix exponentials
Definition matrix_exp.F:69

matrix_exp::exp_pade_full_complex
subroutine, public exp_pade_full_complex(exp_h, re_part, im_part, nsquare, npade)
exponential of a complex matrix, calculated using pade approximation together with scaling and squari...
Definition matrix_exp.F:342

message_passing
Interface to the message passing library MPI.
Definition message_passing.F:23

parallel_gemm_api
basic linear algebra operations for full matrixes
Definition parallel_gemm_api.F:14

cp_cfm_types::cp_cfm_type
Represent a complex full matrix.
Definition cp_cfm_types.F:68

cp_fm_struct::cp_fm_struct_type
keeps the information about the structure of a full matrix
Definition cp_fm_struct.F:82

cp_fm_types::cp_fm_type
represent a full matrix
Definition cp_fm_types.F:113

message_passing::mp_comm_type
Definition message_passing.F:189

message_passing::mp_para_env_type
stores all the informations relevant to an mpi environment
Definition message_passing.F:763