d4/d7a/library__tests_8F_source.html

!--------------------------------------------------------------------------------------------------!

!   CP2K: A general program to perform molecular dynamics simulations                              !

!   Copyright 2000-2025 CP2K developers group <https://cp2k.org>                                   !

!                                                                                                  !

!   SPDX-License-Identifier: GPL-2.0-or-later                                                      !

!--------------------------------------------------------------------------------------------------!


! **************************************************************************************************

!> \brief Performance tests for basic tasks like matrix multiplies, copy, fft.

!> \par History

!>      30-Nov-2000 (JGH) added input

!>      02-Jan-2001 (JGH) Parallel FFT

!>      28-Feb-2002 (JGH) Clebsch-Gordon Coefficients

!>      06-Jun-2003 (JGH) Real space grid test

!>      Eigensolver test (29.08.05,MK)

!> \author JGH  6-NOV-2000

! **************************************************************************************************

MODULE library_tests


   USE ai_coulomb_test,                 ONLY: eri_test

   USE cell_methods,                    ONLY: cell_create,&

                                              init_cell

   USE cell_types,                      ONLY: cell_release,&

                                              cell_type

   USE cg_test,                         ONLY: clebsch_gordon_test

   USE cp_blacs_env,                    ONLY: cp_blacs_env_create,&

                                              cp_blacs_env_release,&

                                              cp_blacs_env_type

   USE cp_dbcsr_api,                    ONLY: dbcsr_reset_randmat_seed,&

                                              dbcsr_run_tests

   USE cp_eri_mme_interface,            ONLY: cp_eri_mme_perf_acc_test

   USE cp_files,                        ONLY: close_file,&

                                              open_file

   USE cp_fm_basic_linalg,              ONLY: cp_fm_gemm

   USE cp_fm_diag,                      ONLY: cp_fm_syevd,&

                                              cp_fm_syevx

   USE cp_fm_struct,                    ONLY: cp_fm_struct_create,&

                                              cp_fm_struct_get,&

                                              cp_fm_struct_release,&

                                              cp_fm_struct_type

   USE cp_fm_types,                     ONLY: cp_fm_create,&

                                              cp_fm_pilaenv,&

                                              cp_fm_release,&

                                              cp_fm_set_all,&

                                              cp_fm_set_submatrix,&

                                              cp_fm_to_fm,&

                                              cp_fm_type

   USE cp_log_handling,                 ONLY: cp_get_default_logger,&

                                              cp_logger_type

   USE cp_output_handling,              ONLY: cp_print_key_finished_output,&

                                              cp_print_key_unit_nr

   USE cp_realspace_grid_init,          ONLY: init_input_type

   USE dbm_tests,                       ONLY: dbm_run_tests

   USE fft_tools,                       ONLY: bwfft,&

                                              fft_radix_closest,&

                                              fwfft,&

                                              fft3d,&

                                              fft_radix_operations,&

                                              finalize_fft,&

                                              init_fft

   USE global_types,                    ONLY: global_environment_type

   USE input_constants,                 ONLY: do_diag_syevd,&

                                              do_diag_syevx,&

                                              do_mat_random,&

                                              do_mat_read,&

                                              do_pwgrid_ns_fullspace,&

                                              do_pwgrid_ns_halfspace,&

                                              do_pwgrid_spherical

   USE input_section_types,             ONLY: section_vals_get,&

                                              section_vals_get_subs_vals,&

                                              section_vals_type,&

                                              section_vals_val_get

   USE kinds,                           ONLY: dp

   USE machine,                         ONLY: m_flush,&

                                              m_walltime

   USE message_passing,                 ONLY: mp_para_env_type

   USE minimax_exp,                     ONLY: validate_exp_minimax

   USE mp2_grids,                       ONLY: test_least_square_ft

   USE mp_perf_test,                    ONLY: mpi_perf_test

   USE parallel_gemm_api,               ONLY: parallel_gemm

   USE parallel_rng_types,              ONLY: uniform,&

                                              rng_stream_type

   USE pw_grid_types,                   ONLY: fullspace,&

                                              halfspace,&

                                              pw_grid_type

   USE pw_grids,                        ONLY: pw_grid_create,&

                                              pw_grid_release

   USE pw_methods,                      ONLY: pw_transfer,&

                                              pw_zero

   USE pw_types,                        ONLY: pw_c1d_gs_type,&

                                              pw_c3d_rs_type,&

                                              pw_r3d_rs_type

   USE realspace_grid_types,            ONLY: &

        realspace_grid_desc_type, realspace_grid_input_type, realspace_grid_type, rs_grid_create, &

        rs_grid_create_descriptor, rs_grid_print, rs_grid_release, rs_grid_release_descriptor, &

        rs_grid_zero, transfer_pw2rs, transfer_rs2pw

   USE shg_integrals_test,              ONLY: shg_integrals_perf_acc_test

#include "./base/base_uses.f90"


   IMPLICIT NONE


   PRIVATE

   PUBLIC :: lib_test


   INTEGER                  :: runtest(100)

   REAL(KIND=dp)           :: max_memory

   REAL(KIND=dp), PARAMETER :: threshold = 1.0e-8_dp

   CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'library_tests'


CONTAINS


! **************************************************************************************************

!> \brief Master routine for tests

!> \param root_section ...

!> \param para_env ...

!> \param globenv ...

!> \par History

!>      none

!> \author JGH  6-NOV-2000

! **************************************************************************************************


   SUBROUTINE lib_test(root_section, para_env, globenv)


      TYPE(section_vals_type), POINTER                   :: root_section

      TYPE(mp_para_env_type), POINTER                    :: para_env

      TYPE(global_environment_type), POINTER             :: globenv


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'lib_test'


      INTEGER                                            :: handle, iw

      LOGICAL                                            :: explicit

      TYPE(cp_logger_type), POINTER                      :: logger

      TYPE(section_vals_type), POINTER :: cp_dbcsr_test_section, cp_fm_gemm_test_section, &

         dbm_test_section, eigensolver_section, eri_mme_test_section, pw_transfer_section, &

         rs_pw_transfer_section, shg_integrals_test_section


      CALL timeset(routinen, handle)


      logger => cp_get_default_logger()

      iw = cp_print_key_unit_nr(logger, root_section, "TEST%PROGRAM_RUN_INFO", extension=".log")


      IF (iw > 0) THEN

         WRITE (iw, '(T2,79("*"))')

         WRITE (iw, '(A,T31,A,T80,A)') ' *', ' PERFORMANCE TESTS ', '*'

         WRITE (iw, '(T2,79("*"))')

      END IF

      !

      CALL test_input(root_section, para_env)

      !

      IF (runtest(1) /= 0) CALL copy_test(para_env, iw)

      !

      IF (runtest(2) /= 0) CALL matmul_test(para_env, test_matmul=.true., test_dgemm=.false., iw=iw)

      IF (runtest(5) /= 0) CALL matmul_test(para_env, test_matmul=.false., test_dgemm=.true., iw=iw)

      !

      IF (runtest(3) /= 0) CALL fft_test(para_env, iw, globenv%fftw_plan_type, &

                                         globenv%fftw_wisdom_file_name)

      !

      IF (runtest(4) /= 0) CALL eri_test(iw)

      !

      IF (runtest(6) /= 0) CALL clebsch_gordon_test()

      !

      ! runtest 7 has been deleted and can be recycled

      !

      IF (runtest(8) /= 0) CALL mpi_perf_test(para_env, runtest(8), iw)

      !

      IF (runtest(10) /= 0) CALL validate_exp_minimax(runtest(10), iw)

      !

      IF (runtest(11) /= 0) CALL test_least_square_ft(runtest(11), iw)

      !


      rs_pw_transfer_section => section_vals_get_subs_vals(root_section, "TEST%RS_PW_TRANSFER")

      CALL section_vals_get(rs_pw_transfer_section, explicit=explicit)

      IF (explicit) THEN

         CALL rs_pw_transfer_test(para_env, iw, globenv, rs_pw_transfer_section)

      END IF


      pw_transfer_section => section_vals_get_subs_vals(root_section, "TEST%PW_TRANSFER")

      CALL section_vals_get(pw_transfer_section, explicit=explicit)

      IF (explicit) THEN

         CALL pw_fft_test(para_env, iw, globenv, pw_transfer_section)

      END IF


      cp_fm_gemm_test_section => section_vals_get_subs_vals(root_section, "TEST%CP_FM_GEMM")

      CALL section_vals_get(cp_fm_gemm_test_section, explicit=explicit)

      IF (explicit) THEN

         CALL cp_fm_gemm_test(para_env, iw, cp_fm_gemm_test_section)

      END IF


      eigensolver_section => section_vals_get_subs_vals(root_section, "TEST%EIGENSOLVER")

      CALL section_vals_get(eigensolver_section, explicit=explicit)

      IF (explicit) THEN

         CALL eigensolver_test(para_env, iw, eigensolver_section)

      END IF


      eri_mme_test_section => section_vals_get_subs_vals(root_section, "TEST%ERI_MME_TEST")

      CALL section_vals_get(eri_mme_test_section, explicit=explicit)

      IF (explicit) THEN

         CALL cp_eri_mme_perf_acc_test(para_env, iw, eri_mme_test_section)

      END IF


      shg_integrals_test_section => section_vals_get_subs_vals(root_section, "TEST%SHG_INTEGRALS_TEST")

      CALL section_vals_get(shg_integrals_test_section, explicit=explicit)

      IF (explicit) THEN

         CALL shg_integrals_perf_acc_test(iw, shg_integrals_test_section)

      END IF


      ! DBCSR tests

      cp_dbcsr_test_section => section_vals_get_subs_vals(root_section, "TEST%CP_DBCSR")

      CALL section_vals_get(cp_dbcsr_test_section, explicit=explicit)

      IF (explicit) THEN

         CALL cp_dbcsr_tests(para_env, iw, cp_dbcsr_test_section)

      END IF


      ! DBM tests

      dbm_test_section => section_vals_get_subs_vals(root_section, "TEST%DBM")

      CALL section_vals_get(dbm_test_section, explicit=explicit)

      IF (explicit) THEN

         CALL run_dbm_tests(para_env, iw, dbm_test_section)

      END IF


      CALL cp_print_key_finished_output(iw, logger, root_section, "TEST%PROGRAM_RUN_INFO")


      CALL timestop(handle)


   END SUBROUTINE lib_test


! **************************************************************************************************

!> \brief Reads input section &TEST ... &END

!> \param root_section ...

!> \param para_env ...

!> \author JGH 30-NOV-2000

!> \note

!> I---------------------------------------------------------------------------I

!> I SECTION: &TEST ... &END                                                   I

!> I                                                                           I

!> I    MEMORY   max_memory                                                    I

!> I    COPY     n                                                             I

!> I    MATMUL   n                                                             I

!> I    FFT      n                                                             I

!> I    ERI      n                                                             I

!> I    PW_FFT   n                                                             I

!> I    Clebsch-Gordon n                                                       I

!> I    RS_GRIDS n                                                             I

!> I    MPI      n                                                             I

!> I    RNG      n             -> Parallel random number generator             I

!> I---------------------------------------------------------------------------I

! **************************************************************************************************

   SUBROUTINE test_input(root_section, para_env)

      TYPE(section_vals_type), POINTER                   :: root_section

      TYPE(mp_para_env_type), POINTER                    :: para_env


      TYPE(section_vals_type), POINTER                   :: test_section


!

!..defaults

! using this style is not recommended, introduce sections instead (see e.g. cp_fm_gemm)


      runtest = 0

      test_section => section_vals_get_subs_vals(root_section, "TEST")

      CALL section_vals_val_get(test_section, "MEMORY", r_val=max_memory)

      CALL section_vals_val_get(test_section, 'COPY', i_val=runtest(1))

      CALL section_vals_val_get(test_section, 'MATMUL', i_val=runtest(2))

      CALL section_vals_val_get(test_section, 'DGEMM', i_val=runtest(5))

      CALL section_vals_val_get(test_section, 'FFT', i_val=runtest(3))

      CALL section_vals_val_get(test_section, 'ERI', i_val=runtest(4))

      CALL section_vals_val_get(test_section, 'CLEBSCH_GORDON', i_val=runtest(6))

      CALL section_vals_val_get(test_section, 'MPI', i_val=runtest(8))

      CALL section_vals_val_get(test_section, 'MINIMAX', i_val=runtest(10))

      CALL section_vals_val_get(test_section, 'LEAST_SQ_FT', i_val=runtest(11))


      CALL para_env%sync()

   END SUBROUTINE test_input


! **************************************************************************************************

!> \brief Tests the performance to copy two vectors.

!> \param para_env ...

!> \param iw ...

!> \par History

!>      none

!> \author JGH  6-NOV-2000

!> \note

!>      The results of these tests allow to determine the size of the cache

!>      of the CPU. This can be used to optimize the performance of the

!>      FFTSG library.

! **************************************************************************************************

   SUBROUTINE copy_test(para_env, iw)

      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw


      INTEGER                                            :: i, ierr, j, len, ntim, siz

      REAL(kind=dp)                                      :: perf, t, tend, tstart

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: ca, cb


! test for copy --> Cache size


      siz = abs(runtest(1))

      IF (para_env%is_source()) WRITE (iw, '(//,A,/)') " Test of copy ( F95 ) "

      DO i = 6, 24

         len = 2**i

         IF (8.0_dp*real(len, kind=dp) > max_memory*0.5_dp) EXIT

         ALLOCATE (ca(len), stat=ierr)

         IF (ierr /= 0) EXIT

         ALLOCATE (cb(len), stat=ierr)

         IF (ierr /= 0) EXIT


         CALL random_number(ca)

         ntim = nint(1.e7_dp/real(len, kind=dp))

         ntim = max(ntim, 1)

         ntim = min(ntim, siz*10000)


         tstart = m_walltime()

         DO j = 1, ntim

            cb(:) = ca(:)

            ca(1) = real(j, kind=dp)

         END DO

         tend = m_walltime()

         t = tend - tstart + threshold

         IF (t > 0.0_dp) THEN

            perf = real(ntim, kind=dp)*real(len, kind=dp)*1.e-6_dp/t

         ELSE

            perf = 0.0_dp

         END IF


         IF (para_env%is_source()) THEN

            WRITE (iw, '(A,i2,i10,A,T59,F14.4,A)') " Copy test:   Size = 2^", i, &

               len/1024, " Kwords", perf, " Mcopy/s"

         END IF


         DEALLOCATE (ca)

         DEALLOCATE (cb)

      END DO

      CALL para_env%sync()

   END SUBROUTINE copy_test


! **************************************************************************************************

!> \brief Tests the performance of different kinds of matrix matrix multiply

!>      kernels for the BLAS and F95 intrinsic matmul.

!> \param para_env ...

!> \param test_matmul ...

!> \param test_dgemm ...

!> \param iw ...

!> \par History

!>      none

!> \author JGH  6-NOV-2000

! **************************************************************************************************

   SUBROUTINE matmul_test(para_env, test_matmul, test_dgemm, iw)

      TYPE(mp_para_env_type), POINTER                    :: para_env

      LOGICAL                                            :: test_matmul, test_dgemm

      INTEGER                                            :: iw


      INTEGER                                            :: i, ierr, j, len, ntim, siz

      REAL(kind=dp)                                      :: perf, t, tend, tstart, xdum

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :)        :: ma, mb, mc


! test for matrix multpies


      IF (test_matmul) THEN

         siz = abs(runtest(2))

         IF (para_env%is_source()) WRITE (iw, '(//,A,/)') " Test of matmul ( F95 ) "

         DO i = 5, siz, 2

            len = 2**i + 1

            IF (8.0_dp*real(len*len, kind=dp) > max_memory*0.3_dp) EXIT

            ALLOCATE (ma(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            ALLOCATE (mb(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            ALLOCATE (mc(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            mc = 0.0_dp


            CALL random_number(xdum)

            ma = xdum

            CALL random_number(xdum)

            mb = xdum

            ntim = nint(1.e8_dp/(2.0_dp*real(len, kind=dp)**3))

            ntim = max(ntim, 1)

            ntim = min(ntim, siz*200)

            tstart = m_walltime()

            DO j = 1, ntim

               mc(:, :) = matmul(ma, mb)

               ma(1, 1) = real(j, kind=dp)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a * b         Size = ", len, perf, " Mflop/s"

            END IF

            tstart = m_walltime()

            DO j = 1, ntim

               mc(:, :) = mc + matmul(ma, mb)

               ma(1, 1) = real(j, kind=dp)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: a = a * b         Size = ", len, perf, " Mflop/s"

            END IF


            tstart = m_walltime()

            DO j = 1, ntim

               mc(:, :) = mc + matmul(ma, transpose(mb))

               ma(1, 1) = real(j, kind=dp)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a * b(T)      Size = ", len, perf, " Mflop/s"

            END IF


            tstart = m_walltime()

            DO j = 1, ntim

               mc(:, :) = mc + matmul(transpose(ma), mb)

               ma(1, 1) = real(j, kind=dp)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a(T) * b      Size = ", len, perf, " Mflop/s"

            END IF


            DEALLOCATE (ma)

            DEALLOCATE (mb)

            DEALLOCATE (mc)

         END DO

      END IF


      ! test for matrix multpies

      IF (test_dgemm) THEN

         siz = abs(runtest(5))

         IF (para_env%is_source()) WRITE (iw, '(//,A,/)') " Test of matmul ( BLAS ) "

         DO i = 5, siz, 2

            len = 2**i + 1

            IF (8.0_dp*real(len*len, kind=dp) > max_memory*0.3_dp) EXIT

            ALLOCATE (ma(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            ALLOCATE (mb(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            ALLOCATE (mc(len, len), stat=ierr)

            IF (ierr /= 0) EXIT

            mc = 0.0_dp


            CALL random_number(xdum)

            ma = xdum

            CALL random_number(xdum)

            mb = xdum

            ntim = nint(1.e8_dp/(2.0_dp*real(len, kind=dp)**3))

            ntim = max(ntim, 1)

            ntim = min(ntim, 1000)


            tstart = m_walltime()

            DO j = 1, ntim

               CALL dgemm("N", "N", len, len, len, 1.0_dp, ma, len, mb, len, 1.0_dp, mc, len)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a * b         Size = ", len, perf, " Mflop/s"

            END IF


            tstart = m_walltime()

            DO j = 1, ntim

               CALL dgemm("N", "N", len, len, len, 1.0_dp, ma, len, mb, len, 1.0_dp, mc, len)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: a = a * b         Size = ", len, perf, " Mflop/s"

            END IF


            tstart = m_walltime()

            DO j = 1, ntim

               CALL dgemm("N", "T", len, len, len, 1.0_dp, ma, len, mb, len, 1.0_dp, mc, len)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a * b(T)      Size = ", len, perf, " Mflop/s"

            END IF


            tstart = m_walltime()

            DO j = 1, ntim

               CALL dgemm("T", "N", len, len, len, 1.0_dp, ma, len, mb, len, 1.0_dp, mc, len)

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(ntim, kind=dp)*2.0_dp*real(len, kind=dp)**3*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            IF (para_env%is_source()) THEN

               WRITE (iw, '(A,i6,T59,F14.4,A)') &

                  " Matrix multiply test: c = a(T) * b      Size = ", len, perf, " Mflop/s"

            END IF


            DEALLOCATE (ma)

            DEALLOCATE (mb)

            DEALLOCATE (mc)

         END DO

      END IF


      CALL para_env%sync()


   END SUBROUTINE matmul_test


! **************************************************************************************************

!> \brief Tests the performance of all available FFT libraries for 3D FFTs

!> \param para_env ...

!> \param iw ...

!> \param fftw_plan_type ...

!> \param wisdom_file where FFTW3 should look to save/load wisdom

!> \par History

!>      none

!> \author JGH  6-NOV-2000

! **************************************************************************************************

   SUBROUTINE fft_test(para_env, iw, fftw_plan_type, wisdom_file)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw, fftw_plan_type

      CHARACTER(LEN=*), INTENT(IN)                       :: wisdom_file


      INTEGER, PARAMETER                                 :: ndate(3) = (/12, 48, 96/)


      INTEGER                                            :: iall, ierr, it, j, len, n(3), ntim, &

                                                            radix_in, radix_out, siz, stat

      COMPLEX(KIND=dp), DIMENSION(4, 4, 4)               :: zz

      COMPLEX(KIND=dp), ALLOCATABLE, DIMENSION(:, :, :)  :: ca, cb, cc

      CHARACTER(LEN=7)                                   :: method

      REAL(kind=dp)                                      :: flops, perf, scale, t, tdiff, tend, &

                                                            tstart

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :, :)     :: ra


! test for 3d FFT


      IF (para_env%is_source()) WRITE (iw, '(//,A,/)') " Test of 3D-FFT "

      siz = abs(runtest(3))


      DO iall = 1, 100

         SELECT CASE (iall)

         CASE DEFAULT

            EXIT

         CASE (1)

            CALL init_fft("FFTSG", alltoall=.false., fftsg_sizes=.true., wisdom_file=wisdom_file, &

                          pool_limit=10, plan_style=fftw_plan_type)

            method = "FFTSG  "

         CASE (2)

            cycle

         CASE (3)

            CALL init_fft("FFTW3", alltoall=.false., fftsg_sizes=.true., wisdom_file=wisdom_file, &

                          pool_limit=10, plan_style=fftw_plan_type)

            method = "FFTW3  "

         END SELECT

         n = 4

         zz = 0.0_dp

         CALL fft3d(fwfft, n, zz, status=stat)

         IF (stat == 0) THEN

            DO it = 1, 3

               radix_in = ndate(it)

               CALL fft_radix_operations(radix_in, radix_out, fft_radix_closest)

               len = radix_out

               n = len

               IF (16.0_dp*real(len*len*len, kind=dp) > max_memory*0.5_dp) EXIT

               ALLOCATE (ra(len, len, len), stat=ierr)

               ALLOCATE (ca(len, len, len), stat=ierr)

               CALL random_number(ra)

               ca(:, :, :) = ra

               CALL random_number(ra)

               ca(:, :, :) = ca + cmplx(0.0_dp, 1.0_dp, kind=dp)*ra

               flops = real(len**3, kind=dp)*15.0_dp*log(real(len, kind=dp))

               ntim = nint(siz*1.e7_dp/flops)

               ntim = max(ntim, 1)

               ntim = min(ntim, 200)

               scale = 1.0_dp/real(len**3, kind=dp)

               tstart = m_walltime()

               DO j = 1, ntim

                  CALL fft3d(fwfft, n, ca)

                  CALL fft3d(bwfft, n, ca)

               END DO

               tend = m_walltime()

               t = tend - tstart + threshold

               IF (t > 0.0_dp) THEN

                  perf = real(ntim, kind=dp)*2.0_dp*flops*1.e-6_dp/t

               ELSE

                  perf = 0.0_dp

               END IF


               IF (para_env%is_source()) THEN

                  WRITE (iw, '(T2,A,A,i6,T59,F14.4,A)') &

                     adjustr(method), " test (in-place)    Size = ", len, perf, " Mflop/s"

               END IF

               DEALLOCATE (ca)

               DEALLOCATE (ra)

            END DO

            IF (para_env%is_source()) WRITE (iw, *)

            ! test if input data is preserved

            len = 24

            n = len

            ALLOCATE (ra(len, len, len))

            ALLOCATE (ca(len, len, len))

            ALLOCATE (cb(len, len, len))

            ALLOCATE (cc(len, len, len))

            CALL random_number(ra)

            ca(:, :, :) = ra

            CALL random_number(ra)

            ca(:, :, :) = ca + cmplx(0.0_dp, 1.0_dp, kind=dp)*ra

            cc(:, :, :) = ca

            CALL fft3d(fwfft, n, ca, cb)

            tdiff = maxval(abs(ca - cc))

            IF (tdiff > 1.0e-12_dp) THEN

               IF (para_env%is_source()) &

                  WRITE (iw, '(T2,A,A,A)') adjustr(method), "         FWFFT ", &

                  "             Input array is changed in out-of-place FFT !"

            ELSE

               IF (para_env%is_source()) &

                  WRITE (iw, '(T2,A,A,A)') adjustr(method), "         FWFFT ", &

                  "         Input array is not changed in out-of-place FFT !"

            END IF

            ca(:, :, :) = cc

            CALL fft3d(bwfft, n, ca, cb)

            tdiff = maxval(abs(ca - cc))

            IF (tdiff > 1.0e-12_dp) THEN

               IF (para_env%is_source()) &

                  WRITE (iw, '(T2,A,A,A)') adjustr(method), "         BWFFT ", &

                  "             Input array is changed in out-of-place FFT !"

            ELSE

               IF (para_env%is_source()) &

                  WRITE (iw, '(T2,A,A,A)') adjustr(method), "         BWFFT ", &

                  "         Input array is not changed in out-of-place FFT !"

            END IF

            IF (para_env%is_source()) WRITE (iw, *)


            DEALLOCATE (ra)

            DEALLOCATE (ca)

            DEALLOCATE (cb)

            DEALLOCATE (cc)

         END IF

         CALL finalize_fft(para_env, wisdom_file=wisdom_file)

      END DO


   END SUBROUTINE fft_test


! **************************************************************************************************

!> \brief   test rs_pw_transfer performance

!> \param para_env ...

!> \param iw ...

!> \param globenv ...

!> \param rs_pw_transfer_section ...

!> \author  Joost VandeVondele

!>      9.2008 Randomise rs grid [Iain Bethune]

!>      (c) The Numerical Algorithms Group (NAG) Ltd, 2008 on behalf of the HECToR project

! **************************************************************************************************

   SUBROUTINE rs_pw_transfer_test(para_env, iw, globenv, rs_pw_transfer_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(global_environment_type), POINTER             :: globenv

      TYPE(section_vals_type), POINTER                   :: rs_pw_transfer_section


      CHARACTER(LEN=*), PARAMETER :: routinen = 'rs_pw_transfer_test'


      INTEGER                                            :: halo_size, handle, i_loop, n_loop, ns_max

      INTEGER, DIMENSION(3)                              :: no, np

      INTEGER, DIMENSION(:), POINTER                     :: i_vals

      LOGICAL                                            :: do_rs2pw

      REAL(kind=dp)                                      :: tend, tstart

      TYPE(cell_type), POINTER                           :: box

      TYPE(pw_grid_type), POINTER                        :: grid

      TYPE(pw_r3d_rs_type)                               :: ca

      TYPE(realspace_grid_desc_type), POINTER            :: rs_desc

      TYPE(realspace_grid_input_type)                    :: input_settings

      TYPE(realspace_grid_type)                          :: rs_grid

      TYPE(section_vals_type), POINTER                   :: rs_grid_section


      CALL timeset(routinen, handle)


      !..set fft lib

      CALL init_fft(globenv%default_fft_library, alltoall=.false., fftsg_sizes=.true., &

                    pool_limit=globenv%fft_pool_scratch_limit, &

                    wisdom_file=globenv%fftw_wisdom_file_name, &

                    plan_style=globenv%fftw_plan_type)


      ! .. set cell (should otherwise be irrelevant)

      NULLIFY (box)

      CALL cell_create(box)

      box%hmat = reshape((/20.0_dp, 0.0_dp, 0.0_dp, 0.0_dp, 20.0_dp, 0.0_dp, &

                           0.0_dp, 0.0_dp, 20.0_dp/), (/3, 3/))

      CALL init_cell(box)


      ! .. grid type and pw_grid

      NULLIFY (grid)

      CALL section_vals_val_get(rs_pw_transfer_section, "GRID", i_vals=i_vals)

      np = i_vals

      CALL pw_grid_create(grid, para_env, box%hmat, grid_span=fullspace, npts=np, fft_usage=.true., iounit=iw)

      no = grid%npts


      CALL ca%create(grid)

      CALL pw_zero(ca)


      ! .. rs input setting type

      CALL section_vals_val_get(rs_pw_transfer_section, "HALO_SIZE", i_val=halo_size)

      rs_grid_section => section_vals_get_subs_vals(rs_pw_transfer_section, "RS_GRID")

      ns_max = 2*halo_size + 1

      CALL init_input_type(input_settings, ns_max, rs_grid_section, 1, (/-1, -1, -1/))


      ! .. rs type

      NULLIFY (rs_desc)

      CALL rs_grid_create_descriptor(rs_desc, pw_grid=grid, input_settings=input_settings)

      CALL rs_grid_create(rs_grid, rs_desc)

      CALL rs_grid_print(rs_grid, iw)

      CALL rs_grid_zero(rs_grid)


      ! Put random values on the grid, so summation check will pick up errors

      CALL random_number(rs_grid%r)


      CALL section_vals_val_get(rs_pw_transfer_section, "N_loop", i_val=n_loop)

      CALL section_vals_val_get(rs_pw_transfer_section, "RS2PW", l_val=do_rs2pw)


      ! go for the real loops, sync to get max timings

      IF (para_env%is_source()) THEN

         WRITE (iw, '(T2,A)') ""

         WRITE (iw, '(T2,A)') "Timing rs_pw_transfer routine"

         WRITE (iw, '(T2,A)') ""

         WRITE (iw, '(T2,A)') "iteration      time[s]"

      END IF

      DO i_loop = 1, n_loop

         CALL para_env%sync()

         tstart = m_walltime()

         IF (do_rs2pw) THEN

            CALL transfer_rs2pw(rs_grid, ca)

         ELSE

            CALL transfer_pw2rs(rs_grid, ca)

         END IF

         CALL para_env%sync()

         tend = m_walltime()

         IF (para_env%is_source()) THEN

            WRITE (iw, '(T2,I9,1X,F12.6)') i_loop, tend - tstart

         END IF

      END DO


      !cleanup

      CALL rs_grid_release(rs_grid)

      CALL rs_grid_release_descriptor(rs_desc)

      CALL ca%release()

      CALL pw_grid_release(grid)

      CALL cell_release(box)

      CALL finalize_fft(para_env, wisdom_file=globenv%fftw_wisdom_file_name)


      CALL timestop(handle)


   END SUBROUTINE rs_pw_transfer_test


! **************************************************************************************************

!> \brief Tests the performance of PW calls to FFT routines

!> \param para_env ...

!> \param iw ...

!> \param globenv ...

!> \param pw_transfer_section ...

!> \par History

!>      JGH  6-Feb-2001 : Test and performance code

!>      Made input sensitive [Joost VandeVondele]

!> \author JGH  1-JAN-2001

! **************************************************************************************************

   SUBROUTINE pw_fft_test(para_env, iw, globenv, pw_transfer_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(global_environment_type), POINTER             :: globenv

      TYPE(section_vals_type), POINTER                   :: pw_transfer_section


      REAL(kind=dp), PARAMETER                           :: toler = 1.e-11_dp


      INTEGER                                            :: blocked_id, grid_span, i_layout, i_rep, &

                                                            ig, ip, itmp, n_loop, n_rep, nn, p, q

      INTEGER, ALLOCATABLE, DIMENSION(:, :)              :: layouts

      INTEGER, DIMENSION(2)                              :: distribution_layout

      INTEGER, DIMENSION(3)                              :: no, np

      INTEGER, DIMENSION(:), POINTER                     :: i_vals

      LOGICAL                                            :: debug, is_fullspace, odd, &

                                                            pw_grid_layout_all, spherical

      REAL(kind=dp)                                      :: em, et, flops, gsq, perf, t, t_max, &

                                                            t_min, tend, tstart

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: t_end, t_start

      TYPE(cell_type), POINTER                           :: box

      TYPE(pw_c1d_gs_type)                               :: ca, cc

      TYPE(pw_c3d_rs_type)                               :: cb

      TYPE(pw_grid_type), POINTER                        :: grid


!..set fft lib


      CALL init_fft(globenv%default_fft_library, alltoall=.false., fftsg_sizes=.true., &

                    pool_limit=globenv%fft_pool_scratch_limit, &

                    wisdom_file=globenv%fftw_wisdom_file_name, &

                    plan_style=globenv%fftw_plan_type)


      !..the unit cell (should not really matter, the number of grid points do)

      NULLIFY (box, grid)

      CALL cell_create(box)

      box%hmat = reshape((/10.0_dp, 0.0_dp, 0.0_dp, 0.0_dp, 8.0_dp, 0.0_dp, &

                           0.0_dp, 0.0_dp, 7.0_dp/), (/3, 3/))

      CALL init_cell(box)


      CALL section_vals_get(pw_transfer_section, n_repetition=n_rep)

      DO i_rep = 1, n_rep


         ! how often should we do the transfer

         CALL section_vals_val_get(pw_transfer_section, "N_loop", i_rep_section=i_rep, i_val=n_loop)

         ALLOCATE (t_start(n_loop))

         ALLOCATE (t_end(n_loop))


         ! setup of the grids

         CALL section_vals_val_get(pw_transfer_section, "GRID", i_rep_section=i_rep, i_vals=i_vals)

         np = i_vals


         CALL section_vals_val_get(pw_transfer_section, "PW_GRID_BLOCKED", i_rep_section=i_rep, i_val=blocked_id)

         CALL section_vals_val_get(pw_transfer_section, "DEBUG", i_rep_section=i_rep, l_val=debug)


         CALL section_vals_val_get(pw_transfer_section, "PW_GRID_LAYOUT_ALL", i_rep_section=i_rep, &

                                   l_val=pw_grid_layout_all)


         ! prepare to loop over all or a specific layout

         IF (pw_grid_layout_all) THEN

            ! count layouts that fit

            itmp = 0

            ! start from 2, (/1,para_env%num_pe/) is not supported

            DO p = 2, para_env%num_pe

               q = para_env%num_pe/p

               IF (p*q == para_env%num_pe) THEN

                  itmp = itmp + 1

               END IF

            END DO

            ! build list

            ALLOCATE (layouts(2, itmp))

            itmp = 0

            DO p = 2, para_env%num_pe

               q = para_env%num_pe/p

               IF (p*q == para_env%num_pe) THEN

                  itmp = itmp + 1

                  layouts(:, itmp) = (/p, q/)

               END IF

            END DO

         ELSE

            CALL section_vals_val_get(pw_transfer_section, "PW_GRID_LAYOUT", i_rep_section=i_rep, i_vals=i_vals)

            ALLOCATE (layouts(2, 1))

            layouts(:, 1) = i_vals

         END IF


         DO i_layout = 1, SIZE(layouts, 2)


            distribution_layout = layouts(:, i_layout)


            CALL section_vals_val_get(pw_transfer_section, "PW_GRID", i_rep_section=i_rep, i_val=itmp)


            ! from cp_control_utils

            SELECT CASE (itmp)

            CASE (do_pwgrid_spherical)

               spherical = .true.

               is_fullspace = .false.

            CASE (do_pwgrid_ns_fullspace)

               spherical = .false.

               is_fullspace = .true.

            CASE (do_pwgrid_ns_halfspace)

               spherical = .false.

               is_fullspace = .false.

            END SELECT


            ! from pw_env_methods

            IF (spherical) THEN

               grid_span = halfspace

               spherical = .true.

               odd = .true.

            ELSE IF (is_fullspace) THEN

               grid_span = fullspace

               spherical = .false.

               odd = .false.

            ELSE

               grid_span = halfspace

               spherical = .false.

               odd = .true.

            END IF


            ! actual setup

            CALL pw_grid_create(grid, para_env, box%hmat, grid_span=grid_span, odd=odd, spherical=spherical, &

                                blocked=blocked_id, npts=np, fft_usage=.true., &

                                rs_dims=distribution_layout, iounit=iw)


            IF (iw > 0) CALL m_flush(iw)


            ! note that the number of grid points might be different from what the user requested (fft-able needed)

            no = grid%npts


            CALL ca%create(grid)

            CALL cb%create(grid)

            CALL cc%create(grid)


            ! initialize data

            CALL pw_zero(ca)

            CALL pw_zero(cb)

            CALL pw_zero(cc)

            nn = SIZE(ca%array)

            DO ig = 1, nn

               gsq = grid%gsq(ig)

               ca%array(ig) = exp(-gsq)

            END DO


            flops = product(no)*30.0_dp*log(real(maxval(no), kind=dp))

            tstart = m_walltime()

            DO ip = 1, n_loop

               CALL para_env%sync()

               t_start(ip) = m_walltime()

               CALL pw_transfer(ca, cb, debug)

               CALL pw_transfer(cb, cc, debug)

               CALL para_env%sync()

               t_end(ip) = m_walltime()

            END DO

            tend = m_walltime()

            t = tend - tstart + threshold

            IF (t > 0.0_dp) THEN

               perf = real(n_loop, kind=dp)*2.0_dp*flops*1.e-6_dp/t

            ELSE

               perf = 0.0_dp

            END IF


            em = maxval(abs(ca%array(:) - cc%array(:)))

            CALL para_env%max(em)

            et = sum(abs(ca%array(:) - cc%array(:)))

            CALL para_env%sum(et)

            t_min = minval(t_end - t_start)

            t_max = maxval(t_end - t_start)


            IF (para_env%is_source()) THEN

               WRITE (iw, *)

               WRITE (iw, '(A,T67,E14.6)') " Parallel FFT Tests: Maximal Error ", em

               WRITE (iw, '(A,T67,E14.6)') " Parallel FFT Tests: Total Error ", et

               WRITE (iw, '(A,T67,F14.0)') &

                  " Parallel FFT Tests: Performance [Mflops] ", perf

               WRITE (iw, '(A,T67,F14.6)') " Best time : ", t_min

               WRITE (iw, '(A,T67,F14.6)') " Worst time: ", t_max

               IF (iw > 0) CALL m_flush(iw)

            END IF


            ! need debugging ???

            IF (em > toler .OR. et > toler) THEN

               cpwarn("The FFT results are not accurate ... starting debug pw_transfer")

               CALL pw_transfer(ca, cb, .true.)

               CALL pw_transfer(cb, cc, .true.)

            END IF


            ! done with these grids

            CALL ca%release()

            CALL cb%release()

            CALL cc%release()

            CALL pw_grid_release(grid)


         END DO


         ! local arrays

         DEALLOCATE (layouts)

         DEALLOCATE (t_start)

         DEALLOCATE (t_end)


      END DO


      ! cleanup

      CALL cell_release(box)

      CALL finalize_fft(para_env, wisdom_file=globenv%fftw_wisdom_file_name)


   END SUBROUTINE pw_fft_test


! **************************************************************************************************

!> \brief Tests the eigensolver library routines

!> \param para_env ...

!> \param iw ...

!> \param eigensolver_section ...

!> \par History

!>      JGH  6-Feb-2001 : Test and performance code

!> \author JGH  1-JAN-2001

! **************************************************************************************************

   SUBROUTINE eigensolver_test(para_env, iw, eigensolver_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(section_vals_type), POINTER                   :: eigensolver_section


      INTEGER                                            :: diag_method, i, i_loop, i_rep, &

                                                            init_method, j, n, n_loop, n_rep, &

                                                            neig, unit_number

      REAL(kind=dp)                                      :: t1, t2

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: eigenvalues

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :)        :: buffer

      TYPE(cp_blacs_env_type), POINTER                   :: blacs_env

      TYPE(cp_fm_struct_type), POINTER                   :: fmstruct

      TYPE(cp_fm_type)                                   :: eigenvectors, matrix, work

      TYPE(rng_stream_type), ALLOCATABLE                 :: rng_stream


      IF (iw > 0) THEN

         WRITE (unit=iw, fmt="(/,/,T2,A,/)") "EIGENSOLVER TEST"

      END IF


      ! create blacs env corresponding to para_env

      NULLIFY (blacs_env)

      CALL cp_blacs_env_create(blacs_env=blacs_env, &

                               para_env=para_env)


      ! loop over all tests

      CALL section_vals_get(eigensolver_section, n_repetition=n_rep)

      DO i_rep = 1, n_rep


         ! parse section

         CALL section_vals_val_get(eigensolver_section, "N", i_rep_section=i_rep, i_val=n)

         CALL section_vals_val_get(eigensolver_section, "EIGENVALUES", i_rep_section=i_rep, i_val=neig)

         CALL section_vals_val_get(eigensolver_section, "DIAG_METHOD", i_rep_section=i_rep, i_val=diag_method)

         CALL section_vals_val_get(eigensolver_section, "INIT_METHOD", i_rep_section=i_rep, i_val=init_method)

         CALL section_vals_val_get(eigensolver_section, "N_loop", i_rep_section=i_rep, i_val=n_loop)


         ! proper number of eigs

         IF (neig < 0) neig = n

         neig = min(neig, n)


         ! report

         IF (iw > 0) THEN

            WRITE (iw, *) "Matrix size", n

            WRITE (iw, *) "Number of eigenvalues", neig

            WRITE (iw, *) "Timing loops", n_loop

            SELECT CASE (diag_method)

            CASE (do_diag_syevd)

               WRITE (iw, *) "Diag using syevd"

            CASE (do_diag_syevx)

               WRITE (iw, *) "Diag using syevx"

            CASE DEFAULT

               ! stop

            END SELECT


            SELECT CASE (init_method)

            CASE (do_mat_random)

               WRITE (iw, *) "using random matrix"

            CASE (do_mat_read)

               WRITE (iw, *) "reading from file"

            CASE DEFAULT

               ! stop

            END SELECT

         END IF


         ! create matrix struct type

         NULLIFY (fmstruct)

         CALL cp_fm_struct_create(fmstruct=fmstruct, &

                                  para_env=para_env, &

                                  context=blacs_env, &

                                  nrow_global=n, &

                                  ncol_global=n)


         ! create all needed matrices, and buffers for the eigenvalues

         CALL cp_fm_create(matrix=matrix, &

                           matrix_struct=fmstruct, &

                           name="MATRIX")

         CALL cp_fm_set_all(matrix, 0.0_dp)


         CALL cp_fm_create(matrix=eigenvectors, &

                           matrix_struct=fmstruct, &

                           name="EIGENVECTORS")

         CALL cp_fm_set_all(eigenvectors, 0.0_dp)


         CALL cp_fm_create(matrix=work, &

                           matrix_struct=fmstruct, &

                           name="WORK")

         CALL cp_fm_set_all(matrix, 0.0_dp)


         ALLOCATE (eigenvalues(n))

         eigenvalues = 0.0_dp

         ALLOCATE (buffer(1, n))


         ! generate initial matrix, either by reading a file, or using random numbers

         IF (para_env%is_source()) THEN

            SELECT CASE (init_method)

            CASE (do_mat_random)

               rng_stream = rng_stream_type( &

                            name="rng_stream", &

                            distribution_type=uniform, &

                            extended_precision=.true.)

            CASE (do_mat_read)

               CALL open_file(file_name="MATRIX", &

                              file_action="READ", &

                              file_form="FORMATTED", &

                              file_status="OLD", &

                              unit_number=unit_number)

            END SELECT

         END IF


         DO i = 1, n

            IF (para_env%is_source()) THEN

               SELECT CASE (init_method)

               CASE (do_mat_random)

                  DO j = i, n

                     buffer(1, j) = rng_stream%next() - 0.5_dp

                  END DO

                  !MK activate/modify for a diagonal dominant symmetric matrix:

                  !MK buffer(1,i) = 10.0_dp*buffer(1,i)

               CASE (do_mat_read)

                  READ (unit=unit_number, fmt=*) buffer(1, 1:n)

               END SELECT

            END IF

            CALL para_env%bcast(buffer)

            SELECT CASE (init_method)

            CASE (do_mat_random)

               CALL cp_fm_set_submatrix(fm=matrix, &

                                        new_values=buffer, &

                                        start_row=i, &

                                        start_col=i, &

                                        n_rows=1, &

                                        n_cols=n - i + 1, &

                                        alpha=1.0_dp, &

                                        beta=0.0_dp, &

                                        transpose=.false.)

               CALL cp_fm_set_submatrix(fm=matrix, &

                                        new_values=buffer, &

                                        start_row=i, &

                                        start_col=i, &

                                        n_rows=n - i + 1, &

                                        n_cols=1, &

                                        alpha=1.0_dp, &

                                        beta=0.0_dp, &

                                        transpose=.true.)

            CASE (do_mat_read)

               CALL cp_fm_set_submatrix(fm=matrix, &

                                        new_values=buffer, &

                                        start_row=i, &

                                        start_col=1, &

                                        n_rows=1, &

                                        n_cols=n, &

                                        alpha=1.0_dp, &

                                        beta=0.0_dp, &

                                        transpose=.false.)

            END SELECT

         END DO


         DEALLOCATE (buffer)


         IF (para_env%is_source()) THEN

            SELECT CASE (init_method)

            CASE (do_mat_read)

               CALL close_file(unit_number=unit_number)

            END SELECT

         END IF


         DO i_loop = 1, n_loop

            eigenvalues = 0.0_dp

            CALL cp_fm_set_all(eigenvectors, 0.0_dp)

            CALL cp_fm_to_fm(source=matrix, &

                             destination=work)


            ! DONE, now testing

            t1 = m_walltime()

            SELECT CASE (diag_method)

            CASE (do_diag_syevd)

               CALL cp_fm_syevd(matrix=work, &

                                eigenvectors=eigenvectors, &

                                eigenvalues=eigenvalues)

            CASE (do_diag_syevx)

               CALL cp_fm_syevx(matrix=work, &

                                eigenvectors=eigenvectors, &

                                eigenvalues=eigenvalues, &

                                neig=neig, &

                                work_syevx=1.0_dp)

            END SELECT

            t2 = m_walltime()

            IF (iw > 0) WRITE (iw, *) "Timing for loop ", i_loop, " : ", t2 - t1

         END DO


         IF (iw > 0) THEN

            WRITE (iw, *) "Eigenvalues: "

            WRITE (unit=iw, fmt="(T3,5F14.6)") eigenvalues(1:neig)

            WRITE (unit=iw, fmt="(T3,A4,F16.6)") "Sum:", sum(eigenvalues(1:neig))

            WRITE (iw, *) ""

         END IF


         ! Clean up

         DEALLOCATE (eigenvalues)

         CALL cp_fm_release(matrix=work)

         CALL cp_fm_release(matrix=eigenvectors)

         CALL cp_fm_release(matrix=matrix)

         CALL cp_fm_struct_release(fmstruct=fmstruct)


      END DO


      CALL cp_blacs_env_release(blacs_env=blacs_env)


   END SUBROUTINE eigensolver_test


! **************************************************************************************************

!> \brief Tests the parallel matrix multiply

!> \param para_env ...

!> \param iw ...

!> \param cp_fm_gemm_test_section ...

! **************************************************************************************************

   SUBROUTINE cp_fm_gemm_test(para_env, iw, cp_fm_gemm_test_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(section_vals_type), POINTER                   :: cp_fm_gemm_test_section


      CHARACTER(LEN=1)                                   :: transa, transb

      INTEGER :: i_loop, i_rep, k, m, n, n_loop, n_rep, ncol_block, ncol_block_actual, &

         ncol_global, np, nrow_block, nrow_block_actual, nrow_global

      INTEGER, DIMENSION(:), POINTER                     :: grid_2d

      LOGICAL                                            :: force_blocksize, row_major, transa_p, &

                                                            transb_p

      REAL(kind=dp)                                      :: t1, t2, t3, t4

      TYPE(cp_blacs_env_type), POINTER                   :: blacs_env

      TYPE(cp_fm_struct_type), POINTER                   :: fmstruct_a, fmstruct_b, fmstruct_c

      TYPE(cp_fm_type)                                   :: matrix_a, matrix_b, matrix_c


      CALL section_vals_get(cp_fm_gemm_test_section, n_repetition=n_rep)

      DO i_rep = 1, n_rep


         ! how often should we do the multiply

         CALL section_vals_val_get(cp_fm_gemm_test_section, "N_loop", i_rep_section=i_rep, i_val=n_loop)


         ! matrices def.

         CALL section_vals_val_get(cp_fm_gemm_test_section, "K", i_rep_section=i_rep, i_val=k)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "N", i_rep_section=i_rep, i_val=n)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "M", i_rep_section=i_rep, i_val=m)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "transa", i_rep_section=i_rep, l_val=transa_p)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "transb", i_rep_section=i_rep, l_val=transb_p)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "nrow_block", i_rep_section=i_rep, i_val=nrow_block)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "ncol_block", i_rep_section=i_rep, i_val=ncol_block)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "ROW_MAJOR", i_rep_section=i_rep, l_val=row_major)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "GRID_2D", i_rep_section=i_rep, i_vals=grid_2d)

         CALL section_vals_val_get(cp_fm_gemm_test_section, "FORCE_BLOCKSIZE", i_rep_section=i_rep, l_val=force_blocksize)

         transa = "N"

         transb = "N"

         IF (transa_p) transa = "T"

         IF (transb_p) transb = "T"


         IF (iw > 0) THEN

            WRITE (iw, '(T2,A)') "----------- TESTING PARALLEL MATRIX MULTIPLY -------------"

            WRITE (iw, '(T2,A)', advance="NO") "C = "

            IF (transa_p) THEN

               WRITE (iw, '(A)', advance="NO") "TRANSPOSE(A) x"

            ELSE

               WRITE (iw, '(A)', advance="NO") "A x "

            END IF

            IF (transb_p) THEN

               WRITE (iw, '(A)') "TRANSPOSE(B) "

            ELSE

               WRITE (iw, '(A)') "B "

            END IF

            WRITE (iw, '(T2,A,T50,I5,A,I5)') 'requested block size', nrow_block, ' by ', ncol_block

            WRITE (iw, '(T2,A,T50,I5)') 'number of repetitions of cp_fm_gemm ', n_loop

            WRITE (iw, '(T2,A,T50,L5)') 'Row Major', row_major

            WRITE (iw, '(T2,A,T50,2I7)') 'GRID_2D ', grid_2d

            WRITE (iw, '(T2,A,T50,L5)') 'Force blocksize ', force_blocksize

            ! check the return value of pilaenv, too small values limit the performance (assuming pdgemm is the vanilla variant)

            np = cp_fm_pilaenv(0, 'D')

            IF (np > 0) THEN

               WRITE (iw, '(T2,A,T50,I5)') 'PILAENV blocksize', np

            END IF

         END IF


         NULLIFY (blacs_env)

         CALL cp_blacs_env_create(blacs_env=blacs_env, &

                                  para_env=para_env, &

                                  row_major=row_major, &

                                  grid_2d=grid_2d)


         NULLIFY (fmstruct_a)

         IF (transa_p) THEN

            nrow_global = m; ncol_global = k

         ELSE

            nrow_global = k; ncol_global = m

         END IF

         CALL cp_fm_struct_create(fmstruct=fmstruct_a, para_env=para_env, context=blacs_env, &

                                  nrow_global=nrow_global, ncol_global=ncol_global, &

                                  nrow_block=nrow_block, ncol_block=ncol_block, force_block=force_blocksize)

         CALL cp_fm_struct_get(fmstruct_a, nrow_block=nrow_block_actual, ncol_block=ncol_block_actual)

         IF (iw > 0) WRITE (iw, '(T2,A,I9,A,I9,A,I5,A,I5)') 'matrix A ', nrow_global, " by ", ncol_global, &

            ' using blocks of ', nrow_block_actual, ' by ', ncol_block_actual


         IF (transb_p) THEN

            nrow_global = n; ncol_global = m

         ELSE

            nrow_global = m; ncol_global = n

         END IF

         NULLIFY (fmstruct_b)

         CALL cp_fm_struct_create(fmstruct=fmstruct_b, para_env=para_env, context=blacs_env, &

                                  nrow_global=nrow_global, ncol_global=ncol_global, &

                                  nrow_block=nrow_block, ncol_block=ncol_block, force_block=force_blocksize)

         CALL cp_fm_struct_get(fmstruct_b, nrow_block=nrow_block_actual, ncol_block=ncol_block_actual)

         IF (iw > 0) WRITE (iw, '(T2,A,I9,A,I9,A,I5,A,I5)') 'matrix B ', nrow_global, " by ", ncol_global, &

            ' using blocks of ', nrow_block_actual, ' by ', ncol_block_actual


         NULLIFY (fmstruct_c)

         nrow_global = k

         ncol_global = n

         CALL cp_fm_struct_create(fmstruct=fmstruct_c, para_env=para_env, context=blacs_env, &

                                  nrow_global=nrow_global, ncol_global=ncol_global, &

                                  nrow_block=nrow_block, ncol_block=ncol_block, force_block=force_blocksize)

         CALL cp_fm_struct_get(fmstruct_c, nrow_block=nrow_block_actual, ncol_block=ncol_block_actual)

         IF (iw > 0) WRITE (iw, '(T2,A,I9,A,I9,A,I5,A,I5)') 'matrix C ', nrow_global, " by ", ncol_global, &

            ' using blocks of ', nrow_block_actual, ' by ', ncol_block_actual


         CALL cp_fm_create(matrix=matrix_a, matrix_struct=fmstruct_a, name="MATRIX A")

         CALL cp_fm_create(matrix=matrix_b, matrix_struct=fmstruct_b, name="MATRIX B")

         CALL cp_fm_create(matrix=matrix_c, matrix_struct=fmstruct_c, name="MATRIX C")


         CALL random_number(matrix_a%local_data)

         CALL random_number(matrix_b%local_data)

         CALL random_number(matrix_c%local_data)


         IF (iw > 0) CALL m_flush(iw)


         t1 = m_walltime()

         DO i_loop = 1, n_loop

            t3 = m_walltime()

            CALL parallel_gemm(transa, transb, k, n, m, 1.0_dp, matrix_a, matrix_b, 0.0_dp, matrix_c)

            t4 = m_walltime()

            IF (iw > 0) THEN

               WRITE (iw, '(T2,A,T50,F12.6)') "cp_fm_gemm timing: ", (t4 - t3)

               CALL m_flush(iw)

            END IF

         END DO

         t2 = m_walltime()


         IF (iw > 0) THEN

            WRITE (iw, '(T2,A,T50,F12.6)') "average cp_fm_gemm timing: ", (t2 - t1)/n_loop

            IF (t2 > t1) THEN

               WRITE (iw, '(T2,A,T50,F12.6)') "cp_fm_gemm Gflops per MPI task: ", &

                  2*real(m, kind=dp)*real(n, kind=dp)*real(k, kind=dp)*n_loop/max(0.001_dp, t2 - t1)/1.0e9_dp/para_env%num_pe

            END IF

         END IF


         CALL cp_fm_release(matrix=matrix_a)

         CALL cp_fm_release(matrix=matrix_b)

         CALL cp_fm_release(matrix=matrix_c)

         CALL cp_fm_struct_release(fmstruct=fmstruct_a)

         CALL cp_fm_struct_release(fmstruct=fmstruct_b)

         CALL cp_fm_struct_release(fmstruct=fmstruct_c)

         CALL cp_blacs_env_release(blacs_env=blacs_env)


      END DO


   END SUBROUTINE cp_fm_gemm_test


! **************************************************************************************************

!> \brief Tests the DBCSR interface.

!> \param para_env ...

!> \param iw ...

!> \param input_section ...

! **************************************************************************************************

   SUBROUTINE cp_dbcsr_tests(para_env, iw, input_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(section_vals_type), POINTER                   :: input_section


      CHARACTER, DIMENSION(3)                            :: types

      INTEGER                                            :: data_type, i_rep, k, m, n, n_loop, &

                                                            n_rep, test_type

      INTEGER, DIMENSION(:), POINTER                     :: bs_k, bs_m, bs_n, nproc

      LOGICAL                                            :: always_checksum, retain_sparsity, &

                                                            transa_p, transb_p

      REAL(kind=dp)                                      :: alpha, beta, filter_eps, s_a, s_b, s_c


!   ---------------------------------------------------------------------------


      NULLIFY (bs_m, bs_n, bs_k)

      CALL section_vals_get(input_section, n_repetition=n_rep)

      CALL dbcsr_reset_randmat_seed()

      DO i_rep = 1, n_rep

         ! how often should we do the multiply

         CALL section_vals_val_get(input_section, "N_loop", i_rep_section=i_rep, i_val=n_loop)


         ! matrices def.

         CALL section_vals_val_get(input_section, "TEST_TYPE", i_rep_section=i_rep, i_val=test_type)

         CALL section_vals_val_get(input_section, "DATA_TYPE", i_rep_section=i_rep, i_val=data_type)

         CALL section_vals_val_get(input_section, "K", i_rep_section=i_rep, i_val=k)

         CALL section_vals_val_get(input_section, "N", i_rep_section=i_rep, i_val=n)

         CALL section_vals_val_get(input_section, "M", i_rep_section=i_rep, i_val=m)

         CALL section_vals_val_get(input_section, "transa", i_rep_section=i_rep, l_val=transa_p)

         CALL section_vals_val_get(input_section, "transb", i_rep_section=i_rep, l_val=transb_p)

         CALL section_vals_val_get(input_section, "bs_m", i_rep_section=i_rep, &

                                   i_vals=bs_m)

         CALL section_vals_val_get(input_section, "bs_n", i_rep_section=i_rep, &

                                   i_vals=bs_n)

         CALL section_vals_val_get(input_section, "bs_k", i_rep_section=i_rep, &

                                   i_vals=bs_k)

         CALL section_vals_val_get(input_section, "keepsparse", i_rep_section=i_rep, l_val=retain_sparsity)

         CALL section_vals_val_get(input_section, "asparsity", i_rep_section=i_rep, r_val=s_a)

         CALL section_vals_val_get(input_section, "bsparsity", i_rep_section=i_rep, r_val=s_b)

         CALL section_vals_val_get(input_section, "csparsity", i_rep_section=i_rep, r_val=s_c)

         CALL section_vals_val_get(input_section, "alpha", i_rep_section=i_rep, r_val=alpha)

         CALL section_vals_val_get(input_section, "beta", i_rep_section=i_rep, r_val=beta)

         CALL section_vals_val_get(input_section, "nproc", i_rep_section=i_rep, &

                                   i_vals=nproc)

         CALL section_vals_val_get(input_section, "atype", i_rep_section=i_rep, &

                                   c_val=types(1))

         CALL section_vals_val_get(input_section, "btype", i_rep_section=i_rep, &

                                   c_val=types(2))

         CALL section_vals_val_get(input_section, "ctype", i_rep_section=i_rep, &

                                   c_val=types(3))

         CALL section_vals_val_get(input_section, "filter_eps", &

                                   i_rep_section=i_rep, r_val=filter_eps)

         CALL section_vals_val_get(input_section, "ALWAYS_CHECKSUM", i_rep_section=i_rep, l_val=always_checksum)


         CALL dbcsr_run_tests(para_env%get_handle(), iw, nproc, &

                              (/m, n, k/), &

                              (/transa_p, transb_p/), &

                              bs_m, bs_n, bs_k, &

                              (/s_a, s_b, s_c/), &

                              alpha, beta, &

                              data_type=data_type, &

                              test_type=test_type, &

                              n_loops=n_loop, eps=filter_eps, retain_sparsity=retain_sparsity, &

                              always_checksum=always_checksum)

      END DO

   END SUBROUTINE cp_dbcsr_tests


! **************************************************************************************************

!> \brief Tests the DBM library.

!> \param para_env ...

!> \param iw ...

!> \param input_section ...

! **************************************************************************************************

   SUBROUTINE run_dbm_tests(para_env, iw, input_section)


      TYPE(mp_para_env_type), POINTER                    :: para_env

      INTEGER                                            :: iw

      TYPE(section_vals_type), POINTER                   :: input_section


      INTEGER                                            :: i_rep, k, m, n, n_loop, n_rep

      INTEGER, DIMENSION(:), POINTER                     :: bs_k, bs_m, bs_n

      LOGICAL                                            :: always_checksum, retain_sparsity, &

                                                            transa_p, transb_p

      REAL(kind=dp)                                      :: alpha, beta, filter_eps, s_a, s_b, s_c


!   ---------------------------------------------------------------------------


      NULLIFY (bs_m, bs_n, bs_k)

      CALL section_vals_get(input_section, n_repetition=n_rep)

      CALL dbcsr_reset_randmat_seed()

      DO i_rep = 1, n_rep

         CALL section_vals_val_get(input_section, "N_loop", i_rep_section=i_rep, i_val=n_loop)

         CALL section_vals_val_get(input_section, "K", i_rep_section=i_rep, i_val=k)

         CALL section_vals_val_get(input_section, "N", i_rep_section=i_rep, i_val=n)

         CALL section_vals_val_get(input_section, "M", i_rep_section=i_rep, i_val=m)

         CALL section_vals_val_get(input_section, "transa", i_rep_section=i_rep, l_val=transa_p)

         CALL section_vals_val_get(input_section, "transb", i_rep_section=i_rep, l_val=transb_p)

         CALL section_vals_val_get(input_section, "bs_m", i_rep_section=i_rep, i_vals=bs_m)

         CALL section_vals_val_get(input_section, "bs_n", i_rep_section=i_rep, i_vals=bs_n)

         CALL section_vals_val_get(input_section, "bs_k", i_rep_section=i_rep, i_vals=bs_k)

         CALL section_vals_val_get(input_section, "keepsparse", i_rep_section=i_rep, l_val=retain_sparsity)

         CALL section_vals_val_get(input_section, "asparsity", i_rep_section=i_rep, r_val=s_a)

         CALL section_vals_val_get(input_section, "bsparsity", i_rep_section=i_rep, r_val=s_b)

         CALL section_vals_val_get(input_section, "csparsity", i_rep_section=i_rep, r_val=s_c)

         CALL section_vals_val_get(input_section, "alpha", i_rep_section=i_rep, r_val=alpha)

         CALL section_vals_val_get(input_section, "beta", i_rep_section=i_rep, r_val=beta)

         CALL section_vals_val_get(input_section, "filter_eps", i_rep_section=i_rep, r_val=filter_eps)

         CALL section_vals_val_get(input_section, "ALWAYS_CHECKSUM", i_rep_section=i_rep, l_val=always_checksum)


         CALL dbm_run_tests(mp_group=para_env, &

                            io_unit=iw, &

                            matrix_sizes=(/m, n, k/), &

                            trs=(/transa_p, transb_p/), &

                            bs_m=bs_m, &

                            bs_n=bs_n, &

                            bs_k=bs_k, &

                            sparsities=(/s_a, s_b, s_c/), &

                            alpha=alpha, &

                            beta=beta, &

                            n_loops=n_loop, &

                            eps=filter_eps, &

                            retain_sparsity=retain_sparsity, &

                            always_checksum=always_checksum)

      END DO

   END SUBROUTINE run_dbm_tests


END MODULE library_tests

dgemm
static void dgemm(const char transa, const char transb, const int m, const int n, const int k, const double alpha, const double *a, const int lda, const double *b, const int ldb, const double beta, double *c, const int ldc)
Convenient wrapper to hide Fortran nature of dgemm_, swapping a and b.
Definition grid_cpu_task_list.c:214

cp_fm_types::cp_fm_release
Definition cp_fm_types.F:87

cp_fm_types::cp_fm_to_fm
Definition cp_fm_types.F:82

fft_tools::fft3d
Definition fft_tools.F:166

parallel_gemm_api::parallel_gemm
Definition parallel_gemm_api.F:38

pw_grids::pw_grid_create
Definition pw_grids.F:81

pw_methods::pw_transfer
Definition pw_methods.F:303

pw_methods::pw_zero
Definition pw_methods.F:82

ai_coulomb_test
Test of Electron Repulsion Routines (ERI)
Definition ai_coulomb_test.F:14

ai_coulomb_test::threshold
real(kind=dp), parameter threshold
Definition ai_coulomb_test.F:29

ai_coulomb_test::eri_test
subroutine, public eri_test(iw)
...
Definition ai_coulomb_test.F:43

cell_methods
Handles all functions related to the CELL.
Definition cell_methods.F:15

cell_methods::init_cell
subroutine, public init_cell(cell, hmat, periodic)
Initialise/readjust a simulation cell after hmat has been changed.
Definition cell_methods.F:117

cell_methods::cell_create
subroutine, public cell_create(cell, hmat, periodic, tag)
allocates and initializes a cell
Definition cell_methods.F:85

cell_types
Handles all functions related to the CELL.
Definition cell_types.F:15

cell_types::cell_release
subroutine, public cell_release(cell)
releases the given cell (see doc/ReferenceCounting.html)
Definition cell_types.F:559

cg_test
Test of Clebsch-Gordon Coefficients.
Definition cg_test.F:14

cg_test::clebsch_gordon_test
subroutine, public clebsch_gordon_test()
...
Definition cg_test.F:42

cp_blacs_env
methods related to the blacs parallel environment
Definition cp_blacs_env.F:15

cp_blacs_env::cp_blacs_env_release
subroutine, public cp_blacs_env_release(blacs_env)
releases the given blacs_env
Definition cp_blacs_env.F:274

cp_blacs_env::cp_blacs_env_create
subroutine, public cp_blacs_env_create(blacs_env, para_env, blacs_grid_layout, blacs_repeatable, row_major, grid_2d)
allocates and initializes a type that represent a blacs context
Definition cp_blacs_env.F:123

cp_dbcsr_api
Definition cp_dbcsr_api.F:8

cp_eri_mme_interface
Interface to Minimax-Ewald method for periodic ERI's to be used in CP2K.
Definition cp_eri_mme_interface.F:12

cp_eri_mme_interface::cp_eri_mme_perf_acc_test
subroutine, public cp_eri_mme_perf_acc_test(para_env, iw, eri_mme_test_section)
...
Definition cp_eri_mme_interface.F:753

cp_files
Utility routines to open and close files. Tracking of preconnections.
Definition cp_files.F:16

cp_files::open_file
subroutine, public open_file(file_name, file_status, file_form, file_action, file_position, file_pad, unit_number, debug, skip_get_unit_number, file_access)
Opens the requested file using a free unit number.
Definition cp_files.F:308

cp_files::close_file
subroutine, public close_file(unit_number, file_status, keep_preconnection)
Close an open file given by its logical unit number. Optionally, keep the file and unit preconnected.
Definition cp_files.F:119

cp_fm_basic_linalg
Basic linear algebra operations for full matrices.
Definition cp_fm_basic_linalg.F:14

cp_fm_basic_linalg::cp_fm_gemm
subroutine, public cp_fm_gemm(transa, transb, m, n, k, alpha, matrix_a, matrix_b, beta, matrix_c, a_first_col, a_first_row, b_first_col, b_first_row, c_first_col, c_first_row)
computes matrix_c = beta * matrix_c + alpha * ( matrix_a ** transa ) * ( matrix_b ** transb )
Definition cp_fm_basic_linalg.F:440

cp_fm_diag
used for collecting some of the diagonalization schemes available for cp_fm_type. cp_fm_power also mo...
Definition cp_fm_diag.F:17

cp_fm_diag::cp_fm_syevd
subroutine, public cp_fm_syevd(matrix, eigenvectors, eigenvalues, info)
Computes all eigenvalues and vectors of a real symmetric matrix significantly faster than syevx,...
Definition cp_fm_diag.F:443

cp_fm_diag::cp_fm_syevx
subroutine, public cp_fm_syevx(matrix, eigenvectors, eigenvalues, neig, work_syevx)
compute eigenvalues and optionally eigenvectors of a real symmetric matrix using scalapack....
Definition cp_fm_diag.F:687

cp_fm_struct
represent the structure of a full matrix
Definition cp_fm_struct.F:14

cp_fm_struct::cp_fm_struct_create
subroutine, public cp_fm_struct_create(fmstruct, para_env, context, nrow_global, ncol_global, nrow_block, ncol_block, descriptor, first_p_pos, local_leading_dimension, template_fmstruct, square_blocks, force_block)
allocates and initializes a full matrix structure
Definition cp_fm_struct.F:132

cp_fm_struct::cp_fm_struct_get
subroutine, public cp_fm_struct_get(fmstruct, para_env, context, descriptor, ncol_block, nrow_block, nrow_global, ncol_global, first_p_pos, row_indices, col_indices, nrow_local, ncol_local, nrow_locals, ncol_locals, local_leading_dimension)
returns the values of various attributes of the matrix structure
Definition cp_fm_struct.F:440

cp_fm_struct::cp_fm_struct_release
subroutine, public cp_fm_struct_release(fmstruct)
releases a full matrix structure
Definition cp_fm_struct.F:351

cp_fm_types
represent a full matrix distributed on many processors
Definition cp_fm_types.F:15

cp_fm_types::cp_fm_set_submatrix
subroutine, public cp_fm_set_submatrix(fm, new_values, start_row, start_col, n_rows, n_cols, alpha, beta, transpose)
sets a submatrix of a full matrix fm(start_row:start_row+n_rows,start_col:start_col+n_cols) = alpha*o...
Definition cp_fm_types.F:761

cp_fm_types::cp_fm_set_all
subroutine, public cp_fm_set_all(matrix, alpha, beta)
set all elements of a matrix to the same value, and optionally the diagonal to a different one
Definition cp_fm_types.F:528

cp_fm_types::cp_fm_pilaenv
integer function, public cp_fm_pilaenv(ictxt, prec)
...
Definition cp_fm_types.F:2455

cp_fm_types::cp_fm_create
subroutine, public cp_fm_create(matrix, matrix_struct, name, use_sp)
creates a new full matrix with the given structure
Definition cp_fm_types.F:164

cp_log_handling
various routines to log and control the output. The idea is that decisions about where to log should ...
Definition cp_log_handling.F:41

cp_log_handling::cp_get_default_logger
type(cp_logger_type) function, pointer, public cp_get_default_logger()
returns the default logger
Definition cp_log_handling.F:234

cp_output_handling
routines to handle the output, The idea is to remove the decision of wheter to output and what to out...
Definition cp_output_handling.F:25

cp_output_handling::cp_print_key_unit_nr
integer function, public cp_print_key_unit_nr(logger, basis_section, print_key_path, extension, middle_name, local, log_filename, ignore_should_output, file_form, file_position, file_action, file_status, do_backup, on_file, is_new_file, mpi_io, fout)
...
Definition cp_output_handling.F:853

cp_output_handling::cp_print_key_finished_output
subroutine, public cp_print_key_finished_output(unit_nr, logger, basis_section, print_key_path, local, ignore_should_output, on_file, mpi_io)
should be called after you finish working with a unit obtained with cp_print_key_unit_nr,...
Definition cp_output_handling.F:1063

cp_realspace_grid_init
Definition cp_realspace_grid_init.F:15

cp_realspace_grid_init::init_input_type
subroutine, public init_input_type(input_settings, nsmax, rs_grid_section, ilevel, higher_grid_layout)
parses an input section to assign the proper values to the input type
Definition cp_realspace_grid_init.F:48

dbm_tests
Definition dbm_tests.F:8

dbm_tests::dbm_run_tests
subroutine, public dbm_run_tests(mp_group, io_unit, matrix_sizes, trs, bs_m, bs_n, bs_k, sparsities, alpha, beta, n_loops, eps, retain_sparsity, always_checksum)
Tests the DBM library.
Definition dbm_tests.F:54

fft_tools
Definition fft_tools.F:29

fft_tools::fft_radix_operations
subroutine, public fft_radix_operations(radix_in, radix_out, operation)
Determine the allowed lengths of FFT's '''.
Definition fft_tools.F:239

fft_tools::bwfft
integer, parameter, public bwfft
Definition fft_tools.F:146

fft_tools::fft_radix_closest
integer, parameter, public fft_radix_closest
Definition fft_tools.F:147

fft_tools::init_fft
subroutine, public init_fft(fftlib, alltoall, fftsg_sizes, pool_limit, wisdom_file, plan_style)
...
Definition fft_tools.F:186

fft_tools::fwfft
integer, parameter, public fwfft
Definition fft_tools.F:146

fft_tools::finalize_fft
subroutine, public finalize_fft(para_env, wisdom_file)
does whatever is needed to finalize the current fft setup
Definition fft_tools.F:216

global_types
Define type storing the global information of a run. Keep the amount of stored data small....
Definition global_types.F:21

input_constants
collects all constants needed in input so that they can be used without circular dependencies
Definition input_constants.F:17

input_constants::do_diag_syevd
integer, parameter, public do_diag_syevd
Definition input_constants.F:74

input_constants::do_mat_read
integer, parameter, public do_mat_read
Definition input_constants.F:77

input_constants::do_pwgrid_ns_fullspace
integer, parameter, public do_pwgrid_ns_fullspace
Definition input_constants.F:236

input_constants::do_diag_syevx
integer, parameter, public do_diag_syevx
Definition input_constants.F:74

input_constants::do_pwgrid_spherical
integer, parameter, public do_pwgrid_spherical
Definition input_constants.F:236

input_constants::do_mat_random
integer, parameter, public do_mat_random
Definition input_constants.F:77

input_constants::do_pwgrid_ns_halfspace
integer, parameter, public do_pwgrid_ns_halfspace
Definition input_constants.F:236

input_section_types
objects that represent the structure of input sections and the data contained in an input section
Definition input_section_types.F:15

input_section_types::section_vals_get_subs_vals
recursive type(section_vals_type) function, pointer, public section_vals_get_subs_vals(section_vals, subsection_name, i_rep_section, can_return_null)
returns the values of the requested subsection
Definition input_section_types.F:731

input_section_types::section_vals_get
subroutine, public section_vals_get(section_vals, ref_count, n_repetition, n_subs_vals_rep, section, explicit)
returns various attributes about the section_vals
Definition input_section_types.F:704

input_section_types::section_vals_val_get
subroutine, public section_vals_val_get(section_vals, keyword_name, i_rep_section, i_rep_val, n_rep_val, val, l_val, i_val, r_val, c_val, l_vals, i_vals, r_vals, c_vals, explicit)
returns the requested value
Definition input_section_types.F:1047

kinds
Defines the basic variable types.
Definition kinds.F:23

kinds::dp
integer, parameter, public dp
Definition kinds.F:34

library_tests
Performance tests for basic tasks like matrix multiplies, copy, fft.
Definition library_tests.F:18

library_tests::lib_test
subroutine, public lib_test(root_section, para_env, globenv)
Master routine for tests.
Definition library_tests.F:122

machine
Machine interface based on Fortran 2003 and POSIX.
Definition machine.F:17

machine::m_flush
subroutine, public m_flush(lunit)
flushes units if the &GLOBAL flag is set accordingly
Definition machine.F:130

machine::m_walltime
real(kind=dp) function, public m_walltime()
returns time from a real-time clock, protected against rolling early/easily
Definition machine.F:147

message_passing
Interface to the message passing library MPI.
Definition message_passing.F:23

minimax_exp
Routines to calculate the minimax coefficients in order to approximate 1/x as a sum over exponential ...
Definition minimax_exp.F:29

minimax_exp::validate_exp_minimax
subroutine, public validate_exp_minimax(n_r, iw)
Unit test checking that numerical error of minimax approximations generated using any k15 or k53 coef...
Definition minimax_exp.F:246

mp2_grids
Routines to calculate frequency and time grids (integration points and weights) for correlation metho...
Definition mp2_grids.F:14

mp2_grids::test_least_square_ft
subroutine, public test_least_square_ft(nr, iw)
test the singular value decomposition for the computation of integration weights for the Fourier tran...
Definition mp2_grids.F:1167

mp_perf_test
Interface to the message passing library MPI.
Definition mp_perf_test.F:23

mp_perf_test::mpi_perf_test
subroutine, public mpi_perf_test(comm, npow, output_unit)
Tests the MPI library.
Definition mp_perf_test.F:55

parallel_gemm_api
basic linear algebra operations for full matrixes
Definition parallel_gemm_api.F:14

parallel_rng_types
Parallel (pseudo)random number generator (RNG) for multiple streams and substreams of random numbers.
Definition parallel_rng_types.F:51

parallel_rng_types::advance
subroutine advance(self, e, c)
Advance the state by n steps, i.e. jump n steps forward, if n > 0, or backward if n < 0.
Definition parallel_rng_types.F:228

parallel_rng_types::uniform
integer, parameter, public uniform
Definition parallel_rng_types.F:73

pw_grid_types
Definition pw_grid_types.F:13

pw_grid_types::halfspace
integer, parameter, public halfspace
Definition pw_grid_types.F:26

pw_grid_types::fullspace
integer, parameter, public fullspace
Definition pw_grid_types.F:26

pw_grids
This module defines the grid data type and some basic operations on it.
Definition pw_grids.F:36

pw_grids::pw_grid_release
subroutine, public pw_grid_release(pw_grid)
releases the given pw grid
Definition pw_grids.F:2163

pw_methods
Definition pw_methods.F:25

pw_types
Definition pw_types.F:24

realspace_grid_types
Definition realspace_grid_types.F:18

realspace_grid_types::rs_grid_print
subroutine, public rs_grid_print(rs, iounit)
Print information on grids to output.
Definition realspace_grid_types.F:579

realspace_grid_types::rs_grid_create
subroutine, public rs_grid_create(rs, desc)
...
Definition realspace_grid_types.F:478

realspace_grid_types::rs_grid_create_descriptor
subroutine, public rs_grid_create_descriptor(desc, pw_grid, input_settings, border_points)
Determine the setup of real space grids - this is divided up into the creation of a descriptor and th...
Definition realspace_grid_types.F:202

realspace_grid_types::transfer_pw2rs
subroutine, public transfer_pw2rs(rs, pw)
...
Definition realspace_grid_types.F:694

realspace_grid_types::rs_grid_release_descriptor
subroutine, public rs_grid_release_descriptor(rs_desc)
releases the given rs grid descriptor (see doc/ReferenceCounting.html)
Definition realspace_grid_types.F:2032

realspace_grid_types::transfer_rs2pw
subroutine, public transfer_rs2pw(rs, pw)
...
Definition realspace_grid_types.F:652

realspace_grid_types::rs_grid_release
subroutine, public rs_grid_release(rs_grid)
releases the given rs grid (see doc/ReferenceCounting.html)
Definition realspace_grid_types.F:2012

realspace_grid_types::rs_grid_zero
subroutine, public rs_grid_zero(rs)
Initialize grid to zero.
Definition realspace_grid_types.F:1905

shg_integrals_test
Calculates 2-center integrals for different r12 operators comparing the Solid harmonic Gaussian integ...
Definition shg_integrals_test.F:13

shg_integrals_test::shg_integrals_perf_acc_test
subroutine, public shg_integrals_perf_acc_test(iw, shg_integrals_test_section)
Unit test for performance and accuracy of the SHG integrals.
Definition shg_integrals_test.F:205

cell_types::cell_type
Type defining parameters related to the simulation cell.
Definition cell_types.F:55

cp_blacs_env::cp_blacs_env_type
represent a blacs multidimensional parallel environment (for the mpi corrispective see cp_paratypes/m...
Definition cp_blacs_env.F:53

cp_fm_struct::cp_fm_struct_type
keeps the information about the structure of a full matrix
Definition cp_fm_struct.F:82

cp_fm_types::cp_fm_type
represent a full matrix
Definition cp_fm_types.F:113

cp_log_handling::cp_logger_type
type of a logger, at the moment it contains just a print level starting at which level it should be l...
Definition cp_log_handling.F:140

global_types::global_environment_type
contains the initially parsed file and the initial parallel environment
Definition global_types.F:66

input_section_types::section_vals_type
stores the values of a section
Definition input_section_types.F:127

message_passing::mp_para_env_type
stores all the informations relevant to an mpi environment
Definition message_passing.F:763

parallel_rng_types::rng_stream_type
Definition parallel_rng_types.F:157

pw_grid_types::pw_grid_type
Definition pw_grid_types.F:52

pw_types::pw_c1d_gs_type
Definition pw_types.F:127

pw_types::pw_c3d_rs_type
Definition pw_types.F:88

pw_types::pw_r3d_rs_type
Definition pw_types.F:62

realspace_grid_types::realspace_grid_desc_type
Definition realspace_grid_types.F:90

realspace_grid_types::realspace_grid_input_type
Definition realspace_grid_types.F:80

realspace_grid_types::realspace_grid_type
Definition realspace_grid_types.F:136