d6/d59/gw__utils_8F_source.html

!--------------------------------------------------------------------------------------------------!

!   CP2K: A general program to perform molecular dynamics simulations                              !

!   Copyright 2000-2025 CP2K developers group <https://cp2k.org>                                   !

!                                                                                                  !

!   SPDX-License-Identifier: GPL-2.0-or-later                                                      !

!--------------------------------------------------------------------------------------------------!


! **************************************************************************************************

!> \brief

!> \author Jan Wilhelm

!> \date 07.2023

! **************************************************************************************************

MODULE gw_utils

   USE atomic_kind_types,               ONLY: atomic_kind_type,&

                                              get_atomic_kind_set

   USE basis_set_types,                 ONLY: get_gto_basis_set,&

                                              gto_basis_set_type

   USE bibliography,                    ONLY: graml2024,&

                                              cite_reference

   USE cell_types,                      ONLY: cell_type,&

                                              pbc,&

                                              scaled_to_real

   USE cp_blacs_env,                    ONLY: cp_blacs_env_create,&

                                              cp_blacs_env_release,&

                                              cp_blacs_env_type

   USE cp_cfm_types,                    ONLY: cp_cfm_create,&

                                              cp_cfm_release,&

                                              cp_cfm_to_cfm,&

                                              cp_cfm_to_fm,&

                                              cp_cfm_type

   USE cp_control_types,                ONLY: dft_control_type

   USE cp_dbcsr_api,                    ONLY: &

        dbcsr_create, dbcsr_distribution_release, dbcsr_distribution_type, dbcsr_p_type, &

        dbcsr_release, dbcsr_set, dbcsr_type, dbcsr_type_no_symmetry, dbcsr_type_symmetric

   USE cp_dbcsr_operations,             ONLY: copy_dbcsr_to_fm,&

                                              copy_fm_to_dbcsr,&

                                              cp_dbcsr_dist2d_to_dist,&

                                              dbcsr_allocate_matrix_set,&

                                              dbcsr_deallocate_matrix_set

   USE cp_files,                        ONLY: close_file,&

                                              open_file

   USE cp_fm_basic_linalg,              ONLY: cp_fm_scale_and_add

   USE cp_fm_struct,                    ONLY: cp_fm_struct_create,&

                                              cp_fm_struct_release,&

                                              cp_fm_struct_type

   USE cp_fm_types,                     ONLY: cp_fm_create,&

                                              cp_fm_get_diag,&

                                              cp_fm_release,&

                                              cp_fm_set_all,&

                                              cp_fm_type

   USE cp_log_handling,                 ONLY: cp_get_default_logger,&

                                              cp_logger_type

   USE cp_output_handling,              ONLY: cp_print_key_generate_filename

   USE dbt_api,                         ONLY: &

        dbt_clear, dbt_create, dbt_destroy, dbt_filter, dbt_iterator_blocks_left, &

        dbt_iterator_next_block, dbt_iterator_start, dbt_iterator_stop, dbt_iterator_type, &

        dbt_mp_environ_pgrid, dbt_pgrid_create, dbt_pgrid_destroy, dbt_pgrid_type, dbt_type

   USE distribution_2d_types,           ONLY: distribution_2d_type

   USE gw_communication,                ONLY: fm_to_local_array

   USE gw_integrals,                    ONLY: build_3c_integral_block

   USE gw_kp_to_real_space_and_back,    ONLY: trafo_rs_to_ikp

   USE input_constants,                 ONLY: do_potential_truncated,&

                                              large_cell_gamma,&

                                              ri_rpa_g0w0_crossing_newton,&

                                              rtp_method_bse,&

                                              small_cell_full_kp,&

                                              xc_none

   USE input_section_types,             ONLY: section_vals_get,&

                                              section_vals_get_subs_vals,&

                                              section_vals_type,&

                                              section_vals_val_get,&

                                              section_vals_val_set

   USE kinds,                           ONLY: default_string_length,&

                                              dp,&

                                              int_8

   USE kpoint_methods,                  ONLY: kpoint_init_cell_index

   USE kpoint_types,                    ONLY: get_kpoint_info,&

                                              kpoint_create,&

                                              kpoint_type

   USE libint_2c_3c,                    ONLY: libint_potential_type

   USE libint_wrapper,                  ONLY: cp_libint_static_cleanup,&

                                              cp_libint_static_init

   USE machine,                         ONLY: m_memory,&

                                              m_walltime

   USE mathconstants,                   ONLY: gaussi,&

                                              z_one,&

                                              z_zero

   USE mathlib,                         ONLY: diag_complex,&

                                              gcd

   USE message_passing,                 ONLY: mp_cart_type,&

                                              mp_para_env_type

   USE minimax_exp,                     ONLY: get_exp_minimax_coeff

   USE minimax_exp_gw,                  ONLY: get_exp_minimax_coeff_gw

   USE minimax_rpa,                     ONLY: get_rpa_minimax_coeff,&

                                              get_rpa_minimax_coeff_larger_grid

   USE mp2_gpw,                         ONLY: create_mat_munu

   USE mp2_grids,                       ONLY: get_l_sq_wghts_cos_tf_t_to_w,&

                                              get_l_sq_wghts_cos_tf_w_to_t,&

                                              get_l_sq_wghts_sin_tf_t_to_w

   USE mp2_ri_2c,                       ONLY: trunc_coulomb_for_exchange

   USE parallel_gemm_api,               ONLY: parallel_gemm

   USE particle_methods,                ONLY: get_particle_set

   USE particle_types,                  ONLY: particle_type

   USE physcon,                         ONLY: angstrom,&

                                              evolt

   USE post_scf_bandstructure_types,    ONLY: post_scf_bandstructure_type

   USE post_scf_bandstructure_utils,    ONLY: rsmat_to_kp

   USE qs_energy_types,                 ONLY: qs_energy_type

   USE qs_environment_types,            ONLY: get_qs_env,&

                                              qs_env_part_release,&

                                              qs_environment_type

   USE qs_integral_utils,               ONLY: basis_set_list_setup

   USE qs_interactions,                 ONLY: init_interaction_radii_orb_basis

   USE qs_kind_types,                   ONLY: get_qs_kind,&

                                              qs_kind_type

   USE qs_ks_methods,                   ONLY: qs_ks_build_kohn_sham_matrix

   USE qs_neighbor_list_types,          ONLY: neighbor_list_set_p_type,&

                                              release_neighbor_list_sets

   USE qs_tensors,                      ONLY: build_2c_integrals,&

                                              build_2c_neighbor_lists,&

                                              build_3c_integrals,&

                                              build_3c_neighbor_lists,&

                                              get_tensor_occupancy,&

                                              neighbor_list_3c_destroy

   USE qs_tensors_types,                ONLY: create_2c_tensor,&

                                              create_3c_tensor,&

                                              distribution_3d_create,&

                                              distribution_3d_type,&

                                              neighbor_list_3c_type

   USE rpa_gw,                          ONLY: continuation_pade

#include "base/base_uses.f90"


   IMPLICIT NONE


   PRIVATE


   PUBLIC :: create_and_init_bs_env_for_gw, de_init_bs_env, get_i_j_atoms, &

             kpoint_init_cell_index_simple, compute_xkp, time_to_freq, analyt_conti_and_print, &

             add_r, is_cell_in_index_to_cell, get_v_tr_r, power


   CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'gw_utils'


CONTAINS


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

!> \param bs_sec ...

! **************************************************************************************************


   SUBROUTINE create_and_init_bs_env_for_gw(qs_env, bs_env, bs_sec)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(section_vals_type), POINTER                   :: bs_sec


      CHARACTER(LEN=*), PARAMETER :: routinen = 'create_and_init_bs_env_for_gw'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      CALL cite_reference(graml2024)


      CALL read_gw_input_parameters(bs_env, bs_sec)


      CALL print_header_and_input_parameters(bs_env)


      CALL setup_ao_and_ri_basis_set(qs_env, bs_env)


      CALL get_ri_basis_and_basis_function_indices(qs_env, bs_env)


      CALL set_heuristic_parameters(bs_env, qs_env)


      CALL cp_libint_static_init()


      CALL setup_kpoints_chi_eps_w(bs_env, bs_env%kpoints_chi_eps_W)


      IF (bs_env%small_cell_full_kp_or_large_cell_Gamma == small_cell_full_kp) THEN

         CALL setup_cells_3c(qs_env, bs_env)

      END IF


      CALL set_parallelization_parameters(qs_env, bs_env)


      CALL allocate_matrices(qs_env, bs_env)


      CALL compute_v_xc(qs_env, bs_env)


      CALL create_tensors(qs_env, bs_env)


      SELECT CASE (bs_env%small_cell_full_kp_or_large_cell_Gamma)

      CASE (large_cell_gamma)


         CALL allocate_gw_eigenvalues(bs_env)


         CALL check_sparsity_3c(qs_env, bs_env)


         CALL set_sparsity_parallelization_parameters(bs_env)


         CALL check_for_restart_files(qs_env, bs_env)


      CASE (small_cell_full_kp)


         CALL compute_3c_integrals(qs_env, bs_env)


         CALL setup_cells_delta_r(bs_env)


         CALL setup_parallelization_delta_r(bs_env)


         CALL allocate_matrices_small_cell_full_kp(qs_env, bs_env)


         CALL trafo_v_xc_r_to_kp(qs_env, bs_env)


         CALL heuristic_ri_regularization(qs_env, bs_env)


      END SELECT


      CALL setup_time_and_frequency_minimax_grid(bs_env)


      ! free memory in qs_env; only if one is not calculating the LDOS because

      ! we need real-space grid operations in pw_env, task_list for the LDOS

      ! Recommendation in case of memory issues: first perform GW calculation without calculating

      !                                          LDOS (to safe memor). Then, use GW restart files

      !                                          in a subsequent calculation to calculate the LDOS

      ! Marek : TODO - boolean that does not interfere with RTP init but sets this to correct value

      IF (.NOT. bs_env%do_ldos .AND. .false.) THEN

         CALL qs_env_part_release(qs_env)

      END IF


      CALL timestop(handle)


   END SUBROUTINE create_and_init_bs_env_for_gw


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************


   SUBROUTINE de_init_bs_env(bs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'de_init_bs_env'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)

      ! deallocate quantities here which:

      ! 1. cannot be deallocated in bs_env_release due to circular dependencies

      ! 2. consume a lot of memory and should not be kept until the quantity is

      !    deallocated in bs_env_release


      IF (ASSOCIATED(bs_env%nl_3c%ij_list) .AND. (bs_env%rtp_method == rtp_method_bse)) THEN

         IF (bs_env%unit_nr > 0) WRITE (bs_env%unit_nr, *) "Retaining nl_3c for RTBSE"

      ELSE

         CALL neighbor_list_3c_destroy(bs_env%nl_3c)

      END IF


      CALL cp_libint_static_cleanup()


      CALL timestop(handle)


   END SUBROUTINE de_init_bs_env


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param bs_sec ...

! **************************************************************************************************

   SUBROUTINE read_gw_input_parameters(bs_env, bs_sec)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(section_vals_type), POINTER                   :: bs_sec


      CHARACTER(LEN=*), PARAMETER :: routinen = 'read_gw_input_parameters'


      INTEGER                                            :: handle

      TYPE(section_vals_type), POINTER                   :: gw_sec


      CALL timeset(routinen, handle)


      NULLIFY (gw_sec)

      gw_sec => section_vals_get_subs_vals(bs_sec, "GW")


      CALL section_vals_val_get(gw_sec, "NUM_TIME_FREQ_POINTS", i_val=bs_env%num_time_freq_points)

      CALL section_vals_val_get(gw_sec, "EPS_FILTER", r_val=bs_env%eps_filter)

      CALL section_vals_val_get(gw_sec, "REGULARIZATION_RI", r_val=bs_env%input_regularization_RI)

      CALL section_vals_val_get(gw_sec, "REGULARIZATION_MINIMAX", r_val=bs_env%input_regularization_minimax)

      CALL section_vals_val_get(gw_sec, "CUTOFF_RADIUS_RI", r_val=bs_env%ri_metric%cutoff_radius)

      CALL section_vals_val_get(gw_sec, "MEMORY_PER_PROC", r_val=bs_env%input_memory_per_proc_GB)

      CALL section_vals_val_get(gw_sec, "APPROX_KP_EXTRAPOL", l_val=bs_env%approx_kp_extrapol)

      CALL section_vals_val_get(gw_sec, "SIZE_LATTICE_SUM", i_val=bs_env%size_lattice_sum_V)

      CALL section_vals_val_get(gw_sec, "KPOINTS_W", i_vals=bs_env%nkp_grid_chi_eps_W_input)

      CALL section_vals_val_get(gw_sec, "HEDIN_SHIFT", l_val=bs_env%do_hedin_shift)

      CALL section_vals_val_get(gw_sec, "FREQ_MAX_FIT", r_val=bs_env%freq_max_fit)


      CALL timestop(handle)


   END SUBROUTINE read_gw_input_parameters


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE setup_ao_and_ri_basis_set(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_AO_and_RI_basis_set'


      INTEGER                                            :: handle, natom, nkind

      TYPE(particle_type), DIMENSION(:), POINTER         :: particle_set

      TYPE(qs_kind_type), DIMENSION(:), POINTER          :: qs_kind_set


      CALL timeset(routinen, handle)


      CALL get_qs_env(qs_env, &

                      qs_kind_set=qs_kind_set, &

                      particle_set=particle_set, &

                      natom=natom, nkind=nkind)


      ! set up basis

      ALLOCATE (bs_env%sizes_RI(natom), bs_env%sizes_AO(natom))

      ALLOCATE (bs_env%basis_set_RI(nkind), bs_env%basis_set_AO(nkind))


      CALL basis_set_list_setup(bs_env%basis_set_RI, "RI_AUX", qs_kind_set)

      CALL basis_set_list_setup(bs_env%basis_set_AO, "ORB", qs_kind_set)


      CALL get_particle_set(particle_set, qs_kind_set, nsgf=bs_env%sizes_RI, &

                            basis=bs_env%basis_set_RI)

      CALL get_particle_set(particle_set, qs_kind_set, nsgf=bs_env%sizes_AO, &

                            basis=bs_env%basis_set_AO)


      CALL timestop(handle)


   END SUBROUTINE setup_ao_and_ri_basis_set


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE get_ri_basis_and_basis_function_indices(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'get_RI_basis_and_basis_function_indices'


      INTEGER                                            :: handle, i_ri, iatom, ikind, iset, &

                                                            max_ao_bf_per_atom, n_ao_test, n_atom, &

                                                            n_kind, n_ri, nset, nsgf, u

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: kind_of

      INTEGER, DIMENSION(:), POINTER                     :: l_max, l_min, nsgf_set

      TYPE(atomic_kind_type), DIMENSION(:), POINTER      :: atomic_kind_set

      TYPE(gto_basis_set_type), POINTER                  :: basis_set_a

      TYPE(qs_kind_type), DIMENSION(:), POINTER          :: qs_kind_set


      CALL timeset(routinen, handle)


      ! determine RI basis set size

      CALL get_qs_env(qs_env, atomic_kind_set=atomic_kind_set, qs_kind_set=qs_kind_set)


      n_kind = SIZE(qs_kind_set)

      n_atom = bs_env%n_atom


      CALL get_atomic_kind_set(atomic_kind_set, kind_of=kind_of)


      DO ikind = 1, n_kind

         CALL get_qs_kind(qs_kind=qs_kind_set(ikind), basis_set=basis_set_a, &

                          basis_type="RI_AUX")

         IF (.NOT. ASSOCIATED(basis_set_a)) THEN

            CALL cp_abort(__location__, &

                          "At least one RI_AUX basis set was not explicitly invoked in &KIND-section.")

         END IF

      END DO


      ALLOCATE (bs_env%i_RI_start_from_atom(n_atom))

      ALLOCATE (bs_env%i_RI_end_from_atom(n_atom))

      ALLOCATE (bs_env%i_ao_start_from_atom(n_atom))

      ALLOCATE (bs_env%i_ao_end_from_atom(n_atom))


      n_ri = 0

      DO iatom = 1, n_atom

         bs_env%i_RI_start_from_atom(iatom) = n_ri + 1

         ikind = kind_of(iatom)

         CALL get_qs_kind(qs_kind=qs_kind_set(ikind), nsgf=nsgf, basis_type="RI_AUX")

         n_ri = n_ri + nsgf

         bs_env%i_RI_end_from_atom(iatom) = n_ri

      END DO

      bs_env%n_RI = n_ri


      max_ao_bf_per_atom = 0

      n_ao_test = 0

      DO iatom = 1, n_atom

         bs_env%i_ao_start_from_atom(iatom) = n_ao_test + 1

         ikind = kind_of(iatom)

         CALL get_qs_kind(qs_kind=qs_kind_set(ikind), nsgf=nsgf, basis_type="ORB")

         n_ao_test = n_ao_test + nsgf

         bs_env%i_ao_end_from_atom(iatom) = n_ao_test

         max_ao_bf_per_atom = max(max_ao_bf_per_atom, nsgf)

      END DO

      cpassert(n_ao_test == bs_env%n_ao)

      bs_env%max_AO_bf_per_atom = max_ao_bf_per_atom


      ALLOCATE (bs_env%l_RI(n_ri))

      i_ri = 0

      DO iatom = 1, n_atom

         ikind = kind_of(iatom)


         nset = bs_env%basis_set_RI(ikind)%gto_basis_set%nset

         l_max => bs_env%basis_set_RI(ikind)%gto_basis_set%lmax

         l_min => bs_env%basis_set_RI(ikind)%gto_basis_set%lmin

         nsgf_set => bs_env%basis_set_RI(ikind)%gto_basis_set%nsgf_set


         DO iset = 1, nset

            cpassert(l_max(iset) == l_min(iset))

            bs_env%l_RI(i_ri + 1:i_ri + nsgf_set(iset)) = l_max(iset)

            i_ri = i_ri + nsgf_set(iset)

         END DO


      END DO

      cpassert(i_ri == n_ri)


      u = bs_env%unit_nr


      IF (u > 0) THEN

         WRITE (u, fmt="(T2,A)") " "

         WRITE (u, fmt="(T2,2A,T75,I8)") "Number of auxiliary Gaussian basis functions ", &

            χε"for , , W", n_ri

      END IF


      CALL timestop(handle)


   END SUBROUTINE get_ri_basis_and_basis_function_indices


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param kpoints ...

! **************************************************************************************************

   SUBROUTINE setup_kpoints_chi_eps_w(bs_env, kpoints)


      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(kpoint_type), POINTER                         :: kpoints


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_kpoints_chi_eps_W'


      INTEGER                                            :: handle, i_dim, n_dim, nkp, nkp_extra, &

                                                            nkp_orig, u

      INTEGER, DIMENSION(3)                              :: nkp_grid, nkp_grid_extra, periodic

      REAL(kind=dp)                                      :: exp_s_p, n_dim_inv


      CALL timeset(routinen, handle)


      ! routine adapted from mp2_integrals.F

      NULLIFY (kpoints)

      CALL kpoint_create(kpoints)


      kpoints%kp_scheme = "GENERAL"


      periodic(1:3) = bs_env%periodic(1:3)


      cpassert(SIZE(bs_env%nkp_grid_chi_eps_W_input) == 3)


      IF (bs_env%nkp_grid_chi_eps_W_input(1) > 0 .AND. &

          bs_env%nkp_grid_chi_eps_W_input(2) > 0 .AND. &

          bs_env%nkp_grid_chi_eps_W_input(3) > 0) THEN

         ! 1. k-point mesh for χ, ε, W from input

         DO i_dim = 1, 3

            SELECT CASE (periodic(i_dim))

            CASE (0)

               nkp_grid(i_dim) = 1

               nkp_grid_extra(i_dim) = 1

            CASE (1)

               nkp_grid(i_dim) = bs_env%nkp_grid_chi_eps_W_input(i_dim)

               nkp_grid_extra(i_dim) = nkp_grid(i_dim)*2

            CASE DEFAULT

               cpabort("Error in periodicity.")

            END SELECT

         END DO


      ELSE IF (bs_env%nkp_grid_chi_eps_W_input(1) == -1 .AND. &

               bs_env%nkp_grid_chi_eps_W_input(2) == -1 .AND. &

               bs_env%nkp_grid_chi_eps_W_input(3) == -1) THEN

         ! 2. automatic k-point mesh for χ, ε, W


         DO i_dim = 1, 3


            cpassert(periodic(i_dim) == 0 .OR. periodic(i_dim) == 1)


            SELECT CASE (periodic(i_dim))

            CASE (0)

               nkp_grid(i_dim) = 1

               nkp_grid_extra(i_dim) = 1

            CASE (1)

               SELECT CASE (bs_env%small_cell_full_kp_or_large_cell_Gamma)

               CASE (large_cell_gamma)

                  nkp_grid(i_dim) = 4

                  nkp_grid_extra(i_dim) = 6

               CASE (small_cell_full_kp)

                  nkp_grid(i_dim) = bs_env%kpoints_scf_desymm%nkp_grid(i_dim)*4

                  nkp_grid_extra(i_dim) = bs_env%kpoints_scf_desymm%nkp_grid(i_dim)*8

               END SELECT

            CASE DEFAULT

               cpabort("Error in periodicity.")

            END SELECT


         END DO


      ELSE


         cpabort("An error occured when setting up the k-mesh for W.")


      END IF


      nkp_orig = max(nkp_grid(1)*nkp_grid(2)*nkp_grid(3)/2, 1)


      nkp_extra = nkp_grid_extra(1)*nkp_grid_extra(2)*nkp_grid_extra(3)/2


      nkp = nkp_orig + nkp_extra


      kpoints%nkp_grid(1:3) = nkp_grid(1:3)

      kpoints%nkp = nkp


      bs_env%nkp_grid_chi_eps_W_orig(1:3) = nkp_grid(1:3)

      bs_env%nkp_grid_chi_eps_W_extra(1:3) = nkp_grid_extra(1:3)

      bs_env%nkp_chi_eps_W_orig = nkp_orig

      bs_env%nkp_chi_eps_W_extra = nkp_extra

      bs_env%nkp_chi_eps_W_orig_plus_extra = nkp


      ALLOCATE (kpoints%xkp(3, nkp), kpoints%wkp(nkp))

      ALLOCATE (bs_env%wkp_no_extra(nkp), bs_env%wkp_s_p(nkp))


      CALL compute_xkp(kpoints%xkp, 1, nkp_orig, nkp_grid)

      CALL compute_xkp(kpoints%xkp, nkp_orig + 1, nkp, nkp_grid_extra)


      n_dim = sum(periodic)

      IF (n_dim == 0) THEN

         ! molecules

         kpoints%wkp(1) = 1.0_dp

         bs_env%wkp_s_p(1) = 1.0_dp

         bs_env%wkp_no_extra(1) = 1.0_dp

      ELSE


         n_dim_inv = 1.0_dp/real(n_dim, kind=dp)


         ! k-point weights are chosen to automatically extrapolate the k-point mesh

         CALL compute_wkp(kpoints%wkp(1:nkp_orig), nkp_orig, nkp_extra, n_dim_inv)

         CALL compute_wkp(kpoints%wkp(nkp_orig + 1:nkp), nkp_extra, nkp_orig, n_dim_inv)


         bs_env%wkp_no_extra(1:nkp_orig) = 0.0_dp

         bs_env%wkp_no_extra(nkp_orig + 1:nkp) = 1.0_dp/real(nkp_extra, kind=dp)


         IF (n_dim == 3) THEN

            ! W_PQ(k) for an s-function P and a p-function Q diverges as 1/k at k=0

            ! (instead of 1/k^2 for P and Q both being s-functions).

            exp_s_p = 2.0_dp*n_dim_inv

            CALL compute_wkp(bs_env%wkp_s_p(1:nkp_orig), nkp_orig, nkp_extra, exp_s_p)

            CALL compute_wkp(bs_env%wkp_s_p(nkp_orig + 1:nkp), nkp_extra, nkp_orig, exp_s_p)

         ELSE

            bs_env%wkp_s_p(1:nkp) = bs_env%wkp_no_extra(1:nkp)

         END IF


      END IF


      IF (bs_env%approx_kp_extrapol) THEN

         bs_env%wkp_orig = 1.0_dp/real(nkp_orig, kind=dp)

      END IF


      ! heuristic parameter: how many k-points for χ, ε, and W are used simultaneously

      ! (less simultaneous k-points: less memory, but more computational effort because of

      !  recomputation of V(k))

      bs_env%nkp_chi_eps_W_batch = 4


      bs_env%num_chi_eps_W_batches = (bs_env%nkp_chi_eps_W_orig_plus_extra - 1)/ &

                                     bs_env%nkp_chi_eps_W_batch + 1


      u = bs_env%unit_nr


      IF (u > 0) THEN

         WRITE (u, fmt="(T2,A)") " "

         WRITE (u, fmt="(T2,1A,T71,3I4)") χε"K-point mesh 1 for , , W", nkp_grid(1:3)

         WRITE (u, fmt="(T2,2A,T71,3I4)") χε"K-point mesh 2 for , , W ", &

            "(for k-point extrapolation of W)", nkp_grid_extra(1:3)

         WRITE (u, fmt="(T2,A,T80,L)") "Approximate the k-point extrapolation", &

            bs_env%approx_kp_extrapol

      END IF


      CALL timestop(handle)


   END SUBROUTINE setup_kpoints_chi_eps_w


! **************************************************************************************************

!> \brief ...

!> \param kpoints ...

!> \param qs_env ...

! **************************************************************************************************


   SUBROUTINE kpoint_init_cell_index_simple(kpoints, qs_env)


      TYPE(kpoint_type), POINTER                         :: kpoints

      TYPE(qs_environment_type), POINTER                 :: qs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'kpoint_init_cell_index_simple'


      INTEGER                                            :: handle

      TYPE(dft_control_type), POINTER                    :: dft_control

      TYPE(mp_para_env_type), POINTER                    :: para_env

      TYPE(neighbor_list_set_p_type), DIMENSION(:), &

         POINTER                                         :: sab_orb


      CALL timeset(routinen, handle)


      NULLIFY (dft_control, para_env, sab_orb)

      CALL get_qs_env(qs_env=qs_env, para_env=para_env, dft_control=dft_control, sab_orb=sab_orb)

      CALL kpoint_init_cell_index(kpoints, sab_orb, para_env, dft_control)


      CALL timestop(handle)


   END SUBROUTINE kpoint_init_cell_index_simple


! **************************************************************************************************

!> \brief ...

!> \param xkp ...

!> \param ikp_start ...

!> \param ikp_end ...

!> \param grid ...

! **************************************************************************************************


   SUBROUTINE compute_xkp(xkp, ikp_start, ikp_end, grid)


      REAL(kind=dp), DIMENSION(:, :), POINTER            :: xkp

      INTEGER                                            :: ikp_start, ikp_end

      INTEGER, DIMENSION(3)                              :: grid


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'compute_xkp'


      INTEGER                                            :: handle, i, ix, iy, iz


      CALL timeset(routinen, handle)


      i = ikp_start

      DO ix = 1, grid(1)

         DO iy = 1, grid(2)

            DO iz = 1, grid(3)


               IF (i > ikp_end) cycle


               xkp(1, i) = real(2*ix - grid(1) - 1, kind=dp)/(2._dp*real(grid(1), kind=dp))

               xkp(2, i) = real(2*iy - grid(2) - 1, kind=dp)/(2._dp*real(grid(2), kind=dp))

               xkp(3, i) = real(2*iz - grid(3) - 1, kind=dp)/(2._dp*real(grid(3), kind=dp))

               i = i + 1


            END DO

         END DO

      END DO


      CALL timestop(handle)


   END SUBROUTINE compute_xkp


! **************************************************************************************************

!> \brief ...

!> \param wkp ...

!> \param nkp_1 ...

!> \param nkp_2 ...

!> \param exponent ...

! **************************************************************************************************

   SUBROUTINE compute_wkp(wkp, nkp_1, nkp_2, exponent)

      REAL(kind=dp), DIMENSION(:)                        :: wkp

      INTEGER                                            :: nkp_1, nkp_2

      REAL(kind=dp)                                      :: exponent


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'compute_wkp'


      INTEGER                                            :: handle

      REAL(kind=dp)                                      :: nkp_ratio


      CALL timeset(routinen, handle)


      nkp_ratio = real(nkp_2, kind=dp)/real(nkp_1, kind=dp)


      wkp(:) = 1.0_dp/real(nkp_1, kind=dp)/(1.0_dp - nkp_ratio**exponent)


      CALL timestop(handle)


   END SUBROUTINE compute_wkp


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE allocate_matrices(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'allocate_matrices'


      INTEGER                                            :: handle, i_t

      TYPE(cp_blacs_env_type), POINTER                   :: blacs_env, blacs_env_tensor

      TYPE(cp_fm_struct_type), POINTER                   :: fm_struct, fm_struct_ri_global

      TYPE(mp_para_env_type), POINTER                    :: para_env


      CALL timeset(routinen, handle)


      CALL get_qs_env(qs_env, para_env=para_env, blacs_env=blacs_env)


      fm_struct => bs_env%fm_ks_Gamma(1)%matrix_struct


      CALL cp_fm_create(bs_env%fm_Gocc, fm_struct)

      CALL cp_fm_create(bs_env%fm_Gvir, fm_struct)


      NULLIFY (fm_struct_ri_global)

      CALL cp_fm_struct_create(fm_struct_ri_global, context=blacs_env, nrow_global=bs_env%n_RI, &

                               ncol_global=bs_env%n_RI, para_env=para_env)

      CALL cp_fm_create(bs_env%fm_RI_RI, fm_struct_ri_global)

      CALL cp_fm_create(bs_env%fm_chi_Gamma_freq, fm_struct_ri_global)

      CALL cp_fm_create(bs_env%fm_W_MIC_freq, fm_struct_ri_global)

      IF (bs_env%approx_kp_extrapol) THEN

         CALL cp_fm_create(bs_env%fm_W_MIC_freq_1_extra, fm_struct_ri_global)

         CALL cp_fm_create(bs_env%fm_W_MIC_freq_1_no_extra, fm_struct_ri_global)

         CALL cp_fm_set_all(bs_env%fm_W_MIC_freq_1_extra, 0.0_dp)

         CALL cp_fm_set_all(bs_env%fm_W_MIC_freq_1_no_extra, 0.0_dp)

      END IF

      CALL cp_fm_struct_release(fm_struct_ri_global)


      ! create blacs_env for subgroups of tensor operations

      NULLIFY (blacs_env_tensor)

      CALL cp_blacs_env_create(blacs_env=blacs_env_tensor, para_env=bs_env%para_env_tensor)


      ! allocate dbcsr matrices in the tensor subgroup; actually, one only needs a small

      ! subset of blocks in the tensor subgroup, however, all atomic blocks are allocated.

      ! One might think of creating a dbcsr matrix with only the blocks that are needed

      ! in the tensor subgroup

      CALL create_mat_munu(bs_env%mat_ao_ao_tensor, qs_env, bs_env%eps_atom_grid_2d_mat, &

                           blacs_env_tensor, do_ri_aux_basis=.false.)


      CALL create_mat_munu(bs_env%mat_RI_RI_tensor, qs_env, bs_env%eps_atom_grid_2d_mat, &

                           blacs_env_tensor, do_ri_aux_basis=.true.)


      CALL create_mat_munu(bs_env%mat_RI_RI, qs_env, bs_env%eps_atom_grid_2d_mat, &

                           blacs_env, do_ri_aux_basis=.true.)


      CALL cp_blacs_env_release(blacs_env_tensor)


      NULLIFY (bs_env%mat_chi_Gamma_tau)

      CALL dbcsr_allocate_matrix_set(bs_env%mat_chi_Gamma_tau, bs_env%num_time_freq_points)


      DO i_t = 1, bs_env%num_time_freq_points

         ALLOCATE (bs_env%mat_chi_Gamma_tau(i_t)%matrix)

         CALL dbcsr_create(bs_env%mat_chi_Gamma_tau(i_t)%matrix, template=bs_env%mat_RI_RI%matrix)

      END DO


      CALL timestop(handle)


   END SUBROUTINE allocate_matrices


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE allocate_gw_eigenvalues(bs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'allocate_GW_eigenvalues'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      ALLOCATE (bs_env%eigenval_G0W0(bs_env%n_ao, bs_env%nkp_bs_and_DOS, bs_env%n_spin))

      ALLOCATE (bs_env%eigenval_HF(bs_env%n_ao, bs_env%nkp_bs_and_DOS, bs_env%n_spin))


      CALL timestop(handle)


   END SUBROUTINE allocate_gw_eigenvalues


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE create_tensors(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'create_tensors'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      CALL init_interaction_radii(bs_env)


      ! split blocks does not improve load balancing/efficienfy for tensor contraction, so we go

      ! with the standard atomic blocks

      CALL create_3c_t(bs_env%t_RI_AO__AO, bs_env%para_env_tensor, "(RI AO | AO)", [1, 2], [3], &

                       bs_env%sizes_RI, bs_env%sizes_AO, &

                       create_nl_3c=.true., nl_3c=bs_env%nl_3c, qs_env=qs_env)

      CALL create_3c_t(bs_env%t_RI__AO_AO, bs_env%para_env_tensor, "(RI | AO AO)", [1], [2, 3], &

                       bs_env%sizes_RI, bs_env%sizes_AO)


      CALL create_2c_t(bs_env, bs_env%sizes_RI, bs_env%sizes_AO)


      CALL timestop(handle)


   END SUBROUTINE create_tensors


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE check_sparsity_3c(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'check_sparsity_3c'


      INTEGER                                            :: handle, n_atom_step, ri_atom

      INTEGER(int_8)                                     :: mem, non_zero_elements_sum, nze

      REAL(dp)                                           :: max_dist_ao_atoms, occ, occupation_sum

      REAL(kind=dp)                                      :: t1, t2

      TYPE(dbt_type)                                     :: t_3c_global

      TYPE(dbt_type), ALLOCATABLE, DIMENSION(:, :)       :: t_3c_global_array

      TYPE(neighbor_list_3c_type)                        :: nl_3c_global


      CALL timeset(routinen, handle)


      ! check the sparsity of 3c integral tensor (µν|P); calculate maximum distance between

      ! AO atoms µ, ν where at least a single integral (µν|P) is larger than the filter threshold

      CALL create_3c_t(t_3c_global, bs_env%para_env, "(RI AO | AO)", [1, 2], [3], &

                       bs_env%sizes_RI, bs_env%sizes_AO, &

                       create_nl_3c=.true., nl_3c=nl_3c_global, qs_env=qs_env)


      CALL m_memory(mem)

      CALL bs_env%para_env%max(mem)


      ALLOCATE (t_3c_global_array(1, 1))

      CALL dbt_create(t_3c_global, t_3c_global_array(1, 1))


      CALL bs_env%para_env%sync()

      t1 = m_walltime()


      occupation_sum = 0.0_dp

      non_zero_elements_sum = 0

      max_dist_ao_atoms = 0.0_dp

      n_atom_step = int(sqrt(real(bs_env%n_atom, kind=dp)))

      ! do not compute full 3c integrals at once because it may cause out of memory

      DO ri_atom = 1, bs_env%n_atom, n_atom_step


         CALL build_3c_integrals(t_3c_global_array, &

                                 bs_env%eps_filter, &

                                 qs_env, &

                                 nl_3c_global, &

                                 int_eps=bs_env%eps_filter, &

                                 basis_i=bs_env%basis_set_RI, &

                                 basis_j=bs_env%basis_set_AO, &

                                 basis_k=bs_env%basis_set_AO, &

                                 bounds_i=[ri_atom, min(ri_atom + n_atom_step - 1, bs_env%n_atom)], &

                                 potential_parameter=bs_env%ri_metric, &

                                 desymmetrize=.false.)


         CALL dbt_filter(t_3c_global_array(1, 1), bs_env%eps_filter)


         CALL bs_env%para_env%sync()


         CALL get_tensor_occupancy(t_3c_global_array(1, 1), nze, occ)

         non_zero_elements_sum = non_zero_elements_sum + nze

         occupation_sum = occupation_sum + occ


         CALL get_max_dist_ao_atoms(t_3c_global_array(1, 1), max_dist_ao_atoms, qs_env)


         CALL dbt_clear(t_3c_global_array(1, 1))


      END DO


      t2 = m_walltime()


      bs_env%occupation_3c_int = occupation_sum

      bs_env%max_dist_AO_atoms = max_dist_ao_atoms


      CALL dbt_destroy(t_3c_global)

      CALL dbt_destroy(t_3c_global_array(1, 1))

      DEALLOCATE (t_3c_global_array)


      CALL neighbor_list_3c_destroy(nl_3c_global)


      IF (bs_env%unit_nr > 0) THEN

         WRITE (bs_env%unit_nr, '(T2,A)') ''

         WRITE (bs_env%unit_nr, '(T2,A,F27.1,A)') &

            µν'Computed 3-center integrals (|P), execution time', t2 - t1, ' s'

         WRITE (bs_env%unit_nr, '(T2,A,F48.3,A)') µν'Percentage of non-zero (|P)', &

            occupation_sum*100, ' %'

         WRITE (bs_env%unit_nr, '(T2,A,F33.1,A)') µνµν'Max. distance between , in non-zero (|P)', &

            max_dist_ao_atoms*angstrom, ' A'

         WRITE (bs_env%unit_nr, '(T2,2A,I20,A)') 'Required memory if storing all 3-center ', &

            µν'integrals (|P)', int(real(non_zero_elements_sum, kind=dp)*8.0e-9_dp), ' GB'

      END IF


      CALL timestop(handle)


   END SUBROUTINE check_sparsity_3c


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param sizes_RI ...

!> \param sizes_AO ...

! **************************************************************************************************

   SUBROUTINE create_2c_t(bs_env, sizes_RI, sizes_AO)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: sizes_ri, sizes_ao


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'create_2c_t'


      INTEGER                                            :: handle

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: dist_1, dist_2

      INTEGER, DIMENSION(2)                              :: pdims_2d

      TYPE(dbt_pgrid_type)                               :: pgrid_2d


      CALL timeset(routinen, handle)


      ! inspired from rpa_im_time.F / hfx_types.F


      pdims_2d = 0

      CALL dbt_pgrid_create(bs_env%para_env_tensor, pdims_2d, pgrid_2d)


      CALL create_2c_tensor(bs_env%t_G, dist_1, dist_2, pgrid_2d, sizes_ao, sizes_ao, &

                            name="(AO | AO)")

      DEALLOCATE (dist_1, dist_2)

      CALL create_2c_tensor(bs_env%t_chi, dist_1, dist_2, pgrid_2d, sizes_ri, sizes_ri, &

                            name="(RI | RI)")

      DEALLOCATE (dist_1, dist_2)

      CALL create_2c_tensor(bs_env%t_W, dist_1, dist_2, pgrid_2d, sizes_ri, sizes_ri, &

                            name="(RI | RI)")

      DEALLOCATE (dist_1, dist_2)

      CALL dbt_pgrid_destroy(pgrid_2d)


      CALL timestop(handle)


   END SUBROUTINE create_2c_t


! **************************************************************************************************

!> \brief ...

!> \param tensor ...

!> \param para_env ...

!> \param tensor_name ...

!> \param map1 ...

!> \param map2 ...

!> \param sizes_RI ...

!> \param sizes_AO ...

!> \param create_nl_3c ...

!> \param nl_3c ...

!> \param qs_env ...

! **************************************************************************************************

   SUBROUTINE create_3c_t(tensor, para_env, tensor_name, map1, map2, sizes_RI, sizes_AO, &

                          create_nl_3c, nl_3c, qs_env)

      TYPE(dbt_type)                                     :: tensor

      TYPE(mp_para_env_type), POINTER                    :: para_env

      CHARACTER(LEN=12)                                  :: tensor_name

      INTEGER, DIMENSION(:)                              :: map1, map2

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: sizes_ri, sizes_ao

      LOGICAL, OPTIONAL                                  :: create_nl_3c

      TYPE(neighbor_list_3c_type), OPTIONAL              :: nl_3c

      TYPE(qs_environment_type), OPTIONAL, POINTER       :: qs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'create_3c_t'


      INTEGER                                            :: handle, nkind

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: dist_ao_1, dist_ao_2, dist_ri

      INTEGER, DIMENSION(3)                              :: pcoord, pdims, pdims_3d

      LOGICAL                                            :: my_create_nl_3c

      TYPE(dbt_pgrid_type)                               :: pgrid_3d

      TYPE(distribution_3d_type)                         :: dist_3d

      TYPE(mp_cart_type)                                 :: mp_comm_t3c_2

      TYPE(particle_type), DIMENSION(:), POINTER         :: particle_set


      CALL timeset(routinen, handle)


      pdims_3d = 0

      CALL dbt_pgrid_create(para_env, pdims_3d, pgrid_3d)

      CALL create_3c_tensor(tensor, dist_ri, dist_ao_1, dist_ao_2, &

                            pgrid_3d, sizes_ri, sizes_ao, sizes_ao, &

                            map1=map1, map2=map2, name=tensor_name)


      IF (PRESENT(create_nl_3c)) THEN

         my_create_nl_3c = create_nl_3c

      ELSE

         my_create_nl_3c = .false.

      END IF


      IF (my_create_nl_3c) THEN

         CALL get_qs_env(qs_env, nkind=nkind, particle_set=particle_set)

         CALL dbt_mp_environ_pgrid(pgrid_3d, pdims, pcoord)

         CALL mp_comm_t3c_2%create(pgrid_3d%mp_comm_2d, 3, pdims)

         CALL distribution_3d_create(dist_3d, dist_ri, dist_ao_1, dist_ao_2, &

                                     nkind, particle_set, mp_comm_t3c_2, own_comm=.true.)


         CALL build_3c_neighbor_lists(nl_3c, &

                                      qs_env%bs_env%basis_set_RI, &

                                      qs_env%bs_env%basis_set_AO, &

                                      qs_env%bs_env%basis_set_AO, &

                                      dist_3d, qs_env%bs_env%ri_metric, &

                                      "GW_3c_nl", qs_env, own_dist=.true.)

      END IF


      DEALLOCATE (dist_ri, dist_ao_1, dist_ao_2)

      CALL dbt_pgrid_destroy(pgrid_3d)


      CALL timestop(handle)


   END SUBROUTINE create_3c_t


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE init_interaction_radii(bs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'init_interaction_radii'


      INTEGER                                            :: handle, ibasis

      TYPE(gto_basis_set_type), POINTER                  :: orb_basis, ri_basis


      CALL timeset(routinen, handle)


      DO ibasis = 1, SIZE(bs_env%basis_set_AO)


         orb_basis => bs_env%basis_set_AO(ibasis)%gto_basis_set

         CALL init_interaction_radii_orb_basis(orb_basis, bs_env%eps_filter)


         ri_basis => bs_env%basis_set_RI(ibasis)%gto_basis_set

         CALL init_interaction_radii_orb_basis(ri_basis, bs_env%eps_filter)


      END DO


      CALL timestop(handle)


   END SUBROUTINE init_interaction_radii


! **************************************************************************************************

!> \brief ...

!> \param t_3c_int ...

!> \param max_dist_AO_atoms ...

!> \param qs_env ...

! **************************************************************************************************

   SUBROUTINE get_max_dist_ao_atoms(t_3c_int, max_dist_AO_atoms, qs_env)

      TYPE(dbt_type)                                     :: t_3c_int

      REAL(kind=dp)                                      :: max_dist_ao_atoms

      TYPE(qs_environment_type), POINTER                 :: qs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'get_max_dist_AO_atoms'


      INTEGER                                            :: atom_1, atom_2, handle, num_cells

      INTEGER, DIMENSION(3)                              :: atom_ind

      INTEGER, DIMENSION(:, :), POINTER                  :: index_to_cell

      REAL(kind=dp)                                      :: abs_rab

      REAL(kind=dp), DIMENSION(3)                        :: rab

      TYPE(cell_type), POINTER                           :: cell

      TYPE(dbt_iterator_type)                            :: iter

      TYPE(mp_para_env_type), POINTER                    :: para_env

      TYPE(particle_type), DIMENSION(:), POINTER         :: particle_set


      CALL timeset(routinen, handle)


      NULLIFY (cell, particle_set, para_env)

      CALL get_qs_env(qs_env, cell=cell, particle_set=particle_set, para_env=para_env)


!$OMP PARALLEL DEFAULT(NONE) &

!$OMP SHARED(t_3c_int, max_dist_AO_atoms, num_cells, index_to_cell, particle_set, cell) &

!$OMP PRIVATE(iter,atom_ind,rab, abs_rab, atom_1, atom_2)

      CALL dbt_iterator_start(iter, t_3c_int)

      DO WHILE (dbt_iterator_blocks_left(iter))

         CALL dbt_iterator_next_block(iter, atom_ind)


         atom_1 = atom_ind(2)

         atom_2 = atom_ind(3)


         rab = pbc(particle_set(atom_1)%r(1:3), particle_set(atom_2)%r(1:3), cell)


         abs_rab = sqrt(rab(1)**2 + rab(2)**2 + rab(3)**2)


         max_dist_ao_atoms = max(max_dist_ao_atoms, abs_rab)


      END DO

      CALL dbt_iterator_stop(iter)

!$OMP END PARALLEL


      CALL para_env%max(max_dist_ao_atoms)


      CALL timestop(handle)


   END SUBROUTINE get_max_dist_ao_atoms


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE set_sparsity_parallelization_parameters(bs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'set_sparsity_parallelization_parameters'


      INTEGER :: handle, i_ivl, il_ivl, j_ivl, n_atom_per_il_ivl, n_atom_per_ivl, n_intervals_i, &

         n_intervals_inner_loop_atoms, n_intervals_j, u

      INTEGER(KIND=int_8)                                :: input_memory_per_proc


      CALL timeset(routinen, handle)


      ! heuristic parameter to prevent out of memory

      bs_env%safety_factor_memory = 0.10_dp


      input_memory_per_proc = int(bs_env%input_memory_per_proc_GB*1.0e9_dp, kind=int_8)


      ! choose atomic range for λ ("i_atom"), ν ("j_atom") in

      ! M_λνP(iτ) = sum_µ (µν|P) G^occ_µλ(i|τ|,k=0)

      ! N_νλQ(iτ) = sum_σ (σλ|Q) G^vir_σν(i|τ|,k=0)

      ! such that M and N fit into the memory

      n_atom_per_ivl = int(sqrt(bs_env%safety_factor_memory*input_memory_per_proc &

                                *bs_env%group_size_tensor/24/bs_env%n_RI &

                                /sqrt(bs_env%occupation_3c_int)))/bs_env%max_AO_bf_per_atom


      n_intervals_i = (bs_env%n_atom_i - 1)/n_atom_per_ivl + 1

      n_intervals_j = (bs_env%n_atom_j - 1)/n_atom_per_ivl + 1


      bs_env%n_atom_per_interval_ij = n_atom_per_ivl

      bs_env%n_intervals_i = n_intervals_i

      bs_env%n_intervals_j = n_intervals_j


      ALLOCATE (bs_env%i_atom_intervals(2, n_intervals_i))

      ALLOCATE (bs_env%j_atom_intervals(2, n_intervals_j))


      DO i_ivl = 1, n_intervals_i

         bs_env%i_atom_intervals(1, i_ivl) = (i_ivl - 1)*n_atom_per_ivl + bs_env%atoms_i(1)

         bs_env%i_atom_intervals(2, i_ivl) = min(i_ivl*n_atom_per_ivl + bs_env%atoms_i(1) - 1, &

                                                 bs_env%atoms_i(2))

      END DO


      DO j_ivl = 1, n_intervals_j

         bs_env%j_atom_intervals(1, j_ivl) = (j_ivl - 1)*n_atom_per_ivl + bs_env%atoms_j(1)

         bs_env%j_atom_intervals(2, j_ivl) = min(j_ivl*n_atom_per_ivl + bs_env%atoms_j(1) - 1, &

                                                 bs_env%atoms_j(2))

      END DO


      ALLOCATE (bs_env%skip_Sigma_occ(n_intervals_i, n_intervals_j))

      ALLOCATE (bs_env%skip_Sigma_vir(n_intervals_i, n_intervals_j))

      bs_env%skip_Sigma_occ(:, :) = .false.

      bs_env%skip_Sigma_vir(:, :) = .false.


      ! choose atomic range for µ and σ ("inner loop (IL) atom") in

      ! M_λνP(iτ) = sum_µ (µν|P) G^occ_µλ(i|τ|,k=0)

      ! N_νλQ(iτ) = sum_σ (σλ|Q) G^vir_σν(i|τ|,k=0)

      n_atom_per_il_ivl = min(int(bs_env%safety_factor_memory*input_memory_per_proc &

                                  *bs_env%group_size_tensor/n_atom_per_ivl &

                                  /bs_env%max_AO_bf_per_atom &

                                  /bs_env%n_RI/8/sqrt(bs_env%occupation_3c_int) &

                                  /bs_env%max_AO_bf_per_atom), bs_env%n_atom)


      n_intervals_inner_loop_atoms = (bs_env%n_atom - 1)/n_atom_per_il_ivl + 1


      bs_env%n_atom_per_IL_interval = n_atom_per_il_ivl

      bs_env%n_intervals_inner_loop_atoms = n_intervals_inner_loop_atoms


      ALLOCATE (bs_env%inner_loop_atom_intervals(2, n_intervals_inner_loop_atoms))

      DO il_ivl = 1, n_intervals_inner_loop_atoms

         bs_env%inner_loop_atom_intervals(1, il_ivl) = (il_ivl - 1)*n_atom_per_il_ivl + 1

         bs_env%inner_loop_atom_intervals(2, il_ivl) = min(il_ivl*n_atom_per_il_ivl, bs_env%n_atom)

      END DO


      u = bs_env%unit_nr

      IF (u > 0) THEN

         WRITE (u, '(T2,A)') ''

         WRITE (u, '(T2,A,I33)') λντνλτ'Number of i and j atoms in M_P(), N_Q():', n_atom_per_ivl

         WRITE (u, '(T2,A,I18)') µλνµµνµλ'Number of inner loop atoms for  in M_P = sum_ (|P) G_', &

            n_atom_per_il_ivl

      END IF


      CALL timestop(handle)


   END SUBROUTINE set_sparsity_parallelization_parameters


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE check_for_restart_files(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'check_for_restart_files'


      CHARACTER(LEN=9)                                   :: frmt

      CHARACTER(LEN=default_string_length)               :: f_chi, f_s_n, f_s_p, f_s_x, f_w_t, &

                                                            prefix, project_name

      INTEGER                                            :: handle, i_spin, i_t_or_w, ind, n_spin, &

                                                            num_time_freq_points

      LOGICAL                                            :: chi_exists, sigma_neg_time_exists, &

                                                            sigma_pos_time_exists, &

                                                            sigma_x_spin_exists, w_time_exists

      TYPE(cp_logger_type), POINTER                      :: logger

      TYPE(section_vals_type), POINTER                   :: input, print_key


      CALL timeset(routinen, handle)


      num_time_freq_points = bs_env%num_time_freq_points

      n_spin = bs_env%n_spin


      ALLOCATE (bs_env%read_chi(num_time_freq_points))

      ALLOCATE (bs_env%calc_chi(num_time_freq_points))

      ALLOCATE (bs_env%Sigma_c_exists(num_time_freq_points, n_spin))


      CALL get_qs_env(qs_env, input=input)


      logger => cp_get_default_logger()

      print_key => section_vals_get_subs_vals(input, 'PROPERTIES%BANDSTRUCTURE%GW%PRINT%RESTART')

      project_name = cp_print_key_generate_filename(logger, print_key, extension="", &

                                                    my_local=.false.)

      WRITE (prefix, '(2A)') trim(project_name), "-RESTART_"

      bs_env%prefix = prefix


      bs_env%all_W_exist = .true.


      DO i_t_or_w = 1, num_time_freq_points


         IF (i_t_or_w < 10) THEN

            WRITE (frmt, '(A)') '(3A,I1,A)'

            WRITE (f_chi, frmt) trim(prefix), bs_env%chi_name, "_0", i_t_or_w, ".matrix"

            WRITE (f_w_t, frmt) trim(prefix), bs_env%W_time_name, "_0", i_t_or_w, ".matrix"

         ELSE IF (i_t_or_w < 100) THEN

            WRITE (frmt, '(A)') '(3A,I2,A)'

            WRITE (f_chi, frmt) trim(prefix), bs_env%chi_name, "_", i_t_or_w, ".matrix"

            WRITE (f_w_t, frmt) trim(prefix), bs_env%W_time_name, "_", i_t_or_w, ".matrix"

         ELSE

            cpabort('Please implement more than 99 time/frequency points.')

         END IF


         INQUIRE (file=trim(f_chi), exist=chi_exists)

         INQUIRE (file=trim(f_w_t), exist=w_time_exists)


         bs_env%read_chi(i_t_or_w) = chi_exists

         bs_env%calc_chi(i_t_or_w) = .NOT. chi_exists


         bs_env%all_W_exist = bs_env%all_W_exist .AND. w_time_exists


         ! the self-energy is spin-dependent

         DO i_spin = 1, n_spin


            ind = i_t_or_w + (i_spin - 1)*num_time_freq_points


            IF (ind < 10) THEN

               WRITE (frmt, '(A)') '(3A,I1,A)'

               WRITE (f_s_p, frmt) trim(prefix), bs_env%Sigma_p_name, "_0", ind, ".matrix"

               WRITE (f_s_n, frmt) trim(prefix), bs_env%Sigma_n_name, "_0", ind, ".matrix"

            ELSE IF (i_t_or_w < 100) THEN

               WRITE (frmt, '(A)') '(3A,I2,A)'

               WRITE (f_s_p, frmt) trim(prefix), bs_env%Sigma_p_name, "_", ind, ".matrix"

               WRITE (f_s_n, frmt) trim(prefix), bs_env%Sigma_n_name, "_", ind, ".matrix"

            END IF


            INQUIRE (file=trim(f_s_p), exist=sigma_pos_time_exists)

            INQUIRE (file=trim(f_s_n), exist=sigma_neg_time_exists)


            bs_env%Sigma_c_exists(i_t_or_w, i_spin) = sigma_pos_time_exists .AND. &

                                                      sigma_neg_time_exists


         END DO


      END DO


      ! Marek : In the RTBSE run, check also for zero frequency W

      IF (bs_env%rtp_method == rtp_method_bse) THEN

         WRITE (f_w_t, '(3A,I1,A)') trim(prefix), "W_freq_rtp", "_0", 0, ".matrix"

         INQUIRE (file=trim(f_w_t), exist=w_time_exists)

         bs_env%all_W_exist = bs_env%all_W_exist .AND. w_time_exists

      END IF


      IF (bs_env%all_W_exist) THEN

         bs_env%read_chi(:) = .false.

         bs_env%calc_chi(:) = .false.

      END IF


      bs_env%Sigma_x_exists = .true.

      DO i_spin = 1, n_spin

         WRITE (f_s_x, '(3A,I1,A)') trim(prefix), bs_env%Sigma_x_name, "_0", i_spin, ".matrix"

         INQUIRE (file=trim(f_s_x), exist=sigma_x_spin_exists)

         bs_env%Sigma_x_exists = bs_env%Sigma_x_exists .AND. sigma_x_spin_exists

      END DO


      ! If any restart files are read, check if the SCF converged in 1 step.

      ! This is important because a re-iterated SCF can lead to spurious GW results

      IF (any(bs_env%read_chi(:)) &

          .OR. any(bs_env%Sigma_c_exists) &

          .OR. bs_env%all_W_exist &

          .OR. bs_env%Sigma_x_exists &

          ) THEN


         IF (qs_env%scf_env%iter_count /= 1) THEN

            CALL cp_warn(__location__, "SCF needed more than 1 step, "// &

                         "which might lead to spurious GW results when using GW restart files. ")

         END IF

      END IF


      CALL timestop(handle)


   END SUBROUTINE check_for_restart_files


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE set_parallelization_parameters(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'set_parallelization_parameters'


      INTEGER                                            :: color_sub, dummy_1, dummy_2, handle, &

                                                            num_pe, num_t_groups, u

      INTEGER(KIND=int_8)                                :: mem

      TYPE(mp_para_env_type), POINTER                    :: para_env


      CALL timeset(routinen, handle)


      CALL get_qs_env(qs_env, para_env=para_env)


      num_pe = para_env%num_pe

      ! if not already set, use all processors for the group (for large-cell GW, performance

      ! seems to be best for a single group with all MPI processes per group)

      IF (bs_env%group_size_tensor < 0 .OR. bs_env%group_size_tensor > num_pe) &

         bs_env%group_size_tensor = num_pe


      ! group_size_tensor must divide num_pe without rest; otherwise everything will be complicated

      IF (modulo(num_pe, bs_env%group_size_tensor) .NE. 0) THEN

         CALL find_good_group_size(num_pe, bs_env%group_size_tensor)

      END IF


      ! para_env_tensor for tensor subgroups

      color_sub = para_env%mepos/bs_env%group_size_tensor

      bs_env%tensor_group_color = color_sub


      ALLOCATE (bs_env%para_env_tensor)

      CALL bs_env%para_env_tensor%from_split(para_env, color_sub)


      num_t_groups = para_env%num_pe/bs_env%group_size_tensor

      bs_env%num_tensor_groups = num_t_groups


      CALL get_i_j_atoms(bs_env%atoms_i, bs_env%atoms_j, bs_env%n_atom_i, bs_env%n_atom_j, &

                         color_sub, bs_env)


      ALLOCATE (bs_env%atoms_i_t_group(2, num_t_groups))

      ALLOCATE (bs_env%atoms_j_t_group(2, num_t_groups))

      DO color_sub = 0, num_t_groups - 1

         CALL get_i_j_atoms(bs_env%atoms_i_t_group(1:2, color_sub + 1), &

                            bs_env%atoms_j_t_group(1:2, color_sub + 1), &

                            dummy_1, dummy_2, color_sub, bs_env)

      END DO


      CALL m_memory(mem)

      CALL bs_env%para_env%max(mem)


      u = bs_env%unit_nr

      IF (u > 0) THEN

         WRITE (u, '(T2,A,I47)') 'Group size for tensor operations', bs_env%group_size_tensor

         IF (bs_env%group_size_tensor > 1 .AND. bs_env%n_atom < 5) THEN

            WRITE (u, '(T2,A)') 'The requested group size is > 1 which can lead to bad performance.'

            WRITE (u, '(T2,A)') 'Using more memory per MPI process might improve performance.'

            WRITE (u, '(T2,A)') '(Also increase MEMORY_PER_PROC when using more memory per process.)'

         END IF

      END IF


      CALL timestop(handle)


   END SUBROUTINE set_parallelization_parameters


! **************************************************************************************************

!> \brief ...

!> \param num_pe ...

!> \param group_size ...

! **************************************************************************************************

   SUBROUTINE find_good_group_size(num_pe, group_size)


      INTEGER                                            :: num_pe, group_size


      CHARACTER(LEN=*), PARAMETER :: routinen = 'find_good_group_size'


      INTEGER                                            :: group_size_minus, group_size_orig, &

                                                            group_size_plus, handle, i_diff


      CALL timeset(routinen, handle)


      group_size_orig = group_size


      DO i_diff = 1, num_pe


         group_size_minus = group_size - i_diff


         IF (modulo(num_pe, group_size_minus) == 0 .AND. group_size_minus > 0) THEN

            group_size = group_size_minus

            EXIT

         END IF


         group_size_plus = group_size + i_diff


         IF (modulo(num_pe, group_size_plus) == 0 .AND. group_size_plus <= num_pe) THEN

            group_size = group_size_plus

            EXIT

         END IF


      END DO


      IF (group_size_orig == group_size) cpabort("Group size error")


      CALL timestop(handle)


   END SUBROUTINE find_good_group_size


! **************************************************************************************************

!> \brief ...

!> \param atoms_i ...

!> \param atoms_j ...

!> \param n_atom_i ...

!> \param n_atom_j ...

!> \param color_sub ...

!> \param bs_env ...

! **************************************************************************************************


   SUBROUTINE get_i_j_atoms(atoms_i, atoms_j, n_atom_i, n_atom_j, color_sub, bs_env)


      INTEGER, DIMENSION(2)                              :: atoms_i, atoms_j

      INTEGER                                            :: n_atom_i, n_atom_j, color_sub

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'get_i_j_atoms'


      INTEGER                                            :: handle, i_atoms_per_group, i_group, &

                                                            ipcol, ipcol_loop, iprow, iprow_loop, &

                                                            j_atoms_per_group, npcol, nprow


      CALL timeset(routinen, handle)


      ! create a square mesh of tensor groups for iatom and jatom; code from blacs_env_create

      CALL square_mesh(nprow, npcol, bs_env%num_tensor_groups)


      i_group = 0

      DO ipcol_loop = 0, npcol - 1

         DO iprow_loop = 0, nprow - 1

            IF (i_group == color_sub) THEN

               iprow = iprow_loop

               ipcol = ipcol_loop

            END IF

            i_group = i_group + 1

         END DO

      END DO


      IF (modulo(bs_env%n_atom, nprow) == 0) THEN

         i_atoms_per_group = bs_env%n_atom/nprow

      ELSE

         i_atoms_per_group = bs_env%n_atom/nprow + 1

      END IF


      IF (modulo(bs_env%n_atom, npcol) == 0) THEN

         j_atoms_per_group = bs_env%n_atom/npcol

      ELSE

         j_atoms_per_group = bs_env%n_atom/npcol + 1

      END IF


      atoms_i(1) = iprow*i_atoms_per_group + 1

      atoms_i(2) = min((iprow + 1)*i_atoms_per_group, bs_env%n_atom)

      n_atom_i = atoms_i(2) - atoms_i(1) + 1


      atoms_j(1) = ipcol*j_atoms_per_group + 1

      atoms_j(2) = min((ipcol + 1)*j_atoms_per_group, bs_env%n_atom)

      n_atom_j = atoms_j(2) - atoms_j(1) + 1


      CALL timestop(handle)


   END SUBROUTINE get_i_j_atoms


! **************************************************************************************************

!> \brief ...

!> \param nprow ...

!> \param npcol ...

!> \param nproc ...

! **************************************************************************************************

   SUBROUTINE square_mesh(nprow, npcol, nproc)

      INTEGER                                            :: nprow, npcol, nproc


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'square_mesh'


      INTEGER                                            :: gcd_max, handle, ipe, jpe


      CALL timeset(routinen, handle)


      gcd_max = -1

      DO ipe = 1, ceiling(sqrt(real(nproc, dp)))

         jpe = nproc/ipe

         IF (ipe*jpe .NE. nproc) cycle

         IF (gcd(ipe, jpe) >= gcd_max) THEN

            nprow = ipe

            npcol = jpe

            gcd_max = gcd(ipe, jpe)

         END IF

      END DO


      CALL timestop(handle)


   END SUBROUTINE square_mesh


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param qs_env ...

! **************************************************************************************************

   SUBROUTINE set_heuristic_parameters(bs_env, qs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(qs_environment_type), OPTIONAL, POINTER       :: qs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'set_heuristic_parameters'


      INTEGER                                            :: handle, u

      LOGICAL                                            :: do_bvk_cell


      CALL timeset(routinen, handle)


      ! for generating numerically stable minimax Fourier integration weights

      bs_env%num_points_per_magnitude = 200


      IF (bs_env%input_regularization_minimax > -1.0e-12_dp) THEN

         bs_env%regularization_minimax = bs_env%input_regularization_minimax

      ELSE

         ! for periodic systems and for 20 minimax points, we use a regularized minimax mesh

         ! (from experience: regularized minimax meshes converges faster for periodic systems

         !  and for 20 pts)

         IF (sum(bs_env%periodic) .NE. 0 .OR. bs_env%num_time_freq_points >= 20) THEN

            bs_env%regularization_minimax = 1.0e-6_dp

         ELSE

            bs_env%regularization_minimax = 0.0_dp

         END IF

      END IF


      bs_env%stabilize_exp = 70.0_dp

      bs_env%eps_atom_grid_2d_mat = 1.0e-50_dp


      ! use a 16-parameter Padé fit

      bs_env%nparam_pade = 16


      ! resolution of the identity with the truncated Coulomb metric, cutoff radius 3 Angström

      bs_env%ri_metric%potential_type = do_potential_truncated

      bs_env%ri_metric%omega = 0.0_dp

      ! cutoff radius is specified in the input

      bs_env%ri_metric%filename = "t_c_g.dat"


      bs_env%eps_eigval_mat_RI = 0.0_dp


      IF (bs_env%input_regularization_RI > -1.0e-12_dp) THEN

         bs_env%regularization_RI = bs_env%input_regularization_RI

      ELSE

         ! default case:


         ! 1. for periodic systems, we use the regularized resolution of the identity per default

         bs_env%regularization_RI = 1.0e-2_dp


         ! 2. for molecules, no regularization is necessary

         IF (sum(bs_env%periodic) == 0) bs_env%regularization_RI = 0.0_dp


      END IF


      ! truncated Coulomb operator for exchange self-energy

      ! (see details in Guidon, VandeVondele, Hutter, JCTC 5, 3010 (2009) and references therein)

      do_bvk_cell = bs_env%small_cell_full_kp_or_large_cell_Gamma == small_cell_full_kp

      CALL trunc_coulomb_for_exchange(qs_env, bs_env%trunc_coulomb, &

                                      rel_cutoff_trunc_coulomb_ri_x=0.5_dp, &

                                      cell_grid=bs_env%cell_grid_scf_desymm, &

                                      do_bvk_cell=do_bvk_cell)


      ! for small-cell GW, we need more cells than normally used by the filter bs_env%eps_filter

      ! (in particular for computing the self-energy because of higher number of cells needed)

      bs_env%heuristic_filter_factor = 1.0e-4


      u = bs_env%unit_nr

      IF (u > 0) THEN

         WRITE (u, fmt="(T2,2A,F21.1,A)") "Cutoff radius for the truncated Coulomb ", &

            Σ"operator in ^x:", bs_env%trunc_coulomb%cutoff_radius*angstrom, Å" "

         WRITE (u, fmt="(T2,2A,F15.1,A)") "Cutoff radius for the truncated Coulomb ", &

            "operator in RI metric:", bs_env%ri_metric%cutoff_radius*angstrom, Å" "

         WRITE (u, fmt="(T2,A,ES48.1)") "Regularization parameter of RI ", bs_env%regularization_RI

         WRITE (u, fmt="(T2,A,ES38.1)") "Regularization parameter of minimax grids", &

            bs_env%regularization_minimax

         WRITE (u, fmt="(T2,A,I53)") "Lattice sum size for V(k):", bs_env%size_lattice_sum_V

      END IF


      CALL timestop(handle)


   END SUBROUTINE set_heuristic_parameters


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE print_header_and_input_parameters(bs_env)


      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'print_header_and_input_parameters'


      INTEGER                                            :: handle, u


      CALL timeset(routinen, handle)


      u = bs_env%unit_nr


      IF (u > 0) THEN

         WRITE (u, '(T2,A)') ' '

         WRITE (u, '(T2,A)') repeat('-', 79)

         WRITE (u, '(T2,A,A78)') '-', '-'

         WRITE (u, '(T2,A,A46,A32)') '-', 'GW CALCULATION', '-'

         WRITE (u, '(T2,A,A78)') '-', '-'

         WRITE (u, '(T2,A)') repeat('-', 79)

         WRITE (u, '(T2,A)') ' '

         WRITE (u, '(T2,A,I45)') 'Input: Number of time/freq. points', bs_env%num_time_freq_points

         WRITE (u, "(T2,A,F44.1,A)") ωΣω'Input: _max for fitting (i) (eV)', bs_env%freq_max_fit*evolt

         WRITE (u, '(T2,A,ES27.1)') 'Input: Filter threshold for sparse tensor operations', &

            bs_env%eps_filter

         WRITE (u, "(T2,A,L55)") 'Input: Apply Hedin shift', bs_env%do_hedin_shift

      END IF


      CALL timestop(handle)


   END SUBROUTINE print_header_and_input_parameters


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE compute_v_xc(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'compute_V_xc'


      INTEGER                                            :: handle, img, ispin, myfun, nimages

      LOGICAL                                            :: hf_present

      REAL(kind=dp)                                      :: energy_ex, energy_exc, energy_total, &

                                                            myfraction

      TYPE(dbcsr_p_type), DIMENSION(:), POINTER          :: mat_ks_without_v_xc

      TYPE(dbcsr_p_type), DIMENSION(:, :), POINTER       :: matrix_ks_kp

      TYPE(dft_control_type), POINTER                    :: dft_control

      TYPE(qs_energy_type), POINTER                      :: energy

      TYPE(section_vals_type), POINTER                   :: hf_section, input, xc_section


      CALL timeset(routinen, handle)


      CALL get_qs_env(qs_env, input=input, energy=energy, dft_control=dft_control)


      ! previously, dft_control%nimages set to # neighbor cells, revert for Γ-only KS matrix

      nimages = dft_control%nimages

      dft_control%nimages = bs_env%nimages_scf


      ! we need to reset XC functional, therefore, get XC input

      xc_section => section_vals_get_subs_vals(input, "DFT%XC")

      CALL section_vals_val_get(xc_section, "XC_FUNCTIONAL%_SECTION_PARAMETERS_", i_val=myfun)

      CALL section_vals_val_set(xc_section, "XC_FUNCTIONAL%_SECTION_PARAMETERS_", i_val=xc_none)

      ! IF (ASSOCIATED(section_vals_get_subs_vals(xc_section, "HF", can_return_null=.TRUE.))) THEN

      hf_section => section_vals_get_subs_vals(input, "DFT%XC%HF", can_return_null=.true.)

      hf_present = .false.

      IF (ASSOCIATED(hf_section)) THEN

         CALL section_vals_get(hf_section, explicit=hf_present)

      END IF

      IF (hf_present) THEN

         ! Special case for handling hfx

         CALL section_vals_val_get(xc_section, "HF%FRACTION", r_val=myfraction)

         CALL section_vals_val_set(xc_section, "HF%FRACTION", r_val=0.0_dp)

      END IF


      ! save the energy before the energy gets updated

      energy_total = energy%total

      energy_exc = energy%exc

      energy_ex = energy%ex


      SELECT CASE (bs_env%small_cell_full_kp_or_large_cell_Gamma)

      CASE (large_cell_gamma)


         NULLIFY (mat_ks_without_v_xc)

         CALL dbcsr_allocate_matrix_set(mat_ks_without_v_xc, bs_env%n_spin)


         DO ispin = 1, bs_env%n_spin

            ALLOCATE (mat_ks_without_v_xc(ispin)%matrix)

            IF (hf_present) THEN

               CALL dbcsr_create(mat_ks_without_v_xc(ispin)%matrix, template=bs_env%mat_ao_ao%matrix, &

                                 matrix_type=dbcsr_type_symmetric)

            ELSE

               CALL dbcsr_create(mat_ks_without_v_xc(ispin)%matrix, template=bs_env%mat_ao_ao%matrix)

            END IF

         END DO


         ! calculate KS-matrix without XC

         CALL qs_ks_build_kohn_sham_matrix(qs_env, calculate_forces=.false., just_energy=.false., &

                                           ext_ks_matrix=mat_ks_without_v_xc)


         DO ispin = 1, bs_env%n_spin

            ! transfer dbcsr matrix to fm

            CALL cp_fm_create(bs_env%fm_V_xc_Gamma(ispin), bs_env%fm_s_Gamma%matrix_struct)

            CALL copy_dbcsr_to_fm(mat_ks_without_v_xc(ispin)%matrix, bs_env%fm_V_xc_Gamma(ispin))


            ! v_xc = h_ks - h_ks(v_xc = 0)

            CALL cp_fm_scale_and_add(alpha=-1.0_dp, matrix_a=bs_env%fm_V_xc_Gamma(ispin), &

                                     beta=1.0_dp, matrix_b=bs_env%fm_ks_Gamma(ispin))

         END DO


         CALL dbcsr_deallocate_matrix_set(mat_ks_without_v_xc)


      CASE (small_cell_full_kp)


         ! calculate KS-matrix without XC

         CALL qs_ks_build_kohn_sham_matrix(qs_env, calculate_forces=.false., just_energy=.false.)

         CALL get_qs_env(qs_env=qs_env, matrix_ks_kp=matrix_ks_kp)


         ALLOCATE (bs_env%fm_V_xc_R(dft_control%nimages, bs_env%n_spin))

         DO ispin = 1, bs_env%n_spin

            DO img = 1, dft_control%nimages

               ! safe fm_V_xc_R in fm_matrix because saving in dbcsr matrix caused trouble...

               CALL copy_dbcsr_to_fm(matrix_ks_kp(ispin, img)%matrix, bs_env%fm_work_mo(1))

               CALL cp_fm_create(bs_env%fm_V_xc_R(img, ispin), bs_env%fm_work_mo(1)%matrix_struct)

               ! store h_ks(v_xc = 0) in fm_V_xc_R

               CALL cp_fm_scale_and_add(alpha=1.0_dp, matrix_a=bs_env%fm_V_xc_R(img, ispin), &

                                        beta=1.0_dp, matrix_b=bs_env%fm_work_mo(1))

            END DO

         END DO


      END SELECT


      ! set back the energy

      energy%total = energy_total

      energy%exc = energy_exc

      energy%ex = energy_ex


      ! set back nimages

      dft_control%nimages = nimages


      ! set the DFT functional and HF fraction back

      CALL section_vals_val_set(xc_section, "XC_FUNCTIONAL%_SECTION_PARAMETERS_", &

                                i_val=myfun)

      IF (hf_present) THEN

         CALL section_vals_val_set(xc_section, "HF%FRACTION", &

                                   r_val=myfraction)

      END IF


      IF (bs_env%small_cell_full_kp_or_large_cell_Gamma == small_cell_full_kp) THEN

         ! calculate KS-matrix again with XC

         CALL qs_ks_build_kohn_sham_matrix(qs_env, calculate_forces=.false., just_energy=.false.)

         DO ispin = 1, bs_env%n_spin

            DO img = 1, dft_control%nimages

               ! store h_ks in fm_work_mo

               CALL copy_dbcsr_to_fm(matrix_ks_kp(ispin, img)%matrix, bs_env%fm_work_mo(1))

               ! v_xc = h_ks - h_ks(v_xc = 0)

               CALL cp_fm_scale_and_add(alpha=-1.0_dp, matrix_a=bs_env%fm_V_xc_R(img, ispin), &

                                        beta=1.0_dp, matrix_b=bs_env%fm_work_mo(1))

            END DO

         END DO

      END IF


      CALL timestop(handle)


   END SUBROUTINE compute_v_xc


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE setup_time_and_frequency_minimax_grid(bs_env)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_time_and_frequency_minimax_grid'


      INTEGER                                            :: handle, homo, i_w, ierr, ispin, j_w, &

                                                            n_mo, num_time_freq_points, u

      REAL(kind=dp)                                      :: e_max, e_max_ispin, e_min, e_min_ispin, &

                                                            e_range, max_error_min

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: points_and_weights


      CALL timeset(routinen, handle)


      n_mo = bs_env%n_ao

      num_time_freq_points = bs_env%num_time_freq_points


      ALLOCATE (bs_env%imag_freq_points(num_time_freq_points))

      ALLOCATE (bs_env%imag_time_points(num_time_freq_points))

      ALLOCATE (bs_env%imag_time_weights_freq_zero(num_time_freq_points))

      ALLOCATE (bs_env%weights_cos_t_to_w(num_time_freq_points, num_time_freq_points))

      ALLOCATE (bs_env%weights_cos_w_to_t(num_time_freq_points, num_time_freq_points))

      ALLOCATE (bs_env%weights_sin_t_to_w(num_time_freq_points, num_time_freq_points))


      ! minimum and maximum difference between eigenvalues of unoccupied and an occupied MOs

      e_min = 1000.0_dp

      e_max = -1000.0_dp

      DO ispin = 1, bs_env%n_spin

         homo = bs_env%n_occ(ispin)

         SELECT CASE (bs_env%small_cell_full_kp_or_large_cell_Gamma)

         CASE (large_cell_gamma)

            e_min_ispin = bs_env%eigenval_scf_Gamma(homo + 1, ispin) - &

                          bs_env%eigenval_scf_Gamma(homo, ispin)

            e_max_ispin = bs_env%eigenval_scf_Gamma(n_mo, ispin) - &

                          bs_env%eigenval_scf_Gamma(1, ispin)

         CASE (small_cell_full_kp)

            e_min_ispin = minval(bs_env%eigenval_scf(homo + 1, :, ispin)) - &

                          maxval(bs_env%eigenval_scf(homo, :, ispin))

            e_max_ispin = maxval(bs_env%eigenval_scf(n_mo, :, ispin)) - &

                          minval(bs_env%eigenval_scf(1, :, ispin))

         END SELECT

         e_min = min(e_min, e_min_ispin)

         e_max = max(e_max, e_max_ispin)

      END DO


      e_range = e_max/e_min


      ALLOCATE (points_and_weights(2*num_time_freq_points))


      ! frequency points

      IF (num_time_freq_points .LE. 20) THEN

         CALL get_rpa_minimax_coeff(num_time_freq_points, e_range, points_and_weights, ierr, .false.)

      ELSE

         CALL get_rpa_minimax_coeff_larger_grid(num_time_freq_points, e_range, points_and_weights)

      END IF


      ! one needs to scale the minimax grids, see Azizi, Wilhelm, Golze, Panades-Barrueta,

      ! Giantomassi, Rinke, Draxl, Gonze et al., 2 publications

      bs_env%imag_freq_points(:) = points_and_weights(1:num_time_freq_points)*e_min


      ! determine number of fit points in the interval [0,ω_max] for virt, or [-ω_max,0] for occ

      bs_env%num_freq_points_fit = 0

      DO i_w = 1, num_time_freq_points

         IF (bs_env%imag_freq_points(i_w) < bs_env%freq_max_fit) THEN

            bs_env%num_freq_points_fit = bs_env%num_freq_points_fit + 1

         END IF

      END DO


      ! iω values for the analytic continuation Σ^c_n(iω,k) -> Σ^c_n(ϵ,k)

      ALLOCATE (bs_env%imag_freq_points_fit(bs_env%num_freq_points_fit))

      j_w = 0

      DO i_w = 1, num_time_freq_points

         IF (bs_env%imag_freq_points(i_w) < bs_env%freq_max_fit) THEN

            j_w = j_w + 1

            bs_env%imag_freq_points_fit(j_w) = bs_env%imag_freq_points(i_w)

         END IF

      END DO


      ! reset the number of Padé parameters if smaller than the number of

      ! imaginary-frequency points for the fit

      IF (bs_env%num_freq_points_fit < bs_env%nparam_pade) THEN

         bs_env%nparam_pade = bs_env%num_freq_points_fit

      END IF


      ! time points

      IF (num_time_freq_points .LE. 20) THEN

         CALL get_exp_minimax_coeff(num_time_freq_points, e_range, points_and_weights)

      ELSE

         CALL get_exp_minimax_coeff_gw(num_time_freq_points, e_range, points_and_weights)

      END IF


      bs_env%imag_time_points(:) = points_and_weights(1:num_time_freq_points)/(2.0_dp*e_min)

      bs_env%imag_time_weights_freq_zero(:) = points_and_weights(num_time_freq_points + 1:)/(e_min)


      DEALLOCATE (points_and_weights)


      u = bs_env%unit_nr

      IF (u > 0) THEN

         WRITE (u, '(T2,A)') ''

         WRITE (u, '(T2,A,F55.2)') 'SCF direct band gap (eV)', e_min*evolt

         WRITE (u, '(T2,A,F53.2)') 'Max. SCF eigval diff. (eV)', e_max*evolt

         WRITE (u, '(T2,A,F55.2)') 'E-Range for minimax grid', e_range

         WRITE (u, '(T2,A,I27)') é'Number of Pad parameters for analytic continuation:', &

            bs_env%nparam_pade

         WRITE (u, '(T2,A)') ''

      END IF


      ! in minimax grids, Fourier transforms t -> w and w -> t are split using

      ! e^(iwt) = cos(wt) + i sin(wt); we thus calculate weights for trafos with a cos and

      ! sine prefactor; details in Azizi, Wilhelm, Golze, Giantomassi, Panades-Barrueta,

      ! Rinke, Draxl, Gonze et al., 2 publications


      ! cosine transform weights imaginary time to imaginary frequency

      CALL get_l_sq_wghts_cos_tf_t_to_w(num_time_freq_points, &

                                        bs_env%imag_time_points, &

                                        bs_env%weights_cos_t_to_w, &

                                        bs_env%imag_freq_points, &

                                        e_min, e_max, max_error_min, &

                                        bs_env%num_points_per_magnitude, &

                                        bs_env%regularization_minimax)


      ! cosine transform weights imaginary frequency to imaginary time

      CALL get_l_sq_wghts_cos_tf_w_to_t(num_time_freq_points, &

                                        bs_env%imag_time_points, &

                                        bs_env%weights_cos_w_to_t, &

                                        bs_env%imag_freq_points, &

                                        e_min, e_max, max_error_min, &

                                        bs_env%num_points_per_magnitude, &

                                        bs_env%regularization_minimax)


      ! sine transform weights imaginary time to imaginary frequency

      CALL get_l_sq_wghts_sin_tf_t_to_w(num_time_freq_points, &

                                        bs_env%imag_time_points, &

                                        bs_env%weights_sin_t_to_w, &

                                        bs_env%imag_freq_points, &

                                        e_min, e_max, max_error_min, &

                                        bs_env%num_points_per_magnitude, &

                                        bs_env%regularization_minimax)


      CALL timestop(handle)


   END SUBROUTINE setup_time_and_frequency_minimax_grid


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE setup_cells_3c(qs_env, bs_env)


      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'setup_cells_3c'


      INTEGER :: atom_i, atom_j, atom_k, block_count, handle, i, i_cell_x, i_cell_x_max, &

         i_cell_x_min, i_size, ikind, img, j, j_cell, j_cell_max, j_cell_y, j_cell_y_max, &

         j_cell_y_min, j_size, k_cell, k_cell_max, k_cell_z, k_cell_z_max, k_cell_z_min, k_size, &

         nimage_pairs_3c, nimages_3c, nimages_3c_max, nkind, u

      INTEGER(KIND=int_8)                                :: mem_occ_per_proc

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: kind_of, n_other_3c_images_max

      INTEGER, ALLOCATABLE, DIMENSION(:, :)              :: index_to_cell_3c_max, nblocks_3c_max

      INTEGER, DIMENSION(3)                              :: cell_index, n_max

      REAL(kind=dp) :: avail_mem_per_proc_gb, cell_dist, cell_radius_3c, dij, dik, djk, eps, &

         exp_min_ao, exp_min_ri, frobenius_norm, mem_3c_gb, mem_occ_per_proc_gb, radius_ao, &

         radius_ao_product, radius_ri

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: exp_ao_kind, exp_ri_kind, &

                                                            radius_ao_kind, &

                                                            radius_ao_product_kind, radius_ri_kind

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :, :)     :: int_3c

      REAL(kind=dp), DIMENSION(3)                        :: rij, rik, rjk, vec_cell_j, vec_cell_k

      REAL(kind=dp), DIMENSION(:, :), POINTER            :: exp_ao, exp_ri

      TYPE(atomic_kind_type), DIMENSION(:), POINTER      :: atomic_kind_set

      TYPE(cell_type), POINTER                           :: cell

      TYPE(particle_type), DIMENSION(:), POINTER         :: particle_set


      CALL timeset(routinen, handle)


      CALL get_qs_env(qs_env, nkind=nkind, atomic_kind_set=atomic_kind_set, particle_set=particle_set, cell=cell)


      ALLOCATE (exp_ao_kind(nkind), exp_ri_kind(nkind), radius_ao_kind(nkind), &

                radius_ao_product_kind(nkind), radius_ri_kind(nkind))


      exp_min_ri = 10.0_dp

      exp_min_ao = 10.0_dp

      exp_ri_kind = 10.0_dp

      exp_ao_kind = 10.0_dp


      eps = bs_env%eps_filter*bs_env%heuristic_filter_factor


      DO ikind = 1, nkind


         CALL get_gto_basis_set(bs_env%basis_set_RI(ikind)%gto_basis_set, zet=exp_ri)

         CALL get_gto_basis_set(bs_env%basis_set_ao(ikind)%gto_basis_set, zet=exp_ao)


         ! we need to remove all exponents lower than a lower bound, e.g. 1E-3, because

         ! for contracted basis sets, there might be exponents = 0 in zet

         DO i = 1, SIZE(exp_ri, 1)

            DO j = 1, SIZE(exp_ri, 2)

               IF (exp_ri(i, j) < exp_min_ri .AND. exp_ri(i, j) > 1e-3_dp) exp_min_ri = exp_ri(i, j)

               IF (exp_ri(i, j) < exp_ri_kind(ikind) .AND. exp_ri(i, j) > 1e-3_dp) &

                  exp_ri_kind(ikind) = exp_ri(i, j)

            END DO

         END DO

         DO i = 1, SIZE(exp_ao, 1)

            DO j = 1, SIZE(exp_ao, 2)

               IF (exp_ao(i, j) < exp_min_ao .AND. exp_ao(i, j) > 1e-3_dp) exp_min_ao = exp_ao(i, j)

               IF (exp_ao(i, j) < exp_ao_kind(ikind) .AND. exp_ao(i, j) > 1e-3_dp) &

                  exp_ao_kind(ikind) = exp_ao(i, j)

            END DO

         END DO

         radius_ao_kind(ikind) = sqrt(-log(eps)/exp_ao_kind(ikind))

         radius_ao_product_kind(ikind) = sqrt(-log(eps)/(2.0_dp*exp_ao_kind(ikind)))

         radius_ri_kind(ikind) = sqrt(-log(eps)/exp_ri_kind(ikind))

      END DO


      radius_ao = sqrt(-log(eps)/exp_min_ao)

      radius_ao_product = sqrt(-log(eps)/(2.0_dp*exp_min_ao))

      radius_ri = sqrt(-log(eps)/exp_min_ri)


      CALL get_atomic_kind_set(atomic_kind_set=atomic_kind_set, kind_of=kind_of)


      ! For a 3c integral (μR υS | P0) we have that cell R and cell S need to be within radius_3c

      cell_radius_3c = radius_ao_product + radius_ri + bs_env%ri_metric%cutoff_radius


      n_max(1:3) = bs_env%periodic(1:3)*30


      nimages_3c_max = 0


      i_cell_x_min = 0

      i_cell_x_max = 0

      j_cell_y_min = 0

      j_cell_y_max = 0

      k_cell_z_min = 0

      k_cell_z_max = 0


      DO i_cell_x = -n_max(1), n_max(1)

         DO j_cell_y = -n_max(2), n_max(2)

            DO k_cell_z = -n_max(3), n_max(3)


               cell_index(1:3) = (/i_cell_x, j_cell_y, k_cell_z/)


               CALL get_cell_dist(cell_index, bs_env%hmat, cell_dist)


               IF (cell_dist < cell_radius_3c) THEN

                  nimages_3c_max = nimages_3c_max + 1

                  i_cell_x_min = min(i_cell_x_min, i_cell_x)

                  i_cell_x_max = max(i_cell_x_max, i_cell_x)

                  j_cell_y_min = min(j_cell_y_min, j_cell_y)

                  j_cell_y_max = max(j_cell_y_max, j_cell_y)

                  k_cell_z_min = min(k_cell_z_min, k_cell_z)

                  k_cell_z_max = max(k_cell_z_max, k_cell_z)

               END IF


            END DO

         END DO

      END DO


      ! get index_to_cell_3c_max for the maximum possible cell range;

      ! compute 3c integrals later in this routine and check really which cell is needed

      ALLOCATE (index_to_cell_3c_max(nimages_3c_max, 3))


      img = 0

      DO i_cell_x = -n_max(1), n_max(1)

         DO j_cell_y = -n_max(2), n_max(2)

            DO k_cell_z = -n_max(3), n_max(3)


               cell_index(1:3) = (/i_cell_x, j_cell_y, k_cell_z/)


               CALL get_cell_dist(cell_index, bs_env%hmat, cell_dist)


               IF (cell_dist < cell_radius_3c) THEN

                  img = img + 1

                  index_to_cell_3c_max(img, 1:3) = cell_index(1:3)

               END IF


            END DO

         END DO

      END DO


      ! get pairs of R and S which have non-zero 3c integral (μR υS | P0)

      ALLOCATE (nblocks_3c_max(nimages_3c_max, nimages_3c_max))

      nblocks_3c_max(:, :) = 0


      block_count = 0

      DO j_cell = 1, nimages_3c_max

         DO k_cell = 1, nimages_3c_max


            DO atom_j = 1, bs_env%n_atom

            DO atom_k = 1, bs_env%n_atom

            DO atom_i = 1, bs_env%n_atom


               block_count = block_count + 1

               IF (modulo(block_count, bs_env%para_env%num_pe) .NE. bs_env%para_env%mepos) cycle


               CALL scaled_to_real(vec_cell_j, real(index_to_cell_3c_max(j_cell, 1:3), kind=dp), cell)

               CALL scaled_to_real(vec_cell_k, real(index_to_cell_3c_max(k_cell, 1:3), kind=dp), cell)


               rij = pbc(particle_set(atom_j)%r(:), cell) - pbc(particle_set(atom_i)%r(:), cell) + vec_cell_j(:)

               rjk = pbc(particle_set(atom_k)%r(:), cell) - pbc(particle_set(atom_j)%r(:), cell) &

                     + vec_cell_k(:) - vec_cell_j(:)

               rik(:) = rij(:) + rjk(:)

               dij = norm2(rij)

               dik = norm2(rik)

               djk = norm2(rjk)

               IF (djk > radius_ao_kind(kind_of(atom_j)) + radius_ao_kind(kind_of(atom_k))) cycle

               IF (dij > radius_ao_kind(kind_of(atom_j)) + radius_ri_kind(kind_of(atom_i)) &

                   + bs_env%ri_metric%cutoff_radius) cycle

               IF (dik > radius_ri_kind(kind_of(atom_i)) + radius_ao_kind(kind_of(atom_k)) &

                   + bs_env%ri_metric%cutoff_radius) cycle


               j_size = bs_env%i_ao_end_from_atom(atom_j) - bs_env%i_ao_start_from_atom(atom_j) + 1

               k_size = bs_env%i_ao_end_from_atom(atom_k) - bs_env%i_ao_start_from_atom(atom_k) + 1

               i_size = bs_env%i_RI_end_from_atom(atom_i) - bs_env%i_RI_start_from_atom(atom_i) + 1


               ALLOCATE (int_3c(j_size, k_size, i_size))


               ! compute 3-c int. ( μ(atom j) R , ν (atom k) S | P (atom i) 0 )

               ! ("|": truncated Coulomb operator), inside build_3c_integrals: (j k | i)

               CALL build_3c_integral_block(int_3c, qs_env, bs_env%ri_metric, &

                                            basis_j=bs_env%basis_set_AO, &

                                            basis_k=bs_env%basis_set_AO, &

                                            basis_i=bs_env%basis_set_RI, &

                                            cell_j=index_to_cell_3c_max(j_cell, 1:3), &

                                            cell_k=index_to_cell_3c_max(k_cell, 1:3), &

                                            atom_k=atom_k, atom_j=atom_j, atom_i=atom_i)


               frobenius_norm = sqrt(sum(int_3c(:, :, :)**2))


               DEALLOCATE (int_3c)


               ! we use a higher threshold here to safe memory when storing the 3c integrals

               ! in every tensor group

               IF (frobenius_norm > eps) THEN

                  nblocks_3c_max(j_cell, k_cell) = nblocks_3c_max(j_cell, k_cell) + 1

               END IF


            END DO

            END DO

            END DO


         END DO

      END DO


      CALL bs_env%para_env%sum(nblocks_3c_max)


      ALLOCATE (n_other_3c_images_max(nimages_3c_max))

      n_other_3c_images_max(:) = 0


      nimages_3c = 0

      nimage_pairs_3c = 0


      DO j_cell = 1, nimages_3c_max

         DO k_cell = 1, nimages_3c_max

            IF (nblocks_3c_max(j_cell, k_cell) > 0) THEN

               n_other_3c_images_max(j_cell) = n_other_3c_images_max(j_cell) + 1

               nimage_pairs_3c = nimage_pairs_3c + 1

            END IF

         END DO


         IF (n_other_3c_images_max(j_cell) > 0) nimages_3c = nimages_3c + 1


      END DO


      bs_env%nimages_3c = nimages_3c

      ALLOCATE (bs_env%index_to_cell_3c(nimages_3c, 3))

      ALLOCATE (bs_env%cell_to_index_3c(i_cell_x_min:i_cell_x_max, &

                                        j_cell_y_min:j_cell_y_max, &

                                        k_cell_z_min:k_cell_z_max))

      bs_env%cell_to_index_3c(:, :, :) = -1


      ALLOCATE (bs_env%nblocks_3c(nimages_3c, nimages_3c))

      bs_env%nblocks_3c(nimages_3c, nimages_3c) = 0


      j_cell = 0

      DO j_cell_max = 1, nimages_3c_max

         IF (n_other_3c_images_max(j_cell_max) == 0) cycle

         j_cell = j_cell + 1

         cell_index(1:3) = index_to_cell_3c_max(j_cell_max, 1:3)

         bs_env%index_to_cell_3c(j_cell, 1:3) = cell_index(1:3)

         bs_env%cell_to_index_3c(cell_index(1), cell_index(2), cell_index(3)) = j_cell


         k_cell = 0

         DO k_cell_max = 1, nimages_3c_max

            IF (n_other_3c_images_max(k_cell_max) == 0) cycle

            k_cell = k_cell + 1


            bs_env%nblocks_3c(j_cell, k_cell) = nblocks_3c_max(j_cell_max, k_cell_max)

         END DO


      END DO


      ! we use: 8*10^-9 GB / double precision number

      mem_3c_gb = real(bs_env%n_RI, kind=dp)*real(bs_env%n_ao, kind=dp)**2 &

                  *real(nimage_pairs_3c, kind=dp)*8e-9_dp


      CALL m_memory(mem_occ_per_proc)

      CALL bs_env%para_env%max(mem_occ_per_proc)


      mem_occ_per_proc_gb = real(mem_occ_per_proc, kind=dp)/1.0e9_dp


      ! number of processors per group that entirely stores the 3c integrals and does tensor ops

      avail_mem_per_proc_gb = bs_env%input_memory_per_proc_GB - mem_occ_per_proc_gb


      ! careful: downconvering real to integer, 1.9 -> 1; thus add 1.0 for upconversion, 1.9 -> 2

      bs_env%group_size_tensor = max(int(mem_3c_gb/avail_mem_per_proc_gb + 1.0_dp), 1)


      u = bs_env%unit_nr


      IF (u > 0) THEN

         WRITE (u, fmt="(T2,A,F52.1,A)") "Radius of atomic orbitals", radius_ao*angstrom, Å" "

         WRITE (u, fmt="(T2,A,F55.1,A)") "Radius of RI functions", radius_ri*angstrom, Å" "

         WRITE (u, fmt="(T2,A,I47)") "Number of cells for 3c integrals", nimages_3c

         WRITE (u, fmt="(T2,A,I42)") "Number of cell pairs for 3c integrals", nimage_pairs_3c

         WRITE (u, '(T2,A)') ''

         WRITE (u, '(T2,A,F37.1,A)') 'Input: Available memory per MPI process', &

            bs_env%input_memory_per_proc_GB, ' GB'

         WRITE (u, '(T2,A,F35.1,A)') 'Used memory per MPI process before GW run', &

            mem_occ_per_proc_gb, ' GB'

         WRITE (u, '(T2,A,F44.1,A)') 'Memory of three-center integrals', mem_3c_gb, ' GB'

      END IF


      CALL timestop(handle)


   END SUBROUTINE setup_cells_3c


! **************************************************************************************************

!> \brief ...

!> \param index_to_cell_1 ...

!> \param index_to_cell_2 ...

!> \param nimages_1 ...

!> \param nimages_2 ...

!> \param index_to_cell ...

!> \param cell_to_index ...

!> \param nimages ...

! **************************************************************************************************

   SUBROUTINE sum_two_r_grids(index_to_cell_1, index_to_cell_2, nimages_1, nimages_2, &

                              index_to_cell, cell_to_index, nimages)


      INTEGER, DIMENSION(:, :)                           :: index_to_cell_1, index_to_cell_2

      INTEGER                                            :: nimages_1, nimages_2

      INTEGER, ALLOCATABLE, DIMENSION(:, :)              :: index_to_cell

      INTEGER, DIMENSION(:, :, :), POINTER               :: cell_to_index

      INTEGER                                            :: nimages


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'sum_two_R_grids'


      INTEGER                                            :: handle, i_dim, img_1, img_2, nimages_max

      INTEGER, ALLOCATABLE, DIMENSION(:, :)              :: index_to_cell_tmp

      INTEGER, DIMENSION(3)                              :: cell_1, cell_2, r, r_max, r_min


      CALL timeset(routinen, handle)


      DO i_dim = 1, 3

         r_min(i_dim) = minval(index_to_cell_1(:, i_dim)) + minval(index_to_cell_2(:, i_dim))

         r_max(i_dim) = maxval(index_to_cell_1(:, i_dim)) + maxval(index_to_cell_2(:, i_dim))

      END DO


      nimages_max = (r_max(1) - r_min(1) + 1)*(r_max(2) - r_min(2) + 1)*(r_max(3) - r_min(3) + 1)


      ALLOCATE (index_to_cell_tmp(nimages_max, 3))

      index_to_cell_tmp(:, :) = -1


      ALLOCATE (cell_to_index(r_min(1):r_max(1), r_min(2):r_max(2), r_min(3):r_max(3)))

      cell_to_index(:, :, :) = -1


      nimages = 0


      DO img_1 = 1, nimages_1


         DO img_2 = 1, nimages_2


            cell_1(1:3) = index_to_cell_1(img_1, 1:3)

            cell_2(1:3) = index_to_cell_2(img_2, 1:3)


            r(1:3) = cell_1(1:3) + cell_2(1:3)


            ! check whether we have found a new cell

            IF (cell_to_index(r(1), r(2), r(3)) == -1) THEN


               nimages = nimages + 1

               cell_to_index(r(1), r(2), r(3)) = nimages

               index_to_cell_tmp(nimages, 1:3) = r(1:3)


            END IF


         END DO


      END DO


      ALLOCATE (index_to_cell(nimages, 3))

      index_to_cell(:, :) = index_to_cell_tmp(1:nimages, 1:3)


      CALL timestop(handle)


   END SUBROUTINE sum_two_r_grids


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE compute_3c_integrals(qs_env, bs_env)


      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'compute_3c_integrals'


      INTEGER                                            :: handle, j_cell, k_cell, nimages_3c


      CALL timeset(routinen, handle)


      nimages_3c = bs_env%nimages_3c

      ALLOCATE (bs_env%t_3c_int(nimages_3c, nimages_3c))

      DO j_cell = 1, nimages_3c

         DO k_cell = 1, nimages_3c

            CALL dbt_create(bs_env%t_RI_AO__AO, bs_env%t_3c_int(j_cell, k_cell))

         END DO

      END DO


      CALL build_3c_integrals(bs_env%t_3c_int, &

                              bs_env%eps_filter, &

                              qs_env, &

                              bs_env%nl_3c, &

                              int_eps=bs_env%eps_filter*0.05_dp, &

                              basis_i=bs_env%basis_set_RI, &

                              basis_j=bs_env%basis_set_AO, &

                              basis_k=bs_env%basis_set_AO, &

                              potential_parameter=bs_env%ri_metric, &

                              desymmetrize=.false., do_kpoints=.true., cell_sym=.true., &

                              cell_to_index_ext=bs_env%cell_to_index_3c)


      CALL bs_env%para_env%sync()


      CALL timestop(handle)


   END SUBROUTINE compute_3c_integrals


! **************************************************************************************************

!> \brief ...

!> \param cell_index ...

!> \param hmat ...

!> \param cell_dist ...

! **************************************************************************************************

   SUBROUTINE get_cell_dist(cell_index, hmat, cell_dist)


      INTEGER, DIMENSION(3)                              :: cell_index

      REAL(kind=dp)                                      :: hmat(3, 3), cell_dist


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'get_cell_dist'


      INTEGER                                            :: handle, i_dim

      INTEGER, DIMENSION(3)                              :: cell_index_adj

      REAL(kind=dp)                                      :: cell_dist_3(3)


      CALL timeset(routinen, handle)


      ! the distance of cells needs to be taken to adjacent neighbors, not

      ! between the center of the cells. We thus need to rescale the cell index

      DO i_dim = 1, 3

         IF (cell_index(i_dim) > 0) cell_index_adj(i_dim) = cell_index(i_dim) - 1

         IF (cell_index(i_dim) < 0) cell_index_adj(i_dim) = cell_index(i_dim) + 1

         IF (cell_index(i_dim) == 0) cell_index_adj(i_dim) = cell_index(i_dim)

      END DO


      cell_dist_3(1:3) = matmul(hmat, real(cell_index_adj, kind=dp))


      cell_dist = sqrt(abs(sum(cell_dist_3(1:3)**2)))


      CALL timestop(handle)


   END SUBROUTINE get_cell_dist


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

!> \param kpoints ...

!> \param do_print ...

! **************************************************************************************************

   SUBROUTINE setup_kpoints_scf_desymm(qs_env, bs_env, kpoints, do_print)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(kpoint_type), POINTER                         :: kpoints


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_kpoints_scf_desymm'


      INTEGER                                            :: handle, i_cell_x, i_dim, img, j_cell_y, &

                                                            k_cell_z, nimages, nkp, u

      INTEGER, DIMENSION(3)                              :: cell_grid, cixd, nkp_grid

      TYPE(kpoint_type), POINTER                         :: kpoints_scf


      LOGICAL:: do_print


      CALL timeset(routinen, handle)


      NULLIFY (kpoints)

      CALL kpoint_create(kpoints)


      CALL get_qs_env(qs_env=qs_env, kpoints=kpoints_scf)


      nkp_grid(1:3) = kpoints_scf%nkp_grid(1:3)

      nkp = nkp_grid(1)*nkp_grid(2)*nkp_grid(3)


      ! we need in periodic directions at least 2 k-points in the SCF

      DO i_dim = 1, 3

         IF (bs_env%periodic(i_dim) == 1) THEN

            cpassert(nkp_grid(i_dim) > 1)

         END IF

      END DO


      kpoints%kp_scheme = "GENERAL"

      kpoints%nkp_grid(1:3) = nkp_grid(1:3)

      kpoints%nkp = nkp

      bs_env%nkp_scf_desymm = nkp


      ALLOCATE (kpoints%xkp(1:3, nkp))

      CALL compute_xkp(kpoints%xkp, 1, nkp, nkp_grid)


      ALLOCATE (kpoints%wkp(nkp))

      kpoints%wkp(:) = 1.0_dp/real(nkp, kind=dp)


      ! for example 4x3x6 kpoint grid -> 3x3x5 cell grid because we need the same number of

      ! neighbor cells on both sides of the unit cell

      cell_grid(1:3) = nkp_grid(1:3) - modulo(nkp_grid(1:3) + 1, 2)

      ! cell index: for example for x: from -n_x/2 to +n_x/2, n_x: number of cells in x direction

      cixd(1:3) = cell_grid(1:3)/2


      nimages = cell_grid(1)*cell_grid(2)*cell_grid(3)


      bs_env%nimages_scf_desymm = nimages


      ALLOCATE (kpoints%cell_to_index(-cixd(1):cixd(1), -cixd(2):cixd(2), -cixd(3):cixd(3)))

      ALLOCATE (kpoints%index_to_cell(nimages, 3))


      img = 0

      DO i_cell_x = -cixd(1), cixd(1)

         DO j_cell_y = -cixd(2), cixd(2)

            DO k_cell_z = -cixd(3), cixd(3)

               img = img + 1

               kpoints%cell_to_index(i_cell_x, j_cell_y, k_cell_z) = img

               kpoints%index_to_cell(img, 1:3) = (/i_cell_x, j_cell_y, k_cell_z/)

            END DO

         END DO

      END DO


      u = bs_env%unit_nr

      IF (u > 0 .AND. do_print) THEN

         WRITE (u, fmt="(T2,A,I49)") χΣ"Number of cells for G, , W, ", nimages

      END IF


      CALL timestop(handle)


   END SUBROUTINE setup_kpoints_scf_desymm


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE setup_cells_delta_r(bs_env)


      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_cells_Delta_R'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      ! cell sums batch wise for fixed ΔR = S_1 - R_1; for example:

      ! Σ_λσ^R = sum_PR1νS1 M^G_λ0,νS1,PR1 M^W_σR,νS1,PR1


      CALL sum_two_r_grids(bs_env%index_to_cell_3c, &

                           bs_env%index_to_cell_3c, &

                           bs_env%nimages_3c, bs_env%nimages_3c, &

                           bs_env%index_to_cell_Delta_R, &

                           bs_env%cell_to_index_Delta_R, &

                           bs_env%nimages_Delta_R)


      IF (bs_env%unit_nr > 0) THEN

         WRITE (bs_env%unit_nr, fmt="(T2,A,I61)") Δ"Number of cells R", bs_env%nimages_Delta_R

      END IF


      CALL timestop(handle)


   END SUBROUTINE setup_cells_delta_r


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE setup_parallelization_delta_r(bs_env)


      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'setup_parallelization_Delta_R'


      INTEGER                                            :: handle, i_cell_delta_r, i_task_local, &

                                                            n_tasks_local

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: i_cell_delta_r_group, &

                                                            n_tensor_ops_delta_r


      CALL timeset(routinen, handle)


      CALL compute_n_tensor_ops_delta_r(bs_env, n_tensor_ops_delta_r)


      CALL compute_delta_r_dist(bs_env, n_tensor_ops_delta_r, i_cell_delta_r_group, n_tasks_local)


      bs_env%n_tasks_Delta_R_local = n_tasks_local


      ALLOCATE (bs_env%task_Delta_R(n_tasks_local))


      i_task_local = 0

      DO i_cell_delta_r = 1, bs_env%nimages_Delta_R


         IF (i_cell_delta_r_group(i_cell_delta_r) /= bs_env%tensor_group_color) cycle


         i_task_local = i_task_local + 1


         bs_env%task_Delta_R(i_task_local) = i_cell_delta_r


      END DO


      ALLOCATE (bs_env%skip_DR_chi(n_tasks_local))

      bs_env%skip_DR_chi(:) = .false.

      ALLOCATE (bs_env%skip_DR_Sigma(n_tasks_local))

      bs_env%skip_DR_Sigma(:) = .false.


      CALL allocate_skip_3xr(bs_env%skip_DR_R12_S_Goccx3c_chi, bs_env)

      CALL allocate_skip_3xr(bs_env%skip_DR_R12_S_Gvirx3c_chi, bs_env)

      CALL allocate_skip_3xr(bs_env%skip_DR_R_R2_MxM_chi, bs_env)


      CALL allocate_skip_3xr(bs_env%skip_DR_R1_S2_Gx3c_Sigma, bs_env)

      CALL allocate_skip_3xr(bs_env%skip_DR_R1_R_MxM_Sigma, bs_env)


      CALL timestop(handle)


   END SUBROUTINE setup_parallelization_delta_r


! **************************************************************************************************

!> \brief ...

!> \param skip ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE allocate_skip_3xr(skip, bs_env)

      LOGICAL, ALLOCATABLE, DIMENSION(:, :, :)           :: skip

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'allocate_skip_3xR'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      ALLOCATE (skip(bs_env%n_tasks_Delta_R_local, bs_env%nimages_3c, bs_env%nimages_scf_desymm))

      skip(:, :, :) = .false.


      CALL timestop(handle)


   END SUBROUTINE allocate_skip_3xr


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param n_tensor_ops_Delta_R ...

!> \param i_cell_Delta_R_group ...

!> \param n_tasks_local ...

! **************************************************************************************************

   SUBROUTINE compute_delta_r_dist(bs_env, n_tensor_ops_Delta_R, i_cell_Delta_R_group, n_tasks_local)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: n_tensor_ops_delta_r, &

                                                            i_cell_delta_r_group

      INTEGER                                            :: n_tasks_local


      CHARACTER(LEN=*), PARAMETER :: routinen = 'compute_Delta_R_dist'


      INTEGER                                            :: handle, i_delta_r_max_op, i_group_min, &

                                                            nimages_delta_r, u

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: n_tensor_ops_delta_r_in_group


      CALL timeset(routinen, handle)


      nimages_delta_r = bs_env%nimages_Delta_R


      u = bs_env%unit_nr


      IF (u > 0 .AND. nimages_delta_r < bs_env%num_tensor_groups) THEN

         WRITE (u, fmt="(T2,A,I5,A,I5,A)") "There are only ", nimages_delta_r, &

            " tasks to work on but there are ", bs_env%num_tensor_groups, " groups."

         WRITE (u, fmt="(T2,A)") "Please reduce the number of MPI processes."

         WRITE (u, '(T2,A)') ''

      END IF


      ALLOCATE (n_tensor_ops_delta_r_in_group(bs_env%num_tensor_groups))

      n_tensor_ops_delta_r_in_group(:) = 0

      ALLOCATE (i_cell_delta_r_group(nimages_delta_r))

      i_cell_delta_r_group(:) = -1


      n_tasks_local = 0


      DO WHILE (any(n_tensor_ops_delta_r(:) .NE. 0))


         ! get largest element of n_tensor_ops_Delta_R

         i_delta_r_max_op = maxloc(n_tensor_ops_delta_r, 1)


         ! distribute i_Delta_R_max_op to tensor group which has currently the smallest load

         i_group_min = minloc(n_tensor_ops_delta_r_in_group, 1)


         ! the tensor groups are 0-index based; but i_group_min is 1-index based

         i_cell_delta_r_group(i_delta_r_max_op) = i_group_min - 1

         n_tensor_ops_delta_r_in_group(i_group_min) = n_tensor_ops_delta_r_in_group(i_group_min) + &

                                                      n_tensor_ops_delta_r(i_delta_r_max_op)


         ! remove i_Delta_R_max_op from n_tensor_ops_Delta_R

         n_tensor_ops_delta_r(i_delta_r_max_op) = 0


         IF (bs_env%tensor_group_color == i_group_min - 1) n_tasks_local = n_tasks_local + 1


      END DO


      CALL timestop(handle)


   END SUBROUTINE compute_delta_r_dist


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param n_tensor_ops_Delta_R ...

! **************************************************************************************************

   SUBROUTINE compute_n_tensor_ops_delta_r(bs_env, n_tensor_ops_Delta_R)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: n_tensor_ops_delta_r


      CHARACTER(LEN=*), PARAMETER :: routinen = 'compute_n_tensor_ops_Delta_R'


      INTEGER :: handle, i_cell_delta_r, i_cell_r, i_cell_r1, i_cell_r1_minus_r, i_cell_r2, &

         i_cell_r2_m_r1, i_cell_s1, i_cell_s1_m_r1_p_r2, i_cell_s1_minus_r, i_cell_s2, &

         nimages_delta_r

      INTEGER, DIMENSION(3) :: cell_dr, cell_m_r1, cell_r, cell_r1, cell_r1_minus_r, cell_r2, &

         cell_r2_m_r1, cell_s1, cell_s1_m_r2_p_r1, cell_s1_minus_r, cell_s1_p_s2_m_r1, cell_s2

      LOGICAL                                            :: cell_found


      CALL timeset(routinen, handle)


      nimages_delta_r = bs_env%nimages_Delta_R


      ALLOCATE (n_tensor_ops_delta_r(nimages_delta_r))

      n_tensor_ops_delta_r(:) = 0


      ! compute number of tensor operations for specific Delta_R

      DO i_cell_delta_r = 1, nimages_delta_r


         IF (modulo(i_cell_delta_r, bs_env%num_tensor_groups) /= bs_env%tensor_group_color) cycle


         DO i_cell_r1 = 1, bs_env%nimages_3c


            cell_r1(1:3) = bs_env%index_to_cell_3c(i_cell_r1, 1:3)

            cell_dr(1:3) = bs_env%index_to_cell_Delta_R(i_cell_delta_r, 1:3)


            ! S_1 = R_1 + ΔR (from ΔR = S_1 - R_1)

            CALL add_r(cell_r1, cell_dr, bs_env%index_to_cell_3c, cell_s1, &

                       cell_found, bs_env%cell_to_index_3c, i_cell_s1)

            IF (.NOT. cell_found) cycle


            DO i_cell_r2 = 1, bs_env%nimages_scf_desymm


               cell_r2(1:3) = bs_env%kpoints_scf_desymm%index_to_cell(i_cell_r2, 1:3)


               ! R_2 - R_1

               CALL add_r(cell_r2, -cell_r1, bs_env%index_to_cell_3c, cell_r2_m_r1, &

                          cell_found, bs_env%cell_to_index_3c, i_cell_r2_m_r1)

               IF (.NOT. cell_found) cycle


               ! S_1 - R_1 + R_2

               CALL add_r(cell_s1, cell_r2_m_r1, bs_env%index_to_cell_3c, cell_s1_m_r2_p_r1, &

                          cell_found, bs_env%cell_to_index_3c, i_cell_s1_m_r1_p_r2)

               IF (.NOT. cell_found) cycle


               n_tensor_ops_delta_r(i_cell_delta_r) = n_tensor_ops_delta_r(i_cell_delta_r) + 1


            END DO ! i_cell_R2


            DO i_cell_s2 = 1, bs_env%nimages_scf_desymm


               cell_s2(1:3) = bs_env%kpoints_scf_desymm%index_to_cell(i_cell_s2, 1:3)

               cell_m_r1(1:3) = -cell_r1(1:3)

               cell_s1_p_s2_m_r1(1:3) = cell_s1(1:3) + cell_s2(1:3) - cell_r1(1:3)


               CALL is_cell_in_index_to_cell(cell_m_r1, bs_env%index_to_cell_3c, cell_found)

               IF (.NOT. cell_found) cycle


               CALL is_cell_in_index_to_cell(cell_s1_p_s2_m_r1, bs_env%index_to_cell_3c, cell_found)

               IF (.NOT. cell_found) cycle


            END DO ! i_cell_S2


            DO i_cell_r = 1, bs_env%nimages_scf_desymm


               cell_r = bs_env%kpoints_scf_desymm%index_to_cell(i_cell_r, 1:3)


               ! R_1 - R

               CALL add_r(cell_r1, -cell_r, bs_env%index_to_cell_3c, cell_r1_minus_r, &

                          cell_found, bs_env%cell_to_index_3c, i_cell_r1_minus_r)

               IF (.NOT. cell_found) cycle


               ! S_1 - R

               CALL add_r(cell_s1, -cell_r, bs_env%index_to_cell_3c, cell_s1_minus_r, &

                          cell_found, bs_env%cell_to_index_3c, i_cell_s1_minus_r)

               IF (.NOT. cell_found) cycle


            END DO ! i_cell_R


         END DO ! i_cell_R1


      END DO ! i_cell_Delta_R


      CALL bs_env%para_env%sum(n_tensor_ops_delta_r)


      CALL timestop(handle)


   END SUBROUTINE compute_n_tensor_ops_delta_r


! **************************************************************************************************

!> \brief ...

!> \param cell_1 ...

!> \param cell_2 ...

!> \param index_to_cell ...

!> \param cell_1_plus_2 ...

!> \param cell_found ...

!> \param cell_to_index ...

!> \param i_cell_1_plus_2 ...

! **************************************************************************************************


   SUBROUTINE add_r(cell_1, cell_2, index_to_cell, cell_1_plus_2, cell_found, &

                    cell_to_index, i_cell_1_plus_2)


      INTEGER, DIMENSION(3)                              :: cell_1, cell_2

      INTEGER, DIMENSION(:, :)                           :: index_to_cell

      INTEGER, DIMENSION(3)                              :: cell_1_plus_2

      LOGICAL                                            :: cell_found

      INTEGER, DIMENSION(:, :, :), INTENT(IN), &

         OPTIONAL, POINTER                               :: cell_to_index

      INTEGER, INTENT(OUT), OPTIONAL                     :: i_cell_1_plus_2


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'add_R'


      INTEGER                                            :: handle


      CALL timeset(routinen, handle)


      cell_1_plus_2(1:3) = cell_1(1:3) + cell_2(1:3)


      CALL is_cell_in_index_to_cell(cell_1_plus_2, index_to_cell, cell_found)


      IF (PRESENT(i_cell_1_plus_2)) THEN

         IF (cell_found) THEN

            cpassert(PRESENT(cell_to_index))

            i_cell_1_plus_2 = cell_to_index(cell_1_plus_2(1), cell_1_plus_2(2), cell_1_plus_2(3))

         ELSE

            i_cell_1_plus_2 = -1000

         END IF

      END IF


      CALL timestop(handle)


   END SUBROUTINE add_r


! **************************************************************************************************

!> \brief ...

!> \param cell ...

!> \param index_to_cell ...

!> \param cell_found ...

! **************************************************************************************************


   SUBROUTINE is_cell_in_index_to_cell(cell, index_to_cell, cell_found)

      INTEGER, DIMENSION(3)                              :: cell

      INTEGER, DIMENSION(:, :)                           :: index_to_cell

      LOGICAL                                            :: cell_found


      CHARACTER(LEN=*), PARAMETER :: routinen = 'is_cell_in_index_to_cell'


      INTEGER                                            :: handle, i_cell, nimg

      INTEGER, DIMENSION(3)                              :: cell_i


      CALL timeset(routinen, handle)


      nimg = SIZE(index_to_cell, 1)


      cell_found = .false.


      DO i_cell = 1, nimg


         cell_i(1:3) = index_to_cell(i_cell, 1:3)


         IF (cell_i(1) == cell(1) .AND. cell_i(2) == cell(2) .AND. cell_i(3) == cell(3)) THEN

            cell_found = .true.

         END IF


      END DO


      CALL timestop(handle)


   END SUBROUTINE is_cell_in_index_to_cell


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE allocate_matrices_small_cell_full_kp(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'allocate_matrices_small_cell_full_kp'


      INTEGER                                            :: handle, i_spin, i_t, img, n_spin, &

                                                            nimages_scf, num_time_freq_points

      TYPE(cp_blacs_env_type), POINTER                   :: blacs_env

      TYPE(mp_para_env_type), POINTER                    :: para_env


      CALL timeset(routinen, handle)


      nimages_scf = bs_env%nimages_scf_desymm

      num_time_freq_points = bs_env%num_time_freq_points

      n_spin = bs_env%n_spin


      CALL get_qs_env(qs_env, para_env=para_env, blacs_env=blacs_env)


      ALLOCATE (bs_env%fm_G_S(nimages_scf))

      ALLOCATE (bs_env%fm_Sigma_x_R(nimages_scf))

      ALLOCATE (bs_env%fm_chi_R_t(nimages_scf, num_time_freq_points))

      ALLOCATE (bs_env%fm_MWM_R_t(nimages_scf, num_time_freq_points))

      ALLOCATE (bs_env%fm_Sigma_c_R_neg_tau(nimages_scf, num_time_freq_points, n_spin))

      ALLOCATE (bs_env%fm_Sigma_c_R_pos_tau(nimages_scf, num_time_freq_points, n_spin))

      DO img = 1, nimages_scf

         CALL cp_fm_create(bs_env%fm_G_S(img), bs_env%fm_work_mo(1)%matrix_struct)

         CALL cp_fm_create(bs_env%fm_Sigma_x_R(img), bs_env%fm_work_mo(1)%matrix_struct)

         DO i_t = 1, num_time_freq_points

            CALL cp_fm_create(bs_env%fm_chi_R_t(img, i_t), bs_env%fm_RI_RI%matrix_struct)

            CALL cp_fm_create(bs_env%fm_MWM_R_t(img, i_t), bs_env%fm_RI_RI%matrix_struct)

            CALL cp_fm_set_all(bs_env%fm_MWM_R_t(img, i_t), 0.0_dp)

            DO i_spin = 1, n_spin

               CALL cp_fm_create(bs_env%fm_Sigma_c_R_neg_tau(img, i_t, i_spin), &

                                 bs_env%fm_work_mo(1)%matrix_struct)

               CALL cp_fm_create(bs_env%fm_Sigma_c_R_pos_tau(img, i_t, i_spin), &

                                 bs_env%fm_work_mo(1)%matrix_struct)

               CALL cp_fm_set_all(bs_env%fm_Sigma_c_R_neg_tau(img, i_t, i_spin), 0.0_dp)

               CALL cp_fm_set_all(bs_env%fm_Sigma_c_R_pos_tau(img, i_t, i_spin), 0.0_dp)

            END DO

         END DO

      END DO


      CALL timestop(handle)


   END SUBROUTINE allocate_matrices_small_cell_full_kp


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE trafo_v_xc_r_to_kp(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'trafo_V_xc_R_to_kp'


      INTEGER                                            :: handle, ikp, img, ispin, n_ao

      INTEGER, DIMENSION(:, :, :), POINTER               :: cell_to_index_scf

      TYPE(cp_cfm_type)                                  :: cfm_mo_coeff, cfm_tmp, cfm_v_xc

      TYPE(cp_fm_type)                                   :: fm_v_xc_re

      TYPE(dbcsr_p_type), DIMENSION(:, :), POINTER       :: matrix_ks

      TYPE(kpoint_type), POINTER                         :: kpoints_scf

      TYPE(neighbor_list_set_p_type), DIMENSION(:), &

         POINTER                                         :: sab_nl


      CALL timeset(routinen, handle)


      n_ao = bs_env%n_ao


      CALL get_qs_env(qs_env, matrix_ks_kp=matrix_ks, kpoints=kpoints_scf)


      NULLIFY (sab_nl)

      CALL get_kpoint_info(kpoints_scf, sab_nl=sab_nl, cell_to_index=cell_to_index_scf)


      CALL cp_cfm_create(cfm_v_xc, bs_env%cfm_work_mo%matrix_struct)

      CALL cp_cfm_create(cfm_mo_coeff, bs_env%cfm_work_mo%matrix_struct)

      CALL cp_cfm_create(cfm_tmp, bs_env%cfm_work_mo%matrix_struct)

      CALL cp_fm_create(fm_v_xc_re, bs_env%cfm_work_mo%matrix_struct)


      DO img = 1, bs_env%nimages_scf

         DO ispin = 1, bs_env%n_spin

            ! JW kind of hack because the format of matrix_ks remains dubious...

            CALL dbcsr_set(matrix_ks(ispin, img)%matrix, 0.0_dp)

            CALL copy_fm_to_dbcsr(bs_env%fm_V_xc_R(img, ispin), matrix_ks(ispin, img)%matrix)

         END DO

      END DO


      ALLOCATE (bs_env%v_xc_n(n_ao, bs_env%nkp_bs_and_DOS, bs_env%n_spin))


      DO ispin = 1, bs_env%n_spin

         DO ikp = 1, bs_env%nkp_bs_and_DOS


            ! v^xc^R -> v^xc(k)  (matrix_ks stores v^xc^R, see SUBROUTINE compute_V_xc)

            CALL rsmat_to_kp(matrix_ks, ispin, bs_env%kpoints_DOS%xkp(1:3, ikp), &

                             cell_to_index_scf, sab_nl, bs_env, cfm_v_xc)


            ! get C_µn(k)

            CALL cp_cfm_to_cfm(bs_env%cfm_mo_coeff_kp(ikp, ispin), cfm_mo_coeff)


            ! v^xc_nm(k_i) = sum_µν C^*_µn(k_i) v^xc_µν(k_i) C_νn(k_i)

            CALL parallel_gemm('N', 'N', n_ao, n_ao, n_ao, z_one, cfm_v_xc, cfm_mo_coeff, &

                               z_zero, cfm_tmp)

            CALL parallel_gemm('C', 'N', n_ao, n_ao, n_ao, z_one, cfm_mo_coeff, cfm_tmp, &

                               z_zero, cfm_v_xc)


            ! get v^xc_nn(k_i) which is a real quantity as v^xc is Hermitian

            CALL cp_cfm_to_fm(cfm_v_xc, fm_v_xc_re)

            CALL cp_fm_get_diag(fm_v_xc_re, bs_env%v_xc_n(:, ikp, ispin))


         END DO


      END DO


      ! just rebuild the overwritten KS matrix again

      CALL qs_ks_build_kohn_sham_matrix(qs_env, calculate_forces=.false., just_energy=.false.)


      CALL cp_cfm_release(cfm_v_xc)

      CALL cp_cfm_release(cfm_mo_coeff)

      CALL cp_cfm_release(cfm_tmp)

      CALL cp_fm_release(fm_v_xc_re)


      CALL timestop(handle)


   END SUBROUTINE trafo_v_xc_r_to_kp


! **************************************************************************************************

!> \brief ...

!> \param qs_env ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE heuristic_ri_regularization(qs_env, bs_env)

      TYPE(qs_environment_type), POINTER                 :: qs_env

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'heuristic_RI_regularization'


      COMPLEX(KIND=dp), ALLOCATABLE, DIMENSION(:, :, :)  :: m

      INTEGER                                            :: handle, ikp, ikp_local, n_ri, nkp, &

                                                            nkp_local, u

      REAL(kind=dp)                                      :: cond_nr, cond_nr_max, max_ev, &

                                                            max_ev_ikp, min_ev, min_ev_ikp

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :, :)     :: m_r


      CALL timeset(routinen, handle)


      ! compute M^R_PQ = <phi_P,0|V^tr(rc)|phi_Q,R> for RI metric

      CALL get_v_tr_r(m_r, bs_env%ri_metric, 0.0_dp, bs_env, qs_env)


      nkp = bs_env%nkp_chi_eps_W_orig_plus_extra

      n_ri = bs_env%n_RI


      nkp_local = 0

      DO ikp = 1, nkp

         ! trivial parallelization over k-points

         IF (modulo(ikp, bs_env%para_env%num_pe) .NE. bs_env%para_env%mepos) cycle

         nkp_local = nkp_local + 1

      END DO


      ALLOCATE (m(n_ri, n_ri, nkp_local))


      ikp_local = 0

      cond_nr_max = 0.0_dp

      min_ev = 1000.0_dp

      max_ev = -1000.0_dp


      DO ikp = 1, nkp


         ! trivial parallelization

         IF (modulo(ikp, bs_env%para_env%num_pe) .NE. bs_env%para_env%mepos) cycle


         ikp_local = ikp_local + 1


         ! M(k) = sum_R e^ikR M^R

         CALL trafo_rs_to_ikp(m_r, m(:, :, ikp_local), &

                              bs_env%kpoints_scf_desymm%index_to_cell, &

                              bs_env%kpoints_chi_eps_W%xkp(1:3, ikp))


         ! compute condition number of M_PQ(k)

         CALL power(m(:, :, ikp_local), 1.0_dp, 0.0_dp, cond_nr, min_ev_ikp, max_ev_ikp)


         IF (cond_nr > cond_nr_max) cond_nr_max = cond_nr

         IF (max_ev_ikp > max_ev) max_ev = max_ev_ikp

         IF (min_ev_ikp < min_ev) min_ev = min_ev_ikp


      END DO ! ikp


      CALL bs_env%para_env%max(cond_nr_max)


      u = bs_env%unit_nr

      IF (u > 0) THEN

         WRITE (u, fmt="(T2,A,ES34.1)") "Min. abs. eigenvalue of RI metric matrix M(k)", min_ev

         WRITE (u, fmt="(T2,A,ES34.1)") "Max. abs. eigenvalue of RI metric matrix M(k)", max_ev

         WRITE (u, fmt="(T2,A,ES50.1)") "Max. condition number of M(k)", cond_nr_max

      END IF


      CALL timestop(handle)


   END SUBROUTINE heuristic_ri_regularization


! **************************************************************************************************

!> \brief ...

!> \param V_tr_R ...

!> \param pot_type ...

!> \param regularization_RI ...

!> \param bs_env ...

!> \param qs_env ...

! **************************************************************************************************


   SUBROUTINE get_v_tr_r(V_tr_R, pot_type, regularization_RI, bs_env, qs_env)

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :, :)     :: v_tr_r

      TYPE(libint_potential_type)                        :: pot_type

      REAL(kind=dp)                                      :: regularization_ri

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      TYPE(qs_environment_type), POINTER                 :: qs_env


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'get_V_tr_R'


      INTEGER                                            :: handle, img, nimages_scf_desymm

      INTEGER, ALLOCATABLE, DIMENSION(:)                 :: sizes_ri

      INTEGER, DIMENSION(:), POINTER                     :: col_bsize, row_bsize

      TYPE(cp_blacs_env_type), POINTER                   :: blacs_env

      TYPE(cp_fm_type), ALLOCATABLE, DIMENSION(:)        :: fm_v_tr_r

      TYPE(dbcsr_distribution_type)                      :: dbcsr_dist

      TYPE(dbcsr_type), ALLOCATABLE, DIMENSION(:)        :: mat_v_tr_r

      TYPE(distribution_2d_type), POINTER                :: dist_2d

      TYPE(neighbor_list_set_p_type), DIMENSION(:), &

         POINTER                                         :: sab_ri

      TYPE(particle_type), DIMENSION(:), POINTER         :: particle_set

      TYPE(qs_kind_type), DIMENSION(:), POINTER          :: qs_kind_set


      CALL timeset(routinen, handle)


      NULLIFY (sab_ri, dist_2d)


      CALL get_qs_env(qs_env=qs_env, &

                      blacs_env=blacs_env, &

                      distribution_2d=dist_2d, &

                      qs_kind_set=qs_kind_set, &

                      particle_set=particle_set)


      ALLOCATE (sizes_ri(bs_env%n_atom))

      CALL get_particle_set(particle_set, qs_kind_set, nsgf=sizes_ri, basis=bs_env%basis_set_RI)

      CALL build_2c_neighbor_lists(sab_ri, bs_env%basis_set_RI, bs_env%basis_set_RI, &

                                   pot_type, "2c_nl_RI", qs_env, sym_ij=.false., &

                                   dist_2d=dist_2d)

      CALL cp_dbcsr_dist2d_to_dist(dist_2d, dbcsr_dist)

      ALLOCATE (row_bsize(SIZE(sizes_ri)))

      ALLOCATE (col_bsize(SIZE(sizes_ri)))

      row_bsize(:) = sizes_ri

      col_bsize(:) = sizes_ri


      nimages_scf_desymm = bs_env%nimages_scf_desymm

      ALLOCATE (mat_v_tr_r(nimages_scf_desymm))

      CALL dbcsr_create(mat_v_tr_r(1), "(RI|RI)", dbcsr_dist, dbcsr_type_no_symmetry, &

                        row_bsize, col_bsize)

      DEALLOCATE (row_bsize, col_bsize)


      DO img = 2, nimages_scf_desymm

         CALL dbcsr_create(mat_v_tr_r(img), template=mat_v_tr_r(1))

      END DO


      CALL build_2c_integrals(mat_v_tr_r, 0.0_dp, qs_env, sab_ri, bs_env%basis_set_RI, &

                              bs_env%basis_set_RI, pot_type, do_kpoints=.true., &

                              ext_kpoints=bs_env%kpoints_scf_desymm, &

                              regularization_ri=regularization_ri)


      ALLOCATE (fm_v_tr_r(nimages_scf_desymm))

      DO img = 1, nimages_scf_desymm

         CALL cp_fm_create(fm_v_tr_r(img), bs_env%fm_RI_RI%matrix_struct)

         CALL copy_dbcsr_to_fm(mat_v_tr_r(img), fm_v_tr_r(img))

         CALL dbcsr_release(mat_v_tr_r(img))

      END DO


      IF (.NOT. ALLOCATED(v_tr_r)) THEN

         ALLOCATE (v_tr_r(bs_env%n_RI, bs_env%n_RI, nimages_scf_desymm))

      END IF


      CALL fm_to_local_array(fm_v_tr_r, v_tr_r)


      CALL cp_fm_release(fm_v_tr_r)

      CALL dbcsr_distribution_release(dbcsr_dist)

      CALL release_neighbor_list_sets(sab_ri)


      CALL timestop(handle)


   END SUBROUTINE get_v_tr_r


! **************************************************************************************************

!> \brief ...

!> \param matrix ...

!> \param exponent ...

!> \param eps ...

!> \param cond_nr ...

!> \param min_ev ...

!> \param max_ev ...

! **************************************************************************************************


   SUBROUTINE power(matrix, exponent, eps, cond_nr, min_ev, max_ev)

      COMPLEX(KIND=dp), DIMENSION(:, :)                  :: matrix

      REAL(kind=dp)                                      :: exponent, eps

      REAL(kind=dp), OPTIONAL                            :: cond_nr, min_ev, max_ev


      CHARACTER(len=*), PARAMETER                        :: routinen = 'power'


      COMPLEX(KIND=dp), ALLOCATABLE, DIMENSION(:, :)     :: eigenvectors

      INTEGER                                            :: handle, i, n

      REAL(kind=dp)                                      :: pos_eval

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: eigenvalues


      CALL timeset(routinen, handle)


      ! make matrix perfectly Hermitian

      matrix(:, :) = 0.5_dp*(matrix(:, :) + conjg(transpose(matrix(:, :))))


      n = SIZE(matrix, 1)

      ALLOCATE (eigenvalues(n), eigenvectors(n, n))

      CALL diag_complex(matrix, eigenvectors, eigenvalues)


      IF (PRESENT(cond_nr)) cond_nr = maxval(abs(eigenvalues))/minval(abs(eigenvalues))

      IF (PRESENT(min_ev)) min_ev = minval(abs(eigenvalues))

      IF (PRESENT(max_ev)) max_ev = maxval(abs(eigenvalues))


      DO i = 1, n

         IF (eps < eigenvalues(i)) THEN

            pos_eval = (eigenvalues(i))**(0.5_dp*exponent)

         ELSE

            pos_eval = 0.0_dp

         END IF

         eigenvectors(:, i) = eigenvectors(:, i)*pos_eval

      END DO


      CALL zgemm("N", "C", n, n, n, z_one, eigenvectors, n, eigenvectors, n, z_zero, matrix, n)


      DEALLOCATE (eigenvalues, eigenvectors)


      CALL timestop(handle)


   END SUBROUTINE power


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param Sigma_c_n_time ...

!> \param Sigma_c_n_freq ...

!> \param ispin ...

! **************************************************************************************************


   SUBROUTINE time_to_freq(bs_env, Sigma_c_n_time, Sigma_c_n_freq, ispin)

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      REAL(kind=dp), DIMENSION(:, :, :)                  :: sigma_c_n_time, sigma_c_n_freq

      INTEGER                                            :: ispin


      CHARACTER(LEN=*), PARAMETER                        :: routinen = 'time_to_freq'


      INTEGER                                            :: handle, i_t, j_w, n_occ

      REAL(kind=dp)                                      :: freq_j, time_i, w_cos_ij, w_sin_ij

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:, :)        :: sigma_c_n_cos_time, sigma_c_n_sin_time


      CALL timeset(routinen, handle)


      ALLOCATE (sigma_c_n_cos_time(bs_env%n_ao, bs_env%num_time_freq_points))

      ALLOCATE (sigma_c_n_sin_time(bs_env%n_ao, bs_env%num_time_freq_points))


      sigma_c_n_cos_time(:, :) = 0.5_dp*(sigma_c_n_time(:, :, 1) + sigma_c_n_time(:, :, 2))

      sigma_c_n_sin_time(:, :) = 0.5_dp*(sigma_c_n_time(:, :, 1) - sigma_c_n_time(:, :, 2))


      sigma_c_n_freq(:, :, :) = 0.0_dp


      DO i_t = 1, bs_env%num_time_freq_points


         DO j_w = 1, bs_env%num_time_freq_points


            freq_j = bs_env%imag_freq_points(j_w)

            time_i = bs_env%imag_time_points(i_t)

            ! integration weights for cosine and sine transform

            w_cos_ij = bs_env%weights_cos_t_to_w(j_w, i_t)*cos(freq_j*time_i)

            w_sin_ij = bs_env%weights_sin_t_to_w(j_w, i_t)*sin(freq_j*time_i)


            ! 1. Re(Σ^c_nn(k_i,iω)) from cosine transform

            sigma_c_n_freq(:, j_w, 1) = sigma_c_n_freq(:, j_w, 1) + &

                                        w_cos_ij*sigma_c_n_cos_time(:, i_t)


            ! 2. Im(Σ^c_nn(k_i,iω)) from sine transform

            sigma_c_n_freq(:, j_w, 2) = sigma_c_n_freq(:, j_w, 2) + &

                                        w_sin_ij*sigma_c_n_sin_time(:, i_t)


         END DO


      END DO


      ! for occupied levels, we need the correlation self-energy for negative omega.

      ! Therefore, weight_sin should be computed with -omega, which results in an

      ! additional minus for the imaginary part:

      n_occ = bs_env%n_occ(ispin)

      sigma_c_n_freq(1:n_occ, :, 2) = -sigma_c_n_freq(1:n_occ, :, 2)


      CALL timestop(handle)


   END SUBROUTINE time_to_freq


! **************************************************************************************************

!> \brief ...

!> \param bs_env ...

!> \param Sigma_c_ikp_n_freq ...

!> \param Sigma_x_ikp_n ...

!> \param V_xc_ikp_n ...

!> \param eigenval_scf ...

!> \param ikp ...

!> \param ispin ...

! **************************************************************************************************


   SUBROUTINE analyt_conti_and_print(bs_env, Sigma_c_ikp_n_freq, Sigma_x_ikp_n, V_xc_ikp_n, &

                                     eigenval_scf, ikp, ispin)


      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env

      REAL(kind=dp), DIMENSION(:, :, :)                  :: sigma_c_ikp_n_freq

      REAL(kind=dp), DIMENSION(:)                        :: sigma_x_ikp_n, v_xc_ikp_n, eigenval_scf

      INTEGER                                            :: ikp, ispin


      CHARACTER(LEN=*), PARAMETER :: routinen = 'analyt_conti_and_print'


      CHARACTER(len=3)                                   :: occ_vir

      CHARACTER(len=default_string_length)               :: fname

      INTEGER                                            :: handle, i_mo, ikp_for_print, iunit, &

                                                            n_mo, nkp

      LOGICAL                                            :: is_bandstruc_kpoint, print_dos_kpoints, &

                                                            print_ikp

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: dummy, sigma_c_ikp_n_qp


      CALL timeset(routinen, handle)


      n_mo = bs_env%n_ao

      ALLOCATE (dummy(n_mo), sigma_c_ikp_n_qp(n_mo))

      sigma_c_ikp_n_qp(:) = 0.0_dp


      DO i_mo = 1, n_mo


         ! parallelization

         IF (modulo(i_mo, bs_env%para_env%num_pe) /= bs_env%para_env%mepos) cycle


         CALL continuation_pade(sigma_c_ikp_n_qp, &

                                bs_env%imag_freq_points_fit, dummy, dummy, &

                                sigma_c_ikp_n_freq(:, 1:bs_env%num_freq_points_fit, 1)*z_one + &

                                sigma_c_ikp_n_freq(:, 1:bs_env%num_freq_points_fit, 2)*gaussi, &

                                sigma_x_ikp_n(:) - v_xc_ikp_n(:), &

                                eigenval_scf(:), eigenval_scf(:), &

                                bs_env%do_hedin_shift, &

                                i_mo, bs_env%n_occ(ispin), bs_env%n_vir(ispin), &

                                bs_env%nparam_pade, bs_env%num_freq_points_fit, &

                                ri_rpa_g0w0_crossing_newton, bs_env%n_occ(ispin), &

                                0.0_dp, .true., .false., 1, e_fermi_ext=bs_env%e_fermi(ispin))

      END DO


      CALL bs_env%para_env%sum(sigma_c_ikp_n_qp)


      CALL correct_obvious_fitting_fails(sigma_c_ikp_n_qp, ispin, bs_env)


      bs_env%eigenval_G0W0(:, ikp, ispin) = eigenval_scf(:) + &

                                            sigma_c_ikp_n_qp(:) + &

                                            sigma_x_ikp_n(:) - &

                                            v_xc_ikp_n(:)


      bs_env%eigenval_HF(:, ikp, ispin) = eigenval_scf(:) + sigma_x_ikp_n(:) - v_xc_ikp_n(:)


      ! only print eigenvalues of DOS k-points in case no bandstructure path has been given

      print_dos_kpoints = (bs_env%nkp_only_bs .LE. 0)

      ! in kpoints_DOS, the last nkp_only_bs are bandstructure k-points

      is_bandstruc_kpoint = (ikp > bs_env%nkp_only_DOS)

      print_ikp = print_dos_kpoints .OR. is_bandstruc_kpoint


      IF (bs_env%para_env%is_source() .AND. print_ikp) THEN


         IF (print_dos_kpoints) THEN

            nkp = bs_env%nkp_only_DOS

            ikp_for_print = ikp

         ELSE

            nkp = bs_env%nkp_only_bs

            ikp_for_print = ikp - bs_env%nkp_only_DOS

         END IF


         fname = "bandstructure_SCF_and_G0W0"


         IF (ikp_for_print == 1) THEN

            CALL open_file(trim(fname), unit_number=iunit, file_status="REPLACE", &

                           file_action="WRITE")

         ELSE

            CALL open_file(trim(fname), unit_number=iunit, file_status="OLD", &

                           file_action="WRITE", file_position="APPEND")

         END IF


         WRITE (iunit, "(A)") " "

         WRITE (iunit, "(A10,I7,A25,3F10.4)") "kpoint: ", ikp_for_print, "coordinate: ", &

            bs_env%kpoints_DOS%xkp(:, ikp)

         WRITE (iunit, "(A)") " "

         WRITE (iunit, "(A5,A12,3A17,A16,A18)") "n", "k", ϵ"_nk^DFT (eV)", Σ"^c_nk (eV)", &

            Σ"^x_nk (eV)", "v_nk^xc (eV)", ϵ"_nk^G0W0 (eV)"

         WRITE (iunit, "(A)") " "


         DO i_mo = 1, n_mo

            IF (i_mo .LE. bs_env%n_occ(ispin)) occ_vir = 'occ'

            IF (i_mo > bs_env%n_occ(ispin)) occ_vir = 'vir'

            WRITE (iunit, "(I5,3A,I5,4F16.3,F17.3)") i_mo, ' (', occ_vir, ') ', ikp_for_print, &

               eigenval_scf(i_mo)*evolt, &

               sigma_c_ikp_n_qp(i_mo)*evolt, &

               sigma_x_ikp_n(i_mo)*evolt, &

               v_xc_ikp_n(i_mo)*evolt, &

               bs_env%eigenval_G0W0(i_mo, ikp, ispin)*evolt

         END DO


         WRITE (iunit, "(A)") " "


         CALL close_file(iunit)


      END IF


      CALL timestop(handle)


   END SUBROUTINE analyt_conti_and_print


! **************************************************************************************************

!> \brief ...

!> \param Sigma_c_ikp_n_qp ...

!> \param ispin ...

!> \param bs_env ...

! **************************************************************************************************

   SUBROUTINE correct_obvious_fitting_fails(Sigma_c_ikp_n_qp, ispin, bs_env)

      REAL(kind=dp), ALLOCATABLE, DIMENSION(:)           :: sigma_c_ikp_n_qp

      INTEGER                                            :: ispin

      TYPE(post_scf_bandstructure_type), POINTER         :: bs_env


      CHARACTER(LEN=*), PARAMETER :: routinen = 'correct_obvious_fitting_fails'


      INTEGER                                            :: handle, homo, i_mo, j_mo, &

                                                            n_levels_scissor, n_mo

      LOGICAL                                            :: is_occ, is_vir

      REAL(kind=dp)                                      :: sum_sigma_c


      CALL timeset(routinen, handle)


      n_mo = bs_env%n_ao

      homo = bs_env%n_occ(ispin)


      DO i_mo = 1, n_mo


         ! if |𝚺^c| > 13 eV, we use a scissors shift

         IF (abs(sigma_c_ikp_n_qp(i_mo)) > 13.0_dp/evolt) THEN


            is_occ = (i_mo .LE. homo)

            is_vir = (i_mo > homo)


            n_levels_scissor = 0

            sum_sigma_c = 0.0_dp


            ! compute scissor

            DO j_mo = 1, n_mo


               ! only compute scissor from other GW levels close in energy

               IF (is_occ .AND. j_mo > homo) cycle

               IF (is_vir .AND. j_mo .LE. homo) cycle

               IF (abs(i_mo - j_mo) > 10) cycle

               IF (i_mo == j_mo) cycle


               n_levels_scissor = n_levels_scissor + 1

               sum_sigma_c = sum_sigma_c + sigma_c_ikp_n_qp(j_mo)


            END DO


            ! overwrite the self-energy with scissor shift

            sigma_c_ikp_n_qp(i_mo) = sum_sigma_c/real(n_levels_scissor, kind=dp)


         END IF


      END DO ! i_mo


      CALL timestop(handle)


   END SUBROUTINE correct_obvious_fitting_fails


END MODULE gw_utils

modulo
static GRID_HOST_DEVICE int modulo(int a, int m)
Equivalent of Fortran's MODULO, which always return a positive number. https://gcc....
Definition grid_common.h:120

tensor
struct tensor_ tensor

cell_types::pbc
Definition cell_types.F:92

cp_cfm_types::cp_cfm_to_cfm
Definition cp_cfm_types.F:55

cp_dbcsr_api::dbcsr_create
Definition cp_dbcsr_api.F:192

cp_dbcsr_operations::dbcsr_allocate_matrix_set
Definition cp_dbcsr_operations.F:77

cp_dbcsr_operations::dbcsr_deallocate_matrix_set
Definition cp_dbcsr_operations.F:85

cp_fm_types::cp_fm_release
Definition cp_fm_types.F:87

parallel_gemm_api::parallel_gemm
Definition parallel_gemm_api.F:38

atomic_kind_types
Define the atomic kind types and their sub types.
Definition atomic_kind_types.F:23

atomic_kind_types::get_atomic_kind_set
subroutine, public get_atomic_kind_set(atomic_kind_set, atom_of_kind, kind_of, natom_of_kind, maxatom, natom, nshell, fist_potential_present, shell_present, shell_adiabatic, shell_check_distance, damping_present)
Get attributes of an atomic kind set.
Definition atomic_kind_types.F:223

basis_set_types
Definition basis_set_types.F:15

basis_set_types::get_gto_basis_set
subroutine, public get_gto_basis_set(gto_basis_set, name, aliases, norm_type, kind_radius, ncgf, nset, nsgf, cgf_symbol, sgf_symbol, norm_cgf, set_radius, lmax, lmin, lx, ly, lz, m, ncgf_set, npgf, nsgf_set, nshell, cphi, pgf_radius, sphi, scon, zet, first_cgf, first_sgf, l, last_cgf, last_sgf, n, gcc, maxco, maxl, maxpgf, maxsgf_set, maxshell, maxso, nco_sum, npgf_sum, nshell_sum, maxder, short_kind_radius, npgf_seg_sum)
...
Definition basis_set_types.F:624

bibliography
collects all references to literature in CP2K as new algorithms / method are included from literature...
Definition bibliography.F:21

bibliography::graml2024
integer, save, public graml2024
Definition bibliography.F:36

cell_types
Handles all functions related to the CELL.
Definition cell_types.F:15

cell_types::scaled_to_real
subroutine, public scaled_to_real(r, s, cell)
Transform scaled cell coordinates real coordinates. r=h*s.
Definition cell_types.F:516

cp_blacs_env
methods related to the blacs parallel environment
Definition cp_blacs_env.F:15

cp_blacs_env::cp_blacs_env_release
subroutine, public cp_blacs_env_release(blacs_env)
releases the given blacs_env
Definition cp_blacs_env.F:274

cp_blacs_env::cp_blacs_env_create
subroutine, public cp_blacs_env_create(blacs_env, para_env, blacs_grid_layout, blacs_repeatable, row_major, grid_2d)
allocates and initializes a type that represent a blacs context
Definition cp_blacs_env.F:123

cp_cfm_types
Represents a complex full matrix distributed on many processors.
Definition cp_cfm_types.F:12

cp_cfm_types::cp_cfm_create
subroutine, public cp_cfm_create(matrix, matrix_struct, name)
Creates a new full matrix with the given structure.
Definition cp_cfm_types.F:121

cp_cfm_types::cp_cfm_release
subroutine, public cp_cfm_release(matrix)
Releases a full matrix.
Definition cp_cfm_types.F:155

cp_cfm_types::cp_cfm_to_fm
subroutine, public cp_cfm_to_fm(msource, mtargetr, mtargeti)
Copy real and imaginary parts of a complex full matrix into separate real-value full matrices.
Definition cp_cfm_types.F:761

cp_control_types
Defines control structures, which contain the parameters and the settings for the DFT-based calculati...
Definition cp_control_types.F:12

cp_dbcsr_api
Definition cp_dbcsr_api.F:8

cp_dbcsr_api::dbcsr_distribution_release
subroutine, public dbcsr_distribution_release(dist)
...
Definition cp_dbcsr_api.F:629

cp_dbcsr_api::dbcsr_set
subroutine, public dbcsr_set(matrix, alpha)
...
Definition cp_dbcsr_api.F:1181

cp_dbcsr_api::dbcsr_release
subroutine, public dbcsr_release(matrix)
...
Definition cp_dbcsr_api.F:1119

cp_dbcsr_operations
DBCSR operations in CP2K.
Definition cp_dbcsr_operations.F:18

cp_dbcsr_operations::cp_dbcsr_dist2d_to_dist
subroutine, public cp_dbcsr_dist2d_to_dist(dist2d, dist)
Creates a DBCSR distribution from a distribution_2d.
Definition cp_dbcsr_operations.F:419

cp_dbcsr_operations::copy_dbcsr_to_fm
subroutine, public copy_dbcsr_to_fm(matrix, fm)
Copy a DBCSR matrix to a BLACS matrix.
Definition cp_dbcsr_operations.F:214

cp_dbcsr_operations::copy_fm_to_dbcsr
subroutine, public copy_fm_to_dbcsr(fm, matrix, keep_sparsity)
Copy a BLACS matrix to a dbcsr matrix.
Definition cp_dbcsr_operations.F:111

cp_files
Utility routines to open and close files. Tracking of preconnections.
Definition cp_files.F:16

cp_files::open_file
subroutine, public open_file(file_name, file_status, file_form, file_action, file_position, file_pad, unit_number, debug, skip_get_unit_number, file_access)
Opens the requested file using a free unit number.
Definition cp_files.F:308

cp_files::close_file
subroutine, public close_file(unit_number, file_status, keep_preconnection)
Close an open file given by its logical unit number. Optionally, keep the file and unit preconnected.
Definition cp_files.F:119

cp_fm_basic_linalg
Basic linear algebra operations for full matrices.
Definition cp_fm_basic_linalg.F:14

cp_fm_basic_linalg::cp_fm_scale_and_add
subroutine, public cp_fm_scale_and_add(alpha, matrix_a, beta, matrix_b)
calc A <- alpha*A + beta*B optimized for alpha == 1.0 (just add beta*B) and beta == 0....
Definition cp_fm_basic_linalg.F:167

cp_fm_struct
represent the structure of a full matrix
Definition cp_fm_struct.F:14

cp_fm_struct::cp_fm_struct_create
subroutine, public cp_fm_struct_create(fmstruct, para_env, context, nrow_global, ncol_global, nrow_block, ncol_block, descriptor, first_p_pos, local_leading_dimension, template_fmstruct, square_blocks, force_block)
allocates and initializes a full matrix structure
Definition cp_fm_struct.F:132

cp_fm_struct::cp_fm_struct_release
subroutine, public cp_fm_struct_release(fmstruct)
releases a full matrix structure
Definition cp_fm_struct.F:351

cp_fm_types
represent a full matrix distributed on many processors
Definition cp_fm_types.F:15

cp_fm_types::cp_fm_get_diag
subroutine, public cp_fm_get_diag(matrix, diag)
returns the diagonal elements of a fm
Definition cp_fm_types.F:563

cp_fm_types::cp_fm_set_all
subroutine, public cp_fm_set_all(matrix, alpha, beta)
set all elements of a matrix to the same value, and optionally the diagonal to a different one
Definition cp_fm_types.F:528

cp_fm_types::cp_fm_create
subroutine, public cp_fm_create(matrix, matrix_struct, name, use_sp)
creates a new full matrix with the given structure
Definition cp_fm_types.F:164

cp_log_handling
various routines to log and control the output. The idea is that decisions about where to log should ...
Definition cp_log_handling.F:41

cp_log_handling::cp_get_default_logger
type(cp_logger_type) function, pointer, public cp_get_default_logger()
returns the default logger
Definition cp_log_handling.F:234

cp_output_handling
routines to handle the output, The idea is to remove the decision of wheter to output and what to out...
Definition cp_output_handling.F:25

cp_output_handling::cp_print_key_generate_filename
character(len=default_path_length) function, public cp_print_key_generate_filename(logger, print_key, middle_name, extension, my_local)
Utility function that returns a unit number to write the print key. Might open a file with a unique f...
Definition cp_output_handling.F:754

dbt_api
This is the start of a dbt_api, all publically needed functions are exported here....
Definition dbt_api.F:17

distribution_2d_types
stores a mapping of 2D info (e.g. matrix) on a 2D processor distribution (i.e. blacs grid) where cpus...
Definition distribution_2d_types.F:15

gw_communication
Definition gw_communication.F:13

gw_communication::fm_to_local_array
subroutine, public fm_to_local_array(fm_s, array_s, weight, add)
...
Definition gw_communication.F:764

gw_integrals
Utility method to build 3-center integrals for small cell GW.
Definition gw_integrals.F:11

gw_integrals::build_3c_integral_block
subroutine, public build_3c_integral_block(int_3c, qs_env, potential_parameter, basis_j, basis_k, basis_i, cell_j, cell_k, cell_i, atom_j, atom_k, atom_i, j_bf_start_from_atom, k_bf_start_from_atom, i_bf_start_from_atom)
...
Definition gw_integrals.F:84

gw_kp_to_real_space_and_back
Definition gw_kp_to_real_space_and_back.F:13

gw_kp_to_real_space_and_back::trafo_rs_to_ikp
subroutine, public trafo_rs_to_ikp(array_rs, array_kp, index_to_cell, xkp)
...
Definition gw_kp_to_real_space_and_back.F:80

gw_utils
Definition gw_utils.F:13

gw_utils::get_v_tr_r
subroutine, public get_v_tr_r(v_tr_r, pot_type, regularization_ri, bs_env, qs_env)
...
Definition gw_utils.F:2987

gw_utils::time_to_freq
subroutine, public time_to_freq(bs_env, sigma_c_n_time, sigma_c_n_freq, ispin)
...
Definition gw_utils.F:3124

gw_utils::de_init_bs_env
subroutine, public de_init_bs_env(bs_env)
...
Definition gw_utils.F:238

gw_utils::compute_xkp
subroutine, public compute_xkp(xkp, ikp_start, ikp_end, grid)
...
Definition gw_utils.F:626

gw_utils::analyt_conti_and_print
subroutine, public analyt_conti_and_print(bs_env, sigma_c_ikp_n_freq, sigma_x_ikp_n, v_xc_ikp_n, eigenval_scf, ikp, ispin)
...
Definition gw_utils.F:3188

gw_utils::create_and_init_bs_env_for_gw
subroutine, public create_and_init_bs_env_for_gw(qs_env, bs_env, bs_sec)
...
Definition gw_utils.F:152

gw_utils::add_r
subroutine, public add_r(cell_1, cell_2, index_to_cell, cell_1_plus_2, cell_found, cell_to_index, i_cell_1_plus_2)
...
Definition gw_utils.F:2704

gw_utils::kpoint_init_cell_index_simple
subroutine, public kpoint_init_cell_index_simple(kpoints, qs_env)
...
Definition gw_utils.F:596

gw_utils::get_i_j_atoms
subroutine, public get_i_j_atoms(atoms_i, atoms_j, n_atom_i, n_atom_j, color_sub, bs_env)
...
Definition gw_utils.F:1427

gw_utils::power
subroutine, public power(matrix, exponent, eps, cond_nr, min_ev, max_ev)
...
Definition gw_utils.F:3075

gw_utils::is_cell_in_index_to_cell
subroutine, public is_cell_in_index_to_cell(cell, index_to_cell, cell_found)
...
Definition gw_utils.F:2743

input_constants
collects all constants needed in input so that they can be used without circular dependencies
Definition input_constants.F:17

input_constants::do_potential_truncated
integer, parameter, public do_potential_truncated
Definition input_constants.F:808

input_constants::rtp_method_bse
integer, parameter, public rtp_method_bse
Definition input_constants.F:944

input_constants::small_cell_full_kp
integer, parameter, public small_cell_full_kp
Definition input_constants.F:1081

input_constants::large_cell_gamma
integer, parameter, public large_cell_gamma
Definition input_constants.F:1081

input_constants::xc_none
integer, parameter, public xc_none
Definition input_constants.F:553

input_constants::ri_rpa_g0w0_crossing_newton
integer, parameter, public ri_rpa_g0w0_crossing_newton
Definition input_constants.F:1081

input_section_types
objects that represent the structure of input sections and the data contained in an input section
Definition input_section_types.F:15

input_section_types::section_vals_val_set
subroutine, public section_vals_val_set(section_vals, keyword_name, i_rep_section, i_rep_val, val, l_val, i_val, r_val, c_val, l_vals_ptr, i_vals_ptr, r_vals_ptr, c_vals_ptr)
sets the requested value
Definition input_section_types.F:1223

input_section_types::section_vals_get_subs_vals
recursive type(section_vals_type) function, pointer, public section_vals_get_subs_vals(section_vals, subsection_name, i_rep_section, can_return_null)
returns the values of the requested subsection
Definition input_section_types.F:731

input_section_types::section_vals_get
subroutine, public section_vals_get(section_vals, ref_count, n_repetition, n_subs_vals_rep, section, explicit)
returns various attributes about the section_vals
Definition input_section_types.F:704

input_section_types::section_vals_val_get
subroutine, public section_vals_val_get(section_vals, keyword_name, i_rep_section, i_rep_val, n_rep_val, val, l_val, i_val, r_val, c_val, l_vals, i_vals, r_vals, c_vals, explicit)
returns the requested value
Definition input_section_types.F:1047

kinds
Defines the basic variable types.
Definition kinds.F:23

kinds::int_8
integer, parameter, public int_8
Definition kinds.F:54

kinds::dp
integer, parameter, public dp
Definition kinds.F:34

kinds::default_string_length
integer, parameter, public default_string_length
Definition kinds.F:57

kpoint_methods
Routines needed for kpoint calculation.
Definition kpoint_methods.F:15

kpoint_methods::kpoint_init_cell_index
subroutine, public kpoint_init_cell_index(kpoint, sab_nl, para_env, dft_control)
Generates the mapping of cell indices and linear RS index CELL (0,0,0) is always mapped to index 1.
Definition kpoint_methods.F:679

kpoint_types
Types and basic routines needed for a kpoint calculation.
Definition kpoint_types.F:15

kpoint_types::kpoint_create
subroutine, public kpoint_create(kpoint)
Create a kpoint environment.
Definition kpoint_types.F:206

kpoint_types::get_kpoint_info
subroutine, public get_kpoint_info(kpoint, kp_scheme, nkp_grid, kp_shift, symmetry, verbose, full_grid, use_real_wfn, eps_geo, parallel_group_size, kp_range, nkp, xkp, wkp, para_env, blacs_env_all, para_env_kp, para_env_inter_kp, blacs_env, kp_env, kp_aux_env, mpools, iogrp, nkp_groups, kp_dist, cell_to_index, index_to_cell, sab_nl, sab_nl_nosym)
Retrieve information from a kpoint environment.
Definition kpoint_types.F:365

libint_2c_3c
2- and 3-center electron repulsion integral routines based on libint2 Currently available operators: ...
Definition libint_2c_3c.F:14

libint_wrapper
Interface to the Libint-Library or a c++ wrapper.
Definition libint_wrapper.F:15

libint_wrapper::cp_libint_static_cleanup
subroutine, public cp_libint_static_cleanup()
Definition libint_wrapper.F:1244

libint_wrapper::cp_libint_static_init
subroutine, public cp_libint_static_init()
Definition libint_wrapper.F:1236

machine
Machine interface based on Fortran 2003 and POSIX.
Definition machine.F:17

machine::m_memory
subroutine, public m_memory(mem)
Returns the total amount of memory [bytes] in use, if known, zero otherwise.
Definition machine.F:440

machine::m_walltime
real(kind=dp) function, public m_walltime()
returns time from a real-time clock, protected against rolling early/easily
Definition machine.F:147

mathconstants
Definition of mathematical constants and functions.
Definition mathconstants.F:16

mathconstants::z_one
complex(kind=dp), parameter, public z_one
Definition mathconstants.F:143

mathconstants::gaussi
complex(kind=dp), parameter, public gaussi
Definition mathconstants.F:142

mathconstants::z_zero
complex(kind=dp), parameter, public z_zero
Definition mathconstants.F:143

mathlib
Collection of simple mathematical functions and subroutines.
Definition mathlib.F:15

mathlib::diag_complex
subroutine, public diag_complex(matrix, eigenvectors, eigenvalues)
Diagonalizes a local complex Hermitian matrix using LAPACK. Based on cp_cfm_heevd.
Definition mathlib.F:1743

mathlib::gcd
elemental integer function, public gcd(a, b)
computes the greatest common divisor of two number
Definition mathlib.F:1280

message_passing
Interface to the message passing library MPI.
Definition message_passing.F:23

minimax_exp_gw
Routines to calculate the minimax coefficients in order to approximate 1/x as a sum over exponential ...
Definition minimax_exp_gw.F:17

minimax_exp_gw::get_exp_minimax_coeff_gw
subroutine, public get_exp_minimax_coeff_gw(k, e_range, aw)
...
Definition minimax_exp_gw.F:38

minimax_exp
Routines to calculate the minimax coefficients in order to approximate 1/x as a sum over exponential ...
Definition minimax_exp.F:29

minimax_exp::get_exp_minimax_coeff
subroutine, public get_exp_minimax_coeff(k, rc, aw, mm_error, which_coeffs)
Get best minimax approximation for given input parameters. Automatically chooses the most exact set o...
Definition minimax_exp.F:127

minimax_rpa
Routines to calculate the minimax coefficients for approximating 1/x as 1/x ~ 1/pi SUM_{i}^{K} w_i x^...
Definition minimax_rpa.F:14

minimax_rpa::get_rpa_minimax_coeff_larger_grid
subroutine, public get_rpa_minimax_coeff_larger_grid(k, e_range, aw)
...
Definition minimax_rpa.F:10122

minimax_rpa::get_rpa_minimax_coeff
subroutine, public get_rpa_minimax_coeff(k, e_range, aw, ierr, print_warning)
The a_i and w_i coefficient are stored in aw such that the first 1:K elements correspond to a_i and t...
Definition minimax_rpa.F:41

mp2_gpw
Calls routines to get RI integrals and calculate total energies.
Definition mp2_gpw.F:14

mp2_gpw::create_mat_munu
subroutine, public create_mat_munu(mat_munu, qs_env, eps_grid, blacs_env_sub, do_ri_aux_basis, do_mixed_basis, group_size_prim, do_alloc_blocks_from_nbl, do_kpoints, sab_orb_sub, dbcsr_sym_type)
Encapsulate the building of dbcsr_matrix mat_munu.
Definition mp2_gpw.F:990

mp2_grids
Routines to calculate frequency and time grids (integration points and weights) for correlation metho...
Definition mp2_grids.F:14

mp2_grids::get_l_sq_wghts_cos_tf_w_to_t
subroutine, public get_l_sq_wghts_cos_tf_w_to_t(num_integ_points, tau_tj, weights_cos_tf_w_to_t, omega_tj, e_min, e_max, max_error, num_points_per_magnitude, regularization)
...
Definition mp2_grids.F:1244

mp2_grids::get_l_sq_wghts_cos_tf_t_to_w
subroutine, public get_l_sq_wghts_cos_tf_t_to_w(num_integ_points, tau_tj, weights_cos_tf_t_to_w, omega_tj, e_min, e_max, max_error, num_points_per_magnitude, regularization)
Calculate integration weights for the tau grid (in dependency of the omega node)
Definition mp2_grids.F:745

mp2_grids::get_l_sq_wghts_sin_tf_t_to_w
subroutine, public get_l_sq_wghts_sin_tf_t_to_w(num_integ_points, tau_tj, weights_sin_tf_t_to_w, omega_tj, e_min, e_max, max_error, num_points_per_magnitude, regularization)
Calculate integration weights for the tau grid (in dependency of the omega node)
Definition mp2_grids.F:881

mp2_ri_2c
Framework for 2c-integrals for RI.
Definition mp2_ri_2c.F:14

mp2_ri_2c::trunc_coulomb_for_exchange
subroutine, public trunc_coulomb_for_exchange(qs_env, trunc_coulomb, rel_cutoff_trunc_coulomb_ri_x, cell_grid, do_bvk_cell)
...
Definition mp2_ri_2c.F:1600

parallel_gemm_api
basic linear algebra operations for full matrixes
Definition parallel_gemm_api.F:14

particle_methods
Define methods related to particle_type.
Definition particle_methods.F:14

particle_methods::get_particle_set
subroutine, public get_particle_set(particle_set, qs_kind_set, first_sgf, last_sgf, nsgf, nmao, basis)
Get the components of a particle set.
Definition particle_methods.F:98

particle_types
Define the data structure for the particle information.
Definition particle_types.F:19

physcon
Definition of physical constants:
Definition physcon.F:68

physcon::evolt
real(kind=dp), parameter, public evolt
Definition physcon.F:183

physcon::angstrom
real(kind=dp), parameter, public angstrom
Definition physcon.F:144

post_scf_bandstructure_types
Definition post_scf_bandstructure_types.F:13

post_scf_bandstructure_utils
Definition post_scf_bandstructure_utils.F:13

post_scf_bandstructure_utils::rsmat_to_kp
subroutine, public rsmat_to_kp(mat_rs, ispin, xkp, cell_to_index_scf, sab_nl, bs_env, cfm_kp, imag_rs_mat)
...
Definition post_scf_bandstructure_utils.F:659

qs_energy_types
Definition qs_energy_types.F:14

qs_environment_types
Definition qs_environment_types.F:14

qs_environment_types::get_qs_env
subroutine, public get_qs_env(qs_env, atomic_kind_set, qs_kind_set, cell, super_cell, cell_ref, use_ref_cell, kpoints, dft_control, mos, sab_orb, sab_all, qmmm, qmmm_periodic, sac_ae, sac_ppl, sac_lri, sap_ppnl, sab_vdw, sab_scp, sap_oce, sab_lrc, sab_se, sab_xtbe, sab_tbe, sab_core, sab_xb, sab_xtb_pp, sab_xtb_nonbond, sab_almo, sab_kp, sab_kp_nosym, particle_set, energy, force, matrix_h, matrix_h_im, matrix_ks, matrix_ks_im, matrix_vxc, run_rtp, rtp, matrix_h_kp, matrix_h_im_kp, matrix_ks_kp, matrix_ks_im_kp, matrix_vxc_kp, kinetic_kp, matrix_s_kp, matrix_w_kp, matrix_s_ri_aux_kp, matrix_s, matrix_s_ri_aux, matrix_w, matrix_p_mp2, matrix_p_mp2_admm, rho, rho_xc, pw_env, ewald_env, ewald_pw, active_space, mpools, input, para_env, blacs_env, scf_control, rel_control, kinetic, qs_charges, vppl, rho_core, rho_nlcc, rho_nlcc_g, ks_env, ks_qmmm_env, wf_history, scf_env, local_particles, local_molecules, distribution_2d, dbcsr_dist, molecule_kind_set, molecule_set, subsys, cp_subsys, oce, local_rho_set, rho_atom_set, task_list, task_list_soft, rho0_atom_set, rho0_mpole, rhoz_set, ecoul_1c, rho0_s_rs, rho0_s_gs, do_kpoints, has_unit_metric, requires_mo_derivs, mo_derivs, mo_loc_history, nkind, natom, nelectron_total, nelectron_spin, efield, neighbor_list_id, linres_control, xas_env, virial, cp_ddapc_env, cp_ddapc_ewald, outer_scf_history, outer_scf_ihistory, x_data, et_coupling, dftb_potential, results, se_taper, se_store_int_env, se_nddo_mpole, se_nonbond_env, admm_env, lri_env, lri_density, exstate_env, ec_env, harris_env, dispersion_env, gcp_env, vee, rho_external, external_vxc, mask, mp2_env, bs_env, kg_env, wanniercentres, atprop, ls_scf_env, do_transport, transport_env, v_hartree_rspace, s_mstruct_changed, rho_changed, potential_changed, forces_up_to_date, mscfg_env, almo_scf_env, gradient_history, variable_history, embed_pot, spin_embed_pot, polar_env, mos_last_converged, eeq, rhs, tb_tblite)
Get the QUICKSTEP environment.
Definition qs_environment_types.F:518

qs_environment_types::qs_env_part_release
subroutine, public qs_env_part_release(qs_env)
releases part of the given qs_env in order to save memory
Definition qs_environment_types.F:1643

qs_integral_utils
Some utility functions for the calculation of integrals.
Definition qs_integral_utils.F:14

qs_integral_utils::basis_set_list_setup
subroutine, public basis_set_list_setup(basis_set_list, basis_type, qs_kind_set)
Set up an easy accessible list of the basis sets for all kinds.
Definition qs_integral_utils.F:149

qs_interactions
Calculate the interaction radii for the operator matrix calculation.
Definition qs_interactions.F:17

qs_interactions::init_interaction_radii_orb_basis
subroutine, public init_interaction_radii_orb_basis(orb_basis_set, eps_pgf_orb, eps_pgf_short)
...
Definition qs_interactions.F:426

qs_kind_types
Define the quickstep kind type and their sub types.
Definition qs_kind_types.F:23

qs_kind_types::get_qs_kind
subroutine, public get_qs_kind(qs_kind, basis_set, basis_type, ncgf, nsgf, all_potential, tnadd_potential, gth_potential, sgp_potential, upf_potential, se_parameter, dftb_parameter, xtb_parameter, dftb3_param, zatom, zeff, elec_conf, mao, lmax_dftb, alpha_core_charge, ccore_charge, core_charge, core_charge_radius, paw_proj_set, paw_atom, hard_radius, hard0_radius, max_rad_local, covalent_radius, vdw_radius, gpw_type_forced, harmonics, max_iso_not0, max_s_harm, grid_atom, ngrid_ang, ngrid_rad, lmax_rho0, dft_plus_u_atom, l_of_dft_plus_u, n_of_dft_plus_u, u_minus_j, u_of_dft_plus_u, j_of_dft_plus_u, alpha_of_dft_plus_u, beta_of_dft_plus_u, j0_of_dft_plus_u, occupation_of_dft_plus_u, dispersion, bs_occupation, magnetization, no_optimize, addel, laddel, naddel, orbitals, max_scf, eps_scf, smear, u_ramping, u_minus_j_target, eps_u_ramping, init_u_ramping_each_scf, reltmat, ghost, floating, name, element_symbol, pao_basis_size, pao_model_file, pao_potentials, pao_descriptors, nelec)
Get attributes of an atomic kind.
Definition qs_kind_types.F:454

qs_ks_methods
routines that build the Kohn-Sham matrix (i.e calculate the coulomb and xc parts
Definition qs_ks_methods.F:22

qs_ks_methods::qs_ks_build_kohn_sham_matrix
subroutine, public qs_ks_build_kohn_sham_matrix(qs_env, calculate_forces, just_energy, print_active, ext_ks_matrix)
routine where the real calculations are made: the KS matrix is calculated
Definition qs_ks_methods.F:179

qs_neighbor_list_types
Define the neighbor list data types and the corresponding functionality.
Definition qs_neighbor_list_types.F:17

qs_neighbor_list_types::release_neighbor_list_sets
subroutine, public release_neighbor_list_sets(nlists)
releases an array of neighbor_list_sets
Definition qs_neighbor_list_types.F:1097

qs_tensors_types
Utility methods to build 3-center integral tensors of various types.
Definition qs_tensors_types.F:12

qs_tensors_types::distribution_3d_create
subroutine, public distribution_3d_create(dist_3d, dist1, dist2, dist3, nkind, particle_set, mp_comm_3d, own_comm)
Create a 3d distribution.
Definition qs_tensors_types.F:91

qs_tensors_types::create_2c_tensor
subroutine, public create_2c_tensor(t2c, dist_1, dist_2, pgrid, sizes_1, sizes_2, order, name)
...
Definition qs_tensors_types.F:382

qs_tensors_types::create_3c_tensor
subroutine, public create_3c_tensor(t3c, dist_1, dist_2, dist_3, pgrid, sizes_1, sizes_2, sizes_3, map1, map2, name)
...
Definition qs_tensors_types.F:335

qs_tensors
Utility methods to build 3-center integral tensors of various types.
Definition qs_tensors.F:11

qs_tensors::build_2c_integrals
subroutine, public build_2c_integrals(t2c, filter_eps, qs_env, nl_2c, basis_i, basis_j, potential_parameter, do_kpoints, do_hfx_kpoints, ext_kpoints, regularization_ri)
...
Definition qs_tensors.F:3156

qs_tensors::build_2c_neighbor_lists
subroutine, public build_2c_neighbor_lists(ij_list, basis_i, basis_j, potential_parameter, name, qs_env, sym_ij, molecular, dist_2d, pot_to_rad)
Build 2-center neighborlists adapted to different operators This mainly wraps build_neighbor_lists fo...
Definition qs_tensors.F:143

qs_tensors::build_3c_integrals
subroutine, public build_3c_integrals(t3c, filter_eps, qs_env, nl_3c, basis_i, basis_j, basis_k, potential_parameter, int_eps, op_pos, do_kpoints, do_hfx_kpoints, desymmetrize, cell_sym, bounds_i, bounds_j, bounds_k, ri_range, img_to_ri_cell, cell_to_index_ext)
Build 3-center integral tensor.
Definition qs_tensors.F:2123

qs_tensors::neighbor_list_3c_destroy
subroutine, public neighbor_list_3c_destroy(ijk_list)
Destroy 3c neighborlist.
Definition qs_tensors.F:383

qs_tensors::get_tensor_occupancy
subroutine, public get_tensor_occupancy(tensor, nze, occ)
...
Definition qs_tensors.F:3627

qs_tensors::build_3c_neighbor_lists
subroutine, public build_3c_neighbor_lists(ijk_list, basis_i, basis_j, basis_k, dist_3d, potential_parameter, name, qs_env, sym_ij, sym_jk, sym_ik, molecular, op_pos, own_dist)
Build a 3-center neighbor list.
Definition qs_tensors.F:282

rpa_gw
Routines for GW, continuous development [Jan Wilhelm].
Definition rpa_gw.F:14

rpa_gw::continuation_pade
subroutine, public continuation_pade(vec_gw_energ, vec_omega_fit_gw, z_value, m_value, vec_sigma_c_gw, vec_sigma_x_minus_vxc_gw, eigenval, eigenval_scf, do_hedin_shift, n_level_gw, gw_corr_lev_occ, gw_corr_lev_vir, nparam_pade, num_fit_points, crossing_search, homo, fermi_level_offset, do_gw_im_time, print_self_energy, count_ev_sc_gw, vec_gw_dos, dos_lower_bound, dos_precision, ndos, min_level_self_energy, max_level_self_energy, dos_eta, dos_min, dos_max, e_fermi_ext)
perform analytic continuation with pade approximation
Definition rpa_gw.F:4314

atomic_kind_types::atomic_kind_type
Provides all information about an atomic kind.
Definition atomic_kind_types.F:45

basis_set_types::gto_basis_set_type
Definition basis_set_types.F:72

cell_types::cell_type
Type defining parameters related to the simulation cell.
Definition cell_types.F:55

cp_blacs_env::cp_blacs_env_type
represent a blacs multidimensional parallel environment (for the mpi corrispective see cp_paratypes/m...
Definition cp_blacs_env.F:53

cp_cfm_types::cp_cfm_type
Represent a complex full matrix.
Definition cp_cfm_types.F:68

cp_control_types::dft_control_type
Definition cp_control_types.F:586

cp_dbcsr_api::dbcsr_distribution_type
Definition cp_dbcsr_api.F:180

cp_dbcsr_api::dbcsr_p_type
Definition cp_dbcsr_api.F:170

cp_dbcsr_api::dbcsr_type
Definition cp_dbcsr_api.F:174

cp_fm_struct::cp_fm_struct_type
keeps the information about the structure of a full matrix
Definition cp_fm_struct.F:82

cp_fm_types::cp_fm_type
represent a full matrix
Definition cp_fm_types.F:113

cp_log_handling::cp_logger_type
type of a logger, at the moment it contains just a print level starting at which level it should be l...
Definition cp_log_handling.F:140

distribution_2d_types::distribution_2d_type
distributes pairs on a 2d grid of processors
Definition distribution_2d_types.F:62

input_section_types::section_vals_type
stores the values of a section
Definition input_section_types.F:127

kpoint_types::kpoint_type
Contains information about kpoints.
Definition kpoint_types.F:150

libint_2c_3c::libint_potential_type
Definition libint_2c_3c.F:66

message_passing::mp_cart_type
Definition message_passing.F:740

message_passing::mp_para_env_type
stores all the informations relevant to an mpi environment
Definition message_passing.F:763

particle_types::particle_type
Definition particle_types.F:35

post_scf_bandstructure_types::post_scf_bandstructure_type
Definition post_scf_bandstructure_types.F:58

qs_energy_types::qs_energy_type
Definition qs_energy_types.F:25

qs_environment_types::qs_environment_type
Definition qs_environment_types.F:219

qs_kind_types::qs_kind_type
Provides all information about a quickstep kind.
Definition qs_kind_types.F:171

qs_neighbor_list_types::neighbor_list_set_p_type
Definition qs_neighbor_list_types.F:67

qs_tensors_types::distribution_3d_type
Definition qs_tensors_types.F:57

qs_tensors_types::neighbor_list_3c_type
Definition qs_tensors_types.F:63