d3/d90/pao__ml__neuralnet_8F_source.html

!--------------------------------------------------------------------------------------------------!

!   CP2K: A general program to perform molecular dynamics simulations                              !

!   Copyright 2000-2025 CP2K developers group <https://cp2k.org>                                   !

!                                                                                                  !

!   SPDX-License-Identifier: GPL-2.0-or-later                                                      !

!--------------------------------------------------------------------------------------------------!


! **************************************************************************************************

!> \brief Neural Network implementation

!> \author Ole Schuett

! **************************************************************************************************

MODULE pao_ml_neuralnet

   USE kinds,                           ONLY: dp

   USE pao_types,                       ONLY: pao_env_type,&

                                              training_matrix_type

   USE parallel_rng_types,              ONLY: rng_stream_type

#include "./base/base_uses.f90"


   IMPLICIT NONE


   PRIVATE


   CHARACTER(len=*), PARAMETER, PRIVATE :: moduleN = 'pao_ml_neuralnet'


   PUBLIC ::pao_ml_nn_train, pao_ml_nn_predict, pao_ml_nn_gradient


   ! TODO turn these into input parameters

   REAL(dp), PARAMETER   :: step_size = 0.001_dp

   INTEGER, PARAMETER    :: nlayers = 3

   REAL(dp), PARAMETER   :: convergence_eps = 1e-7_dp

   INTEGER, PARAMETER    :: max_training_cycles = 50000


CONTAINS


! **************************************************************************************************

!> \brief Uses neural network to make a prediction

!> \param pao ...

!> \param ikind ...

!> \param descriptor ...

!> \param output ...

!> \param variance ...

! **************************************************************************************************


   SUBROUTINE pao_ml_nn_predict(pao, ikind, descriptor, output, variance)

      TYPE(pao_env_type), POINTER                        :: pao

      INTEGER, INTENT(IN)                                :: ikind

      REAL(dp), DIMENSION(:), INTENT(IN)                 :: descriptor

      REAL(dp), DIMENSION(:), INTENT(OUT)                :: output

      REAL(dp), INTENT(OUT)                              :: variance


      TYPE(training_matrix_type), POINTER                :: training_matrix


      training_matrix => pao%ml_training_matrices(ikind)


      CALL nn_eval(training_matrix%NN, input=descriptor, prediction=output)


      variance = 0.0_dp ! Neural Networks don't provide a variance


   END SUBROUTINE pao_ml_nn_predict


! **************************************************************************************************

!> \brief Calculate gradient of neural network

!> \param pao ...

!> \param ikind ...

!> \param descriptor ...

!> \param outer_deriv ...

!> \param gradient ...

! **************************************************************************************************


   SUBROUTINE pao_ml_nn_gradient(pao, ikind, descriptor, outer_deriv, gradient)

      TYPE(pao_env_type), POINTER                        :: pao

      INTEGER, INTENT(IN)                                :: ikind

      REAL(dp), DIMENSION(:), INTENT(IN), TARGET         :: descriptor

      REAL(dp), DIMENSION(:), INTENT(IN)                 :: outer_deriv

      REAL(dp), DIMENSION(:), INTENT(OUT)                :: gradient


      INTEGER                                            :: i, ilayer, j, nlayers, width, width_in, &

                                                            width_out

      REAL(dp), ALLOCATABLE, DIMENSION(:, :)             :: backward, forward

      REAL(dp), DIMENSION(:, :, :), POINTER              :: a


      a => pao%ml_training_matrices(ikind)%NN


      nlayers = SIZE(a, 1)

      width = SIZE(a, 2); cpassert(SIZE(a, 2) == SIZE(a, 3))

      width_in = SIZE(descriptor)

      width_out = SIZE(outer_deriv)


      ALLOCATE (forward(0:nlayers, width), backward(0:nlayers, width))


      forward = 0.0_dp

      forward(0, 1:width_in) = descriptor


      DO ilayer = 1, nlayers

      DO i = 1, width

      DO j = 1, width

         forward(ilayer, i) = forward(ilayer, i) + a(ilayer, i, j)*tanh(forward(ilayer - 1, j))

      END DO

      END DO

      END DO


      ! Turning Point ------------------------------------------------------------------------------

      backward = 0.0_dp

      backward(nlayers, 1:width_out) = outer_deriv(:)


      DO ilayer = nlayers, 1, -1

      DO i = 1, width

      DO j = 1, width

  backward(ilayer - 1, j) = backward(ilayer - 1, j) + backward(ilayer, i)*a(ilayer, i, j)*(1.0_dp - tanh(forward(ilayer - 1, j))**2)

      END DO

      END DO

      END DO


      gradient(:) = backward(0, 1:width_in)


      DEALLOCATE (forward, backward)


   END SUBROUTINE pao_ml_nn_gradient


! **************************************************************************************************

!> \brief Trains the neural network on given training points

!> \param pao ...

! **************************************************************************************************


   SUBROUTINE pao_ml_nn_train(pao)

      TYPE(pao_env_type), POINTER                        :: pao


      INTEGER                                            :: i, icycle, ikind, ilayer, ipoint, j, &

                                                            npoints, width, width_in, width_out

      REAL(dp)                                           :: bak, eps, error, error1, error2, num_grad

      REAL(dp), ALLOCATABLE, DIMENSION(:)                :: prediction

      REAL(dp), ALLOCATABLE, DIMENSION(:, :, :)          :: gradient

      TYPE(rng_stream_type)                              :: rng_stream

      TYPE(training_matrix_type), POINTER                :: training_matrix


      ! TODO this could be parallelized over ranks

      DO ikind = 1, SIZE(pao%ml_training_matrices)

         training_matrix => pao%ml_training_matrices(ikind)


         npoints = SIZE(training_matrix%inputs, 2) ! number of points

         cpassert(SIZE(training_matrix%outputs, 2) == npoints)

         IF (npoints == 0) cycle


         !TODO proper output

         IF (pao%iw > 0) WRITE (pao%iw, *) "PAO|ML| Training neural network for kind: ", &

            trim(training_matrix%kindname), " from ", npoints, "training points."


         ! determine network width and allocate it

         width_in = SIZE(training_matrix%inputs, 1)

         width_out = SIZE(training_matrix%outputs, 1)

         width = max(width_in, width_out)

         ALLOCATE (training_matrix%NN(nlayers, width, width))


         ! initialize network with random numbers from -1.0 ... +1.0

         rng_stream = rng_stream_type(name="pao_nn")

         DO ilayer = 1, nlayers

         DO i = 1, width

         DO j = 1, width

            training_matrix%NN(ilayer, i, j) = -1.0_dp + 2.0_dp*rng_stream%next()

         END DO

         END DO

         END DO


         ! train the network using backpropagation

         ALLOCATE (gradient(nlayers, width, width))

         DO icycle = 1, max_training_cycles

            error = 0.0_dp

            gradient = 0.0_dp

            DO ipoint = 1, npoints

               CALL nn_backpropagate(training_matrix%NN, &

                                     input=training_matrix%inputs(:, ipoint), &

                                     goal=training_matrix%outputs(:, ipoint), &

                                     gradient=gradient, &

                                     error=error)

            END DO

            training_matrix%NN(:, :, :) = training_matrix%NN - step_size*gradient


            IF (pao%iw > 0 .AND. mod(icycle, 100) == 0) WRITE (pao%iw, *) &

               "PAO|ML| ", trim(training_matrix%kindname), &

               " training-cycle:", icycle, "SQRT(error):", sqrt(error), "grad:", sum(gradient**2)


            IF (sum(gradient**2) < convergence_eps) EXIT

         END DO


         ! numeric gradient for debugging ----------------------------------------------------------

         IF (.false.) THEN

            eps = 1e-4_dp

            ilayer = 1

            ipoint = 1

            error = 0.0_dp

            gradient = 0.0_dp

            CALL nn_backpropagate(training_matrix%NN, &

                                  input=training_matrix%inputs(:, ipoint), &

                                  goal=training_matrix%outputs(:, ipoint), &

                                  gradient=gradient, &

                                  error=error)


            ALLOCATE (prediction(width_out))

            DO i = 1, width

            DO j = 1, width

               bak = training_matrix%NN(ilayer, i, j)


               training_matrix%NN(ilayer, i, j) = bak + eps

               CALL nn_eval(training_matrix%NN, &

                            input=training_matrix%inputs(:, ipoint), &

                            prediction=prediction)

               error1 = sum((training_matrix%outputs(:, ipoint) - prediction)**2)


               training_matrix%NN(ilayer, i, j) = bak - eps

               CALL nn_eval(training_matrix%NN, &

                            input=training_matrix%inputs(:, ipoint), &

                            prediction=prediction)

               error2 = sum((training_matrix%outputs(:, ipoint) - prediction)**2)


               training_matrix%NN(ilayer, i, j) = bak

               num_grad = (error1 - error2)/(2.0_dp*eps)

               IF (pao%iw > 0) WRITE (pao%iw, *) "PAO|ML| Numeric gradient:", i, j, gradient(ilayer, i, j), num_grad


            END DO

            END DO

            DEALLOCATE (prediction)

         END IF

         !------------------------------------------------------------------------------------------


         DEALLOCATE (gradient)


         ! test training points individually

         ALLOCATE (prediction(width_out))

         DO ipoint = 1, npoints

            CALL nn_eval(training_matrix%NN, &

                         input=training_matrix%inputs(:, ipoint), &

                         prediction=prediction)

            error = maxval(abs(training_matrix%outputs(:, ipoint) - prediction))

            IF (pao%iw > 0) WRITE (pao%iw, *) "PAO|ML| ", trim(training_matrix%kindname), &

               " verify training-point:", ipoint, "SQRT(error):", sqrt(error)

         END DO

         DEALLOCATE (prediction)


      END DO


   END SUBROUTINE pao_ml_nn_train


! **************************************************************************************************

!> \brief Evaluates the neural network for a given input

!> \param A ...

!> \param input ...

!> \param prediction ...

! **************************************************************************************************

   SUBROUTINE nn_eval(A, input, prediction)

      REAL(dp), DIMENSION(:, :, :), INTENT(IN)           :: a

      REAL(dp), DIMENSION(:), INTENT(IN)                 :: input

      REAL(dp), DIMENSION(:), INTENT(OUT)                :: prediction


      INTEGER                                            :: i, ilayer, j, nlayers, width, width_in, &

                                                            width_out

      REAL(dp), ALLOCATABLE, DIMENSION(:, :)             :: forward


      nlayers = SIZE(a, 1)

      width = SIZE(a, 2); cpassert(SIZE(a, 2) == SIZE(a, 3))

      width_in = SIZE(input)

      width_out = SIZE(prediction)


      ALLOCATE (forward(0:nlayers, width))


      forward = 0.0_dp

      forward(0, 1:width_in) = input(:)


      DO ilayer = 1, nlayers

      DO i = 1, width

      DO j = 1, width

         forward(ilayer, i) = forward(ilayer, i) + a(ilayer, i, j)*tanh(forward(ilayer - 1, j))

      END DO

      END DO

      END DO


      prediction(:) = forward(nlayers, 1:width_out)


   END SUBROUTINE nn_eval


! **************************************************************************************************

!> \brief Uses backpropagation to calculate the gradient for a given training point

!> \param A ...

!> \param input ...

!> \param goal ...

!> \param error ...

!> \param gradient ...

! **************************************************************************************************

   SUBROUTINE nn_backpropagate(A, input, goal, error, gradient)

      REAL(dp), DIMENSION(:, :, :), INTENT(IN)           :: a

      REAL(dp), DIMENSION(:), INTENT(IN)                 :: input, goal

      REAL(dp), INTENT(INOUT)                            :: error

      REAL(dp), DIMENSION(:, :, :), INTENT(INOUT)        :: gradient


      INTEGER                                            :: i, ilayer, j, nlayers, width, width_in, &

                                                            width_out

      REAL(dp), ALLOCATABLE, DIMENSION(:)                :: prediction

      REAL(dp), ALLOCATABLE, DIMENSION(:, :)             :: backward, forward


      nlayers = SIZE(a, 1)

      width = SIZE(a, 2); cpassert(SIZE(a, 2) == SIZE(a, 3))

      width_in = SIZE(input)

      width_out = SIZE(goal)


      ALLOCATE (forward(0:nlayers, width), prediction(width_out), backward(0:nlayers, width))


      forward = 0.0_dp

      forward(0, 1:width_in) = input


      DO ilayer = 1, nlayers

      DO i = 1, width

      DO j = 1, width

         forward(ilayer, i) = forward(ilayer, i) + a(ilayer, i, j)*tanh(forward(ilayer - 1, j))

      END DO

      END DO

      END DO


      prediction(:) = forward(nlayers, 1:width_out)


      error = error + sum((prediction - goal)**2)


      ! Turning Point ------------------------------------------------------------------------------

      backward = 0.0_dp

      backward(nlayers, 1:width_out) = prediction - goal


      DO ilayer = nlayers, 1, -1

      DO i = 1, width

      DO j = 1, width

         gradient(ilayer, i, j) = gradient(ilayer, i, j) + 2.0_dp*backward(ilayer, i)*tanh(forward(ilayer - 1, j))

  backward(ilayer - 1, j) = backward(ilayer - 1, j) + backward(ilayer, i)*a(ilayer, i, j)*(1.0_dp - tanh(forward(ilayer - 1, j))**2)

      END DO

      END DO

      END DO


      DEALLOCATE (forward, backward, prediction)

   END SUBROUTINE nn_backpropagate


END MODULE pao_ml_neuralnet

kinds
Defines the basic variable types.
Definition kinds.F:23

kinds::dp
integer, parameter, public dp
Definition kinds.F:34

pao_ml_neuralnet
Neural Network implementation.
Definition pao_ml_neuralnet.F:12

pao_ml_neuralnet::pao_ml_nn_gradient
subroutine, public pao_ml_nn_gradient(pao, ikind, descriptor, outer_deriv, gradient)
Calculate gradient of neural network.
Definition pao_ml_neuralnet.F:68

pao_ml_neuralnet::pao_ml_nn_train
subroutine, public pao_ml_nn_train(pao)
Trains the neural network on given training points.
Definition pao_ml_neuralnet.F:121

pao_ml_neuralnet::pao_ml_nn_predict
subroutine, public pao_ml_nn_predict(pao, ikind, descriptor, output, variance)
Uses neural network to make a prediction.
Definition pao_ml_neuralnet.F:44

pao_types
Types used by the PAO machinery.
Definition pao_types.F:12

parallel_rng_types
Parallel (pseudo)random number generator (RNG) for multiple streams and substreams of random numbers.
Definition parallel_rng_types.F:51

pao_types::pao_env_type
Definition pao_types.F:147

pao_types::training_matrix_type
Definition pao_types.F:48

parallel_rng_types::rng_stream_type
Definition parallel_rng_types.F:157