330 COMPLEX(kind=dp),
DIMENSION(:, :),
INTENT(out) :: target_m
331 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
332 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
334 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_get_submatrix'
336 COMPLEX(kind=dp),
DIMENSION(:, :),
POINTER :: local_data
337 INTEGER :: end_col_global, end_col_local, end_row_global, end_row_local, handle, i, j, &
338 ncol_global, ncol_local, nrow_global, nrow_local, start_col_global, start_col_local, &
339 start_row_global, start_row_local, this_col
340 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
341 LOGICAL :: do_zero, tr_a
344 CALL timeset(routinen, handle)
346 IF (
SIZE(target_m) /= 0)
THEN
347#if defined(__parallel)
354 IF (
PRESENT(transpose)) tr_a = transpose
359 IF (
PRESENT(start_row)) start_row_global = start_row
360 IF (
PRESENT(start_col)) start_col_global = start_col
363 end_row_global =
SIZE(target_m, 2)
364 end_col_global =
SIZE(target_m, 1)
366 end_row_global =
SIZE(target_m, 1)
367 end_col_global =
SIZE(target_m, 2)
369 IF (
PRESENT(n_rows)) end_row_global = n_rows
370 IF (
PRESENT(n_cols)) end_col_global = n_cols
372 end_row_global = end_row_global + start_row_global - 1
373 end_col_global = end_col_global + start_col_global - 1
376 nrow_global=nrow_global, ncol_global=ncol_global, &
377 nrow_local=nrow_local, ncol_local=ncol_local, &
378 row_indices=row_indices, col_indices=col_indices)
379 IF (end_row_global > nrow_global)
THEN
380 end_row_global = nrow_global
383 IF (end_col_global > ncol_global)
THEN
384 end_col_global = ncol_global
390 DO start_row_local = 1, nrow_local
391 IF (row_indices(start_row_local) >= start_row_global)
EXIT
394 DO end_row_local = start_row_local, nrow_local
395 IF (row_indices(end_row_local) > end_row_global)
EXIT
397 end_row_local = end_row_local - 1
399 DO start_col_local = 1, ncol_local
400 IF (col_indices(start_col_local) >= start_col_global)
EXIT
403 DO end_col_local = start_col_local, ncol_local
404 IF (col_indices(end_col_local) > end_col_global)
EXIT
406 end_col_local = end_col_local - 1
408 para_env => fm%matrix_struct%para_env
409 local_data => fm%local_data
416 CALL zcopy(
SIZE(target_m),
z_zero, 0, target_m(1, 1), 1)
419 DO j = start_col_local, end_col_local
420 this_col = col_indices(j) - start_col_global + 1
421 DO i = start_row_local, end_row_local
422 target_m(this_col, row_indices(i) - start_row_global + 1) = local_data(i, j)
426 DO j = start_col_local, end_col_local
427 this_col = col_indices(j) - start_col_global + 1
428 DO i = start_row_local, end_row_local
429 target_m(row_indices(i) - start_row_global + 1, this_col) = local_data(i, j)
434 CALL para_env%sum(target_m)
437 CALL timestop(handle)
465 start_col, n_rows, n_cols, alpha, beta, transpose)
467 COMPLEX(kind=dp),
DIMENSION(:, :),
INTENT(in) :: new_values
468 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
469 COMPLEX(kind=dp),
INTENT(in),
OPTIONAL :: alpha, beta
470 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
472 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_set_submatrix'
474 COMPLEX(kind=dp) :: al, be
475 COMPLEX(kind=dp),
DIMENSION(:, :),
POINTER :: local_data
476 INTEGER :: end_col_global, end_col_local, end_row_global, end_row_local, handle, i, j, &
477 ncol_global, ncol_local, nrow_global, nrow_local, start_col_global, start_col_local, &
478 start_row_global, start_row_local, this_col
479 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
482 CALL timeset(routinen, handle)
486 IF (
PRESENT(alpha)) al = alpha
487 IF (
PRESENT(beta)) be = beta
492 IF (
PRESENT(start_row)) start_row_global = start_row
493 IF (
PRESENT(start_col)) start_col_global = start_col
496 IF (
PRESENT(transpose)) tr_a = transpose
499 end_row_global =
SIZE(new_values, 2)
500 end_col_global =
SIZE(new_values, 1)
502 end_row_global =
SIZE(new_values, 1)
503 end_col_global =
SIZE(new_values, 2)
505 IF (
PRESENT(n_rows)) end_row_global = n_rows
506 IF (
PRESENT(n_cols)) end_col_global = n_cols
508 end_row_global = end_row_global + start_row_global - 1
509 end_col_global = end_col_global + start_col_global - 1
512 nrow_global=nrow_global, ncol_global=ncol_global, &
513 nrow_local=nrow_local, ncol_local=ncol_local, &
514 row_indices=row_indices, col_indices=col_indices)
515 IF (end_row_global > nrow_global) end_row_global = nrow_global
516 IF (end_col_global > ncol_global) end_col_global = ncol_global
520 DO start_row_local = 1, nrow_local
521 IF (row_indices(start_row_local) >= start_row_global)
EXIT
524 DO end_row_local = start_row_local, nrow_local
525 IF (row_indices(end_row_local) > end_row_global)
EXIT
527 end_row_local = end_row_local - 1
529 DO start_col_local = 1, ncol_local
530 IF (col_indices(start_col_local) >= start_col_global)
EXIT
533 DO end_col_local = start_col_local, ncol_local
534 IF (col_indices(end_col_local) > end_col_global)
EXIT
536 end_col_local = end_col_local - 1
538 local_data => matrix%local_data
542 DO j = start_col_local, end_col_local
543 this_col = col_indices(j) - start_col_global + 1
544 DO i = start_row_local, end_row_local
545 local_data(i, j) = new_values(this_col, row_indices(i) - start_row_global + 1)
549 DO j = start_col_local, end_col_local
550 this_col = col_indices(j) - start_col_global + 1
551 DO i = start_row_local, end_row_local
552 local_data(i, j) = new_values(row_indices(i) - start_row_global + 1, this_col)
558 DO j = start_col_local, end_col_local
559 this_col = col_indices(j) - start_col_global + 1
560 DO i = start_row_local, end_row_local
561 local_data(i, j) = al*new_values(this_col, row_indices(i) - start_row_global + 1) + &
566 DO j = start_col_local, end_col_local
567 this_col = col_indices(j) - start_col_global + 1
568 DO i = start_row_local, end_row_local
569 local_data(i, j) = al*new_values(row_indices(i) - start_row_global + 1, this_col) + &
576 CALL timestop(handle)
875 TYPE(
cp_cfm_type),
INTENT(IN) :: source, destination
879 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_start_copy_general'
881 INTEGER :: dest_p_i, dest_q_j, global_rank, global_size, handle, i, j, k, mpi_rank, &
882 ncol_block_dest, ncol_block_src, ncol_local_recv, ncol_local_send, ncols, &
883 nrow_block_dest, nrow_block_src, nrow_local_recv, nrow_local_send, nrows, p, q, &
884 recv_rank, recv_size, send_rank, send_size
885 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: all_ranks, dest2global, dest_p, dest_q, &
886 recv_count, send_count, send_disp, &
887 source2global, src_p, src_q
888 INTEGER,
ALLOCATABLE,
DIMENSION(:, :) :: dest_blacs2mpi
889 INTEGER,
DIMENSION(2) :: dest_block, dest_block_tmp, dest_num_pe, &
890 src_block, src_block_tmp, src_num_pe
891 INTEGER,
DIMENSION(:),
POINTER :: recv_col_indices, recv_row_indices, &
892 send_col_indices, send_row_indices
896 CALL timeset(routinen, handle)
900 nrow_local_send =
SIZE(source%local_data, 1)
901 ncol_local_send =
SIZE(source%local_data, 2)
902 ALLOCATE (info%send_buf(nrow_local_send*ncol_local_send))
904 DO j = 1, ncol_local_send
905 DO i = 1, nrow_local_send
907 info%send_buf(k) = source%local_data(i, j)
911 NULLIFY (recv_dist, send_dist)
912 NULLIFY (recv_col_indices, recv_row_indices, send_col_indices, send_row_indices)
915 global_size = para_env%num_pe
916 global_rank = para_env%mepos
922 IF (
ASSOCIATED(destination%matrix_struct))
THEN
923 recv_dist => destination%matrix_struct
924 recv_rank = recv_dist%para_env%mepos
929 IF (
ASSOCIATED(source%matrix_struct))
THEN
930 send_dist => source%matrix_struct
931 send_rank = send_dist%para_env%mepos
937 ALLOCATE (all_ranks(0:global_size - 1))
939 CALL para_env%allgather(send_rank, all_ranks)
940 IF (
ASSOCIATED(destination%matrix_struct))
THEN
941 ALLOCATE (source2global(0:count(all_ranks .NE.
mp_proc_null) - 1))
942 DO i = 0, global_size - 1
944 source2global(all_ranks(i)) = i
949 CALL para_env%allgather(recv_rank, all_ranks)
950 IF (
ASSOCIATED(source%matrix_struct))
THEN
951 ALLOCATE (dest2global(0:count(all_ranks .NE.
mp_proc_null) - 1))
952 DO i = 0, global_size - 1
954 dest2global(all_ranks(i)) = i
958 DEALLOCATE (all_ranks)
965 IF (global_rank == 0)
THEN
967 CALL para_env%irecv(src_block,
mp_any_source, recv_req(1), tag=src_tag)
968 CALL para_env%irecv(dest_block,
mp_any_source, recv_req(2), tag=dest_tag)
969 CALL para_env%irecv(src_num_pe,
mp_any_source, recv_req(3), tag=src_tag)
970 CALL para_env%irecv(dest_num_pe,
mp_any_source, recv_req(4), tag=dest_tag)
973 IF (
ASSOCIATED(source%matrix_struct))
THEN
974 IF ((send_rank == 0))
THEN
976 src_block_tmp = (/send_dist%nrow_block, send_dist%ncol_block/)
977 CALL para_env%isend(src_block_tmp, 0, send_req(1), tag=src_tag)
978 CALL para_env%isend(send_dist%context%num_pe, 0, send_req(2), tag=src_tag)
982 IF (
ASSOCIATED(destination%matrix_struct))
THEN
983 IF ((recv_rank == 0))
THEN
984 dest_block_tmp = (/recv_dist%nrow_block, recv_dist%ncol_block/)
985 CALL para_env%isend(dest_block_tmp, 0, send_req(3), tag=dest_tag)
986 CALL para_env%isend(recv_dist%context%num_pe, 0, send_req(4), tag=dest_tag)
990 IF (global_rank == 0)
THEN
993 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
994 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1))
995 CALL para_env%irecv(info%src_blacs2mpi,
mp_any_source, recv_req(5), tag=src_tag)
996 CALL para_env%irecv(dest_blacs2mpi,
mp_any_source, recv_req(6), tag=dest_tag)
999 IF (
ASSOCIATED(source%matrix_struct))
THEN
1000 IF ((send_rank == 0))
THEN
1001 CALL para_env%isend(send_dist%context%blacs2mpi(:, :), 0, send_req(5), tag=src_tag)
1005 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1006 IF ((recv_rank == 0))
THEN
1007 CALL para_env%isend(recv_dist%context%blacs2mpi(:, :), 0, send_req(6), tag=dest_tag)
1011 IF (global_rank == 0)
THEN
1016 CALL para_env%bcast(src_block, 0)
1017 CALL para_env%bcast(dest_block, 0)
1018 CALL para_env%bcast(src_num_pe, 0)
1019 CALL para_env%bcast(dest_num_pe, 0)
1020 info%src_num_pe(1:2) = src_num_pe(1:2)
1021 info%nblock_src(1:2) = src_block(1:2)
1022 IF (global_rank /= 0)
THEN
1023 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1024 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1))
1026 CALL para_env%bcast(info%src_blacs2mpi, 0)
1027 CALL para_env%bcast(dest_blacs2mpi, 0)
1029 recv_size = dest_num_pe(1)*dest_num_pe(2)
1030 send_size = src_num_pe(1)*src_num_pe(2)
1031 info%send_size = send_size
1049 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1051 col_indices=recv_col_indices)
1052 info%recv_col_indices => recv_col_indices
1053 info%recv_row_indices => recv_row_indices
1054 nrow_block_src = src_block(1)
1055 ncol_block_src = src_block(2)
1056 ALLOCATE (recv_count(0:send_size - 1), info%recv_disp(0:send_size - 1), info%recv_request(0:send_size - 1))
1059 nrow_local_recv = recv_dist%nrow_locals(recv_dist%context%mepos(1))
1060 ncol_local_recv = recv_dist%ncol_locals(recv_dist%context%mepos(2))
1061 info%nlocal_recv(1) = nrow_local_recv
1062 info%nlocal_recv(2) = ncol_local_recv
1064 ALLOCATE (src_p(nrow_local_recv), src_q(ncol_local_recv))
1065 DO i = 1, nrow_local_recv
1068 src_p(i) = mod(((recv_row_indices(i) - 1)/nrow_block_src), src_num_pe(1))
1070 DO j = 1, ncol_local_recv
1072 src_q(j) = mod(((recv_col_indices(j) - 1)/ncol_block_src), src_num_pe(2))
1076 DO q = 0, src_num_pe(2) - 1
1077 ncols = count(src_q .EQ. q)
1078 DO p = 0, src_num_pe(1) - 1
1079 nrows = count(src_p .EQ. p)
1081 recv_count(info%src_blacs2mpi(p, q)) = nrows*ncols
1084 DEALLOCATE (src_p, src_q)
1088 ALLOCATE (info%recv_buf(sum(recv_count(:))))
1089 info%recv_disp(0) = 0
1090 DO i = 1, send_size - 1
1091 info%recv_disp(i) = info%recv_disp(i - 1) + recv_count(i - 1)
1095 DO k = 0, send_size - 1
1096 IF (recv_count(k) .GT. 0)
THEN
1097 CALL para_env%irecv(info%recv_buf(info%recv_disp(k) + 1:info%recv_disp(k) + recv_count(k)), &
1098 source2global(k), info%recv_request(k))
1103 DEALLOCATE (source2global)
1107 IF (
ASSOCIATED(source%matrix_struct))
THEN
1109 col_indices=send_col_indices)
1110 nrow_block_dest = dest_block(1)
1111 ncol_block_dest = dest_block(2)
1112 ALLOCATE (send_count(0:recv_size - 1), send_disp(0:recv_size - 1), info%send_request(0:recv_size - 1))
1115 nrow_local_send = send_dist%nrow_locals(send_dist%context%mepos(1))
1116 ncol_local_send = send_dist%ncol_locals(send_dist%context%mepos(2))
1120 ALLOCATE (dest_p(nrow_local_send), dest_q(ncol_local_send))
1122 DO i = 1, nrow_local_send
1124 dest_p(i) = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1126 DO j = 1, ncol_local_send
1127 dest_q(j) = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1131 DO q = 0, dest_num_pe(2) - 1
1132 ncols = count(dest_q .EQ. q)
1133 DO p = 0, dest_num_pe(1) - 1
1134 nrows = count(dest_p .EQ. p)
1135 send_count(dest_blacs2mpi(p, q)) = nrows*ncols
1138 DEALLOCATE (dest_p, dest_q)
1141 ALLOCATE (info%send_buf(sum(send_count(:))))
1143 DO k = 1, recv_size - 1
1144 send_disp(k) = send_disp(k - 1) + send_count(k - 1)
1149 DO j = 1, ncol_local_send
1151 dest_q_j = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1152 DO i = 1, nrow_local_send
1153 dest_p_i = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1154 mpi_rank = dest_blacs2mpi(dest_p_i, dest_q_j)
1155 send_count(mpi_rank) = send_count(mpi_rank) + 1
1156 info%send_buf(send_disp(mpi_rank) + send_count(mpi_rank)) = source%local_data(i, j)
1161 DO k = 0, recv_size - 1
1162 IF (send_count(k) .GT. 0)
THEN
1163 CALL para_env%isend(info%send_buf(send_disp(k) + 1:send_disp(k) + send_count(k)), &
1164 dest2global(k), info%send_request(k))
1169 DEALLOCATE (send_count, send_disp, dest2global)
1171 DEALLOCATE (dest_blacs2mpi)
1175 CALL timestop(handle)