446 INTEGER,
INTENT(IN),
OPTIONAL :: ncol, start_col
448 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_init_random'
450 INTEGER :: handle, icol_global, icol_local, irow_local, my_ncol, my_start_col, ncol_global, &
451 ncol_local, nrow_global, nrow_local
452 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
453 REAL(kind=
dp),
ALLOCATABLE,
DIMENSION(:) :: buff
454 REAL(kind=
dp),
CONTIGUOUS,
DIMENSION(:, :), &
455 POINTER :: local_data
456 REAL(kind=
dp),
DIMENSION(3, 2),
SAVE :: &
457 seed = reshape((/1.0_dp, 2.0_dp, 3.0_dp, 4.0_dp, 5.0_dp, 6.0_dp/), (/3, 2/))
460 CALL timeset(routinen, handle)
463 CALL matrix%matrix_struct%para_env%bcast(seed, 0)
466 extended_precision=.true., seed=seed)
468 cpassert(.NOT. matrix%use_sp)
470 CALL cp_fm_get_info(matrix, nrow_global=nrow_global, ncol_global=ncol_global, &
471 nrow_local=nrow_local, ncol_local=ncol_local, &
472 local_data=local_data, &
473 row_indices=row_indices, col_indices=col_indices)
476 IF (
PRESENT(start_col)) my_start_col = start_col
477 my_ncol = matrix%matrix_struct%ncol_global
478 IF (
PRESENT(ncol)) my_ncol = ncol
480 IF (ncol_global < (my_start_col + my_ncol - 1)) &
481 cpabort(
"ncol_global>=(my_start_col+my_ncol-1)")
483 ALLOCATE (buff(nrow_global))
489 DO icol_local = 1, ncol_local
490 cpassert(col_indices(icol_local) > icol_global)
492 CALL rng%reset_to_next_substream()
493 icol_global = icol_global + 1
494 IF (icol_global == col_indices(icol_local))
EXIT
497 DO irow_local = 1, nrow_local
498 local_data(irow_local, icol_local) = buff(row_indices(irow_local))
511 CALL rng%get(ig=seed)
513 CALL timestop(handle)
760 start_col, n_rows, n_cols, alpha, beta, transpose)
762 REAL(kind=
dp),
DIMENSION(:, :),
INTENT(in) :: new_values
763 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
764 REAL(kind=
dp),
INTENT(in),
OPTIONAL :: alpha, beta
765 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
767 INTEGER :: i, i0, j, j0, ncol, ncol_block, &
768 ncol_global, ncol_local, nrow, &
769 nrow_block, nrow_global, nrow_local, &
771 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
773 REAL(kind=
dp) :: al, be
774 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: full_block
776 al = 1.0_dp; be = 0.0_dp; i0 = 1; j0 = 1; tr_a = .false.
780 cpassert(.NOT. fm%use_sp)
782 IF (
PRESENT(alpha)) al = alpha
783 IF (
PRESENT(beta)) be = beta
784 IF (
PRESENT(start_row)) i0 = start_row
785 IF (
PRESENT(start_col)) j0 = start_col
786 IF (
PRESENT(transpose)) tr_a = transpose
788 nrow =
SIZE(new_values, 2)
789 ncol =
SIZE(new_values, 1)
791 nrow =
SIZE(new_values, 1)
792 ncol =
SIZE(new_values, 2)
794 IF (
PRESENT(n_rows)) nrow = n_rows
795 IF (
PRESENT(n_cols)) ncol = n_cols
797 full_block => fm%local_data
800 nrow_global=nrow_global, ncol_global=ncol_global, &
801 nrow_block=nrow_block, ncol_block=ncol_block, &
802 nrow_local=nrow_local, ncol_local=ncol_local, &
803 row_indices=row_indices, col_indices=col_indices)
805 IF (al == 1.0 .AND. be == 0.0)
THEN
807 this_col = col_indices(j) - j0 + 1
808 IF (this_col .GE. 1 .AND. this_col .LE. ncol)
THEN
810 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
812 full_block(i, j) = new_values(this_col, row_indices(i))
816 this_row = row_indices(i) - i0 + 1
817 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
818 full_block(i, j) = new_values(this_col, this_row)
823 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
825 full_block(i, j) = new_values(row_indices(i), this_col)
829 this_row = row_indices(i) - i0 + 1
830 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
831 full_block(i, j) = new_values(this_row, this_col)
840 this_col = col_indices(j) - j0 + 1
841 IF (this_col .GE. 1 .AND. this_col .LE. ncol)
THEN
844 this_row = row_indices(i) - i0 + 1
845 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
846 full_block(i, j) = al*new_values(this_col, this_row) + &
852 this_row = row_indices(i) - i0 + 1
853 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
854 full_block(i, j) = al*new_values(this_row, this_col) + &
893 start_col, n_rows, n_cols, transpose)
895 REAL(kind=
dp),
DIMENSION(:, :),
INTENT(out) :: target_m
896 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
897 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
899 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_get_submatrix'
901 INTEGER :: handle, i, i0, j, j0, ncol, ncol_global, &
902 ncol_local, nrow, nrow_global, &
903 nrow_local, this_col, this_row
904 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
906 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: full_block
909 CALL timeset(routinen, handle)
911 i0 = 1; j0 = 1; tr_a = .false.
913 cpassert(.NOT. fm%use_sp)
915 IF (
PRESENT(start_row)) i0 = start_row
916 IF (
PRESENT(start_col)) j0 = start_col
917 IF (
PRESENT(transpose)) tr_a = transpose
919 nrow =
SIZE(target_m, 2)
920 ncol =
SIZE(target_m, 1)
922 nrow =
SIZE(target_m, 1)
923 ncol =
SIZE(target_m, 2)
925 IF (
PRESENT(n_rows)) nrow = n_rows
926 IF (
PRESENT(n_cols)) ncol = n_cols
928 para_env => fm%matrix_struct%para_env
930 full_block => fm%local_data
931#if defined(__parallel)
933 IF (
SIZE(target_m, 1)*
SIZE(target_m, 2) /= 0)
THEN
934 CALL dcopy(
SIZE(target_m, 1)*
SIZE(target_m, 2), [0.0_dp], 0, target_m, 1)
939 nrow_global=nrow_global, ncol_global=ncol_global, &
940 nrow_local=nrow_local, ncol_local=ncol_local, &
941 row_indices=row_indices, col_indices=col_indices)
944 this_col = col_indices(j) - j0 + 1
945 IF (this_col .GE. 1 .AND. this_col .LE. ncol)
THEN
947 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
949 target_m(this_col, row_indices(i)) = full_block(i, j)
953 this_row = row_indices(i) - i0 + 1
954 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
955 target_m(this_col, this_row) = full_block(i, j)
960 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
962 target_m(row_indices(i), this_col) = full_block(i, j)
966 this_row = row_indices(i) - i0 + 1
967 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
968 target_m(this_row, this_col) = full_block(i, j)
976 CALL para_env%sum(target_m)
978 CALL timestop(handle)
1058 REAL(kind=
dp),
INTENT(OUT) :: a_max
1059 INTEGER,
INTENT(OUT),
OPTIONAL :: ir_max, ic_max
1061 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_maxabsval'
1063 INTEGER :: handle, i, ic_max_local, ir_max_local, &
1064 j, mepos, ncol_local, nrow_local, &
1066 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: ic_max_vec, ir_max_vec
1067 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
1069 REAL(
dp),
ALLOCATABLE,
DIMENSION(:) :: a_max_vec
1070 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: my_block
1071 REAL(kind=
sp),
DIMENSION(:, :),
POINTER :: my_block_sp
1073 CALL timeset(routinen, handle)
1075 my_block => matrix%local_data
1076 my_block_sp => matrix%local_data_sp
1078 CALL cp_fm_get_info(matrix, nrow_local=nrow_local, ncol_local=ncol_local, &
1079 row_indices=row_indices, col_indices=col_indices)
1081 IF (matrix%use_sp)
THEN
1082 a_max = real(maxval(abs(my_block_sp(1:nrow_local, 1:ncol_local))),
dp)
1084 a_max = maxval(abs(my_block(1:nrow_local, 1:ncol_local)))
1087 IF (
PRESENT(ir_max))
THEN
1088 num_pe = matrix%matrix_struct%para_env%num_pe
1089 mepos = matrix%matrix_struct%para_env%mepos
1090 ALLOCATE (ir_max_vec(0:num_pe - 1))
1091 ir_max_vec(0:num_pe - 1) = 0
1092 ALLOCATE (ic_max_vec(0:num_pe - 1))
1093 ic_max_vec(0:num_pe - 1) = 0
1094 ALLOCATE (a_max_vec(0:num_pe - 1))
1095 a_max_vec(0:num_pe - 1) = 0.0_dp
1098 IF ((ncol_local > 0) .AND. (nrow_local > 0))
THEN
1099 DO i = 1, ncol_local
1100 DO j = 1, nrow_local
1101 IF (matrix%use_sp)
THEN
1102 IF (abs(my_block_sp(j, i)) > my_max)
THEN
1103 my_max = real(my_block_sp(j, i),
dp)
1108 IF (abs(my_block(j, i)) > my_max)
THEN
1109 my_max = my_block(j, i)
1117 a_max_vec(mepos) = my_max
1118 ir_max_vec(mepos) = row_indices(ir_max_local)
1119 ic_max_vec(mepos) = col_indices(ic_max_local)
1123 CALL matrix%matrix_struct%para_env%sum(a_max_vec)
1124 CALL matrix%matrix_struct%para_env%sum(ir_max_vec)
1125 CALL matrix%matrix_struct%para_env%sum(ic_max_vec)
1128 DO i = 0, num_pe - 1
1129 IF (a_max_vec(i) > my_max)
THEN
1130 ir_max = ir_max_vec(i)
1131 ic_max = ic_max_vec(i)
1135 DEALLOCATE (ir_max_vec, ic_max_vec, a_max_vec)
1136 cpassert(ic_max > 0)
1137 cpassert(ir_max > 0)
1141 CALL matrix%matrix_struct%para_env%max(a_max)
1143 CALL timestop(handle)
1304 SUBROUTINE cp_fm_to_fm_matrix(source, destination)
1306 TYPE(
cp_fm_type),
INTENT(IN) :: source, destination
1308 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_to_fm_matrix'
1310 INTEGER :: handle, npcol, nprow
1312 CALL timeset(routinen, handle)
1314 nprow = source%matrix_struct%context%num_pe(1)
1315 npcol = source%matrix_struct%context%num_pe(2)
1319 destination%matrix_struct))
THEN
1320 IF (source%use_sp .AND. destination%use_sp)
THEN
1321 IF (
SIZE(source%local_data_sp, 1) /=
SIZE(destination%local_data_sp, 1) .OR. &
1322 SIZE(source%local_data_sp, 2) /=
SIZE(destination%local_data_sp, 2)) &
1323 CALL cp_abort(__location__, &
1324 "Cannot copy full matrix <"//trim(source%name)// &
1325 "> to full matrix <"//trim(destination%name)// &
1326 ">. The local_data blocks have different sizes.")
1327 CALL scopy(
SIZE(source%local_data_sp, 1)*
SIZE(source%local_data_sp, 2), &
1328 source%local_data_sp, 1, destination%local_data_sp, 1)
1329 ELSE IF (source%use_sp .AND. .NOT. destination%use_sp)
THEN
1330 IF (
SIZE(source%local_data_sp, 1) /=
SIZE(destination%local_data, 1) .OR. &
1331 SIZE(source%local_data_sp, 2) /=
SIZE(destination%local_data, 2)) &
1332 CALL cp_abort(__location__, &
1333 "Cannot copy full matrix <"//trim(source%name)// &
1334 "> to full matrix <"//trim(destination%name)// &
1335 ">. The local_data blocks have different sizes.")
1336 destination%local_data = real(source%local_data_sp,
dp)
1337 ELSE IF (.NOT. source%use_sp .AND. destination%use_sp)
THEN
1338 IF (
SIZE(source%local_data, 1) /=
SIZE(destination%local_data_sp, 1) .OR. &
1339 SIZE(source%local_data, 2) /=
SIZE(destination%local_data_sp, 2)) &
1340 CALL cp_abort(__location__, &
1341 "Cannot copy full matrix <"//trim(source%name)// &
1342 "> to full matrix <"//trim(destination%name)// &
1343 ">. The local_data blocks have different sizes.")
1344 destination%local_data_sp = real(source%local_data,
sp)
1346 IF (
SIZE(source%local_data, 1) /=
SIZE(destination%local_data, 1) .OR. &
1347 SIZE(source%local_data, 2) /=
SIZE(destination%local_data, 2)) &
1348 CALL cp_abort(__location__, &
1349 "Cannot copy full matrix <"//trim(source%name)// &
1350 "> to full matrix <"//trim(destination%name)// &
1351 ">. The local_data blocks have different sizes.")
1352 CALL dcopy(
SIZE(source%local_data, 1)*
SIZE(source%local_data, 2), &
1353 source%local_data, 1, destination%local_data, 1)
1356 cpabort(
"Data structures of source and target full matrix are not equivalent")
1359 CALL timestop(handle)
1567 TYPE(
cp_fm_type),
INTENT(IN) :: source, destination
1571 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_start_copy_general'
1573 INTEGER :: dest_p_i, dest_q_j, global_rank, global_size, handle, i, j, k, mpi_rank, &
1574 ncol_block_dest, ncol_block_src, ncol_local_recv, ncol_local_send, ncols, &
1575 nrow_block_dest, nrow_block_src, nrow_local_recv, nrow_local_send, nrows, p, q, &
1576 recv_rank, recv_size, send_rank, send_size
1577 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: all_ranks, dest2global, dest_p, dest_q, &
1578 recv_count, send_count, send_disp, &
1579 source2global, src_p, src_q
1580 INTEGER,
ALLOCATABLE,
DIMENSION(:, :) :: dest_blacs2mpi
1581 INTEGER,
DIMENSION(2) :: dest_block, dest_block_tmp, dest_num_pe, &
1582 src_block, src_block_tmp, src_num_pe
1583 INTEGER,
DIMENSION(:),
POINTER :: recv_col_indices, recv_row_indices, &
1584 send_col_indices, send_row_indices
1588 CALL timeset(routinen, handle)
1592 nrow_local_send =
SIZE(source%local_data, 1)
1593 ncol_local_send =
SIZE(source%local_data, 2)
1594 ALLOCATE (info%send_buf(nrow_local_send*ncol_local_send))
1596 DO j = 1, ncol_local_send
1597 DO i = 1, nrow_local_send
1599 info%send_buf(k) = source%local_data(i, j)
1604 IF (source%use_sp) cpabort(
"only DP kind implemented")
1605 IF (destination%use_sp) cpabort(
"only DP kind implemented")
1607 NULLIFY (recv_dist, send_dist)
1608 NULLIFY (recv_col_indices, recv_row_indices, send_col_indices, send_row_indices)
1611 global_size = para_env%num_pe
1612 global_rank = para_env%mepos
1618 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1619 recv_dist => destination%matrix_struct
1620 recv_rank = recv_dist%para_env%mepos
1625 IF (
ASSOCIATED(source%matrix_struct))
THEN
1626 send_dist => source%matrix_struct
1627 send_rank = send_dist%para_env%mepos
1633 ALLOCATE (all_ranks(0:global_size - 1))
1635 CALL para_env%allgather(send_rank, all_ranks)
1636 IF (
ASSOCIATED(recv_dist))
THEN
1637 ALLOCATE (source2global(0:count(all_ranks .NE.
mp_proc_null) - 1))
1638 DO i = 0, global_size - 1
1640 source2global(all_ranks(i)) = i
1645 CALL para_env%allgather(recv_rank, all_ranks)
1646 IF (
ASSOCIATED(send_dist))
THEN
1647 ALLOCATE (dest2global(0:count(all_ranks .NE.
mp_proc_null) - 1))
1648 DO i = 0, global_size - 1
1650 dest2global(all_ranks(i)) = i
1654 DEALLOCATE (all_ranks)
1661 IF (global_rank == 0)
THEN
1663 CALL para_env%irecv(src_block,
mp_any_source, recv_req(1), tag=src_tag)
1664 CALL para_env%irecv(dest_block,
mp_any_source, recv_req(2), tag=dest_tag)
1665 CALL para_env%irecv(src_num_pe,
mp_any_source, recv_req(3), tag=src_tag)
1666 CALL para_env%irecv(dest_num_pe,
mp_any_source, recv_req(4), tag=dest_tag)
1669 IF (
ASSOCIATED(send_dist))
THEN
1670 IF ((send_rank .EQ. 0))
THEN
1672 src_block_tmp = (/send_dist%nrow_block, send_dist%ncol_block/)
1673 CALL para_env%isend(src_block_tmp, 0, send_req(1), tag=src_tag)
1674 CALL para_env%isend(send_dist%context%num_pe, 0, send_req(2), tag=src_tag)
1678 IF (
ASSOCIATED(recv_dist))
THEN
1679 IF ((recv_rank .EQ. 0))
THEN
1680 dest_block_tmp = (/recv_dist%nrow_block, recv_dist%ncol_block/)
1681 CALL para_env%isend(dest_block_tmp, 0, send_req(3), tag=dest_tag)
1682 CALL para_env%isend(recv_dist%context%num_pe, 0, send_req(4), tag=dest_tag)
1686 IF (global_rank == 0)
THEN
1689 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1690 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1) &
1692 CALL para_env%irecv(info%src_blacs2mpi,
mp_any_source, recv_req(5), tag=src_tag)
1693 CALL para_env%irecv(dest_blacs2mpi,
mp_any_source, recv_req(6), tag=dest_tag)
1696 IF (
ASSOCIATED(send_dist))
THEN
1697 IF ((send_rank .EQ. 0))
THEN
1698 CALL para_env%isend(send_dist%context%blacs2mpi(:, :), 0, send_req(5), tag=src_tag)
1702 IF (
ASSOCIATED(recv_dist))
THEN
1703 IF ((recv_rank .EQ. 0))
THEN
1704 CALL para_env%isend(recv_dist%context%blacs2mpi(:, :), 0, send_req(6), tag=dest_tag)
1708 IF (global_rank == 0)
THEN
1713 CALL para_env%bcast(src_block, 0)
1714 CALL para_env%bcast(dest_block, 0)
1715 CALL para_env%bcast(src_num_pe, 0)
1716 CALL para_env%bcast(dest_num_pe, 0)
1717 info%src_num_pe(1:2) = src_num_pe(1:2)
1718 info%nblock_src(1:2) = src_block(1:2)
1719 IF (global_rank .NE. 0)
THEN
1720 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1721 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1) &
1724 CALL para_env%bcast(info%src_blacs2mpi, 0)
1725 CALL para_env%bcast(dest_blacs2mpi, 0)
1727 recv_size = dest_num_pe(1)*dest_num_pe(2)
1728 send_size = src_num_pe(1)*src_num_pe(2)
1729 info%send_size = send_size
1747 IF (
ASSOCIATED(recv_dist))
THEN
1749 col_indices=recv_col_indices &
1751 info%recv_col_indices => recv_col_indices
1752 info%recv_row_indices => recv_row_indices
1753 nrow_block_src = src_block(1)
1754 ncol_block_src = src_block(2)
1755 ALLOCATE (recv_count(0:send_size - 1), info%recv_disp(0:send_size - 1), info%recv_request(0:send_size - 1))
1758 nrow_local_recv = recv_dist%nrow_locals(recv_dist%context%mepos(1))
1759 ncol_local_recv = recv_dist%ncol_locals(recv_dist%context%mepos(2))
1760 info%nlocal_recv(1) = nrow_local_recv
1761 info%nlocal_recv(2) = ncol_local_recv
1763 ALLOCATE (src_p(nrow_local_recv), src_q(ncol_local_recv))
1764 DO i = 1, nrow_local_recv
1767 src_p(i) = mod(((recv_row_indices(i) - 1)/nrow_block_src), src_num_pe(1))
1769 DO j = 1, ncol_local_recv
1771 src_q(j) = mod(((recv_col_indices(j) - 1)/ncol_block_src), src_num_pe(2))
1775 DO q = 0, src_num_pe(2) - 1
1776 ncols = count(src_q .EQ. q)
1777 DO p = 0, src_num_pe(1) - 1
1778 nrows = count(src_p .EQ. p)
1780 recv_count(info%src_blacs2mpi(p, q)) = nrows*ncols
1783 DEALLOCATE (src_p, src_q)
1787 ALLOCATE (info%recv_buf(sum(recv_count(:))))
1788 info%recv_disp(0) = 0
1789 DO i = 1, send_size - 1
1790 info%recv_disp(i) = info%recv_disp(i - 1) + recv_count(i - 1)
1794 DO k = 0, send_size - 1
1795 IF (recv_count(k) .GT. 0)
THEN
1796 CALL para_env%irecv(info%recv_buf(info%recv_disp(k) + 1:info%recv_disp(k) + recv_count(k)), &
1797 source2global(k), info%recv_request(k))
1800 DEALLOCATE (source2global)
1804 IF (
ASSOCIATED(send_dist))
THEN
1806 col_indices=send_col_indices &
1808 nrow_block_dest = dest_block(1)
1809 ncol_block_dest = dest_block(2)
1810 ALLOCATE (send_count(0:recv_size - 1), send_disp(0:recv_size - 1), info%send_request(0:recv_size - 1))
1813 nrow_local_send = send_dist%nrow_locals(send_dist%context%mepos(1))
1814 ncol_local_send = send_dist%ncol_locals(send_dist%context%mepos(2))
1818 ALLOCATE (dest_p(nrow_local_send), dest_q(ncol_local_send))
1820 DO i = 1, nrow_local_send
1822 dest_p(i) = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1824 DO j = 1, ncol_local_send
1825 dest_q(j) = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1829 DO q = 0, dest_num_pe(2) - 1
1830 ncols = count(dest_q .EQ. q)
1831 DO p = 0, dest_num_pe(1) - 1
1832 nrows = count(dest_p .EQ. p)
1833 send_count(dest_blacs2mpi(p, q)) = nrows*ncols
1836 DEALLOCATE (dest_p, dest_q)
1839 ALLOCATE (info%send_buf(sum(send_count(:))))
1841 DO k = 1, recv_size - 1
1842 send_disp(k) = send_disp(k - 1) + send_count(k - 1)
1847 DO j = 1, ncol_local_send
1849 dest_q_j = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1850 DO i = 1, nrow_local_send
1851 dest_p_i = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1852 mpi_rank = dest_blacs2mpi(dest_p_i, dest_q_j)
1853 send_count(mpi_rank) = send_count(mpi_rank) + 1
1854 info%send_buf(send_disp(mpi_rank) + send_count(mpi_rank)) = source%local_data(i, j)
1859 DO k = 0, recv_size - 1
1860 IF (send_count(k) .GT. 0)
THEN
1861 CALL para_env%isend(info%send_buf(send_disp(k) + 1:send_disp(k) + send_count(k)), &
1862 dest2global(k), info%send_request(k))
1865 DEALLOCATE (send_count, send_disp, dest2global)
1867 DEALLOCATE (dest_blacs2mpi)
1871 CALL timestop(handle)
2147 INTEGER,
INTENT(IN) :: unit
2149 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_write_unformatted'
2151 INTEGER :: handle, j, max_block, &
2152 ncol_global, nrow_global
2154#if defined(__parallel)
2155 INTEGER :: i, i_block, icol_local, &
2157 iprow, irow_local, &
2160 INTEGER,
DIMENSION(9) :: desc
2161 REAL(kind=
dp),
DIMENSION(:),
POINTER :: vecbuf
2162 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: newdat
2164 INTEGER,
EXTERNAL :: numroc
2167 CALL timeset(routinen, handle)
2168 CALL cp_fm_get_info(fm, nrow_global=nrow_global, ncol_global=ncol_global, ncol_block=max_block, &
2171#if defined(__parallel)
2172 num_pe = para_env%num_pe
2173 mepos = para_env%mepos
2177 CALL ictxt_loc%gridinit(para_env,
'R', 1, num_pe)
2178 CALL descinit(desc, nrow_global, ncol_global, rb, max_block, 0, 0, ictxt_loc%get_handle(), nrow_global, info)
2180 associate(nprow => ictxt_loc%num_pe(1), npcol => ictxt_loc%num_pe(2), &
2181 myprow => ictxt_loc%mepos(1), mypcol => ictxt_loc%mepos(2))
2182 in = numroc(ncol_global, max_block, mypcol, 0, npcol)
2184 ALLOCATE (newdat(nrow_global, max(1, in)))
2187 CALL pdgemr2d(nrow_global, ncol_global, fm%local_data, 1, 1, &
2188 fm%matrix_struct%descriptor, &
2189 newdat, 1, 1, desc, ictxt_loc%get_handle())
2191 ALLOCATE (vecbuf(nrow_global*max_block))
2192 vecbuf = huge(1.0_dp)
2194 DO i = 1, ncol_global, max(max_block, 1)
2195 i_block = min(max_block, ncol_global - i + 1)
2196 CALL infog2l(1, i, desc, nprow, npcol, myprow, mypcol, &
2197 irow_local, icol_local, iprow, ipcol)
2198 IF (ipcol == mypcol)
THEN
2200 vecbuf((j - 1)*nrow_global + 1:nrow_global*j) = newdat(:, icol_local + j - 1)
2204 IF (ipcol == 0)
THEN
2207 IF (ipcol == mypcol)
THEN
2208 CALL para_env%send(vecbuf(:), 0, tag)
2210 IF (mypcol == 0)
THEN
2211 CALL para_env%recv(vecbuf(:), ipcol, tag)
2217 WRITE (unit) vecbuf((j - 1)*nrow_global + 1:nrow_global*j)
2225 CALL ictxt_loc%gridexit()
2232 DO j = 1, ncol_global
2233 WRITE (unit) fm%local_data(:, j)
2238 CALL timestop(handle)
2251 INTEGER,
INTENT(IN) :: unit
2252 CHARACTER(LEN=*),
INTENT(IN),
OPTIONAL ::
header, value_format
2254 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_write_formatted'
2256 CHARACTER(LEN=21) :: my_value_format
2257 INTEGER :: handle, i, j, max_block, &
2258 ncol_global, nrow_global
2259 TYPE(mp_para_env_type),
POINTER :: para_env
2260#if defined(__parallel)
2261 INTEGER :: i_block, icol_local, &
2263 iprow, irow_local, &
2264 mepos, num_pe, rb, tag, k, &
2266 INTEGER,
DIMENSION(9) :: desc
2267 REAL(kind=dp),
DIMENSION(:),
POINTER :: vecbuf
2268 REAL(kind=dp),
DIMENSION(:, :),
POINTER :: newdat
2269 TYPE(cp_blacs_type) :: ictxt_loc
2270 INTEGER,
EXTERNAL :: numroc
2273 CALL timeset(routinen, handle)
2274 CALL cp_fm_get_info(fm, nrow_global=nrow_global, ncol_global=ncol_global, ncol_block=max_block, &
2277 IF (
PRESENT(value_format))
THEN
2278 cpassert(len_trim(adjustl(value_format)) < 11)
2279 my_value_format =
"(I10, I10, "//trim(adjustl(value_format))//
")"
2281 my_value_format =
"(I10, I10, ES24.12)"
2286 WRITE (unit,
"(A2, A8, A10, A24)")
"#",
"Row",
"Column", adjustl(
"Value")
2289#if defined(__parallel)
2290 num_pe = para_env%num_pe
2291 mepos = para_env%mepos
2295 CALL ictxt_loc%gridinit(para_env,
'R', 1, num_pe)
2296 CALL descinit(desc, nrow_global, ncol_global, rb, max_block, 0, 0, ictxt_loc%get_handle(), nrow_global, info)
2298 associate(nprow => ictxt_loc%num_pe(1), npcol => ictxt_loc%num_pe(2), &
2299 myprow => ictxt_loc%mepos(1), mypcol => ictxt_loc%mepos(2))
2300 in = numroc(ncol_global, max_block, mypcol, 0, npcol)
2302 ALLOCATE (newdat(nrow_global, max(1, in)))
2305 CALL pdgemr2d(nrow_global, ncol_global, fm%local_data, 1, 1, &
2306 fm%matrix_struct%descriptor, &
2307 newdat, 1, 1, desc, ictxt_loc%get_handle())
2309 ALLOCATE (vecbuf(nrow_global*max_block))
2310 vecbuf = huge(1.0_dp)
2314 DO i = 1, ncol_global, max(max_block, 1)
2315 i_block = min(max_block, ncol_global - i + 1)
2316 CALL infog2l(1, i, desc, nprow, npcol, myprow, mypcol, &
2317 irow_local, icol_local, iprow, ipcol)
2318 IF (ipcol == mypcol)
THEN
2320 vecbuf((j - 1)*nrow_global + 1:nrow_global*j) = newdat(:, icol_local + j - 1)
2324 IF (ipcol == 0)
THEN
2327 IF (ipcol == mypcol)
THEN
2328 CALL para_env%send(vecbuf(:), 0, tag)
2330 IF (mypcol == 0)
THEN
2331 CALL para_env%recv(vecbuf(:), ipcol, tag)
2337 DO k = (j - 1)*nrow_global + 1, nrow_global*j
2338 WRITE (unit=unit, fmt=my_value_format) irow, icol, vecbuf(k)
2340 IF (irow > nrow_global)
THEN
2352 CALL ictxt_loc%gridexit()
2359 DO j = 1, ncol_global
2360 DO i = 1, nrow_global
2361 WRITE (unit=unit, fmt=my_value_format) i, j, fm%local_data(i, j)
2367 CALL timestop(handle)