453 INTEGER,
INTENT(IN),
OPTIONAL :: ncol, start_col
455 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_init_random'
457 INTEGER :: handle, icol_global, icol_local, irow_local, my_ncol, my_start_col, ncol_global, &
458 ncol_local, nrow_global, nrow_local
459 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
460 REAL(kind=
dp),
ALLOCATABLE,
DIMENSION(:) :: buff
461 REAL(kind=
dp),
CONTIGUOUS,
DIMENSION(:, :), &
462 POINTER :: local_data
463 REAL(kind=
dp),
DIMENSION(3, 2),
SAVE :: &
464 seed = reshape([1.0_dp, 2.0_dp, 3.0_dp, 4.0_dp, 5.0_dp, 6.0_dp], [3, 2])
467 CALL timeset(routinen, handle)
470 CALL matrix%matrix_struct%para_env%bcast(seed, 0)
473 extended_precision=.true., seed=seed)
475 CALL cp_fm_get_info(matrix, nrow_global=nrow_global, ncol_global=ncol_global, &
476 nrow_local=nrow_local, ncol_local=ncol_local, &
477 local_data=local_data, &
478 row_indices=row_indices, col_indices=col_indices)
481 IF (
PRESENT(start_col)) my_start_col = start_col
482 my_ncol = matrix%matrix_struct%ncol_global
483 IF (
PRESENT(ncol)) my_ncol = ncol
485 IF (ncol_global < (my_start_col + my_ncol - 1)) &
486 cpabort(
"ncol_global>=(my_start_col+my_ncol-1)")
488 ALLOCATE (buff(nrow_global))
494 DO icol_local = 1, ncol_local
495 cpassert(col_indices(icol_local) > icol_global)
497 CALL rng%reset_to_next_substream()
498 icol_global = icol_global + 1
499 IF (icol_global == col_indices(icol_local))
EXIT
502 DO irow_local = 1, nrow_local
503 local_data(irow_local, icol_local) = buff(row_indices(irow_local))
516 CALL rng%get(ig=seed)
518 CALL timestop(handle)
748 start_col, n_rows, n_cols, alpha, beta, transpose)
750 REAL(kind=
dp),
DIMENSION(:, :),
INTENT(in) :: new_values
751 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
752 REAL(kind=
dp),
INTENT(in),
OPTIONAL :: alpha, beta
753 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
755 INTEGER :: i, i0, j, j0, ncol, ncol_block, &
756 ncol_global, ncol_local, nrow, &
757 nrow_block, nrow_global, nrow_local, &
759 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
761 REAL(kind=
dp) :: al, be
762 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: full_block
764 al = 1.0_dp; be = 0.0_dp; i0 = 1; j0 = 1; tr_a = .false.
766 IF (
PRESENT(alpha)) al = alpha
767 IF (
PRESENT(beta)) be = beta
768 IF (
PRESENT(start_row)) i0 = start_row
769 IF (
PRESENT(start_col)) j0 = start_col
770 IF (
PRESENT(transpose)) tr_a = transpose
772 nrow =
SIZE(new_values, 2)
773 ncol =
SIZE(new_values, 1)
775 nrow =
SIZE(new_values, 1)
776 ncol =
SIZE(new_values, 2)
778 IF (
PRESENT(n_rows)) nrow = n_rows
779 IF (
PRESENT(n_cols)) ncol = n_cols
781 full_block => fm%local_data
784 nrow_global=nrow_global, ncol_global=ncol_global, &
785 nrow_block=nrow_block, ncol_block=ncol_block, &
786 nrow_local=nrow_local, ncol_local=ncol_local, &
787 row_indices=row_indices, col_indices=col_indices)
789 IF (al == 1.0 .AND. be == 0.0)
THEN
791 this_col = col_indices(j) - j0 + 1
792 IF (this_col >= 1 .AND. this_col <= ncol)
THEN
794 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
796 full_block(i, j) = new_values(this_col, row_indices(i))
800 this_row = row_indices(i) - i0 + 1
801 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
802 full_block(i, j) = new_values(this_col, this_row)
807 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
809 full_block(i, j) = new_values(row_indices(i), this_col)
813 this_row = row_indices(i) - i0 + 1
814 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
815 full_block(i, j) = new_values(this_row, this_col)
824 this_col = col_indices(j) - j0 + 1
825 IF (this_col >= 1 .AND. this_col <= ncol)
THEN
828 this_row = row_indices(i) - i0 + 1
829 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
830 full_block(i, j) = al*new_values(this_col, this_row) + &
836 this_row = row_indices(i) - i0 + 1
837 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
838 full_block(i, j) = al*new_values(this_row, this_col) + &
923 start_col, n_rows, n_cols, transpose)
925 REAL(kind=
dp),
DIMENSION(:, :),
INTENT(out) :: target_m
926 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
927 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
929 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_get_submatrix'
931 INTEGER :: handle, i, i0, j, j0, ncol, ncol_global, &
932 ncol_local, nrow, nrow_global, &
933 nrow_local, this_col, this_row
934 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
936 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: full_block
939 CALL timeset(routinen, handle)
941 i0 = 1; j0 = 1; tr_a = .false.
943 IF (
PRESENT(start_row)) i0 = start_row
944 IF (
PRESENT(start_col)) j0 = start_col
945 IF (
PRESENT(transpose)) tr_a = transpose
947 nrow =
SIZE(target_m, 2)
948 ncol =
SIZE(target_m, 1)
950 nrow =
SIZE(target_m, 1)
951 ncol =
SIZE(target_m, 2)
953 IF (
PRESENT(n_rows)) nrow = n_rows
954 IF (
PRESENT(n_cols)) ncol = n_cols
956 para_env => fm%matrix_struct%para_env
958 full_block => fm%local_data
959#if defined(__parallel)
961 IF (
SIZE(target_m, 1)*
SIZE(target_m, 2) /= 0)
THEN
962 CALL dcopy(
SIZE(target_m, 1)*
SIZE(target_m, 2), [0.0_dp], 0, target_m, 1)
967 nrow_global=nrow_global, ncol_global=ncol_global, &
968 nrow_local=nrow_local, ncol_local=ncol_local, &
969 row_indices=row_indices, col_indices=col_indices)
972 this_col = col_indices(j) - j0 + 1
973 IF (this_col >= 1 .AND. this_col <= ncol)
THEN
975 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
977 target_m(this_col, row_indices(i)) = full_block(i, j)
981 this_row = row_indices(i) - i0 + 1
982 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
983 target_m(this_col, this_row) = full_block(i, j)
988 IF (i0 == 1 .AND. nrow_global == nrow)
THEN
990 target_m(row_indices(i), this_col) = full_block(i, j)
994 this_row = row_indices(i) - i0 + 1
995 IF (this_row >= 1 .AND. this_row <= nrow)
THEN
996 target_m(this_row, this_col) = full_block(i, j)
1004 CALL para_env%sum(target_m)
1006 CALL timestop(handle)
1034 nrow_block, ncol_block, nrow_local, ncol_local, &
1035 row_indices, col_indices, local_data, context, &
1036 nrow_locals, ncol_locals, matrix_struct, para_env)
1039 CHARACTER(LEN=*),
INTENT(OUT),
OPTIONAL :: name
1040 INTEGER,
INTENT(OUT),
OPTIONAL :: nrow_global, ncol_global, nrow_block, &
1041 ncol_block, nrow_local, ncol_local
1042 INTEGER,
DIMENSION(:),
OPTIONAL,
POINTER :: row_indices, col_indices
1043 REAL(kind=
dp),
CONTIGUOUS,
DIMENSION(:, :), &
1044 OPTIONAL,
POINTER :: local_data
1046 INTEGER,
DIMENSION(:),
OPTIONAL,
POINTER :: nrow_locals, ncol_locals
1050 IF (
PRESENT(name)) name = matrix%name
1051 IF (
PRESENT(matrix_struct)) matrix_struct => matrix%matrix_struct
1052 IF (
PRESENT(local_data)) local_data => matrix%local_data
1055 ncol_local=ncol_local, nrow_global=nrow_global, &
1056 ncol_global=ncol_global, nrow_block=nrow_block, &
1057 ncol_block=ncol_block, row_indices=row_indices, &
1058 col_indices=col_indices, nrow_locals=nrow_locals, &
1059 ncol_locals=ncol_locals, context=context, para_env=para_env)
1086 REAL(kind=
dp),
INTENT(OUT) :: a_max
1087 INTEGER,
INTENT(OUT),
OPTIONAL :: ir_max, ic_max
1089 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_maxabsval'
1091 INTEGER :: handle, i, ic_max_local, ir_max_local, &
1092 j, mepos, ncol_local, nrow_local, &
1094 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: ic_max_vec, ir_max_vec
1095 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
1097 REAL(
dp),
ALLOCATABLE,
DIMENSION(:) :: a_max_vec
1098 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: my_block
1100 CALL timeset(routinen, handle)
1102 my_block => matrix%local_data
1104 CALL cp_fm_get_info(matrix, nrow_local=nrow_local, ncol_local=ncol_local, &
1105 row_indices=row_indices, col_indices=col_indices)
1107 a_max = maxval(abs(my_block(1:nrow_local, 1:ncol_local)))
1109 IF (
PRESENT(ir_max))
THEN
1110 num_pe = matrix%matrix_struct%para_env%num_pe
1111 mepos = matrix%matrix_struct%para_env%mepos
1112 ALLOCATE (ir_max_vec(0:num_pe - 1))
1113 ir_max_vec(0:num_pe - 1) = 0
1114 ALLOCATE (ic_max_vec(0:num_pe - 1))
1115 ic_max_vec(0:num_pe - 1) = 0
1116 ALLOCATE (a_max_vec(0:num_pe - 1))
1117 a_max_vec(0:num_pe - 1) = 0.0_dp
1120 IF ((ncol_local > 0) .AND. (nrow_local > 0))
THEN
1121 DO i = 1, ncol_local
1122 DO j = 1, nrow_local
1123 IF (abs(my_block(j, i)) > my_max)
THEN
1124 my_max = my_block(j, i)
1131 a_max_vec(mepos) = my_max
1132 ir_max_vec(mepos) = row_indices(ir_max_local)
1133 ic_max_vec(mepos) = col_indices(ic_max_local)
1137 CALL matrix%matrix_struct%para_env%sum(a_max_vec)
1138 CALL matrix%matrix_struct%para_env%sum(ir_max_vec)
1139 CALL matrix%matrix_struct%para_env%sum(ic_max_vec)
1142 DO i = 0, num_pe - 1
1143 IF (a_max_vec(i) > my_max)
THEN
1144 ir_max = ir_max_vec(i)
1145 ic_max = ic_max_vec(i)
1149 DEALLOCATE (ir_max_vec, ic_max_vec, a_max_vec)
1150 cpassert(ic_max > 0)
1151 cpassert(ir_max > 0)
1155 CALL matrix%matrix_struct%para_env%max(a_max)
1157 CALL timestop(handle)
1548 TYPE(
cp_fm_type),
INTENT(IN) :: source, destination
1552 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_start_copy_general'
1554 INTEGER :: dest_p_i, dest_q_j, global_rank, global_size, handle, i, j, k, mpi_rank, &
1555 ncol_block_dest, ncol_block_src, ncol_local_recv, ncol_local_send, ncols, &
1556 nrow_block_dest, nrow_block_src, nrow_local_recv, nrow_local_send, nrows, p, q, &
1557 recv_rank, recv_size, send_rank, send_size
1558 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: all_ranks, dest2global, dest_p, dest_q, &
1559 recv_count, send_count, send_disp, &
1560 source2global, src_p, src_q
1561 INTEGER,
ALLOCATABLE,
DIMENSION(:, :) :: dest_blacs2mpi
1562 INTEGER,
DIMENSION(2) :: dest_block, dest_block_tmp, dest_num_pe, &
1563 src_block, src_block_tmp, src_num_pe
1564 INTEGER,
DIMENSION(:),
POINTER :: recv_col_indices, recv_row_indices, &
1565 send_col_indices, send_row_indices
1569 CALL timeset(routinen, handle)
1573 nrow_local_send =
SIZE(source%local_data, 1)
1574 ncol_local_send =
SIZE(source%local_data, 2)
1575 ALLOCATE (info%send_buf(nrow_local_send*ncol_local_send))
1577 DO j = 1, ncol_local_send
1578 DO i = 1, nrow_local_send
1580 info%send_buf(k) = source%local_data(i, j)
1584 NULLIFY (recv_dist, send_dist)
1585 NULLIFY (recv_col_indices, recv_row_indices, send_col_indices, send_row_indices)
1588 global_size = para_env%num_pe
1589 global_rank = para_env%mepos
1595 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1596 recv_dist => destination%matrix_struct
1597 recv_rank = recv_dist%para_env%mepos
1602 IF (
ASSOCIATED(source%matrix_struct))
THEN
1603 send_dist => source%matrix_struct
1604 send_rank = send_dist%para_env%mepos
1610 ALLOCATE (all_ranks(0:global_size - 1))
1612 CALL para_env%allgather(send_rank, all_ranks)
1613 IF (
ASSOCIATED(recv_dist))
THEN
1614 ALLOCATE (source2global(0:count(all_ranks /=
mp_proc_null) - 1))
1615 DO i = 0, global_size - 1
1617 source2global(all_ranks(i)) = i
1622 CALL para_env%allgather(recv_rank, all_ranks)
1623 IF (
ASSOCIATED(send_dist))
THEN
1624 ALLOCATE (dest2global(0:count(all_ranks /=
mp_proc_null) - 1))
1625 DO i = 0, global_size - 1
1627 dest2global(all_ranks(i)) = i
1631 DEALLOCATE (all_ranks)
1638 IF (global_rank == 0)
THEN
1640 CALL para_env%irecv(src_block,
mp_any_source, recv_req(1), tag=src_tag)
1641 CALL para_env%irecv(dest_block,
mp_any_source, recv_req(2), tag=dest_tag)
1642 CALL para_env%irecv(src_num_pe,
mp_any_source, recv_req(3), tag=src_tag)
1643 CALL para_env%irecv(dest_num_pe,
mp_any_source, recv_req(4), tag=dest_tag)
1646 IF (
ASSOCIATED(send_dist))
THEN
1647 IF ((send_rank == 0))
THEN
1649 src_block_tmp = [send_dist%nrow_block, send_dist%ncol_block]
1650 CALL para_env%isend(src_block_tmp, 0, send_req(1), tag=src_tag)
1651 CALL para_env%isend(send_dist%context%num_pe, 0, send_req(2), tag=src_tag)
1655 IF (
ASSOCIATED(recv_dist))
THEN
1656 IF ((recv_rank == 0))
THEN
1657 dest_block_tmp = [recv_dist%nrow_block, recv_dist%ncol_block]
1658 CALL para_env%isend(dest_block_tmp, 0, send_req(3), tag=dest_tag)
1659 CALL para_env%isend(recv_dist%context%num_pe, 0, send_req(4), tag=dest_tag)
1663 IF (global_rank == 0)
THEN
1666 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1667 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1) &
1669 CALL para_env%irecv(info%src_blacs2mpi,
mp_any_source, recv_req(5), tag=src_tag)
1670 CALL para_env%irecv(dest_blacs2mpi,
mp_any_source, recv_req(6), tag=dest_tag)
1673 IF (
ASSOCIATED(send_dist))
THEN
1674 IF ((send_rank == 0))
THEN
1675 CALL para_env%isend(send_dist%context%blacs2mpi(:, :), 0, send_req(5), tag=src_tag)
1679 IF (
ASSOCIATED(recv_dist))
THEN
1680 IF ((recv_rank == 0))
THEN
1681 CALL para_env%isend(recv_dist%context%blacs2mpi(:, :), 0, send_req(6), tag=dest_tag)
1685 IF (global_rank == 0)
THEN
1690 CALL para_env%bcast(src_block, 0)
1691 CALL para_env%bcast(dest_block, 0)
1692 CALL para_env%bcast(src_num_pe, 0)
1693 CALL para_env%bcast(dest_num_pe, 0)
1694 info%src_num_pe(1:2) = src_num_pe(1:2)
1695 info%nblock_src(1:2) = src_block(1:2)
1696 IF (global_rank /= 0)
THEN
1697 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1698 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1) &
1701 CALL para_env%bcast(info%src_blacs2mpi, 0)
1702 CALL para_env%bcast(dest_blacs2mpi, 0)
1704 recv_size = dest_num_pe(1)*dest_num_pe(2)
1705 send_size = src_num_pe(1)*src_num_pe(2)
1706 info%send_size = send_size
1724 IF (
ASSOCIATED(recv_dist))
THEN
1726 col_indices=recv_col_indices &
1728 info%recv_col_indices => recv_col_indices
1729 info%recv_row_indices => recv_row_indices
1730 nrow_block_src = src_block(1)
1731 ncol_block_src = src_block(2)
1732 ALLOCATE (recv_count(0:send_size - 1), info%recv_disp(0:send_size - 1), info%recv_request(0:send_size - 1))
1735 nrow_local_recv = recv_dist%nrow_locals(recv_dist%context%mepos(1))
1736 ncol_local_recv = recv_dist%ncol_locals(recv_dist%context%mepos(2))
1737 info%nlocal_recv(1) = nrow_local_recv
1738 info%nlocal_recv(2) = ncol_local_recv
1740 ALLOCATE (src_p(nrow_local_recv), src_q(ncol_local_recv))
1741 DO i = 1, nrow_local_recv
1744 src_p(i) = mod(((recv_row_indices(i) - 1)/nrow_block_src), src_num_pe(1))
1746 DO j = 1, ncol_local_recv
1748 src_q(j) = mod(((recv_col_indices(j) - 1)/ncol_block_src), src_num_pe(2))
1752 DO q = 0, src_num_pe(2) - 1
1753 ncols = count(src_q == q)
1754 DO p = 0, src_num_pe(1) - 1
1755 nrows = count(src_p == p)
1757 recv_count(info%src_blacs2mpi(p, q)) = nrows*ncols
1760 DEALLOCATE (src_p, src_q)
1764 ALLOCATE (info%recv_buf(sum(recv_count(:))))
1765 info%recv_disp(0) = 0
1766 DO i = 1, send_size - 1
1767 info%recv_disp(i) = info%recv_disp(i - 1) + recv_count(i - 1)
1771 DO k = 0, send_size - 1
1772 IF (recv_count(k) > 0)
THEN
1773 CALL para_env%irecv(info%recv_buf(info%recv_disp(k) + 1:info%recv_disp(k) + recv_count(k)), &
1774 source2global(k), info%recv_request(k))
1777 DEALLOCATE (source2global)
1781 IF (
ASSOCIATED(send_dist))
THEN
1783 col_indices=send_col_indices &
1785 nrow_block_dest = dest_block(1)
1786 ncol_block_dest = dest_block(2)
1787 ALLOCATE (send_count(0:recv_size - 1), send_disp(0:recv_size - 1), info%send_request(0:recv_size - 1))
1790 nrow_local_send = send_dist%nrow_locals(send_dist%context%mepos(1))
1791 ncol_local_send = send_dist%ncol_locals(send_dist%context%mepos(2))
1795 ALLOCATE (dest_p(nrow_local_send), dest_q(ncol_local_send))
1797 DO i = 1, nrow_local_send
1799 dest_p(i) = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1801 DO j = 1, ncol_local_send
1802 dest_q(j) = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1806 DO q = 0, dest_num_pe(2) - 1
1807 ncols = count(dest_q == q)
1808 DO p = 0, dest_num_pe(1) - 1
1809 nrows = count(dest_p == p)
1810 send_count(dest_blacs2mpi(p, q)) = nrows*ncols
1813 DEALLOCATE (dest_p, dest_q)
1816 ALLOCATE (info%send_buf(sum(send_count(:))))
1818 DO k = 1, recv_size - 1
1819 send_disp(k) = send_disp(k - 1) + send_count(k - 1)
1824 DO j = 1, ncol_local_send
1826 dest_q_j = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1827 DO i = 1, nrow_local_send
1828 dest_p_i = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1829 mpi_rank = dest_blacs2mpi(dest_p_i, dest_q_j)
1830 send_count(mpi_rank) = send_count(mpi_rank) + 1
1831 info%send_buf(send_disp(mpi_rank) + send_count(mpi_rank)) = source%local_data(i, j)
1836 DO k = 0, recv_size - 1
1837 IF (send_count(k) > 0)
THEN
1838 CALL para_env%isend(info%send_buf(send_disp(k) + 1:send_disp(k) + send_count(k)), &
1839 dest2global(k), info%send_request(k))
1842 DEALLOCATE (send_count, send_disp, dest2global)
1844 DEALLOCATE (dest_blacs2mpi)
1848 CALL timestop(handle)
1861 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_finish_copy_general'
1863 INTEGER :: handle, i, j, k, mpi_rank, send_size, &
1865 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: recv_count
1866 INTEGER,
DIMENSION(2) :: nblock_src, nlocal_recv, src_num_pe
1867 INTEGER,
DIMENSION(:),
POINTER :: recv_col_indices, recv_row_indices
1869 CALL timeset(routinen, handle)
1874 DO j = 1,
SIZE(destination%local_data, 2)
1875 DO i = 1,
SIZE(destination%local_data, 1)
1877 destination%local_data(i, j) = info%send_buf(k)
1880 DEALLOCATE (info%send_buf)
1883 send_size = info%send_size
1884 nlocal_recv(1:2) = info%nlocal_recv(:)
1885 nblock_src(1:2) = info%nblock_src(:)
1886 src_num_pe(1:2) = info%src_num_pe(:)
1887 recv_col_indices => info%recv_col_indices
1888 recv_row_indices => info%recv_row_indices
1893 ALLOCATE (recv_count(0:send_size - 1))
1897 DO j = 1, nlocal_recv(2)
1898 src_q_j = mod(((recv_col_indices(j) - 1)/nblock_src(2)), src_num_pe(2))
1899 DO i = 1, nlocal_recv(1)
1900 src_p_i = mod(((recv_row_indices(i) - 1)/nblock_src(1)), src_num_pe(1))
1901 mpi_rank = info%src_blacs2mpi(src_p_i, src_q_j)
1902 recv_count(mpi_rank) = recv_count(mpi_rank) + 1
1903 destination%local_data(i, j) = info%recv_buf(info%recv_disp(mpi_rank) + recv_count(mpi_rank))
1906 DEALLOCATE (recv_count, info%recv_disp, info%recv_request, info%recv_buf, info%src_blacs2mpi)
1908 NULLIFY (info%recv_col_indices, &
1909 info%recv_row_indices)
1913 CALL timestop(handle)
2122 INTEGER,
INTENT(IN) :: unit
2124 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_write_unformatted'
2126 INTEGER :: handle, j, max_block, &
2127 ncol_global, nrow_global
2129#if defined(__parallel)
2130 INTEGER :: i, i_block, icol_local, &
2132 iprow, irow_local, &
2135 INTEGER,
DIMENSION(9) :: desc
2136 REAL(kind=
dp),
DIMENSION(:),
POINTER :: vecbuf
2137 REAL(kind=
dp),
DIMENSION(:, :),
POINTER :: newdat
2139 INTEGER,
EXTERNAL :: numroc
2142 CALL timeset(routinen, handle)
2143 CALL cp_fm_get_info(fm, nrow_global=nrow_global, ncol_global=ncol_global, ncol_block=max_block, &
2146#if defined(__parallel)
2147 num_pe = para_env%num_pe
2148 mepos = para_env%mepos
2152 CALL ictxt_loc%gridinit(para_env,
'R', 1, num_pe)
2153 CALL descinit(desc, nrow_global, ncol_global, rb, max_block, 0, 0, ictxt_loc%get_handle(), nrow_global, info)
2155 associate(nprow => ictxt_loc%num_pe(1), npcol => ictxt_loc%num_pe(2), &
2156 myprow => ictxt_loc%mepos(1), mypcol => ictxt_loc%mepos(2))
2157 in = numroc(ncol_global, max_block, mypcol, 0, npcol)
2159 ALLOCATE (newdat(nrow_global, max(1, in)))
2162 CALL pdgemr2d(nrow_global, ncol_global, fm%local_data, 1, 1, &
2163 fm%matrix_struct%descriptor, &
2164 newdat, 1, 1, desc, ictxt_loc%get_handle())
2166 ALLOCATE (vecbuf(nrow_global*max_block))
2167 vecbuf = huge(1.0_dp)
2169 DO i = 1, ncol_global, max(max_block, 1)
2170 i_block = min(max_block, ncol_global - i + 1)
2171 CALL infog2l(1, i, desc, nprow, npcol, myprow, mypcol, &
2172 irow_local, icol_local, iprow, ipcol)
2173 IF (ipcol == mypcol)
THEN
2175 vecbuf((j - 1)*nrow_global + 1:nrow_global*j) = newdat(:, icol_local + j - 1)
2179 IF (ipcol == 0)
THEN
2182 IF (ipcol == mypcol)
THEN
2183 CALL para_env%send(vecbuf(:), 0, tag)
2185 IF (mypcol == 0)
THEN
2186 CALL para_env%recv(vecbuf(:), ipcol, tag)
2192 WRITE (unit) vecbuf((j - 1)*nrow_global + 1:nrow_global*j)
2200 CALL ictxt_loc%gridexit()
2207 DO j = 1, ncol_global
2208 WRITE (unit) fm%local_data(:, j)
2213 CALL timestop(handle)
2226 INTEGER,
INTENT(IN) :: unit
2227 CHARACTER(LEN=*),
INTENT(IN),
OPTIONAL ::
header, value_format
2229 CHARACTER(LEN=*),
PARAMETER :: routinen =
'cp_fm_write_formatted'
2231 CHARACTER(LEN=21) :: my_value_format
2232 INTEGER :: handle, i, j, max_block, &
2233 ncol_global, nrow_global
2234 TYPE(mp_para_env_type),
POINTER :: para_env
2235#if defined(__parallel)
2236 INTEGER :: i_block, icol_local, &
2238 iprow, irow_local, &
2239 mepos, num_pe, rb, tag, k, &
2241 INTEGER,
DIMENSION(9) :: desc
2242 REAL(kind=dp),
DIMENSION(:),
POINTER :: vecbuf
2243 REAL(kind=dp),
DIMENSION(:, :),
POINTER :: newdat
2244 TYPE(cp_blacs_type) :: ictxt_loc
2245 INTEGER,
EXTERNAL :: numroc
2248 CALL timeset(routinen, handle)
2249 CALL cp_fm_get_info(fm, nrow_global=nrow_global, ncol_global=ncol_global, ncol_block=max_block, &
2252 IF (
PRESENT(value_format))
THEN
2253 cpassert(len_trim(adjustl(value_format)) < 11)
2254 my_value_format =
"(I10, I10, "//trim(adjustl(value_format))//
")"
2256 my_value_format =
"(I10, I10, ES24.12)"
2261 WRITE (unit,
"(A2, A8, A10, A24)")
"#",
"Row",
"Column", adjustl(
"Value")
2264#if defined(__parallel)
2265 num_pe = para_env%num_pe
2266 mepos = para_env%mepos
2270 CALL ictxt_loc%gridinit(para_env,
'R', 1, num_pe)
2271 CALL descinit(desc, nrow_global, ncol_global, rb, max_block, 0, 0, ictxt_loc%get_handle(), nrow_global, info)
2273 associate(nprow => ictxt_loc%num_pe(1), npcol => ictxt_loc%num_pe(2), &
2274 myprow => ictxt_loc%mepos(1), mypcol => ictxt_loc%mepos(2))
2275 in = numroc(ncol_global, max_block, mypcol, 0, npcol)
2277 ALLOCATE (newdat(nrow_global, max(1, in)))
2280 CALL pdgemr2d(nrow_global, ncol_global, fm%local_data, 1, 1, &
2281 fm%matrix_struct%descriptor, &
2282 newdat, 1, 1, desc, ictxt_loc%get_handle())
2284 ALLOCATE (vecbuf(nrow_global*max_block))
2285 vecbuf = huge(1.0_dp)
2289 DO i = 1, ncol_global, max(max_block, 1)
2290 i_block = min(max_block, ncol_global - i + 1)
2291 CALL infog2l(1, i, desc, nprow, npcol, myprow, mypcol, &
2292 irow_local, icol_local, iprow, ipcol)
2293 IF (ipcol == mypcol)
THEN
2295 vecbuf((j - 1)*nrow_global + 1:nrow_global*j) = newdat(:, icol_local + j - 1)
2299 IF (ipcol == 0)
THEN
2302 IF (ipcol == mypcol)
THEN
2303 CALL para_env%send(vecbuf(:), 0, tag)
2305 IF (mypcol == 0)
THEN
2306 CALL para_env%recv(vecbuf(:), ipcol, tag)
2312 DO k = (j - 1)*nrow_global + 1, nrow_global*j
2313 WRITE (unit=unit, fmt=my_value_format) irow, icol, vecbuf(k)
2315 IF (irow > nrow_global)
THEN
2327 CALL ictxt_loc%gridexit()
2334 DO j = 1, ncol_global
2335 DO i = 1, nrow_global
2336 WRITE (unit=unit, fmt=my_value_format) i, j, fm%local_data(i, j)
2342 CALL timestop(handle)