357 COMPLEX(kind=dp),
DIMENSION(:, :),
INTENT(out) :: target_m
358 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
359 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
361 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_get_submatrix'
363 COMPLEX(kind=dp),
DIMENSION(:, :),
POINTER :: local_data
364 INTEGER :: end_col_global, end_col_local, end_row_global, end_row_local, handle, i, j, &
365 ncol_global, ncol_local, nrow_global, nrow_local, start_col_global, start_col_local, &
366 start_row_global, start_row_local, this_col
367 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
368 LOGICAL :: do_zero, tr_a
371 CALL timeset(routinen, handle)
373 IF (
SIZE(target_m) /= 0)
THEN
374#if defined(__parallel)
381 IF (
PRESENT(transpose)) tr_a = transpose
386 IF (
PRESENT(start_row)) start_row_global = start_row
387 IF (
PRESENT(start_col)) start_col_global = start_col
390 end_row_global =
SIZE(target_m, 2)
391 end_col_global =
SIZE(target_m, 1)
393 end_row_global =
SIZE(target_m, 1)
394 end_col_global =
SIZE(target_m, 2)
396 IF (
PRESENT(n_rows)) end_row_global = n_rows
397 IF (
PRESENT(n_cols)) end_col_global = n_cols
399 end_row_global = end_row_global + start_row_global - 1
400 end_col_global = end_col_global + start_col_global - 1
403 nrow_global=nrow_global, ncol_global=ncol_global, &
404 nrow_local=nrow_local, ncol_local=ncol_local, &
405 row_indices=row_indices, col_indices=col_indices)
406 IF (end_row_global > nrow_global)
THEN
407 end_row_global = nrow_global
410 IF (end_col_global > ncol_global)
THEN
411 end_col_global = ncol_global
417 DO start_row_local = 1, nrow_local
418 IF (row_indices(start_row_local) >= start_row_global)
EXIT
421 DO end_row_local = start_row_local, nrow_local
422 IF (row_indices(end_row_local) > end_row_global)
EXIT
424 end_row_local = end_row_local - 1
426 DO start_col_local = 1, ncol_local
427 IF (col_indices(start_col_local) >= start_col_global)
EXIT
430 DO end_col_local = start_col_local, ncol_local
431 IF (col_indices(end_col_local) > end_col_global)
EXIT
433 end_col_local = end_col_local - 1
435 para_env => fm%matrix_struct%para_env
436 local_data => fm%local_data
443 CALL zcopy(
SIZE(target_m),
z_zero, 0, target_m(1, 1), 1)
446 DO j = start_col_local, end_col_local
447 this_col = col_indices(j) - start_col_global + 1
448 DO i = start_row_local, end_row_local
449 target_m(this_col, row_indices(i) - start_row_global + 1) = local_data(i, j)
453 DO j = start_col_local, end_col_local
454 this_col = col_indices(j) - start_col_global + 1
455 DO i = start_row_local, end_row_local
456 target_m(row_indices(i) - start_row_global + 1, this_col) = local_data(i, j)
461 CALL para_env%sum(target_m)
464 CALL timestop(handle)
492 start_col, n_rows, n_cols, alpha, beta, transpose)
494 COMPLEX(kind=dp),
DIMENSION(:, :),
INTENT(in) :: new_values
495 INTEGER,
INTENT(in),
OPTIONAL :: start_row, start_col, n_rows, n_cols
496 COMPLEX(kind=dp),
INTENT(in),
OPTIONAL :: alpha, beta
497 LOGICAL,
INTENT(in),
OPTIONAL :: transpose
499 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_set_submatrix'
501 COMPLEX(kind=dp) :: al, be
502 COMPLEX(kind=dp),
DIMENSION(:, :),
POINTER :: local_data
503 INTEGER :: end_col_global, end_col_local, end_row_global, end_row_local, handle, i, j, &
504 ncol_global, ncol_local, nrow_global, nrow_local, start_col_global, start_col_local, &
505 start_row_global, start_row_local, this_col
506 INTEGER,
DIMENSION(:),
POINTER :: col_indices, row_indices
509 CALL timeset(routinen, handle)
513 IF (
PRESENT(alpha)) al = alpha
514 IF (
PRESENT(beta)) be = beta
519 IF (
PRESENT(start_row)) start_row_global = start_row
520 IF (
PRESENT(start_col)) start_col_global = start_col
523 IF (
PRESENT(transpose)) tr_a = transpose
526 end_row_global =
SIZE(new_values, 2)
527 end_col_global =
SIZE(new_values, 1)
529 end_row_global =
SIZE(new_values, 1)
530 end_col_global =
SIZE(new_values, 2)
532 IF (
PRESENT(n_rows)) end_row_global = n_rows
533 IF (
PRESENT(n_cols)) end_col_global = n_cols
535 end_row_global = end_row_global + start_row_global - 1
536 end_col_global = end_col_global + start_col_global - 1
539 nrow_global=nrow_global, ncol_global=ncol_global, &
540 nrow_local=nrow_local, ncol_local=ncol_local, &
541 row_indices=row_indices, col_indices=col_indices)
542 IF (end_row_global > nrow_global) end_row_global = nrow_global
543 IF (end_col_global > ncol_global) end_col_global = ncol_global
547 DO start_row_local = 1, nrow_local
548 IF (row_indices(start_row_local) >= start_row_global)
EXIT
551 DO end_row_local = start_row_local, nrow_local
552 IF (row_indices(end_row_local) > end_row_global)
EXIT
554 end_row_local = end_row_local - 1
556 DO start_col_local = 1, ncol_local
557 IF (col_indices(start_col_local) >= start_col_global)
EXIT
560 DO end_col_local = start_col_local, ncol_local
561 IF (col_indices(end_col_local) > end_col_global)
EXIT
563 end_col_local = end_col_local - 1
565 local_data => matrix%local_data
569 DO j = start_col_local, end_col_local
570 this_col = col_indices(j) - start_col_global + 1
571 DO i = start_row_local, end_row_local
572 local_data(i, j) = new_values(this_col, row_indices(i) - start_row_global + 1)
576 DO j = start_col_local, end_col_local
577 this_col = col_indices(j) - start_col_global + 1
578 DO i = start_row_local, end_row_local
579 local_data(i, j) = new_values(row_indices(i) - start_row_global + 1, this_col)
585 DO j = start_col_local, end_col_local
586 this_col = col_indices(j) - start_col_global + 1
587 DO i = start_row_local, end_row_local
588 local_data(i, j) = al*new_values(this_col, row_indices(i) - start_row_global + 1) + &
593 DO j = start_col_local, end_col_local
594 this_col = col_indices(j) - start_col_global + 1
595 DO i = start_row_local, end_row_local
596 local_data(i, j) = al*new_values(row_indices(i) - start_row_global + 1, this_col) + &
603 CALL timestop(handle)
902 TYPE(
cp_cfm_type),
INTENT(IN) :: source, destination
906 CHARACTER(len=*),
PARAMETER :: routinen =
'cp_cfm_start_copy_general'
908 INTEGER :: dest_p_i, dest_q_j, global_rank, global_size, handle, i, j, k, mpi_rank, &
909 ncol_block_dest, ncol_block_src, ncol_local_recv, ncol_local_send, ncols, &
910 nrow_block_dest, nrow_block_src, nrow_local_recv, nrow_local_send, nrows, p, q, &
911 recv_rank, recv_size, send_rank, send_size
912 INTEGER,
ALLOCATABLE,
DIMENSION(:) :: all_ranks, dest2global, dest_p, dest_q, &
913 recv_count, send_count, send_disp, &
914 source2global, src_p, src_q
915 INTEGER,
ALLOCATABLE,
DIMENSION(:, :) :: dest_blacs2mpi
916 INTEGER,
DIMENSION(2) :: dest_block, dest_block_tmp, dest_num_pe, &
917 src_block, src_block_tmp, src_num_pe
918 INTEGER,
DIMENSION(:),
POINTER :: recv_col_indices, recv_row_indices, &
919 send_col_indices, send_row_indices
923 CALL timeset(routinen, handle)
927 nrow_local_send =
SIZE(source%local_data, 1)
928 ncol_local_send =
SIZE(source%local_data, 2)
929 ALLOCATE (info%send_buf(nrow_local_send*ncol_local_send))
931 DO j = 1, ncol_local_send
932 DO i = 1, nrow_local_send
934 info%send_buf(k) = source%local_data(i, j)
938 NULLIFY (recv_dist, send_dist)
939 NULLIFY (recv_col_indices, recv_row_indices, send_col_indices, send_row_indices)
942 global_size = para_env%num_pe
943 global_rank = para_env%mepos
949 IF (
ASSOCIATED(destination%matrix_struct))
THEN
950 recv_dist => destination%matrix_struct
951 recv_rank = recv_dist%para_env%mepos
956 IF (
ASSOCIATED(source%matrix_struct))
THEN
957 send_dist => source%matrix_struct
958 send_rank = send_dist%para_env%mepos
964 ALLOCATE (all_ranks(0:global_size - 1))
966 CALL para_env%allgather(send_rank, all_ranks)
967 IF (
ASSOCIATED(destination%matrix_struct))
THEN
968 ALLOCATE (source2global(0:count(all_ranks /=
mp_proc_null) - 1))
969 DO i = 0, global_size - 1
971 source2global(all_ranks(i)) = i
976 CALL para_env%allgather(recv_rank, all_ranks)
977 IF (
ASSOCIATED(source%matrix_struct))
THEN
978 ALLOCATE (dest2global(0:count(all_ranks /=
mp_proc_null) - 1))
979 DO i = 0, global_size - 1
981 dest2global(all_ranks(i)) = i
985 DEALLOCATE (all_ranks)
992 IF (global_rank == 0)
THEN
994 CALL para_env%irecv(src_block,
mp_any_source, recv_req(1), tag=src_tag)
995 CALL para_env%irecv(dest_block,
mp_any_source, recv_req(2), tag=dest_tag)
996 CALL para_env%irecv(src_num_pe,
mp_any_source, recv_req(3), tag=src_tag)
997 CALL para_env%irecv(dest_num_pe,
mp_any_source, recv_req(4), tag=dest_tag)
1000 IF (
ASSOCIATED(source%matrix_struct))
THEN
1001 IF ((send_rank == 0))
THEN
1003 src_block_tmp = [send_dist%nrow_block, send_dist%ncol_block]
1004 CALL para_env%isend(src_block_tmp, 0, send_req(1), tag=src_tag)
1005 CALL para_env%isend(send_dist%context%num_pe, 0, send_req(2), tag=src_tag)
1009 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1010 IF ((recv_rank == 0))
THEN
1011 dest_block_tmp = [recv_dist%nrow_block, recv_dist%ncol_block]
1012 CALL para_env%isend(dest_block_tmp, 0, send_req(3), tag=dest_tag)
1013 CALL para_env%isend(recv_dist%context%num_pe, 0, send_req(4), tag=dest_tag)
1017 IF (global_rank == 0)
THEN
1020 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1021 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1))
1022 CALL para_env%irecv(info%src_blacs2mpi,
mp_any_source, recv_req(5), tag=src_tag)
1023 CALL para_env%irecv(dest_blacs2mpi,
mp_any_source, recv_req(6), tag=dest_tag)
1026 IF (
ASSOCIATED(source%matrix_struct))
THEN
1027 IF ((send_rank == 0))
THEN
1028 CALL para_env%isend(send_dist%context%blacs2mpi(:, :), 0, send_req(5), tag=src_tag)
1032 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1033 IF ((recv_rank == 0))
THEN
1034 CALL para_env%isend(recv_dist%context%blacs2mpi(:, :), 0, send_req(6), tag=dest_tag)
1038 IF (global_rank == 0)
THEN
1043 CALL para_env%bcast(src_block, 0)
1044 CALL para_env%bcast(dest_block, 0)
1045 CALL para_env%bcast(src_num_pe, 0)
1046 CALL para_env%bcast(dest_num_pe, 0)
1047 info%src_num_pe(1:2) = src_num_pe(1:2)
1048 info%nblock_src(1:2) = src_block(1:2)
1049 IF (global_rank /= 0)
THEN
1050 ALLOCATE (info%src_blacs2mpi(0:src_num_pe(1) - 1, 0:src_num_pe(2) - 1), &
1051 dest_blacs2mpi(0:dest_num_pe(1) - 1, 0:dest_num_pe(2) - 1))
1053 CALL para_env%bcast(info%src_blacs2mpi, 0)
1054 CALL para_env%bcast(dest_blacs2mpi, 0)
1056 recv_size = dest_num_pe(1)*dest_num_pe(2)
1057 send_size = src_num_pe(1)*src_num_pe(2)
1058 info%send_size = send_size
1076 IF (
ASSOCIATED(destination%matrix_struct))
THEN
1078 col_indices=recv_col_indices)
1079 info%recv_col_indices => recv_col_indices
1080 info%recv_row_indices => recv_row_indices
1081 nrow_block_src = src_block(1)
1082 ncol_block_src = src_block(2)
1083 ALLOCATE (recv_count(0:send_size - 1), info%recv_disp(0:send_size - 1), info%recv_request(0:send_size - 1))
1086 nrow_local_recv = recv_dist%nrow_locals(recv_dist%context%mepos(1))
1087 ncol_local_recv = recv_dist%ncol_locals(recv_dist%context%mepos(2))
1088 info%nlocal_recv(1) = nrow_local_recv
1089 info%nlocal_recv(2) = ncol_local_recv
1091 ALLOCATE (src_p(nrow_local_recv), src_q(ncol_local_recv))
1092 DO i = 1, nrow_local_recv
1095 src_p(i) = mod(((recv_row_indices(i) - 1)/nrow_block_src), src_num_pe(1))
1097 DO j = 1, ncol_local_recv
1099 src_q(j) = mod(((recv_col_indices(j) - 1)/ncol_block_src), src_num_pe(2))
1103 DO q = 0, src_num_pe(2) - 1
1104 ncols = count(src_q == q)
1105 DO p = 0, src_num_pe(1) - 1
1106 nrows = count(src_p == p)
1108 recv_count(info%src_blacs2mpi(p, q)) = nrows*ncols
1111 DEALLOCATE (src_p, src_q)
1115 ALLOCATE (info%recv_buf(sum(recv_count(:))))
1116 info%recv_disp(0) = 0
1117 DO i = 1, send_size - 1
1118 info%recv_disp(i) = info%recv_disp(i - 1) + recv_count(i - 1)
1122 DO k = 0, send_size - 1
1123 IF (recv_count(k) > 0)
THEN
1124 CALL para_env%irecv(info%recv_buf(info%recv_disp(k) + 1:info%recv_disp(k) + recv_count(k)), &
1125 source2global(k), info%recv_request(k))
1130 DEALLOCATE (source2global)
1134 IF (
ASSOCIATED(source%matrix_struct))
THEN
1136 col_indices=send_col_indices)
1137 nrow_block_dest = dest_block(1)
1138 ncol_block_dest = dest_block(2)
1139 ALLOCATE (send_count(0:recv_size - 1), send_disp(0:recv_size - 1), info%send_request(0:recv_size - 1))
1142 nrow_local_send = send_dist%nrow_locals(send_dist%context%mepos(1))
1143 ncol_local_send = send_dist%ncol_locals(send_dist%context%mepos(2))
1147 ALLOCATE (dest_p(nrow_local_send), dest_q(ncol_local_send))
1149 DO i = 1, nrow_local_send
1151 dest_p(i) = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1153 DO j = 1, ncol_local_send
1154 dest_q(j) = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1158 DO q = 0, dest_num_pe(2) - 1
1159 ncols = count(dest_q == q)
1160 DO p = 0, dest_num_pe(1) - 1
1161 nrows = count(dest_p == p)
1162 send_count(dest_blacs2mpi(p, q)) = nrows*ncols
1165 DEALLOCATE (dest_p, dest_q)
1168 ALLOCATE (info%send_buf(sum(send_count(:))))
1170 DO k = 1, recv_size - 1
1171 send_disp(k) = send_disp(k - 1) + send_count(k - 1)
1176 DO j = 1, ncol_local_send
1178 dest_q_j = mod(((send_col_indices(j) - 1)/ncol_block_dest), dest_num_pe(2))
1179 DO i = 1, nrow_local_send
1180 dest_p_i = mod(((send_row_indices(i) - 1)/nrow_block_dest), dest_num_pe(1))
1181 mpi_rank = dest_blacs2mpi(dest_p_i, dest_q_j)
1182 send_count(mpi_rank) = send_count(mpi_rank) + 1
1183 info%send_buf(send_disp(mpi_rank) + send_count(mpi_rank)) = source%local_data(i, j)
1188 DO k = 0, recv_size - 1
1189 IF (send_count(k) > 0)
THEN
1190 CALL para_env%isend(info%send_buf(send_disp(k) + 1:send_disp(k) + send_count(k)), &
1191 dest2global(k), info%send_request(k))
1196 DEALLOCATE (send_count, send_disp, dest2global)
1198 DEALLOCATE (dest_blacs2mpi)
1202 CALL timestop(handle)