|
Packit |
0848f5 |
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil ; -*- */
|
|
Packit |
0848f5 |
/*
|
|
Packit |
0848f5 |
*
|
|
Packit |
0848f5 |
* (C) 2014 by Argonne National Laboratory.
|
|
Packit |
0848f5 |
* See COPYRIGHT in top-level directory.
|
|
Packit |
0848f5 |
*/
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
#include <stdio.h>
|
|
Packit |
0848f5 |
#include <stdlib.h>
|
|
Packit |
0848f5 |
#include <mpi.h>
|
|
Packit |
0848f5 |
#include "mpitest.h"
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
#define ITER 100
|
|
Packit |
0848f5 |
#define BUF_CNT 4
|
|
Packit |
0848f5 |
double local_buf[BUF_CNT], check_buf[BUF_CNT];
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
const int verbose = 0;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
int main(int argc, char *argv[])
|
|
Packit |
0848f5 |
{
|
|
Packit |
0848f5 |
int rank, nproc, i, x;
|
|
Packit |
0848f5 |
int errors = 0, all_errors = 0;
|
|
Packit |
0848f5 |
MPI_Win win = MPI_WIN_NULL;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Comm shm_comm = MPI_COMM_NULL;
|
|
Packit |
0848f5 |
int shm_nproc, shm_rank;
|
|
Packit |
0848f5 |
double **shm_bases = NULL, *my_base;
|
|
Packit |
0848f5 |
MPI_Win shm_win = MPI_WIN_NULL;
|
|
Packit |
0848f5 |
MPI_Group shm_group = MPI_GROUP_NULL, world_group = MPI_GROUP_NULL;
|
|
Packit |
0848f5 |
int *shm_ranks = NULL, *shm_ranks_in_world = NULL;
|
|
Packit |
0848f5 |
MPI_Aint get_target_base_offsets = 0;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
int win_size = sizeof(double) * BUF_CNT;
|
|
Packit |
0848f5 |
int new_win_size = win_size;
|
|
Packit |
0848f5 |
int win_unit = sizeof(double);
|
|
Packit |
0848f5 |
int shm_root_rank_in_world;
|
|
Packit |
0848f5 |
int origin = -1, put_target, get_target;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Init(&argc, &argv);
|
|
Packit |
0848f5 |
MPI_Comm_rank(MPI_COMM_WORLD, &rank;;
|
|
Packit |
0848f5 |
MPI_Comm_size(MPI_COMM_WORLD, &nproc);
|
|
Packit |
0848f5 |
MPI_Comm_group(MPI_COMM_WORLD, &world_group);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (nproc != 4) {
|
|
Packit |
0848f5 |
if (rank == 0)
|
|
Packit |
0848f5 |
printf("Error: must be run with four processes\n");
|
|
Packit |
0848f5 |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Comm_split_type(MPI_COMM_WORLD, MPI_COMM_TYPE_SHARED, rank, MPI_INFO_NULL, &shm_comm);
|
|
Packit |
0848f5 |
MPI_Comm_rank(shm_comm, &shm_rank);
|
|
Packit |
0848f5 |
MPI_Comm_size(shm_comm, &shm_nproc);
|
|
Packit |
0848f5 |
MPI_Comm_group(shm_comm, &shm_group);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Platform does not support shared memory or wrong host file, just return. */
|
|
Packit |
0848f5 |
if (shm_nproc != 2) {
|
|
Packit |
0848f5 |
goto exit;
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
shm_bases = (double **) calloc(shm_nproc, sizeof(double *));
|
|
Packit |
0848f5 |
shm_ranks = (int *) calloc(shm_nproc, sizeof(int));
|
|
Packit |
0848f5 |
shm_ranks_in_world = (int *) calloc(shm_nproc, sizeof(int));
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_rank == 0)
|
|
Packit |
0848f5 |
shm_root_rank_in_world = rank;
|
|
Packit |
0848f5 |
MPI_Bcast(&shm_root_rank_in_world, 1, MPI_INT, 0, shm_comm);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Identify ranks of target processes which are located on node 0 */
|
|
Packit |
0848f5 |
if (rank == 0) {
|
|
Packit |
0848f5 |
for (i = 0; i < shm_nproc; i++) {
|
|
Packit |
0848f5 |
shm_ranks[i] = i;
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
MPI_Group_translate_ranks(shm_group, shm_nproc, shm_ranks, world_group, shm_ranks_in_world);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
MPI_Bcast(shm_ranks_in_world, shm_nproc, MPI_INT, 0, MPI_COMM_WORLD);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
put_target = shm_ranks_in_world[shm_nproc - 1];
|
|
Packit |
0848f5 |
get_target = shm_ranks_in_world[0];
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Identify the rank of origin process which are located on node 1 */
|
|
Packit |
0848f5 |
if (shm_root_rank_in_world == 1 && shm_rank == 0) {
|
|
Packit |
0848f5 |
origin = rank;
|
|
Packit |
0848f5 |
if (verbose) {
|
|
Packit |
0848f5 |
printf("---- I am origin = %d, get_target = %d, put_target = %d\n",
|
|
Packit |
0848f5 |
origin, get_target, put_target);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Allocate shared memory among local processes */
|
|
Packit |
0848f5 |
MPI_Win_allocate_shared(win_size, win_unit, MPI_INFO_NULL, shm_comm, &my_base, &shm_win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_root_rank_in_world == 0 && verbose) {
|
|
Packit |
0848f5 |
MPI_Aint size;
|
|
Packit |
0848f5 |
int disp_unit;
|
|
Packit |
0848f5 |
for (i = 0; i < shm_nproc; i++) {
|
|
Packit |
0848f5 |
MPI_Win_shared_query(shm_win, i, &size, &disp_unit, &shm_bases[i]);
|
|
Packit |
0848f5 |
printf("%d -- shared query: base[%d]=%p, size %ld, "
|
|
Packit |
0848f5 |
"unit %d\n", rank, i, shm_bases[i], size, disp_unit);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Get offset of put target(1) on get target(0) */
|
|
Packit |
0848f5 |
get_target_base_offsets = (shm_nproc - 1) * win_size / win_unit;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (origin == rank && verbose)
|
|
Packit |
0848f5 |
printf("%d -- base_offset of put_target %d on get_target %d: %ld\n",
|
|
Packit |
0848f5 |
rank, put_target, get_target, get_target_base_offsets);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Create using MPI_Win_create(). Note that new window size of get_target(0)
|
|
Packit |
0848f5 |
* is equal to the total size of shm segments on this node, thus get_target
|
|
Packit |
0848f5 |
* process can read the byte located on put_target process.*/
|
|
Packit |
0848f5 |
for (i = 0; i < BUF_CNT; i++) {
|
|
Packit |
0848f5 |
local_buf[i] = (i + 1) * 1.0;
|
|
Packit |
0848f5 |
my_base[i] = 0.0;
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (get_target == rank)
|
|
Packit |
0848f5 |
new_win_size = win_size * shm_nproc;
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Win_create(my_base, new_win_size, win_unit, MPI_INFO_NULL, MPI_COMM_WORLD, &win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (verbose)
|
|
Packit |
0848f5 |
printf("%d -- new window my_base %p, size %d\n", rank, my_base, new_win_size);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Barrier(MPI_COMM_WORLD);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
/* Check if flush guarantees the completion of put operations on target side.
|
|
Packit |
0848f5 |
*
|
|
Packit |
0848f5 |
* P exclusively locks 2 processes whose windows are shared with each other.
|
|
Packit |
0848f5 |
* P first put and flush to a process, then get the updated data from another process.
|
|
Packit |
0848f5 |
* If flush returns before operations are done on the target side, the data may be
|
|
Packit |
0848f5 |
* incorrect.*/
|
|
Packit |
0848f5 |
for (x = 0; x < ITER; x++) {
|
|
Packit |
0848f5 |
for (i = 0; i < BUF_CNT; i++) {
|
|
Packit |
0848f5 |
local_buf[i] += x;
|
|
Packit |
0848f5 |
check_buf[i] = 0;
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (rank == origin) {
|
|
Packit |
0848f5 |
MPI_Win_lock(MPI_LOCK_EXCLUSIVE, put_target, 0, win);
|
|
Packit |
0848f5 |
MPI_Win_lock(MPI_LOCK_EXCLUSIVE, get_target, 0, win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
for (i = 0; i < BUF_CNT; i++) {
|
|
Packit |
0848f5 |
MPI_Put(&local_buf[i], 1, MPI_DOUBLE, put_target, i, 1, MPI_DOUBLE, win);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
MPI_Win_flush(put_target, win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Get(check_buf, BUF_CNT, MPI_DOUBLE, get_target,
|
|
Packit |
0848f5 |
get_target_base_offsets, BUF_CNT, MPI_DOUBLE, win);
|
|
Packit |
0848f5 |
MPI_Win_flush(get_target, win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
for (i = 0; i < BUF_CNT; i++) {
|
|
Packit |
0848f5 |
if (check_buf[i] != local_buf[i]) {
|
|
Packit |
0848f5 |
printf("%d(iter %d) - Got check_buf[%d] = %.1lf, expected %.1lf\n",
|
|
Packit |
0848f5 |
rank, x, i, check_buf[i], local_buf[i]);
|
|
Packit |
0848f5 |
errors++;
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Win_unlock(put_target, win);
|
|
Packit |
0848f5 |
MPI_Win_unlock(get_target, win);
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
}
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Barrier(MPI_COMM_WORLD);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Reduce(&errors, &all_errors, 1, MPI_INT, MPI_SUM, 0, MPI_COMM_WORLD);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
exit:
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (rank == 0 && all_errors == 0)
|
|
Packit |
0848f5 |
printf(" No Errors\n");
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_bases)
|
|
Packit |
0848f5 |
free(shm_bases);
|
|
Packit |
0848f5 |
if (shm_ranks)
|
|
Packit |
0848f5 |
free(shm_ranks);
|
|
Packit |
0848f5 |
if (shm_ranks_in_world)
|
|
Packit |
0848f5 |
free(shm_ranks_in_world);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_win != MPI_WIN_NULL)
|
|
Packit |
0848f5 |
MPI_Win_free(&shm_win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (win != MPI_WIN_NULL)
|
|
Packit |
0848f5 |
MPI_Win_free(&win);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_comm != MPI_COMM_NULL)
|
|
Packit |
0848f5 |
MPI_Comm_free(&shm_comm);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (shm_group != MPI_GROUP_NULL)
|
|
Packit |
0848f5 |
MPI_Group_free(&shm_group);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
if (world_group != MPI_GROUP_NULL)
|
|
Packit |
0848f5 |
MPI_Group_free(&world_group);
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
MPI_Finalize();
|
|
Packit |
0848f5 |
|
|
Packit |
0848f5 |
return 0;
|
|
Packit |
0848f5 |
}
|