|
Packit Service |
c5cf8c |
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil ; -*- */
|
|
Packit Service |
c5cf8c |
/*
|
|
Packit Service |
c5cf8c |
*
|
|
Packit Service |
c5cf8c |
* (C) 2014 by Argonne National Laboratory.
|
|
Packit Service |
c5cf8c |
* See COPYRIGHT in top-level directory.
|
|
Packit Service |
c5cf8c |
*/
|
|
Packit Service |
c5cf8c |
#include <mpi.h>
|
|
Packit Service |
c5cf8c |
#include <stdio.h>
|
|
Packit Service |
c5cf8c |
#include <stdlib.h>
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
/*
|
|
Packit Service |
c5cf8c |
* This test makes sure that after a failure, the correct group of failed
|
|
Packit Service |
c5cf8c |
* processes is returned from MPIX_Comm_failure_ack/get_acked.
|
|
Packit Service |
c5cf8c |
*/
|
|
Packit Service |
c5cf8c |
int main(int argc, char **argv)
|
|
Packit Service |
c5cf8c |
{
|
|
Packit Service |
c5cf8c |
int rank, size, err, result, i;
|
|
Packit Service |
c5cf8c |
char buf[10] = " No errors";
|
|
Packit Service |
c5cf8c |
char error[MPI_MAX_ERROR_STRING];
|
|
Packit Service |
c5cf8c |
MPI_Group failed_grp, one_grp, world_grp;
|
|
Packit Service |
c5cf8c |
int one[] = { 1 };
|
|
Packit Service |
c5cf8c |
int world_ranks[] = { 0, 1, 2 };
|
|
Packit Service |
c5cf8c |
int failed_ranks[3];
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
MPI_Init(&argc, &argv);
|
|
Packit Service |
c5cf8c |
MPI_Comm_rank(MPI_COMM_WORLD, &rank;;
|
|
Packit Service |
c5cf8c |
MPI_Comm_size(MPI_COMM_WORLD, &size);
|
|
Packit Service |
c5cf8c |
if (size < 3) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "Must run with at least 3 processes\n");
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
MPI_Comm_set_errhandler(MPI_COMM_WORLD, MPI_ERRORS_RETURN);
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
if (rank == 1) {
|
|
Packit Service |
c5cf8c |
exit(EXIT_FAILURE);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
if (rank == 0) {
|
|
Packit Service |
c5cf8c |
err = MPI_Recv(buf, 10, MPI_CHAR, 1, 0, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS == err) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "Expected a failure for receive from rank 1\n");
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
err = MPIX_Comm_failure_ack(MPI_COMM_WORLD);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS != err) {
|
|
Packit Service |
c5cf8c |
int ec;
|
|
Packit Service |
c5cf8c |
MPI_Error_class(err, &ec);
|
|
Packit Service |
c5cf8c |
MPI_Error_string(err, error, &size);
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "MPIX_Comm_failure_ack returned an error: %d\n%s", ec, error);
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
err = MPIX_Comm_failure_get_acked(MPI_COMM_WORLD, &failed_grp);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS != err) {
|
|
Packit Service |
c5cf8c |
int ec;
|
|
Packit Service |
c5cf8c |
MPI_Error_class(err, &ec);
|
|
Packit Service |
c5cf8c |
MPI_Error_string(err, error, &size);
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "MPIX_Comm_failure_get_acked returned an error: %d\n%s", ec, error);
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
MPI_Comm_group(MPI_COMM_WORLD, &world_grp);
|
|
Packit Service |
c5cf8c |
MPI_Group_incl(world_grp, 1, one, &one_grp);
|
|
Packit Service |
c5cf8c |
MPI_Group_compare(one_grp, failed_grp, &result);
|
|
Packit Service |
c5cf8c |
if (MPI_IDENT != result) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "First failed group contains incorrect processes\n");
|
|
Packit Service |
c5cf8c |
MPI_Group_size(failed_grp, &size);
|
|
Packit Service |
c5cf8c |
MPI_Group_translate_ranks(failed_grp, size, world_ranks, world_grp, failed_ranks);
|
|
Packit Service |
c5cf8c |
for (i = 0; i < size; i++)
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "DEAD: %d\n", failed_ranks[i]);
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
MPI_Group_free(&failed_grp);
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
err = MPI_Recv(buf, 10, MPI_CHAR, 2, 0, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS != err) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "First receive failed\n");
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
err = MPI_Recv(buf, 10, MPI_CHAR, 2, 0, MPI_COMM_WORLD, MPI_STATUS_IGNORE);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS == err) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "Expected a failure for receive from rank 2\n");
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
err = MPIX_Comm_failure_get_acked(MPI_COMM_WORLD, &failed_grp);
|
|
Packit Service |
c5cf8c |
if (MPI_SUCCESS != err) {
|
|
Packit Service |
c5cf8c |
int ec;
|
|
Packit Service |
c5cf8c |
MPI_Error_class(err, &ec);
|
|
Packit Service |
c5cf8c |
MPI_Error_string(err, error, &size);
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "MPIX_Comm_failure_get_acked returned an error: %d\n%s", ec, error);
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
MPI_Group_compare(one_grp, failed_grp, &result);
|
|
Packit Service |
c5cf8c |
if (MPI_IDENT != result) {
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "Second failed group contains incorrect processes\n");
|
|
Packit Service |
c5cf8c |
MPI_Group_size(failed_grp, &size);
|
|
Packit Service |
c5cf8c |
MPI_Group_translate_ranks(failed_grp, size, world_ranks, world_grp, failed_ranks);
|
|
Packit Service |
c5cf8c |
for (i = 0; i < size; i++)
|
|
Packit Service |
c5cf8c |
fprintf(stderr, "DEAD: %d\n", failed_ranks[i]);
|
|
Packit Service |
c5cf8c |
MPI_Abort(MPI_COMM_WORLD, 1);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
fprintf(stdout, " No errors\n");
|
|
Packit Service |
c5cf8c |
} else if (rank == 2) {
|
|
Packit Service |
c5cf8c |
MPI_Ssend(buf, 10, MPI_CHAR, 0, 0, MPI_COMM_WORLD);
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
exit(EXIT_FAILURE);
|
|
Packit Service |
c5cf8c |
}
|
|
Packit Service |
c5cf8c |
|
|
Packit Service |
c5cf8c |
MPI_Group_free(&failed_grp);
|
|
Packit Service |
c5cf8c |
MPI_Group_free(&one_grp);
|
|
Packit Service |
c5cf8c |
MPI_Group_free(&world_grp);
|
|
Packit Service |
c5cf8c |
MPI_Finalize();
|
|
Packit Service |
c5cf8c |
}
|