Blob Blame History Raw
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil ; -*- */
/*
 *  (C) 2001 by Argonne National Laboratory.
 *      See COPYRIGHT in top-level directory.
 */
#include "mpi.h"
#include <stdio.h>
#include <string.h>
#include <stdlib.h>

/* A simple performance test. The file name is taken as a
   command-line argument. */

#define SIZE (1048576*4)        /* read/write size per node in bytes */

static void handle_error(int errcode, const char *str)
{
    char msg[MPI_MAX_ERROR_STRING];
    int resultlen;
    MPI_Error_string(errcode, msg, &resultlen);
    fprintf(stderr, "%s: %s\n", str, msg);
    MPI_Abort(MPI_COMM_WORLD, 1);
}

#define MPI_CHECK(fn) { int errcode; errcode = (fn); if (errcode != MPI_SUCCESS) handle_error(errcode, #fn); }



int main(int argc, char **argv)
{
    int *buf, i, j, mynod, nprocs, ntimes = 5, len, err, flag;
    double stim, read_tim, write_tim, new_read_tim, new_write_tim;
    double min_read_tim = 10000000.0, min_write_tim = 10000000.0, read_bw, write_bw;
    MPI_File fh;
    MPI_Status status;
    char *filename;

    MPI_Init(&argc, &argv);
    MPI_Comm_size(MPI_COMM_WORLD, &nprocs);
    MPI_Comm_rank(MPI_COMM_WORLD, &mynod);

/* process 0 takes the file name as a command-line argument and
   broadcasts it to other processes */
    if (!mynod) {
        i = 1;
        while ((i < argc) && strcmp("-fname", *argv)) {
            i++;
            argv++;
        }
        if (i >= argc) {
            fprintf(stderr, "\n*#  Usage: perf -fname filename\n\n");
            MPI_Abort(MPI_COMM_WORLD, 1);
        }
        argv++;
        len = strlen(*argv);
        filename = (char *) malloc(len + 1);
        strcpy(filename, *argv);
        MPI_Bcast(&len, 1, MPI_INT, 0, MPI_COMM_WORLD);
        MPI_Bcast(filename, len + 1, MPI_CHAR, 0, MPI_COMM_WORLD);
        fprintf(stderr, "Access size per process = %d bytes, ntimes = %d\n", SIZE, ntimes);
    } else {
        MPI_Bcast(&len, 1, MPI_INT, 0, MPI_COMM_WORLD);
        filename = (char *) malloc(len + 1);
        MPI_Bcast(filename, len + 1, MPI_CHAR, 0, MPI_COMM_WORLD);
    }


    buf = (int *) malloc(SIZE);

    for (j = 0; j < ntimes; j++) {
        MPI_CHECK(MPI_File_open(MPI_COMM_WORLD, filename,
                                MPI_MODE_CREATE | MPI_MODE_RDWR, MPI_INFO_NULL, &fh));
        MPI_CHECK(MPI_File_seek(fh, mynod * SIZE, MPI_SEEK_SET));

        MPI_Barrier(MPI_COMM_WORLD);
        stim = MPI_Wtime();
        MPI_CHECK(MPI_File_write(fh, buf, SIZE, MPI_BYTE, &status));
        write_tim = MPI_Wtime() - stim;

        MPI_CHECK(MPI_File_close(&fh));

        MPI_Barrier(MPI_COMM_WORLD);

        MPI_CHECK(MPI_File_open(MPI_COMM_WORLD, filename, MPI_MODE_CREATE |
                                MPI_MODE_RDWR, MPI_INFO_NULL, &fh));
        MPI_CHECK(MPI_File_seek(fh, mynod * SIZE, MPI_SEEK_SET));

        MPI_Barrier(MPI_COMM_WORLD);
        stim = MPI_Wtime();
        MPI_CHECK(MPI_File_read(fh, buf, SIZE, MPI_BYTE, &status));
        read_tim = MPI_Wtime() - stim;

        MPI_CHECK(MPI_File_close(&fh));

        MPI_Allreduce(&write_tim, &new_write_tim, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);
        MPI_Allreduce(&read_tim, &new_read_tim, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);

        min_read_tim = (new_read_tim < min_read_tim) ? new_read_tim : min_read_tim;
        min_write_tim = (new_write_tim < min_write_tim) ? new_write_tim : min_write_tim;
    }

    if (mynod == 0) {
        read_bw = (SIZE * nprocs) / (min_read_tim * 1024.0 * 1024.0);
        write_bw = (SIZE * nprocs) / (min_write_tim * 1024.0 * 1024.0);
        fprintf(stderr, "Write bandwidth without file sync = %f Mbytes/sec\n", write_bw);
        fprintf(stderr, "Read bandwidth without prior file sync = %f Mbytes/sec\n", read_bw);
    }

    min_write_tim = 10000000.0;
    min_read_tim = 10000000.0;

    flag = 0;
    for (j = 0; j < ntimes; j++) {
        MPI_CHECK(MPI_File_open(MPI_COMM_WORLD, filename, MPI_MODE_CREATE |
                                MPI_MODE_RDWR, MPI_INFO_NULL, &fh));
        MPI_CHECK(MPI_File_seek(fh, mynod * SIZE, MPI_SEEK_SET));

        MPI_Barrier(MPI_COMM_WORLD);
        stim = MPI_Wtime();
        MPI_CHECK(MPI_File_write(fh, buf, SIZE, MPI_BYTE, &status));
        err = MPI_File_sync(fh);
        write_tim = MPI_Wtime() - stim;
        if (err == MPI_ERR_UNKNOWN) {
            flag = 1;
            break;
        }

        MPI_CHECK(MPI_File_close(&fh));

        MPI_Barrier(MPI_COMM_WORLD);

        MPI_CHECK(MPI_File_open(MPI_COMM_WORLD, filename, MPI_MODE_CREATE |
                                MPI_MODE_RDWR, MPI_INFO_NULL, &fh));
        MPI_CHECK(MPI_File_seek(fh, mynod * SIZE, MPI_SEEK_SET));

        MPI_Barrier(MPI_COMM_WORLD);
        stim = MPI_Wtime();
        MPI_CHECK(MPI_File_read(fh, buf, SIZE, MPI_BYTE, &status));
        read_tim = MPI_Wtime() - stim;

        MPI_CHECK(MPI_File_close(&fh));

        MPI_Allreduce(&write_tim, &new_write_tim, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);
        MPI_Allreduce(&read_tim, &new_read_tim, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);

        min_read_tim = (new_read_tim < min_read_tim) ? new_read_tim : min_read_tim;
        min_write_tim = (new_write_tim < min_write_tim) ? new_write_tim : min_write_tim;
    }

    if (mynod == 0) {
        if (flag)
            fprintf(stderr, "MPI_File_sync returns error.\n");
        else {
            read_bw = (SIZE * nprocs) / (min_read_tim * 1024.0 * 1024.0);
            write_bw = (SIZE * nprocs) / (min_write_tim * 1024.0 * 1024.0);
            fprintf(stderr, "Write bandwidth including file sync = %f Mbytes/sec\n", write_bw);
            fprintf(stderr, "Read bandwidth after file sync = %f Mbytes/sec\n", read_bw);
        }
    }

    free(buf);
    free(filename);
    MPI_Finalize();
    return 0;
}