Skip to content

Commit

Permalink
ncint performance test
Browse files Browse the repository at this point in the history
  • Loading branch information
edwardhartnett committed Dec 2, 2019
1 parent 751ff3d commit a8ea44c
Show file tree
Hide file tree
Showing 4 changed files with 225 additions and 3 deletions.
8 changes: 5 additions & 3 deletions tests/ncint/Makefile.am
Original file line number Diff line number Diff line change
Expand Up @@ -8,19 +8,21 @@ AM_CPPFLAGS = -I$(top_srcdir)/src/clib
LDADD = ${top_builddir}/src/clib/libpioc.la

# Build the test for make check.
check_PROGRAMS = tst_pio_udf tst_pio_async tst_async_multi
check_PROGRAMS = tst_pio_udf tst_pio_async tst_async_multi \
tst_ncint_perf

tst_pio_udf_SOURCES = tst_pio_udf.c pio_err_macros.h
tst_pio_async_SOURCES = tst_pio_async.c pio_err_macros.h
tst_async_multi_SOURCES = tst_async_multi.c pio_err_macros.h
tst_ncint_perf_SOURCES = tst_ncint_perf.c pio_err_macros.h

if RUN_TESTS
# Tests will run from a bash script.
TESTS = run_tests.sh
TESTS = run_tests.sh run_perf.sh
endif # RUN_TESTS

# Distribute the test script.
EXTRA_DIST = run_tests.sh
EXTRA_DIST = run_tests.sh run_perf.sh

# Clean up files produced during testing.
CLEANFILES = *.nc *.log
2 changes: 2 additions & 0 deletions tests/ncint/pio_err_macros.h
Original file line number Diff line number Diff line change
Expand Up @@ -61,4 +61,6 @@ static int total_err = 0, err = 0;
return 0; \
} while (0)

#define ERR_WRONG 99

#endif /* _PIO_ERR_MACROS_H */
33 changes: 33 additions & 0 deletions tests/ncint/run_perf.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
#!/bin/sh

# This is a test script for PIO. It runs performance tests for the
# netCDF intergration of PIO.

# Ed Hartnett

# Stop execution of script if error is returned.
set -e

# Stop loop if ctrl-c is pressed.
trap exit INT TERM

printf 'running PIO performance tests...\n'

PIO_TESTS='tst_ncint_perf'

success1=true
for TEST in $PIO_TESTS
do
success1=false
echo "running ${TEST}"
mpiexec -n 4 ./${TEST} && success1=true
if test $success1 = false; then
break
fi
done

# Did we succeed?
if test x$success1 = xtrue; then
exit 0
fi
exit 1
185 changes: 185 additions & 0 deletions tests/ncint/tst_ncint_perf.c
Original file line number Diff line number Diff line change
@@ -0,0 +1,185 @@
/* Test netcdf integration layer.
This is a performance test of async mode in PIO, using the netCDF
integration layer.
Ed Hartnett
12/2/19
*/

#include "config.h"
#include <pio.h>
#include <sys/time.h>
#include "pio_err_macros.h"

#define FILE_NAME "tst_pio_async.nc"
#define VAR_NAME "data_var"
#define DIM_NAME_UNLIMITED "dim_unlimited"
#define DIM_NAME_X "dim_x"
#define DIM_NAME_Y "dim_y"
#define DIM_LEN_X 3
#define DIM_LEN_Y 4
#define NDIM2 2
#define NDIM3 3
#define NUM_TIMESTEPS 1

extern NC_Dispatch NCINT_dispatcher;

/* Number of computational components to create. */
#define COMPONENT_COUNT 1

int
main(int argc, char **argv)
{
int my_rank;
int ntasks;

/* Initialize MPI. */
if (MPI_Init(&argc, &argv)) PERR;

/* Learn my rank and the total number of processors. */
if (MPI_Comm_rank(MPI_COMM_WORLD, &my_rank)) PERR;
if (MPI_Comm_size(MPI_COMM_WORLD, &ntasks)) PERR;

if (!my_rank)
printf("\n*** Testing netCDF integration PIO performance.\n");
if (!my_rank)
printf("*** testing simple async use of netCDF integration layer...");
{
int ncid, ioid;
int dimid[NDIM3], varid;
int dimlen[NDIM3] = {NC_UNLIMITED, DIM_LEN_X, DIM_LEN_Y};
int iosysid;
size_t elements_per_pe;
size_t *compdof; /* The decomposition mapping. */
int *my_data;
int *data_in;
int num_procs2[COMPONENT_COUNT] = {3};
int num_io_procs = 1;
int i;

/* Turn on logging for PIO library. */
/* PIOc_set_log_level(4); */
/* if (!my_rank) */
/* nc_set_log_level(3); */

/* Initialize the intracomm. The IO task will not return from
* this call until the PIOc_finalize() is called by the
* compute tasks. */
if (nc_def_async(MPI_COMM_WORLD, num_io_procs, NULL, COMPONENT_COUNT,
num_procs2, NULL, NULL, NULL, PIO_REARR_BOX, &iosysid))
PERR;

if (my_rank)
{
struct timeval starttime, endtime;
long long startt, endt;
long long delta;
float num_megabytes = 0;
float delta_in_sec;
float mb_per_sec;

/* Start the clock. */
gettimeofday(&starttime, NULL);

/* Create a file with a 3D record var. */
if (nc_create(FILE_NAME, NC_PIO|NC_NETCDF4, &ncid)) PERR;
if (nc_def_dim(ncid, DIM_NAME_UNLIMITED, dimlen[0], &dimid[0])) PERR;
if (nc_def_dim(ncid, DIM_NAME_X, dimlen[1], &dimid[1])) PERR;
if (nc_def_dim(ncid, DIM_NAME_Y, dimlen[2], &dimid[2])) PERR;
if (nc_def_var(ncid, VAR_NAME, NC_INT, NDIM3, dimid, &varid)) PERR;
if (nc_enddef(ncid)) PERR;

/* Calculate a decomposition for distributed arrays. */
elements_per_pe = DIM_LEN_X * DIM_LEN_Y / (ntasks - num_io_procs);
/* printf("my_rank %d elements_per_pe %ld\n", my_rank, elements_per_pe); */
if (!(compdof = malloc(elements_per_pe * sizeof(size_t))))
PERR;
for (i = 0; i < elements_per_pe; i++)
{
compdof[i] = (my_rank - num_io_procs) * elements_per_pe + i;
/* printf("my_rank %d compdof[%d]=%ld\n", my_rank, i, compdof[i]); */
}

/* Create the PIO decomposition for this test. */
if (nc_def_decomp(iosysid, PIO_INT, NDIM2, &dimlen[1], elements_per_pe,
compdof, &ioid, 1, NULL, NULL)) PERR;
free(compdof);

/* Create some data on this processor. */
if (!(my_data = malloc(elements_per_pe * sizeof(int)))) PERR;
for (i = 0; i < elements_per_pe; i++)
my_data[i] = my_rank * 10 + i;

/* Write some data with distributed arrays. */
if (nc_put_vard_int(ncid, varid, ioid, 0, my_data)) PERR;
if (nc_close(ncid)) PERR;

/* Reopen the file using netCDF integration. */
{
int ndims, nvars, ngatts, unlimdimid;
nc_type xtype_in;
char var_name_in[NC_MAX_NAME + 1];
char dim_name_in[NC_MAX_NAME + 1];
int natts_in;
int dimids_in[NDIM3];
size_t dim_len_in;

/* Open the file. */
if (nc_open(FILE_NAME, NC_PIO, &ncid)) PERR;

/* Check the file. */
if (nc_inq(ncid, &ndims, &nvars, &ngatts, &unlimdimid)) PERR;
if (ndims != 3 || nvars != 1 || ngatts != 0 ||
unlimdimid != 0) PERR;
if (nc_inq_var(ncid, 0, var_name_in, &xtype_in, &ndims,
dimids_in, &natts_in)) PERR;
if (strcmp(var_name_in, VAR_NAME) || xtype_in != NC_INT || ndims != NDIM3
|| dimids_in[0] != 0 || dimids_in[1] != 1 || dimids_in[2] != 2 ||
natts_in != 0) PERR;
if (nc_inq_dim(ncid, 0, dim_name_in, &dim_len_in)) PERR;
if (strcmp(dim_name_in, DIM_NAME_UNLIMITED) || dim_len_in != 1) PERR;
if (nc_inq_dim(ncid, 1, dim_name_in, &dim_len_in)) PERR;
if (strcmp(dim_name_in, DIM_NAME_X) || dim_len_in != DIM_LEN_X) PERR;
if (nc_inq_dim(ncid, 2, dim_name_in, &dim_len_in)) PERR;
if (strcmp(dim_name_in, DIM_NAME_Y) || dim_len_in != DIM_LEN_Y) PERR;

/* Read distributed arrays. */
if (!(data_in = malloc(elements_per_pe * sizeof(int)))) PERR;
if (nc_get_vard_int(ncid, varid, ioid, 0, data_in)) PERR;

/* Check results. */
for (i = 0; i < elements_per_pe; i++)
if (data_in[i] != my_data[i]) PERR;

/* Close file. */
if (nc_close(ncid)) PERR;

/* Free resources. */
free(data_in);
}

/* Stop the clock. */
gettimeofday(&endtime, NULL);

/* Compute the time delta */
startt = (1000000 * starttime.tv_sec) + starttime.tv_usec;
endt = (1000000 * endtime.tv_sec) + endtime.tv_usec;
delta = (endt - startt)/NUM_TIMESTEPS;
delta_in_sec = (float)delta / 1000000;
mb_per_sec = num_megabytes / delta_in_sec;
printf("\n%d\t%d\t%d\t%d\t%d\t%8.3f\t%8.1f\t%8.3f\n", ntasks, num_io_procs,
1, 0, 1, delta_in_sec, num_megabytes, mb_per_sec);

free(my_data);
if (nc_free_decomp(ioid)) PERR;
if (nc_free_iosystem(iosysid)) PERR;
}
}
if (!my_rank)
PSUMMARIZE_ERR;

/* Finalize MPI. */
MPI_Finalize();
PFINAL_RESULTS;
}

0 comments on commit a8ea44c

Please sign in to comment.