mirror of
https://github.com/Unidata/netcdf-c.git
synced 2025-01-06 15:34:44 +08:00
3ffe7be446
re: Discussion https://github.com/Unidata/netcdf-c/discussions/2214 The primary change is to support so-called "standard filters". A standard filter is one that is defined by the following netcdf-c API: ```` int nc_def_var_XXX(int ncid, int varid, size_t nparams, unsigned* params); int nc_inq_var_XXXX(int ncid, int varid, int* usefilterp, unsigned* params); ```` So for example, zstandard would be a standard filter by defining the functions *nc_def_var_zstandard* and *nc_inq_var_zstandard*. In order to define these functions, we need a new dispatch function: ```` int nc_inq_filter_avail(int ncid, unsigned filterid); ```` This function, combined with the existing filter API can be used to implement arbitrary standard filters using a simple code pattern. Note that I would have preferred that this function return a list of all available filters, but HDF5 does not support that functionality. So this PR implements the dispatch function and implements the following standard functions: + bzip2 + zstandard + blosc Specific test cases are also provided for HDF5 and NCZarr. Over time, other specific standard filters will be defined. ## Primary Changes * Add nc_inq_filter_avail() to netcdf-c API. * Add standard filter implementations to test use of *nc_inq_filter_avail*. * Bump the dispatch table version number and add to all the relevant dispatch tables (libsrc, libsrcp, etc). * Create a program to invoke nc_inq_filter_avail so that it is accessible to shell scripts. * Cleanup szip support to properly support szip when HDF5 is disabled. This involves detecting libsz separately from testing if HDF5 supports szip. * Integrate shuffle and fletcher32 into the existing filter API. This means that, for example, nc_def_var_fletcher32 is now a wrapper around nc_def_var_filter. * Extend the Codec defaulting to allow multiple default shared libraries. ## Misc. Changes * Modify configure.ac/CMakeLists.txt to look for the relevant libraries implementing standard filters. * Modify libnetcdf.settings to list available standard filters (including deflate and szip). * Add CMake test modules to locate libbz2 and libzstd. * Cleanup the HDF5 memory manager function use in the plugins. * remove unused file include//ncfilter.h * remove tests for the HDF5 memory operations e.g. H5allocate_memory. * Add flag to ncdump to force use of _Filter instead of _Deflate or _Shuffle or _Fletcher32. Used for testing.
212 lines
6.0 KiB
C
212 lines
6.0 KiB
C
/* This is part of the netCDF package. Copyright 2020 University
|
|
Corporation for Atmospheric Research/Unidata See COPYRIGHT file for
|
|
conditions of use.
|
|
|
|
Test HDF5 file code. These are not intended to be exhaustive tests,
|
|
but they use HDF5 the same way that netCDF-4 does, so if these
|
|
tests don't work, than netCDF-4 won't work either.
|
|
|
|
This files tests parallel I/O using compression filters. This
|
|
functionality is only available in HDF5-1.10.3 and later versions.
|
|
|
|
Ed Hartnett
|
|
*/
|
|
#include <nc_tests.h>
|
|
#include "err_macros.h"
|
|
#include <hdf5.h>
|
|
|
|
#define FILE_NAME "tst_h_par_compress.h5"
|
|
#define VAR_NAME "HALs_memory"
|
|
#define NDIMS 1
|
|
#define MILLION 1000000
|
|
#define DIM2_LEN 16000000
|
|
#define SC1 100000 /* slice count. */
|
|
|
|
/* The following code, when uncommented, adds szip testing for
|
|
* parallel I/O. However, this currently fails. I have a support
|
|
* request in to HDF5 about this. Ed 7/8/20 */
|
|
/* #ifdef HAVE_H5Z_SZIP */
|
|
/* #define NUM_COMPRESS_FILTERS 2 */
|
|
/* #else */
|
|
/* #define NUM_COMPRESS_FILTERS 1 */
|
|
/* #endif /\* HAVE_H5Z_SZIP *\/ */
|
|
#define NUM_COMPRESS_FILTERS 1
|
|
|
|
int
|
|
main(int argc, char **argv)
|
|
{
|
|
int cf;
|
|
int p, my_rank;
|
|
|
|
MPI_Init(&argc, &argv);
|
|
MPI_Comm_rank(MPI_COMM_WORLD, &my_rank);
|
|
MPI_Comm_size(MPI_COMM_WORLD, &p);
|
|
|
|
/* For builds with HDF5 prior to 1.10.3, just return success. */
|
|
#ifdef HDF5_SUPPORTS_PAR_FILTERS
|
|
for (cf = 0; cf < NUM_COMPRESS_FILTERS; cf++)
|
|
{
|
|
if (!my_rank)
|
|
printf("*** Testing parallel I/O with %s compression...", cf ? "szip" : "zlib");
|
|
{
|
|
hid_t fapl_id, fileid, whole_spaceid, dsid, slice_spaceid, whole_spaceid1, xferid;
|
|
hid_t plistid;
|
|
hsize_t start[NDIMS], count[NDIMS];
|
|
hsize_t dims[1], chunksize = SC1;
|
|
int data[SC1], data_in[SC1];
|
|
int num_steps;
|
|
int deflate_level = 4;
|
|
int i, s;
|
|
|
|
/* We will write the same slice of random data over and over to
|
|
* fill the file. */
|
|
for (i = 0; i < SC1; i++)
|
|
data[i] = rand();
|
|
|
|
/* Create file. */
|
|
if ((fapl_id = H5Pcreate(H5P_FILE_ACCESS)) < 0) ERR;
|
|
if (H5Pset_fapl_mpio(fapl_id, MPI_COMM_WORLD, MPI_INFO_NULL) < 0) ERR;
|
|
if ((fileid = H5Fcreate(FILE_NAME, H5F_ACC_TRUNC, H5P_DEFAULT,
|
|
fapl_id)) < 0) ERR;
|
|
|
|
/* Create a space to deal with one slice in memory. */
|
|
dims[0] = SC1;
|
|
if ((slice_spaceid = H5Screate_simple(NDIMS, dims, NULL)) < 0) ERR;
|
|
|
|
/* Create a space to write all slices. */
|
|
dims[0] = DIM2_LEN;
|
|
if ((whole_spaceid = H5Screate_simple(NDIMS, dims, NULL)) < 0) ERR;
|
|
|
|
/* Create property list for dataset. */
|
|
if ((plistid = H5Pcreate(H5P_DATASET_CREATE)) < 0) ERR;
|
|
|
|
/* Turn off object tracking times in HDF5 (as is done in nc4hdf.c). */
|
|
if (H5Pset_obj_track_times(plistid, 0) < 0) ERR;
|
|
|
|
/* Required to truly turn HDF5 fill values off */
|
|
if (H5Pset_fill_time(plistid, H5D_FILL_TIME_NEVER) < 0) ERR;
|
|
|
|
/* Set compression, either deflate or szip. */
|
|
if (cf == 0)
|
|
{
|
|
if (H5Pset_deflate(plistid, deflate_level) < 0) ERR;
|
|
}
|
|
else
|
|
{
|
|
int options_mask = 32;
|
|
int bits_per_pixel = 32;
|
|
if (H5Pset_szip(plistid, options_mask, bits_per_pixel)) ERR;
|
|
}
|
|
|
|
/* Set chunking. */
|
|
if (H5Pset_chunk(plistid, NDIMS, &chunksize) < 0) ERR;
|
|
|
|
/* Turn on creation order tracking. */
|
|
if (H5Pset_attr_creation_order(plistid, H5P_CRT_ORDER_TRACKED|
|
|
H5P_CRT_ORDER_INDEXED) < 0) ERR;
|
|
|
|
/* Create dataset. */
|
|
if ((dsid = H5Dcreate2(fileid, VAR_NAME, H5T_NATIVE_INT,
|
|
whole_spaceid, H5P_DEFAULT, plistid, H5P_DEFAULT)) < 0) ERR;
|
|
|
|
/* Use collective write operations. */
|
|
if ((xferid = H5Pcreate(H5P_DATASET_XFER)) < 0) ERR;
|
|
if (H5Pset_dxpl_mpio(xferid, H5FD_MPIO_COLLECTIVE) < 0) ERR;
|
|
|
|
/* Write the data in num_step steps. */
|
|
num_steps = (DIM2_LEN/SC1) / p;
|
|
for (s = 0; s < num_steps; s++)
|
|
{
|
|
/* Select hyperslab for write of one slice. */
|
|
start[0] = s * SC1 * p + my_rank * SC1;
|
|
count[0] = SC1;
|
|
if (H5Sselect_hyperslab(whole_spaceid, H5S_SELECT_SET,
|
|
start, NULL, count, NULL) < 0) ERR;
|
|
|
|
if (H5Dwrite(dsid, H5T_NATIVE_INT, slice_spaceid, whole_spaceid,
|
|
xferid, data) < 0) ERR;
|
|
|
|
}
|
|
|
|
/* Close. These collective operations will allow every process
|
|
* to catch up. */
|
|
if (H5Dclose(dsid) < 0 ||
|
|
H5Sclose(whole_spaceid) < 0 ||
|
|
H5Sclose(slice_spaceid) < 0 ||
|
|
H5Pclose(fapl_id) < 0 ||
|
|
H5Pclose(plistid) < 0 ||
|
|
H5Fclose(fileid) < 0)
|
|
ERR;
|
|
|
|
/* Open the file. */
|
|
if ((fapl_id = H5Pcreate(H5P_FILE_ACCESS)) < 0) ERR;
|
|
if (H5Pset_fapl_mpio(fapl_id, MPI_COMM_WORLD, MPI_INFO_NULL) < 0) ERR;
|
|
|
|
|
|
if (H5Pset_libver_bounds(fapl_id, H5F_LIBVER_LATEST, H5F_LIBVER_LATEST) < 0) ERR;
|
|
if ((fileid = H5Fopen(FILE_NAME, H5F_ACC_RDONLY, fapl_id)) < 0) ERR;
|
|
|
|
/* Create a space to deal with one slice in memory. */
|
|
dims[0] = SC1;
|
|
if ((slice_spaceid = H5Screate_simple(NDIMS, dims, NULL)) < 0) ERR;
|
|
|
|
/* Open the dataset. */
|
|
if ((dsid = H5Dopen1(fileid, VAR_NAME)) < 0) ERR;
|
|
if ((whole_spaceid1 = H5Dget_space(dsid)) < 0) ERR;
|
|
|
|
/* Read the data, a slice at a time. */
|
|
for (s = 0; s < num_steps; s++)
|
|
{
|
|
/* Select hyperslab for read of one slice. */
|
|
start[0] = s * SC1 * p + my_rank * SC1;
|
|
count[0] = SC1;
|
|
if (H5Sselect_hyperslab(whole_spaceid1, H5S_SELECT_SET,
|
|
start, NULL, count, NULL) < 0)
|
|
{
|
|
ERR;
|
|
return 2;
|
|
}
|
|
|
|
if (H5Dread(dsid, H5T_NATIVE_INT, slice_spaceid, whole_spaceid1,
|
|
H5P_DEFAULT, data_in) < 0)
|
|
{
|
|
ERR;
|
|
return 2;
|
|
}
|
|
|
|
/* Check the slice of data. */
|
|
for (i = 0; i < SC1; i++)
|
|
if (data[i] != data_in[i])
|
|
{
|
|
ERR;
|
|
return 2;
|
|
}
|
|
}
|
|
|
|
/* Close down. */
|
|
if (H5Dclose(dsid) < 0 ||
|
|
H5Sclose(slice_spaceid) < 0 ||
|
|
H5Sclose(whole_spaceid1) < 0 ||
|
|
H5Pclose(fapl_id) < 0 ||
|
|
H5Fclose(fileid) < 0)
|
|
ERR;
|
|
}
|
|
if (!my_rank)
|
|
SUMMARIZE_ERR;
|
|
|
|
} /* next cf */
|
|
#else
|
|
{
|
|
if (!my_rank)
|
|
printf("*** HDF5 1.10.3 or greater required for this test.\n");
|
|
}
|
|
|
|
#endif /* HDF5_SUPPORTS_PAR_FILTERS */
|
|
|
|
MPI_Finalize();
|
|
|
|
if (!my_rank)
|
|
FINAL_RESULTS;
|
|
return 0;
|
|
}
|