/* Copyright 2003-2018, University Corporation for Atmospheric * Research. See the COPYRIGHT file for copying and redistribution * conditions. */ /** * @file @internal Internal netcdf-4 functions. * * This file contains functions internal to the netcdf4 library. None of * the functions in this file are exposed in the exetnal API. These * functions all relate to the manipulation of netcdf-4's in-memory * buffer of metadata information, i.e. the linked list of NC * structs. * * @author Ed Hartnett */ #include "config.h" #include "hdf5internal.h" #undef DEBUGH5 #ifdef DEBUGH5 /** * @internal Provide a catchable error reporting function * * @param ignored Ignored. * * @return 0 for success. */ static herr_t h5catch(void* ignored) { H5Eprint(NULL); return 0; } #endif /* These are the default chunk cache sizes for HDF5 files created or * opened with netCDF-4. */ extern size_t nc4_chunk_cache_size; extern size_t nc4_chunk_cache_nelems; extern float nc4_chunk_cache_preemption; #ifdef LOGGING /* This is the severity level of messages which will be logged. Use severity 0 for errors, 1 for important log messages, 2 for less important, etc. */ extern int nc_log_level; #endif /* LOGGING */ int nc4_hdf5_initialized = 0; /**< True if initialization has happened. */ /** * @internal Provide a wrapper for H5Eset_auto * @param func Pointer to func. * @param client_data Client data. * * @return 0 for success */ static herr_t set_auto(void* func, void *client_data) { #ifdef DEBUGH5 return H5Eset_auto2(H5E_DEFAULT,(H5E_auto2_t)h5catch,client_data); #else return H5Eset_auto2(H5E_DEFAULT,(H5E_auto2_t)func,client_data); #endif } /** * @internal Provide a function to do any necessary initialization of * the HDF5 library. */ void nc4_hdf5_initialize(void) { if (set_auto(NULL, NULL) < 0) LOG((0, "Couldn't turn off HDF5 error messages!")); LOG((1, "HDF5 error messages have been turned off.")); nc4_hdf5_initialized = 1; } /** * @internal Provide a function to do any necessary finalization of * the HDF5 library. */ void nc4_hdf5_finalize(void) { /* Reclaim global resources */ NC4_provenance_finalize(); nc4_hdf5_initialized = 0; } /** * @internal Given a varid, return the maximum length of a dimension * using dimid. * * @param grp Pointer to group info struct. * @param varid Variable ID. * @param dimid Dimension ID. * @param maxlen Pointer that gets the max length. * * @return ::NC_NOERR No error. * @author Ed Hartnett */ static int find_var_dim_max_length(NC_GRP_INFO_T *grp, int varid, int dimid, size_t *maxlen) { hid_t datasetid = 0, spaceid = 0; NC_VAR_INFO_T *var; hsize_t *h5dimlen = NULL, *h5dimlenmax = NULL; int d, dataset_ndims = 0; int retval = NC_NOERR; *maxlen = 0; /* Find this var. */ var = (NC_VAR_INFO_T*)ncindexith(grp->vars,varid); if (!var) return NC_ENOTVAR; assert(var->hdr.id == varid); /* If the var hasn't been created yet, its size is 0. */ if (!var->created) { *maxlen = 0; } else { /* Get the number of records in the dataset. */ if ((retval = nc4_open_var_grp2(grp, var->hdr.id, &datasetid))) BAIL(retval); if ((spaceid = H5Dget_space(datasetid)) < 0) BAIL(NC_EHDFERR); /* If it's a scalar dataset, it has length one. */ if (H5Sget_simple_extent_type(spaceid) == H5S_SCALAR) { *maxlen = (var->dimids && var->dimids[0] == dimid) ? 1 : 0; } else { /* Check to make sure ndims is right, then get the len of each dim in the space. */ if ((dataset_ndims = H5Sget_simple_extent_ndims(spaceid)) < 0) BAIL(NC_EHDFERR); if (dataset_ndims != var->ndims) BAIL(NC_EHDFERR); if (!(h5dimlen = malloc(dataset_ndims * sizeof(hsize_t)))) BAIL(NC_ENOMEM); if (!(h5dimlenmax = malloc(dataset_ndims * sizeof(hsize_t)))) BAIL(NC_ENOMEM); if ((dataset_ndims = H5Sget_simple_extent_dims(spaceid, h5dimlen, h5dimlenmax)) < 0) BAIL(NC_EHDFERR); LOG((5, "find_var_dim_max_length: varid %d len %d max: %d", varid, (int)h5dimlen[0], (int)h5dimlenmax[0])); for (d=0; ddimids[d] == dimid) { *maxlen = *maxlen > h5dimlen[d] ? *maxlen : h5dimlen[d]; } } } } exit: if (spaceid > 0 && H5Sclose(spaceid) < 0) BAIL2(NC_EHDFERR); if (h5dimlen) free(h5dimlen); if (h5dimlenmax) free(h5dimlenmax); return retval; } /** * @internal Search for type with a given HDF type id. * * @param h5 File * @param target_hdf_typeid HDF5 type ID to find. * * @return Pointer to type info struct, or NULL if not found. * @author Ed Hartnett */ NC_TYPE_INFO_T * nc4_rec_find_hdf_type(NC_FILE_INFO_T *h5, hid_t target_hdf_typeid) { NC_TYPE_INFO_T *type; htri_t equal; int i; assert(h5); for(i=0;ialltypes);i++) { type = (NC_TYPE_INFO_T*)nclistget(h5->alltypes,i); if(type == NULL) continue; /* Is this the type we are searching for? */ if ((equal = H5Tequal(type->native_hdf_typeid ? type->native_hdf_typeid : type->hdf_typeid, target_hdf_typeid)) < 0) return NULL; if (equal) return type; } /* Can't find it. Fate, why do you mock me? */ return NULL; } /** * @internal Find the actual length of a dim by checking the length of * that dim in all variables that use it, in grp or children. **len * must be initialized to zero before this function is called. * * @param grp Pointer to group info struct. * @param dimid Dimension ID. * @param len Pointer to pointer that gets length. * * @return ::NC_NOERR No error. * @author Ed Hartnett */ int nc4_find_dim_len(NC_GRP_INFO_T *grp, int dimid, size_t **len) { NC_GRP_INFO_T *g; NC_VAR_INFO_T *var; int retval; int i; assert(grp && len); LOG((3, "nc4_find_dim_len: grp->name %s dimid %d", grp->hdr.name, dimid)); /* If there are any groups, call this function recursively on * them. */ for(i=0;ichildren);i++) { g = (NC_GRP_INFO_T*)ncindexith(grp->children,i); if(g == NULL) continue; if ((retval = nc4_find_dim_len(g, dimid, len))) return retval; } /* For all variables in this group, find the ones that use this * dimension, and remember the max length. */ for (i=0; i < ncindexsize(grp->vars); i++) { size_t mylen; var = (NC_VAR_INFO_T*)ncindexith(grp->vars,i); if (var == NULL) continue; /* Find max length of dim in this variable... */ if ((retval = find_var_dim_max_length(grp, var->hdr.id, dimid, &mylen))) return retval; **len = **len > mylen ? **len : mylen; } return NC_NOERR; } /** * @internal Break a coordinate variable to separate the dimension and * the variable. * * This is called from nc_rename_dim() and nc_rename_var(). In some * renames, the coord variable must stay, but it is no longer a coord * variable. This function changes a coord var into an ordinary * variable. * * @param grp Pointer to group info struct. * @param coord_var Pointer to variable info struct. * @param dim Pointer to dimension info struct. * * @return ::NC_NOERR No error. * @return ::NC_ENOMEM Out of memory. * @author Quincey Koziol, Ed Hartnett */ int nc4_break_coord_var(NC_GRP_INFO_T *grp, NC_VAR_INFO_T *coord_var, NC_DIM_INFO_T *dim) { int retval = NC_NOERR; /* Sanity checks */ assert(grp && coord_var && dim && dim->coord_var == coord_var && coord_var->dim[0] == dim && coord_var->dimids[0] == dim->hdr.id && !((NC_HDF5_DIM_INFO_T *)(dim->format_dim_info))->hdf_dimscaleid); LOG((3, "%s dim %s was associated with var %s, but now has different name", __func__, dim->hdr.name, coord_var->hdr.name)); /* If we're replacing an existing dimscale dataset, go to * every var in the file and detach this dimension scale. */ if ((retval = rec_detach_scales(grp->nc4_info->root_grp, dim->hdr.id, coord_var->hdf_datasetid))) return retval; /* Allow attached dimscales to be tracked on the [former] * coordinate variable */ if (coord_var->ndims) { /* Coordinate variables shouldn't have dimscales attached. */ assert(!coord_var->dimscale_attached); /* Allocate space for tracking them */ if (!(coord_var->dimscale_attached = calloc(coord_var->ndims, sizeof(nc_bool_t)))) return NC_ENOMEM; } /* Remove the atts that go with being a coordinate var. */ /* if ((retval = remove_coord_atts(coord_var->hdf_datasetid))) */ /* return retval; */ /* Detach dimension from variable */ coord_var->dimscale = NC_FALSE; dim->coord_var = NULL; /* Set state transition indicators */ coord_var->was_coord_var = NC_TRUE; coord_var->became_coord_var = NC_FALSE; return NC_NOERR; } /** * @internal Delete an existing dimscale-only dataset. * * A dimscale-only HDF5 dataset is created when a dim is defined * without an accompanying coordinate variable. * * Sometimes, during renames, or late creation of variables, an * existing, dimscale-only dataset must be removed. This means * detaching all variables that use the dataset, then closing and * unlinking it. * * @param grp The grp of the dimscale-only dataset to be deleted, or a * higher group in the hierarchy (ex. root group). * @param dimid id of the dimension * @param dim Pointer to the dim with the dimscale-only dataset to be * deleted. * * @return ::NC_NOERR No error. * @return ::NC_EHDFERR HDF5 error. * @author Ed Hartnett */ int delete_existing_dimscale_dataset(NC_GRP_INFO_T *grp, int dimid, NC_DIM_INFO_T *dim) { NC_HDF5_DIM_INFO_T *hdf5_dim; int retval; assert(grp && dim && dim->format_dim_info); LOG((2, "%s: deleting dimscale dataset %s dimid %d", __func__, dim->hdr.name, dimid)); hdf5_dim = (NC_HDF5_DIM_INFO_T *)dim->format_dim_info; /* Detach dimscale from any variables using it */ if ((retval = rec_detach_scales(grp, dimid, hdf5_dim->hdf_dimscaleid)) < 0) return retval; /* Close the HDF5 dataset */ if (H5Dclose(hdf5_dim->hdf_dimscaleid) < 0) return NC_EHDFERR; hdf5_dim->hdf_dimscaleid = 0; /* Now delete the dataset. */ if (H5Gunlink(grp->hdf_grpid, dim->hdr.name) < 0) return NC_EHDFERR; return NC_NOERR; } /** * @internal Reform a coordinate variable from a dimension and a * variable. * * @param grp Pointer to group info struct. * @param var Pointer to variable info struct. * @param dim Pointer to dimension info struct. * * @return ::NC_NOERR No error. * @author Quincey Koziol */ int nc4_reform_coord_var(NC_GRP_INFO_T *grp, NC_VAR_INFO_T *var, NC_DIM_INFO_T *dim) { NC_HDF5_DIM_INFO_T *hdf5_dim; int need_to_reattach_scales = 0; int retval = NC_NOERR; assert(grp && var && dim && dim->format_dim_info); LOG((3, "%s: dim->hdr.name %s var->hdr.name %s", __func__, dim->hdr.name, var->hdr.name)); hdf5_dim = (NC_HDF5_DIM_INFO_T *)dim->format_dim_info; /* Detach dimscales from the [new] coordinate variable */ if (var->dimscale_attached) { int dims_detached = 0; int finished = 0; int d; /* Loop over all dimensions for variable */ for (d = 0; d < var->ndims && !finished; d++) { /* Is there a dimscale attached to this axis? */ if (var->dimscale_attached[d]) { NC_GRP_INFO_T *g; int k; for (g = grp; g && !finished; g = g->parent) { NC_DIM_INFO_T *dim1; NC_HDF5_DIM_INFO_T *hdf5_dim1; for (k = 0; k < ncindexsize(g->dim); k++) { dim1 = (NC_DIM_INFO_T *)ncindexith(g->dim, k); assert(dim1 && dim1->format_dim_info); hdf5_dim1 = (NC_HDF5_DIM_INFO_T *)dim1->format_dim_info; if (var->dimids[d] == dim1->hdr.id) { hid_t dim_datasetid; /* Dataset ID for dimension */ /* Find dataset ID for dimension */ if (dim1->coord_var) dim_datasetid = dim1->coord_var->hdf_datasetid; else dim_datasetid = hdf5_dim1->hdf_dimscaleid; /* dim_datasetid may be 0 in some cases when * renames of dims and vars are happening. In * this case, the scale has already been * detached. */ if (dim_datasetid > 0) { LOG((3, "detaching scale from %s", var->hdr.name)); if (H5DSdetach_scale(var->hdf_datasetid, dim_datasetid, d) < 0) BAIL(NC_EHDFERR); } var->dimscale_attached[d] = NC_FALSE; if (dims_detached++ == var->ndims) finished++; } } } } } /* next variable dimension */ /* Release & reset the array tracking attached dimscales */ free(var->dimscale_attached); var->dimscale_attached = NULL; need_to_reattach_scales++; } /* Use variable's dataset ID for the dimscale ID. */ if (hdf5_dim->hdf_dimscaleid && grp != NULL) { LOG((3, "closing and unlinking dimscale dataset %s", dim->hdr.name)); if (H5Dclose(hdf5_dim->hdf_dimscaleid) < 0) BAIL(NC_EHDFERR); hdf5_dim->hdf_dimscaleid = 0; /* Now delete the dimscale's dataset (it will be recreated later, if necessary) */ if (H5Gunlink(grp->hdf_grpid, dim->hdr.name) < 0) return NC_EDIMMETA; } /* Attach variable to dimension */ var->dimscale = NC_TRUE; dim->coord_var = var; /* Check if this variable used to be a coord. var */ if (need_to_reattach_scales || (var->was_coord_var && grp != NULL)) { /* Reattach the scale everywhere it is used. */ /* (Recall that netCDF dimscales are always 1-D) */ if ((retval = rec_reattach_scales(grp->nc4_info->root_grp, var->dimids[0], var->hdf_datasetid))) return retval; /* Set state transition indicator (cancels earlier transition) */ var->was_coord_var = NC_FALSE; } else /* Set state transition indicator */ var->became_coord_var = NC_TRUE; exit: return retval; } /** * @internal Recursively free HDF5 objects for a group (and everything * it contains). * * @param grp Pointer to group info struct. * * @return ::NC_NOERR No error. * @author Ed Hartnett */ int nc4_rec_grp_HDF5_del(NC_GRP_INFO_T *grp) { NC_VAR_INFO_T *var; NC_DIM_INFO_T *dim; NC_ATT_INFO_T *att; int a; int i; int retval; assert(grp); LOG((3, "%s: grp->name %s", __func__, grp->hdr.name)); /* Recursively call this function for each child, if any, stopping * if there is an error. */ for (i = 0; i < ncindexsize(grp->children); i++) if ((retval = nc4_rec_grp_HDF5_del((NC_GRP_INFO_T *)ncindexith(grp->children, i)))) return retval; /* Close HDF5 resources associated with global attributes. */ for (a = 0; a < ncindexsize(grp->att); a++) { NC_HDF5_ATT_INFO_T *hdf5_att; att = (NC_ATT_INFO_T *)ncindexith(grp->att, a); assert(att && att->format_att_info); hdf5_att = (NC_HDF5_ATT_INFO_T *)att->format_att_info; /* Close the HDF5 typeid. */ if (hdf5_att->native_hdf_typeid && H5Tclose(hdf5_att->native_hdf_typeid) < 0) return NC_EHDFERR; } /* Close HDF5 resources associated with vars. */ for (i = 0; i < ncindexsize(grp->vars); i++) { var = (NC_VAR_INFO_T *)ncindexith(grp->vars, i); assert(var); /* Close the HDF5 dataset associated with this var. */ if (var->hdf_datasetid) { LOG((3, "closing HDF5 dataset %lld", var->hdf_datasetid)); if (H5Dclose(var->hdf_datasetid) < 0) return NC_EHDFERR; } for (a = 0; a < ncindexsize(var->att); a++) { NC_HDF5_ATT_INFO_T *hdf5_att; att = (NC_ATT_INFO_T *)ncindexith(var->att, a); assert(att && att->format_att_info); hdf5_att = (NC_HDF5_ATT_INFO_T *)att->format_att_info; /* Close the HDF5 typeid if one is open. */ if (hdf5_att->native_hdf_typeid && H5Tclose(hdf5_att->native_hdf_typeid) < 0) return NC_EHDFERR; } } /* Close HDF5 resources associated with dims. */ for (i = 0; i < ncindexsize(grp->dim); i++) { NC_HDF5_DIM_INFO_T *hdf5_dim; dim = (NC_DIM_INFO_T *)ncindexith(grp->dim, i); assert(dim && dim->format_dim_info); hdf5_dim = (NC_HDF5_DIM_INFO_T *)dim->format_dim_info; /* If this is a dim without a coordinate variable, then close * the HDF5 DIM_WITHOUT_VARIABLE dataset associated with this * dim. */ if (hdf5_dim->hdf_dimscaleid && H5Dclose(hdf5_dim->hdf_dimscaleid) < 0) return NC_EHDFERR; } /* Close HDF5 resources associated with types. Set values to 0 * after closing types. Because of type reference counters, these * closes can be called multiple times. */ for (i = 0; i < ncindexsize(grp->type); i++) { NC_TYPE_INFO_T *type = (NC_TYPE_INFO_T *)ncindexith(grp->type, i); assert(type); /* Close any open user-defined HDF5 typeids. */ if (type->hdf_typeid && H5Tclose(type->hdf_typeid) < 0) return NC_EHDFERR; type->hdf_typeid = 0; if (type->native_hdf_typeid && H5Tclose(type->native_hdf_typeid) < 0) return NC_EHDFERR; type->native_hdf_typeid = 0; /* Class-specific cleanup. Only enums and vlens have HDF5 * resources to close. */ switch (type->nc_type_class) { case NC_ENUM: if (type->u.e.base_hdf_typeid && H5Tclose(type->u.e.base_hdf_typeid) < 0) return NC_EHDFERR; type->u.e.base_hdf_typeid = 0; break; case NC_VLEN: if (type->u.v.base_hdf_typeid && H5Tclose(type->u.v.base_hdf_typeid) < 0) return NC_EHDFERR; type->u.v.base_hdf_typeid = 0; break; default: /* Do nothing. */ break; } } /* Close the HDF5 group. */ LOG((4, "%s: closing group %s", __func__, grp->hdr.name)); if (grp->hdf_grpid && H5Gclose(grp->hdf_grpid) < 0) return NC_EHDFERR; return NC_NOERR; } #ifdef LOGGING /* We will need to check against nc log level from nc4internal.c. */ extern int nc_log_level; /** * @internal This is like nc_set_log_level(), but will also turn on * HDF5 internal logging, in addition to netCDF logging. This should * never be called by the user. It is called in open/create when the * nc logging level has changed. * * @return ::NC_NOERR No error. * @author Ed Hartnett */ int hdf5_set_log_level() { /* If the user wants to completely turn off logging, turn off HDF5 logging too. Now I truely can't think of what to do if this fails, so just ignore the return code. */ if (nc_log_level == NC_TURN_OFF_LOGGING) { set_auto(NULL, NULL); LOG((1, "HDF5 error messages turned off!")); } else { if (set_auto((H5E_auto_t)&H5Eprint, stderr) < 0) LOG((0, "H5Eset_auto failed!")); LOG((1, "HDF5 error messages turned on.")); } return NC_NOERR; } #endif /* LOGGING */