2018-02-08 21:20:58 +08:00
|
|
|
/* Copyright 2018, UCAR/Unidata See netcdf/COPYRIGHT file for copying
|
|
|
|
* and redistribution conditions.*/
|
|
|
|
/**
|
2019-08-04 22:03:53 +08:00
|
|
|
* @file
|
|
|
|
* @internal The HDF4 file functions. These provide a read-only
|
|
|
|
* interface to HDF4 SD files.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "config.h"
|
|
|
|
#include "nc4internal.h"
|
|
|
|
#include "hdf4dispatch.h"
|
|
|
|
#include <mfhdf.h>
|
|
|
|
|
2018-04-05 04:11:44 +08:00
|
|
|
#define NUM_TYPES 12 /**< Number of netCDF atomic types. */
|
|
|
|
|
2018-02-08 21:20:58 +08:00
|
|
|
extern int nc4_vararray_add(NC_GRP_INFO_T *grp, NC_VAR_INFO_T *var);
|
|
|
|
|
|
|
|
/** @internal These flags may not be set for open mode. */
|
2018-04-05 04:11:44 +08:00
|
|
|
static const int
|
2018-09-23 09:22:34 +08:00
|
|
|
ILLEGAL_OPEN_FLAGS = (NC_MMAP|NC_64BIT_OFFSET|NC_DISKLESS|NC_WRITE);
|
2018-04-05 04:11:44 +08:00
|
|
|
|
|
|
|
/** @internal NetCDF atomic type names. */
|
|
|
|
static const char*
|
|
|
|
nc_type_name_g[NUM_TYPES] = {"char", "byte", "short", "int", "float", "double",
|
|
|
|
"ubyte", "ushort", "uint", "int64", "uint64",
|
|
|
|
"string"};
|
|
|
|
|
|
|
|
/** @internal NetCDF atomic type sizes. */
|
|
|
|
static const size_t
|
|
|
|
nc_type_size_g[NUM_TYPES] = {sizeof(char), sizeof(char), sizeof(short),
|
|
|
|
sizeof(int), sizeof(float), sizeof(double),
|
|
|
|
sizeof(unsigned char), sizeof(unsigned short),
|
|
|
|
sizeof(unsigned int), sizeof(long long),
|
|
|
|
sizeof(unsigned long long), sizeof(char *)};
|
2018-02-08 21:20:58 +08:00
|
|
|
|
|
|
|
/**
|
2018-04-05 04:11:44 +08:00
|
|
|
* @internal Recursively delete the data for a group (and everything
|
|
|
|
* it contains) in our internal metadata store.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
2018-04-05 04:11:44 +08:00
|
|
|
* @param grp Pointer to group info struct.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @author Ed Hartnett
|
2018-04-05 04:11:44 +08:00
|
|
|
*/
|
2018-02-08 21:20:58 +08:00
|
|
|
static int
|
2018-04-05 04:11:44 +08:00
|
|
|
hdf4_rec_grp_del(NC_GRP_INFO_T *grp)
|
2018-02-08 21:20:58 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_VAR_INFO_T *var;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
assert(grp);
|
|
|
|
LOG((3, "%s: grp->name %s", __func__, grp->hdr.name));
|
|
|
|
|
|
|
|
/* Delete all vars. */
|
|
|
|
for (i = 0; i < ncindexsize(grp->vars); i++)
|
|
|
|
{
|
|
|
|
NC_VAR_HDF4_INFO_T *hdf4_var;
|
|
|
|
|
|
|
|
var = (NC_VAR_INFO_T *)ncindexith(grp->vars, i);
|
|
|
|
assert(var);
|
|
|
|
LOG((4, "%s: deleting var %s", __func__, var->hdr.name));
|
|
|
|
|
|
|
|
/* Get the HDF4 specific var metadata. */
|
|
|
|
hdf4_var = (NC_VAR_HDF4_INFO_T *)var->format_var_info;
|
|
|
|
|
|
|
|
/* Close HDF4 dataset associated with this var, unless it's a
|
|
|
|
* scale. */
|
|
|
|
if (hdf4_var->sdsid && SDendaccess(hdf4_var->sdsid) < 0)
|
|
|
|
return NC_EHDFERR;
|
2020-03-30 02:48:59 +08:00
|
|
|
|
|
|
|
nullfree(hdf4_var);
|
2019-02-19 20:17:00 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-02-08 21:20:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @internal Given an HDF4 type, set a pointer to netcdf type.
|
|
|
|
*
|
|
|
|
* See http://www.hdfgroup.org/training/HDFtraining/UsersGuide/Fundmtls.fm3.html
|
|
|
|
* for more information re: HDF4 types.
|
|
|
|
*
|
|
|
|
* @param h5 Pointer to HDF5 file info struct.
|
|
|
|
* @param hdf4_typeid Type ID for hdf4 datatype.
|
2018-04-05 04:11:44 +08:00
|
|
|
* @param xtype Pointer that gets netcdf type. Ignored if NULL.
|
|
|
|
* @param endniannessp Pointer that gets endianness. Ignored if NULL.
|
|
|
|
* @param type_sizep Pointer that gets type size. Ignored if NULL.
|
|
|
|
* @param type_name Pointer that gets the type name. Ignored if NULL.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
static int
|
2018-06-22 21:08:09 +08:00
|
|
|
hdf4_type_info(NC_FILE_INFO_T *h5, int32 hdf4_typeid, nc_type* xtypep,
|
2018-04-05 04:11:44 +08:00
|
|
|
int *endiannessp, size_t *type_sizep, char *type_name)
|
2018-02-08 21:20:58 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
int t = 0;
|
|
|
|
int endianness = NC_ENDIAN_BIG;
|
|
|
|
nc_type xtype;
|
|
|
|
|
|
|
|
assert(h5);
|
|
|
|
|
|
|
|
switch(hdf4_typeid)
|
|
|
|
{
|
|
|
|
case DFNT_CHAR:
|
|
|
|
xtype = NC_CHAR;
|
|
|
|
t = 0;
|
|
|
|
break;
|
|
|
|
case DFNT_UCHAR:
|
|
|
|
case DFNT_UINT8:
|
|
|
|
xtype = NC_UBYTE;
|
|
|
|
t = 6;
|
|
|
|
break;
|
|
|
|
case DFNT_LUINT8:
|
|
|
|
xtype = NC_UBYTE;
|
|
|
|
t = 6;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_INT8:
|
|
|
|
xtype = NC_BYTE;
|
|
|
|
t = 1;
|
|
|
|
break;
|
|
|
|
case DFNT_LINT8:
|
|
|
|
xtype = NC_BYTE;
|
|
|
|
t = 1;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_INT16:
|
|
|
|
xtype = NC_SHORT;
|
|
|
|
t = 2;
|
|
|
|
break;
|
|
|
|
case DFNT_LINT16:
|
|
|
|
xtype = NC_SHORT;
|
|
|
|
t = 2;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_UINT16:
|
|
|
|
xtype = NC_USHORT;
|
|
|
|
t = 7;
|
|
|
|
break;
|
|
|
|
case DFNT_LUINT16:
|
|
|
|
xtype = NC_USHORT;
|
|
|
|
t = 7;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_INT32:
|
|
|
|
xtype = NC_INT;
|
|
|
|
t = 3;
|
|
|
|
break;
|
|
|
|
case DFNT_LINT32:
|
|
|
|
xtype = NC_INT;
|
|
|
|
t = 3;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_UINT32:
|
|
|
|
xtype = NC_UINT;
|
|
|
|
t = 8;
|
|
|
|
break;
|
|
|
|
case DFNT_LUINT32:
|
|
|
|
xtype = NC_UINT;
|
|
|
|
t = 8;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_FLOAT32:
|
|
|
|
xtype = NC_FLOAT;
|
|
|
|
t = 4;
|
|
|
|
break;
|
|
|
|
case DFNT_LFLOAT32:
|
|
|
|
xtype = NC_FLOAT;
|
|
|
|
t = 4;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
case DFNT_FLOAT64:
|
|
|
|
xtype = NC_DOUBLE;
|
|
|
|
t = 5;
|
|
|
|
break;
|
|
|
|
case DFNT_LFLOAT64:
|
|
|
|
xtype = NC_DOUBLE;
|
|
|
|
t = 5;
|
|
|
|
endianness = NC_ENDIAN_LITTLE;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return NC_EBADTYPID;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Return results to caller. */
|
|
|
|
if (xtypep)
|
|
|
|
*xtypep = xtype;
|
|
|
|
if (endiannessp)
|
|
|
|
*endiannessp = endianness;
|
|
|
|
if (type_sizep)
|
|
|
|
*type_sizep = nc_type_size_g[t];
|
|
|
|
if (type_name)
|
|
|
|
strncpy(type_name, nc_type_name_g[t], NC_MAX_NAME);
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-04-05 04:11:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @internal Set the type of a netCDF-4 variable.
|
|
|
|
*
|
|
|
|
* @param xtype A netcdf type.
|
|
|
|
* @param endianness The endianness of the data.
|
|
|
|
* @param type_size The size in bytes of one element of this type.
|
|
|
|
* @param type_name A name for the type.
|
|
|
|
* @param typep Pointer to a pointer that gets the TYPE_INFO_T struct.
|
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
nc4_set_var_type(nc_type xtype, int endianness, size_t type_size, char *type_name,
|
|
|
|
NC_TYPE_INFO_T **typep)
|
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_TYPE_INFO_T *type;
|
|
|
|
|
|
|
|
/* Check inputs. */
|
|
|
|
assert(typep);
|
|
|
|
|
|
|
|
/* Allocate space for the type info struct. */
|
|
|
|
if (!(type = calloc(1, sizeof(NC_TYPE_INFO_T))))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
if (!(type->hdr.name = strdup(type_name)))
|
|
|
|
{
|
|
|
|
free(type);
|
|
|
|
return NC_ENOMEM;
|
|
|
|
}
|
|
|
|
type->hdr.sort = NCTYP;
|
|
|
|
|
|
|
|
/* Determine the type class. */
|
|
|
|
if (xtype == NC_FLOAT)
|
|
|
|
type->nc_type_class = NC_FLOAT;
|
|
|
|
else if (xtype == NC_DOUBLE)
|
|
|
|
type->nc_type_class = NC_DOUBLE;
|
|
|
|
else if (xtype == NC_CHAR)
|
|
|
|
type->nc_type_class = NC_STRING;
|
|
|
|
else
|
|
|
|
type->nc_type_class = NC_INT;
|
|
|
|
|
|
|
|
/* Set other type info values. */
|
|
|
|
type->endianness = endianness;
|
|
|
|
type->size = type_size;
|
|
|
|
type->hdr.id = (size_t)xtype;
|
|
|
|
|
|
|
|
/* Return to caller. */
|
|
|
|
*typep = type;
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-02-08 21:20:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2018-04-05 04:11:44 +08:00
|
|
|
* @internal Read an attribute from a HDF4 file.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
2018-04-05 04:11:44 +08:00
|
|
|
* @param h5 Pointer to the file metadata struct.
|
|
|
|
* @param var Pointer to variable metadata struct or NULL for global
|
|
|
|
* attributes.
|
|
|
|
* @param a Index of attribute to read.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
2018-04-05 04:11:44 +08:00
|
|
|
* @return ::NC_EHDFERR HDF4 error.
|
|
|
|
* @return ::NC_EATTMETA Error reading HDF4 attribute.
|
|
|
|
* @return ::NC_ENOMEM Out of memory.
|
2018-02-08 21:20:58 +08:00
|
|
|
* @author Ed Hartnett
|
2018-04-05 04:11:44 +08:00
|
|
|
*/
|
2018-02-08 21:20:58 +08:00
|
|
|
static int
|
2018-06-22 21:08:09 +08:00
|
|
|
hdf4_read_att(NC_FILE_INFO_T *h5, NC_VAR_INFO_T *var, int a)
|
2018-02-08 21:20:58 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_HDF4_FILE_INFO_T *hdf4_file;
|
|
|
|
NC_ATT_INFO_T *att;
|
|
|
|
NCindex *att_list;
|
|
|
|
int32 att_data_type, att_count;
|
|
|
|
size_t att_type_size;
|
|
|
|
char name[NC_MAX_HDF4_NAME+1];
|
|
|
|
int sd_id;
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
LOG((3, "%s: a %d var %s", __func__, a, var ? var->hdr.name : "global"));
|
|
|
|
|
|
|
|
/* Check inputs. */
|
|
|
|
assert(h5 && h5->format_file_info);
|
|
|
|
|
|
|
|
/* Get the HDF4 file info. */
|
|
|
|
hdf4_file = h5->format_file_info;
|
|
|
|
|
|
|
|
/* Decide what att list to use, global or from a var. */
|
|
|
|
if (var)
|
|
|
|
{
|
|
|
|
NC_VAR_HDF4_INFO_T *hdf4_var;
|
|
|
|
assert(var->format_var_info);
|
|
|
|
att_list = var->att;
|
|
|
|
hdf4_var = var->format_var_info;
|
|
|
|
sd_id = hdf4_var->sdsid;
|
|
|
|
} else {
|
|
|
|
att_list = h5->root_grp->att;
|
|
|
|
sd_id = hdf4_file->sdid;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Learn about this attribute. */
|
|
|
|
if (SDattrinfo(sd_id, a, name, &att_data_type, &att_count))
|
|
|
|
return NC_EATTMETA;
|
|
|
|
|
|
|
|
/* Get information about the attribute type. */
|
|
|
|
nc_type xtype;
|
|
|
|
if ((retval = hdf4_type_info(h5, att_data_type, &xtype, NULL,
|
|
|
|
&att_type_size, NULL)))
|
|
|
|
return retval;
|
|
|
|
|
|
|
|
/* Add to the end of the list of atts for this var. */
|
|
|
|
if ((retval = nc4_att_list_add(att_list, name, &att)))
|
|
|
|
return retval;
|
|
|
|
att->nc_typeid = xtype;
|
|
|
|
att->created = NC_TRUE;
|
|
|
|
att->len = att_count;
|
|
|
|
|
|
|
|
/* Allocate memory to hold the data. */
|
|
|
|
if (att->len)
|
|
|
|
if (!(att->data = malloc(att_type_size * att->len)))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
|
|
|
|
/* Read the data. */
|
|
|
|
if (SDreadattr(sd_id, a, att->data))
|
|
|
|
return NC_EHDFERR;
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-04-05 04:11:44 +08:00
|
|
|
}
|
2018-02-08 21:20:58 +08:00
|
|
|
|
2018-04-05 04:11:44 +08:00
|
|
|
/**
|
|
|
|
* @internal Read a HDF4 dimension. As new dimensions are found, add
|
|
|
|
* them to the metadata list of dimensions.
|
|
|
|
*
|
|
|
|
* @param h5 Pointer to the file metadata struct.
|
|
|
|
* @param var Pointer to variable metadata struct or NULL for global
|
|
|
|
* attributes.
|
|
|
|
* @param rec_dim_len Actual length of first dim for this SD.
|
|
|
|
* @param d Dimension index for this SD.
|
2019-02-19 20:17:00 +08:00
|
|
|
*
|
2018-04-05 04:11:44 +08:00
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_EHDFERR HDF4 error.
|
|
|
|
* @return ::NC_EDIMMETA Error reading HDF4 dimension info.
|
|
|
|
* @return ::NC_ENOMEM Out of memory.
|
|
|
|
* @return ::NC_EMAXNAME Name too long.
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
static int
|
2018-06-22 21:08:09 +08:00
|
|
|
hdf4_read_dim(NC_FILE_INFO_T *h5, NC_VAR_INFO_T *var, int rec_dim_len, int d)
|
2018-04-05 04:11:44 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_VAR_HDF4_INFO_T *hdf4_var;
|
|
|
|
NC_DIM_INFO_T *dim = NULL;
|
|
|
|
int32 dimid, dim_len, dim_data_type, dim_num_attrs;
|
|
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
|
|
int i;
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
assert(h5 && h5->format_file_info && var && var->format_var_info);
|
|
|
|
hdf4_var = var->format_var_info;
|
|
|
|
|
|
|
|
/* Get information about the dimension. */
|
|
|
|
if ((dimid = SDgetdimid(hdf4_var->sdsid, d)) == FAIL)
|
|
|
|
return NC_EDIMMETA;
|
|
|
|
if (SDdiminfo(dimid, dim_name, &dim_len, &dim_data_type, &dim_num_attrs))
|
|
|
|
return NC_EDIMMETA;
|
|
|
|
if (strlen(dim_name) > NC_MAX_HDF4_NAME)
|
|
|
|
return NC_EMAXNAME;
|
|
|
|
|
|
|
|
/* Do we already have this dimension? HDF4 explicitly uses
|
|
|
|
* the name to tell. */
|
|
|
|
for (i = 0; i < ncindexsize(h5->root_grp->dim); i++)
|
|
|
|
{
|
|
|
|
dim = (NC_DIM_INFO_T*)ncindexith(h5->root_grp->dim, i);
|
|
|
|
if (!strcmp(dim->hdr.name, dim_name))
|
|
|
|
break;
|
|
|
|
dim = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If we didn't find this dimension, add one. */
|
|
|
|
if (!dim)
|
|
|
|
{
|
|
|
|
LOG((4, "adding dim %s for dataset %s", dim_name, var->hdr.name));
|
|
|
|
if ((retval = nc4_dim_list_add(h5->root_grp, dim_name,
|
|
|
|
(dim_len ? dim_len : rec_dim_len), -1, &dim)))
|
|
|
|
return retval;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Tell the variable the id of this dimension. */
|
|
|
|
var->dimids[d] = dim->hdr.id;
|
|
|
|
var->dim[d] = dim;
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-04-05 04:11:44 +08:00
|
|
|
}
|
2018-02-08 21:20:58 +08:00
|
|
|
|
2018-04-05 04:11:44 +08:00
|
|
|
/**
|
|
|
|
* @internal Create a new variable and insert int relevant lists
|
|
|
|
*
|
|
|
|
* @param grp the containing group
|
|
|
|
* @param name the name for the new variable
|
|
|
|
* @param ndims the rank of the new variable
|
|
|
|
* @param format_var_info Pointer to format-specific var info struct.
|
|
|
|
* @param var Pointer in which to return a pointer to the new var.
|
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_ENOMEM Out of memory.
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
nc4_var_list_add_full(NC_GRP_INFO_T* grp, const char* name, int ndims, nc_type xtype,
|
|
|
|
int endianness, size_t type_size, char *type_name, void *fill_value,
|
|
|
|
int contiguous, size_t *chunksizes, void *format_var_info,
|
|
|
|
NC_VAR_INFO_T **var)
|
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
int d;
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
/* Add the VAR_INFO_T struct to our list of vars. */
|
|
|
|
if ((retval = nc4_var_list_add(grp, name, ndims, var)))
|
|
|
|
return retval;
|
|
|
|
(*var)->created = NC_TRUE;
|
|
|
|
(*var)->written_to = NC_TRUE;
|
|
|
|
(*var)->format_var_info = format_var_info;
|
|
|
|
(*var)->atts_read = 1;
|
|
|
|
|
|
|
|
/* Fill special type_info struct for variable type information. */
|
|
|
|
if ((retval = nc4_set_var_type(xtype, endianness, type_size, type_name,
|
|
|
|
&(*var)->type_info)))
|
|
|
|
return retval;
|
This PR adds EXPERIMENTAL support for accessing data in the
cloud using a variant of the Zarr protocol and storage
format. This enhancement is generically referred to as "NCZarr".
The data model supported by NCZarr is netcdf-4 minus the user-defined
types and the String type. In this sense it is similar to the CDF-5
data model.
More detailed information about enabling and using NCZarr is
described in the document NUG/nczarr.md and in a
[Unidata Developer's blog entry](https://www.unidata.ucar.edu/blogs/developer/en/entry/overview-of-zarr-support-in).
WARNING: this code has had limited testing, so do use this version
for production work. Also, performance improvements are ongoing.
Note especially the following platform matrix of successful tests:
Platform | Build System | S3 support
------------------------------------
Linux+gcc | Automake | yes
Linux+gcc | CMake | yes
Visual Studio | CMake | no
Additionally, and as a consequence of the addition of NCZarr,
major changes have been made to the Filter API. NOTE: NCZarr
does not yet support filters, but these changes are enablers for
that support in the future. Note that it is possible
(probable?) that there will be some accidental reversions if the
changes here did not correctly mimic the existing filter testing.
In any case, previously filter ids and parameters were of type
unsigned int. In order to support the more general zarr filter
model, this was all converted to char*. The old HDF5-specific,
unsigned int operations are still supported but they are
wrappers around the new, char* based nc_filterx_XXX functions.
This entailed at least the following changes:
1. Added the files libdispatch/dfilterx.c and include/ncfilter.h
2. Some filterx utilities have been moved to libdispatch/daux.c
3. A new entry, "filter_actions" was added to the NCDispatch table
and the version bumped.
4. An overly complex set of structs was created to support funnelling
all of the filterx operations thru a single dispatch
"filter_actions" entry.
5. Move common code to from libhdf5 to libsrc4 so that it is accessible
to nczarr.
Changes directly related to Zarr:
1. Modified CMakeList.txt and configure.ac to support both C and C++
-- this is in support of S3 support via the awd-sdk libraries.
2. Define a size64_t type to support nczarr.
3. More reworking of libdispatch/dinfermodel.c to
support zarr and to regularize the structure of the fragments
section of a URL.
Changes not directly related to Zarr:
1. Make client-side filter registration be conditional, with default off.
2. Hack include/nc4internal.h to make some flags added by Ed be unique:
e.g. NC_CREAT, NC_INDEF, etc.
3. cleanup include/nchttp.h and libdispatch/dhttp.c.
4. Misc. changes to support compiling under Visual Studio including:
* Better testing under windows for dirent.h and opendir and closedir.
5. Misc. changes to the oc2 code to support various libcurl CURLOPT flags
and to centralize error reporting.
6. By default, suppress the vlen tests that have unfixed memory leaks; add option to enable them.
7. Make part of the nc_test/test_byterange.sh test be contingent on remotetest.unidata.ucar.edu being accessible.
Changes Left TO-DO:
1. fix provenance code, it is too HDF5 specific.
2020-06-29 08:02:47 +08:00
|
|
|
/* Propate the endianness to the variable */
|
|
|
|
(*var)->endianness = (*var)->type_info->endianness;
|
2019-02-19 20:17:00 +08:00
|
|
|
|
|
|
|
(*var)->type_info->rc++;
|
|
|
|
|
|
|
|
/* Handle fill value, if provided. */
|
|
|
|
if (fill_value)
|
|
|
|
{
|
|
|
|
if (!((*var)->fill_value = malloc(type_size)))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
memcpy((*var)->fill_value, fill_value, type_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Var contiguous or chunked? */
|
2020-03-08 21:28:30 +08:00
|
|
|
if (contiguous)
|
|
|
|
(*var)->storage = NC_CONTIGUOUS;
|
|
|
|
else
|
|
|
|
(*var)->storage = NC_CHUNKED;
|
2019-02-19 20:17:00 +08:00
|
|
|
|
|
|
|
/* Were chunksizes provided? */
|
|
|
|
if (chunksizes)
|
|
|
|
{
|
|
|
|
if (!((*var)->chunksizes = malloc(ndims * sizeof(size_t))))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
for (d = 0; d < ndims; d++)
|
|
|
|
(*var)->chunksizes[d] = chunksizes[d];
|
|
|
|
}
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-04-05 04:11:44 +08:00
|
|
|
}
|
2018-02-08 21:20:58 +08:00
|
|
|
|
2018-04-05 04:11:44 +08:00
|
|
|
/**
|
|
|
|
* @internal Read a HDF4 variable, including its associated dimensions
|
|
|
|
* and attributes.
|
|
|
|
*
|
|
|
|
* @param h5 Pointer to the file metadata struct.
|
|
|
|
* @param v Index of variable to read.
|
2019-02-19 20:17:00 +08:00
|
|
|
*
|
2018-04-05 04:11:44 +08:00
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_EHDFERR HDF4 error.
|
|
|
|
* @return ::NC_EDIMMETA Error reading HDF4 dimension info.
|
|
|
|
* @return ::NC_EVARMETA Error reading HDF4 dataset or att.
|
|
|
|
* @return ::NC_EATTMETA Error reading HDF4 attribute.
|
|
|
|
* @return ::NC_ENOMEM Out of memory.
|
|
|
|
* @return ::NC_EMAXNAME Name too long.
|
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
static int
|
2018-06-22 21:08:09 +08:00
|
|
|
hdf4_read_var(NC_FILE_INFO_T *h5, int v)
|
2018-04-05 04:11:44 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_HDF4_FILE_INFO_T *hdf4_file;
|
|
|
|
NC_VAR_INFO_T *var;
|
|
|
|
NC_VAR_HDF4_INFO_T *hdf4_var;
|
|
|
|
HDF_CHUNK_DEF chunkdefs;
|
|
|
|
int32 data_type, num_atts;
|
|
|
|
int32 dimsize[NC_MAX_HDF4_DIMS];
|
|
|
|
int32 rec_dim_len;
|
|
|
|
int32 rank;
|
|
|
|
int32 sdsid;
|
|
|
|
int contiguous;
|
|
|
|
int d, a;
|
|
|
|
int flag;
|
|
|
|
char name[NC_MAX_HDF4_NAME+1];
|
|
|
|
int xtype;
|
|
|
|
char type_name[NC_MAX_NAME + 1];
|
|
|
|
int endianness;
|
|
|
|
size_t type_size;
|
|
|
|
void *fill_value;
|
|
|
|
size_t *chunksizes = NULL;
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
/* Check inputs. */
|
|
|
|
assert(h5 && h5->format_file_info);
|
|
|
|
|
|
|
|
/* Get HDF4 file metadata. */
|
|
|
|
hdf4_file = h5->format_file_info;
|
|
|
|
|
|
|
|
/* Open this dataset in HDF4 file. */
|
|
|
|
if ((sdsid = SDselect(hdf4_file->sdid, v)) == FAIL)
|
|
|
|
return NC_EVARMETA;
|
|
|
|
|
|
|
|
/* Learn about this dataset. */
|
|
|
|
if (SDgetinfo(sdsid, name, &rank, dimsize, &data_type, &num_atts))
|
|
|
|
return NC_EVARMETA;
|
|
|
|
rec_dim_len = dimsize[0];
|
|
|
|
|
|
|
|
/* Get chunking info from HDF4 file. */
|
|
|
|
if (SDgetchunkinfo(sdsid, &chunkdefs, &flag))
|
|
|
|
return NC_EVARMETA;
|
|
|
|
|
|
|
|
/* Learn about the HDF4 type. */
|
|
|
|
if ((retval = hdf4_type_info(h5, data_type, &xtype, &endianness, &type_size,
|
|
|
|
type_name)))
|
|
|
|
return retval;
|
|
|
|
|
|
|
|
/* Get the fill value. */
|
|
|
|
if (!(fill_value = malloc(type_size)))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
if (SDgetfillvalue(sdsid, fill_value))
|
|
|
|
{
|
|
|
|
/* Whoops! No fill value! */
|
|
|
|
free(fill_value);
|
|
|
|
fill_value = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Is variable chunked or contiguous? */
|
|
|
|
if (flag == HDF_NONE)
|
|
|
|
contiguous = NC_TRUE;
|
|
|
|
else if (flag & HDF_CHUNK)
|
|
|
|
{
|
|
|
|
contiguous = NC_FALSE;
|
|
|
|
if (!(chunksizes = malloc(rank * sizeof(size_t))))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
for (d = 0; d < rank; d++)
|
|
|
|
chunksizes[d] = chunkdefs.chunk_lengths[d];
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Malloc a struct to hold HDF4-specific variable
|
|
|
|
* information. */
|
|
|
|
if (!(hdf4_var = malloc(sizeof(NC_VAR_HDF4_INFO_T))))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
|
|
|
|
/* Remember these values. */
|
|
|
|
hdf4_var->hdf4_data_type = data_type;
|
|
|
|
hdf4_var->sdsid = sdsid;
|
|
|
|
|
|
|
|
/* Add a variable to metadata structures. */
|
|
|
|
LOG((3, "adding var for HDF4 dataset %s, rank %d netCDF type %d", name,
|
|
|
|
rank, xtype));
|
|
|
|
retval = nc4_var_list_add_full(h5->root_grp, name, (int)rank,
|
|
|
|
xtype, endianness, type_size, type_name,
|
|
|
|
fill_value, contiguous, chunksizes, hdf4_var,
|
|
|
|
&var);
|
|
|
|
|
|
|
|
/* Free resources. */
|
|
|
|
if (chunksizes)
|
|
|
|
free(chunksizes);
|
|
|
|
if (fill_value)
|
|
|
|
free(fill_value);
|
|
|
|
|
|
|
|
/* Did the add fail? */
|
|
|
|
if (retval)
|
|
|
|
{
|
|
|
|
free(hdf4_var);
|
|
|
|
return retval;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Find the variable's dimensions. */
|
|
|
|
for (d = 0; d < var->ndims; d++)
|
|
|
|
if ((retval = hdf4_read_dim(h5, var, rec_dim_len, d)))
|
|
|
|
return retval;
|
|
|
|
|
|
|
|
/* Read the variable's attributes. */
|
|
|
|
for (a = 0; a < num_atts; a++)
|
|
|
|
if ((retval = hdf4_read_att(h5, var, a)))
|
|
|
|
return retval;
|
|
|
|
|
|
|
|
return NC_NOERR;
|
2018-02-08 21:20:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2019-07-05 00:13:54 +08:00
|
|
|
* @internal Open a HDF4 SD file for read-only access.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @param path The file name of the file.
|
|
|
|
* @param mode The open mode flag.
|
|
|
|
* @param basepe Ignored by this function.
|
|
|
|
* @param chunksizehintp Ignored by this function.
|
|
|
|
* @param parameters pointer to struct holding extra data (e.g. for
|
2019-07-05 00:14:28 +08:00
|
|
|
* parallel I/O) layer. Ignored if NULL. Ignored by this function.
|
2018-02-08 21:20:58 +08:00
|
|
|
* @param dispatch Pointer to the dispatch table for this file.
|
2019-07-05 00:13:15 +08:00
|
|
|
* @param nc_file Pointer to an instance of NC. The ncid has already
|
|
|
|
* been assigned, and is in nc_file->ext_ncid.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_EINVAL Invalid input.
|
2019-07-05 00:13:15 +08:00
|
|
|
* @return ::NC_EHDFERR Error from HDF4 layer.
|
2019-07-05 00:15:32 +08:00
|
|
|
* @return ::NC_ENOMEM Out of memory.
|
2018-02-08 21:20:58 +08:00
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
int
|
2018-04-05 04:11:44 +08:00
|
|
|
NC_HDF4_open(const char *path, int mode, int basepe, size_t *chunksizehintp,
|
2019-08-02 04:30:20 +08:00
|
|
|
void *parameters, const NC_Dispatch *dispatch, int ncid)
|
2018-02-08 21:20:58 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_FILE_INFO_T *h5;
|
|
|
|
NC_HDF4_FILE_INFO_T *hdf4_file;
|
2019-08-02 04:39:45 +08:00
|
|
|
NC *nc;
|
2019-02-19 20:17:00 +08:00
|
|
|
int32 num_datasets, num_gatts;
|
|
|
|
int32 sdid;
|
|
|
|
int v, a;
|
2019-07-17 04:54:42 +08:00
|
|
|
int retval;
|
2019-02-19 20:17:00 +08:00
|
|
|
|
|
|
|
/* Check inputs. */
|
2019-08-02 04:30:20 +08:00
|
|
|
assert(path);
|
2019-02-19 20:17:00 +08:00
|
|
|
|
|
|
|
LOG((1, "%s: path %s mode %d params %x", __func__, path, mode, parameters));
|
|
|
|
|
2019-08-02 01:40:36 +08:00
|
|
|
/* Find pointer to NC. */
|
2019-08-02 04:39:45 +08:00
|
|
|
if ((retval = NC_check_id(ncid, &nc)))
|
2019-08-02 01:40:36 +08:00
|
|
|
return retval;
|
|
|
|
|
2019-02-19 20:17:00 +08:00
|
|
|
/* Check the mode for validity */
|
|
|
|
if (mode & ILLEGAL_OPEN_FLAGS)
|
|
|
|
return NC_EINVAL;
|
|
|
|
|
|
|
|
/* Open the file and initialize SD interface. */
|
|
|
|
if ((sdid = SDstart(path, DFACC_READ)) == FAIL)
|
|
|
|
return NC_EHDFERR;
|
|
|
|
|
|
|
|
/* Learn how many datasets and global atts we have. */
|
|
|
|
if (SDfileinfo(sdid, &num_datasets, &num_gatts))
|
|
|
|
return NC_EHDFERR;
|
|
|
|
|
|
|
|
/* Add necessary structs to hold netcdf-4 file data. */
|
2019-08-02 23:29:18 +08:00
|
|
|
if ((retval = nc4_file_list_add(ncid, path, mode, (void **)&h5)))
|
2019-02-19 20:17:00 +08:00
|
|
|
return retval;
|
2019-07-17 04:48:26 +08:00
|
|
|
assert(h5 && h5->root_grp);
|
2019-02-19 20:17:00 +08:00
|
|
|
h5->no_write = NC_TRUE;
|
|
|
|
h5->root_grp->atts_read = 1;
|
|
|
|
|
|
|
|
/* Allocate data to hold HDF4 specific file data. */
|
|
|
|
if (!(hdf4_file = malloc(sizeof(NC_HDF4_FILE_INFO_T))))
|
|
|
|
return NC_ENOMEM;
|
|
|
|
h5->format_file_info = hdf4_file;
|
|
|
|
hdf4_file->sdid = sdid;
|
|
|
|
|
|
|
|
/* Read the global atts. */
|
|
|
|
for (a = 0; a < num_gatts; a++)
|
|
|
|
if ((retval = hdf4_read_att(h5, NULL, a)))
|
2018-04-05 04:11:44 +08:00
|
|
|
break;
|
|
|
|
|
2019-02-19 20:17:00 +08:00
|
|
|
/* Read each dataset. */
|
|
|
|
if (!retval)
|
|
|
|
for (v = 0; v < num_datasets; v++)
|
|
|
|
if ((retval = hdf4_read_var(h5, v)))
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* If there is an error, free resources. */
|
|
|
|
if (retval)
|
|
|
|
free(hdf4_file);
|
|
|
|
|
2018-04-05 04:11:44 +08:00
|
|
|
#ifdef LOGGING
|
2019-02-19 20:17:00 +08:00
|
|
|
/* This will print out the names, types, lens, etc of the vars and
|
|
|
|
atts in the file, if the logging level is 2 or greater. */
|
|
|
|
log_metadata_nc(h5);
|
2018-04-05 04:11:44 +08:00
|
|
|
#endif
|
2018-02-08 21:20:58 +08:00
|
|
|
|
2019-02-19 20:17:00 +08:00
|
|
|
return retval;
|
2018-02-08 21:20:58 +08:00
|
|
|
}
|
|
|
|
|
2019-01-02 20:58:54 +08:00
|
|
|
/**
|
|
|
|
* @internal Abort (close) the HDF4 file.
|
|
|
|
*
|
|
|
|
* @param ncid File ID.
|
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_EBADID Bad ncid.
|
2019-07-05 00:16:21 +08:00
|
|
|
* @return ::NC_EHDFERR Error from HDF4 layer.
|
2019-01-02 20:58:54 +08:00
|
|
|
* @author Ed Hartnett
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
NC_HDF4_abort(int ncid)
|
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
return NC_HDF4_close(ncid, NULL);
|
2019-01-02 20:58:54 +08:00
|
|
|
}
|
|
|
|
|
2018-02-08 21:20:58 +08:00
|
|
|
/**
|
2018-04-05 04:11:44 +08:00
|
|
|
* @internal Close the HDF4 file.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @param ncid File ID.
|
2019-01-02 20:58:54 +08:00
|
|
|
* @param ignore Ignore this pointer.
|
2018-02-08 21:20:58 +08:00
|
|
|
*
|
|
|
|
* @return ::NC_NOERR No error.
|
|
|
|
* @return ::NC_EBADID Bad ncid.
|
2019-07-05 00:16:21 +08:00
|
|
|
* @return ::NC_EHDFERR Error from HDF4 layer.
|
2018-02-08 21:20:58 +08:00
|
|
|
* @author Ed Hartnett
|
2018-04-05 04:11:44 +08:00
|
|
|
*/
|
2018-02-08 21:20:58 +08:00
|
|
|
int
|
2019-01-02 20:58:54 +08:00
|
|
|
NC_HDF4_close(int ncid, void *ignore)
|
2018-02-08 21:20:58 +08:00
|
|
|
{
|
2019-02-19 20:17:00 +08:00
|
|
|
NC_GRP_INFO_T *grp;
|
|
|
|
NC *nc;
|
|
|
|
NC_FILE_INFO_T *h5;
|
|
|
|
NC_HDF4_FILE_INFO_T *hdf4_file;
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
LOG((1, "%s: ncid 0x%x", __func__, ncid));
|
|
|
|
|
|
|
|
/* Find our metadata for this file. */
|
|
|
|
if ((retval = nc4_find_nc_grp_h5(ncid, &nc, &grp, &h5)))
|
|
|
|
return retval;
|
|
|
|
assert(nc && h5 && grp && !grp->parent);
|
|
|
|
|
|
|
|
/* Clean up HDF4 specific allocations. */
|
|
|
|
if ((retval = hdf4_rec_grp_del(h5->root_grp)))
|
|
|
|
return retval;
|
|
|
|
|
|
|
|
/* Close hdf4 file and free HDF4 file info. */
|
|
|
|
hdf4_file = (NC_HDF4_FILE_INFO_T *)h5->format_file_info;
|
|
|
|
if (SDend(hdf4_file->sdid))
|
|
|
|
return NC_EHDFERR;
|
|
|
|
free(hdf4_file);
|
|
|
|
|
2019-07-17 06:02:08 +08:00
|
|
|
/* Free the NC_FILE_INFO_T struct. */
|
|
|
|
if ((retval = nc4_nc4f_list_del(h5)))
|
|
|
|
return retval;
|
|
|
|
|
2019-02-19 20:17:00 +08:00
|
|
|
return NC_NOERR;
|
2018-02-08 21:20:58 +08:00
|
|
|
}
|