2017-01-27 03:34:12 +08:00
|
|
|
/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
|
|
|
|
* Copyright by The HDF Group. *
|
|
|
|
* All rights reserved. *
|
|
|
|
* *
|
|
|
|
* This file is part of HDF5. The full HDF5 copyright notice, including *
|
|
|
|
* terms governing use, modification, and redistribution, is contained in *
|
2017-04-18 03:32:16 +08:00
|
|
|
* the COPYING file, which can be found at the root of the source code *
|
2021-02-17 22:52:04 +08:00
|
|
|
* distribution tree, or in https://www.hdfgroup.org/licenses. *
|
2017-04-18 03:32:16 +08:00
|
|
|
* If you do not have access to either file, you may request a copy from *
|
|
|
|
* help@hdfgroup.org. *
|
2017-01-27 03:34:12 +08:00
|
|
|
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
|
|
|
|
|
|
|
|
/*-------------------------------------------------------------------------
|
|
|
|
*
|
|
|
|
* Created: swmr_remove_writer.c
|
|
|
|
*
|
|
|
|
* Purpose: Removes data from a randomly selected subset of the datasets
|
|
|
|
* in the SWMR test file.
|
|
|
|
*
|
|
|
|
* This program is intended to run concurrently with the
|
|
|
|
* swmr_remove_reader program. It is also run AFTER a sequential
|
|
|
|
* (not concurrent!) invoking of swmr_writer so the writer
|
|
|
|
* can dump a bunch of data into the datasets. Otherwise,
|
|
|
|
* there wouldn't be much to shrink :)
|
|
|
|
*
|
|
|
|
*-------------------------------------------------------------------------
|
|
|
|
*/
|
|
|
|
|
|
|
|
/***********/
|
|
|
|
/* Headers */
|
|
|
|
/***********/
|
|
|
|
|
|
|
|
#include "h5test.h"
|
|
|
|
#include "swmr_common.h"
|
|
|
|
|
|
|
|
/****************/
|
|
|
|
/* Local Macros */
|
|
|
|
/****************/
|
|
|
|
|
|
|
|
/* The maximum number of records to remove in one step */
|
2020-09-30 22:27:10 +08:00
|
|
|
#define MAX_REMOVE_SIZE 10
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/********************/
|
|
|
|
/* Local Prototypes */
|
|
|
|
/********************/
|
|
|
|
|
|
|
|
static hid_t open_skeleton(const char *filename, unsigned verbose, unsigned old);
|
2020-09-30 22:27:10 +08:00
|
|
|
static int remove_records(hid_t fid, unsigned verbose, unsigned long nshrinks, unsigned long flush_count);
|
|
|
|
static void usage(void);
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/*-------------------------------------------------------------------------
|
|
|
|
* Function: open_skeleton
|
|
|
|
*
|
|
|
|
* Purpose: Opens the SWMR HDF5 file and datasets.
|
|
|
|
*
|
|
|
|
* Parameters: const char *filename
|
|
|
|
* The filename of the SWMR HDF5 file to open
|
|
|
|
*
|
|
|
|
* unsigned verbose
|
|
|
|
* Whether or not to emit verbose console messages
|
|
|
|
*
|
|
|
|
* Return: Success: The file ID of the opened SWMR file
|
|
|
|
* The dataset IDs are stored in a global array
|
|
|
|
*
|
|
|
|
* Failure: -1
|
|
|
|
*
|
|
|
|
*-------------------------------------------------------------------------
|
|
|
|
*/
|
|
|
|
static hid_t
|
|
|
|
open_skeleton(const char *filename, unsigned verbose, unsigned old)
|
|
|
|
{
|
2020-09-30 22:27:10 +08:00
|
|
|
hid_t fid; /* File ID for new HDF5 file */
|
|
|
|
hid_t fapl; /* File access property list */
|
|
|
|
hid_t sid; /* Dataspace ID */
|
|
|
|
hsize_t dim[2]; /* Dataspace dimensions */
|
|
|
|
unsigned u, v; /* Local index variable */
|
2017-01-27 03:34:12 +08:00
|
|
|
|
2023-06-28 22:31:56 +08:00
|
|
|
assert(filename);
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Create file access property list */
|
2020-09-30 22:27:10 +08:00
|
|
|
if ((fapl = h5_fileaccess()) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
2020-09-30 22:27:10 +08:00
|
|
|
if (!old) {
|
2017-01-27 03:34:12 +08:00
|
|
|
/* Set to use the latest library format */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Pset_libver_bounds(fapl, H5F_LIBVER_LATEST, H5F_LIBVER_LATEST) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Open the file */
|
2020-09-30 22:27:10 +08:00
|
|
|
if ((fid = H5Fopen(filename, H5F_ACC_RDWR | H5F_ACC_SWMR_WRITE, fapl)) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Close file access property list */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Pclose(fapl) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Opening datasets\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Open the datasets */
|
2020-09-30 22:27:10 +08:00
|
|
|
for (u = 0; u < NLEVELS; u++)
|
|
|
|
for (v = 0; v < symbol_count[u]; v++) {
|
|
|
|
if ((symbol_info[u][v].dsid = H5Dopen2(fid, symbol_info[u][v].name, H5P_DEFAULT)) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
2020-09-30 22:27:10 +08:00
|
|
|
if ((sid = H5Dget_space(symbol_info[u][v].dsid)) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
2020-09-30 22:27:10 +08:00
|
|
|
if (2 != H5Sget_simple_extent_ndims(sid))
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Sget_simple_extent_dims(sid, dim, NULL) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
symbol_info[u][v].nrecords = dim[1];
|
|
|
|
} /* end for */
|
|
|
|
|
|
|
|
return fid;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*-------------------------------------------------------------------------
|
|
|
|
* Function: remove_records
|
|
|
|
*
|
|
|
|
* Purpose: Removes a specified number of records from random datasets in
|
|
|
|
* the SWMR test file.
|
|
|
|
*
|
|
|
|
* Parameters: hid_t fid
|
|
|
|
* The file ID of the SWMR HDF5 file
|
|
|
|
*
|
|
|
|
* unsigned verbose
|
|
|
|
* Whether or not to emit verbose console messages
|
|
|
|
*
|
|
|
|
* unsigned long nshrinks
|
|
|
|
* # of records to remove from the datasets
|
|
|
|
*
|
|
|
|
* unsigned long flush_count
|
|
|
|
* # of records to write before flushing the file to disk
|
|
|
|
*
|
|
|
|
* Return: Success: 0
|
|
|
|
* Failure: -1
|
|
|
|
*
|
|
|
|
*-------------------------------------------------------------------------
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
remove_records(hid_t fid, unsigned verbose, unsigned long nshrinks, unsigned long flush_count)
|
|
|
|
{
|
2020-09-30 22:27:10 +08:00
|
|
|
unsigned long shrink_to_flush; /* # of removals before flush */
|
|
|
|
hsize_t dim[2] = {1, 0}; /* Dataspace dimensions */
|
|
|
|
unsigned long u, v; /* Local index variables */
|
2017-01-27 03:34:12 +08:00
|
|
|
|
2023-06-28 22:31:56 +08:00
|
|
|
assert(fid >= 0);
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Remove records from random datasets, according to frequency distribution */
|
|
|
|
shrink_to_flush = flush_count;
|
2020-09-30 22:27:10 +08:00
|
|
|
for (u = 0; u < nshrinks; u++) {
|
|
|
|
symbol_info_t *symbol; /* Symbol to remove record from */
|
|
|
|
hsize_t remove_size; /* Size to reduce dataset dimension by */
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Get a random dataset, according to the symbol distribution */
|
|
|
|
symbol = choose_dataset();
|
|
|
|
|
|
|
|
/* Shrink the dataset's dataspace */
|
|
|
|
remove_size = (hsize_t)HDrandom() % MAX_REMOVE_SIZE + 1;
|
2020-09-30 22:27:10 +08:00
|
|
|
if (remove_size > symbol->nrecords)
|
2017-01-27 03:34:12 +08:00
|
|
|
symbol->nrecords = 0;
|
|
|
|
else
|
|
|
|
symbol->nrecords -= remove_size;
|
2017-05-25 18:45:53 +08:00
|
|
|
dim[1] = symbol->nrecords;
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Dset_extent(symbol->dsid, dim) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Check for flushing file */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (flush_count > 0) {
|
2017-01-27 03:34:12 +08:00
|
|
|
/* Decrement count of records to write before flushing */
|
|
|
|
shrink_to_flush--;
|
|
|
|
|
|
|
|
/* Check for counter being reached */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (0 == shrink_to_flush) {
|
2017-01-27 03:34:12 +08:00
|
|
|
/* Flush contents of file */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Fflush(fid, H5F_SCOPE_GLOBAL) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Reset flush counter */
|
|
|
|
shrink_to_flush = flush_count;
|
|
|
|
} /* end if */
|
2020-09-30 22:27:10 +08:00
|
|
|
} /* end if */
|
|
|
|
} /* end for */
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Closing datasets\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Close the datasets */
|
2020-09-30 22:27:10 +08:00
|
|
|
for (u = 0; u < NLEVELS; u++)
|
|
|
|
for (v = 0; v < symbol_count[u]; v++)
|
|
|
|
if (H5Dclose(symbol_info[u][v].dsid) < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
usage(void)
|
|
|
|
{
|
2023-06-28 23:31:32 +08:00
|
|
|
printf("\n");
|
|
|
|
printf("Usage error!\n");
|
|
|
|
printf("\n");
|
|
|
|
printf("Usage: swmr_remove_writer [-q] [-o] [-f <# of shrinks between flushing\n");
|
|
|
|
printf(" file contents>] [-r <random seed>] <# of shrinks>\n");
|
|
|
|
printf("\n");
|
|
|
|
printf("<# of shrinks between flushing file contents> should be 0 (for no\n");
|
|
|
|
printf("flushing) or between 1 and (<# of shrinks> - 1)\n");
|
|
|
|
printf("\n");
|
|
|
|
printf("Defaults to verbose (no '-q' given), latest format when opening file (no '-o' given),\n");
|
|
|
|
printf("flushing every 1000 shrinks ('-f 1000'), and will generate a random seed (no -r given).\n");
|
|
|
|
printf("\n");
|
2023-06-29 23:18:01 +08:00
|
|
|
exit(EXIT_FAILURE);
|
2017-01-27 03:34:12 +08:00
|
|
|
}
|
|
|
|
|
2020-09-30 22:27:10 +08:00
|
|
|
int
|
2022-01-29 06:30:33 +08:00
|
|
|
main(int argc, char *argv[])
|
2017-01-27 03:34:12 +08:00
|
|
|
{
|
2020-09-30 22:27:10 +08:00
|
|
|
hid_t fid; /* File ID for file opened */
|
|
|
|
long nshrinks = 0; /* # of times to shrink the dataset */
|
|
|
|
long flush_count = 1000; /* # of records to write between flushing file */
|
|
|
|
unsigned verbose = 1; /* Whether to emit some informational messages */
|
|
|
|
unsigned old = 0; /* Whether to use non-latest-format when opening file */
|
|
|
|
unsigned use_seed = 0; /* Set to 1 if a seed was set on the command line */
|
|
|
|
unsigned random_seed = 0; /* Random # seed */
|
|
|
|
unsigned u; /* Local index variable */
|
|
|
|
int temp;
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Parse command line options */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (argc < 2)
|
2017-01-27 03:34:12 +08:00
|
|
|
usage();
|
2020-09-30 22:27:10 +08:00
|
|
|
if (argc > 1) {
|
2017-01-27 03:34:12 +08:00
|
|
|
u = 1;
|
2020-09-30 22:27:10 +08:00
|
|
|
while (u < (unsigned)argc) {
|
|
|
|
if (argv[u][0] == '-') {
|
|
|
|
switch (argv[u][1]) {
|
2017-01-27 03:34:12 +08:00
|
|
|
/* # of records to write between flushing file */
|
|
|
|
case 'f':
|
2023-06-29 21:33:09 +08:00
|
|
|
flush_count = atol(argv[u + 1]);
|
2020-09-30 22:27:10 +08:00
|
|
|
if (flush_count < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
usage();
|
|
|
|
u += 2;
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* Be quiet */
|
|
|
|
case 'q':
|
|
|
|
verbose = 0;
|
|
|
|
u++;
|
|
|
|
break;
|
2020-04-21 07:12:00 +08:00
|
|
|
|
2017-01-27 03:34:12 +08:00
|
|
|
/* Random # seed */
|
|
|
|
case 'r':
|
2020-09-30 22:27:10 +08:00
|
|
|
use_seed = 1;
|
2023-06-29 21:33:09 +08:00
|
|
|
temp = atoi(argv[u + 1]);
|
2017-01-27 03:34:12 +08:00
|
|
|
random_seed = (unsigned)temp;
|
|
|
|
u += 2;
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* Use non-latest-format when opening file */
|
|
|
|
case 'o':
|
|
|
|
old = 1;
|
|
|
|
u++;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
usage();
|
|
|
|
break;
|
|
|
|
} /* end switch */
|
2020-09-30 22:27:10 +08:00
|
|
|
} /* end if */
|
2017-01-27 03:34:12 +08:00
|
|
|
else {
|
|
|
|
/* Get the number of records to append */
|
2023-06-29 21:33:09 +08:00
|
|
|
nshrinks = atol(argv[u]);
|
2020-09-30 22:27:10 +08:00
|
|
|
if (nshrinks <= 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
usage();
|
|
|
|
|
|
|
|
u++;
|
|
|
|
} /* end else */
|
2020-09-30 22:27:10 +08:00
|
|
|
} /* end while */
|
|
|
|
} /* end if */
|
|
|
|
if (nshrinks <= 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
usage();
|
2020-09-30 22:27:10 +08:00
|
|
|
if (flush_count >= nshrinks)
|
2017-01-27 03:34:12 +08:00
|
|
|
usage();
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose) {
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Parameters:\n");
|
|
|
|
fprintf(stderr, "\t# of shrinks between flushes = %ld\n", flush_count);
|
|
|
|
fprintf(stderr, "\t# of shrinks = %ld\n", nshrinks);
|
2017-01-27 03:34:12 +08:00
|
|
|
} /* end if */
|
|
|
|
|
|
|
|
/* Set the random seed */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (0 == use_seed) {
|
2017-01-27 03:34:12 +08:00
|
|
|
struct timeval t;
|
|
|
|
HDgettimeofday(&t, NULL);
|
|
|
|
random_seed = (unsigned)(t.tv_usec);
|
|
|
|
} /* end if */
|
|
|
|
HDsrandom(random_seed);
|
|
|
|
/* ALWAYS emit the random seed for possible debugging */
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Using writer random seed: %u\n", random_seed);
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Generating symbol names\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Generate dataset names */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (generate_symbols() < 0)
|
2017-01-27 03:34:12 +08:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Opening skeleton file: %s\n", FILENAME);
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Open file skeleton */
|
2020-09-30 22:27:10 +08:00
|
|
|
if ((fid = open_skeleton(FILENAME, verbose, old)) < 0) {
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Error opening skeleton file!\n");
|
2023-06-29 23:18:01 +08:00
|
|
|
exit(EXIT_FAILURE);
|
2017-01-27 03:34:12 +08:00
|
|
|
} /* end if */
|
|
|
|
|
|
|
|
/* Send a message to indicate "H5Fopen" is complete--releasing the file lock */
|
|
|
|
h5_send_message(WRITER_MESSAGE, NULL, NULL);
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Removing records\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Remove records from datasets */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (remove_records(fid, verbose, (unsigned long)nshrinks, (unsigned long)flush_count) < 0) {
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Error removing records from datasets!\n");
|
2023-06-29 23:18:01 +08:00
|
|
|
exit(EXIT_FAILURE);
|
2017-01-27 03:34:12 +08:00
|
|
|
} /* end if */
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Releasing symbols\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Clean up the symbols */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (shutdown_symbols() < 0) {
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Error releasing symbols!\n");
|
2023-06-29 23:18:01 +08:00
|
|
|
exit(EXIT_FAILURE);
|
2017-01-27 03:34:12 +08:00
|
|
|
} /* end if */
|
|
|
|
|
|
|
|
/* Emit informational message */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (verbose)
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Closing objects\n");
|
2017-01-27 03:34:12 +08:00
|
|
|
|
|
|
|
/* Close objects opened */
|
2020-09-30 22:27:10 +08:00
|
|
|
if (H5Fclose(fid) < 0) {
|
2023-06-28 23:31:32 +08:00
|
|
|
fprintf(stderr, "Error closing file!\n");
|
2023-06-29 23:18:01 +08:00
|
|
|
exit(EXIT_FAILURE);
|
2017-01-27 03:34:12 +08:00
|
|
|
} /* end if */
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|