hdf5/tools/lib/h5diff.c
Quincey Koziol 0cd7123fb6 [svn-r19292] Description:
Merge r19290 & r19291 from 1.8 branch to trunk:

r19290:
Correct another error in metadata accumulator dirty region calculations
(this time with a corner case when freeing data in the file).

r19291:
Avoid getting object information for soft/external links if we aren't
going to traverse across the link itself.

Tested on:
        FreeBSD/32 6.3 (duty) in debug mode
        FreeBSD/64 6.3 (liberty) w/C++ & FORTRAN, in debug mode
        Linux/32 2.6 (jam) w/PGI compilers, w/default API=1.8.x,
                w/C++ & FORTRAN, w/threadsafe, in debug mode
        Linux/64-amd64 2.6 (amani) w/Intel compilers, w/default API=1.6.x,
                w/C++ & FORTRAN, in production mode
        Solaris/32 2.10 (linew) w/deprecated symbols disabled, w/C++ & FORTRAN,
                w/szip filter, w/threadsafe, in production mode
        Linux/PPC 2.6 (heiwa) w/C++ & FORTRAN, w/threadsafe, in debug mode
        Linux/64-ia64 2.6 (cobalt) w/Intel compilers, w/C++ & FORTRAN,
                in production mode
        Linux/64-amd64 2.6 (abe) w/parallel, w/FORTRAN, in debug mode
        Mac OS X/32 10.6.4 (amazon) in debug mode
        Mac OS X/32 10.6.4 (amazon) w/C++ & FORTRAN, w/threadsafe,
                in production mode
        Mac OS X/32 10.6.4 (amazon) w/parallel, in debug mode
2010-08-24 16:03:32 -05:00

1567 lines
53 KiB
C

/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
* Copyright by The HDF Group. *
* Copyright by the Board of Trustees of the University of Illinois. *
* All rights reserved. *
* *
* This file is part of HDF5. The full HDF5 copyright notice, including *
* terms governing use, modification, and redistribution, is contained in *
* the files COPYING and Copyright.html. COPYING can be found at the root *
* of the source code distribution tree; Copyright.html can be found at the *
* root level of an installed copy of the electronic HDF5 document set and *
* is linked from the top-level documents page. It can also be found at *
* http://hdfgroup.org/HDF5/doc/Copyright.html. If you do not have *
* access to either file, you may request a copy from help@hdfgroup.org. *
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
#include <stdlib.h>
#include "h5diff.h"
#include "H5private.h"
#include "ph5diff.h"
#include "h5tools.h"
#include "h5tools_utils.h"
/*
* Debug printf macros. The prefix allows output filtering by test scripts.
*/
#ifdef H5DIFF_DEBUG
#define h5diffdebug(x) fprintf(stderr, "h5diff debug: " x)
#define h5diffdebug2(x1, x2) fprintf(stderr, "h5diff debug: " x1, x2)
#define h5diffdebug3(x1, x2, x3) fprintf(stderr, "h5diff debug: " x1, x2, x3)
#define h5diffdebug4(x1, x2, x3, x4) fprintf(stderr, "h5diff debug: " x1, x2, x3, x4)
#define h5diffdebug5(x1, x2, x3, x4, x5) fprintf(stderr, "h5diff debug: " x1, x2, x3, x4, x5)
#else
#define h5diffdebug(x)
#define h5diffdebug2(x1, x2)
#define h5diffdebug3(x1, x2, x3)
#define h5diffdebug4(x1, x2, x3, x4)
#define h5diffdebug5(x1, x2, x3, x4, x5)
#endif
/*-------------------------------------------------------------------------
* Function: print_objname
*
* Purpose: check if object name is to be printed, only when:
* 1) verbose mode
* 2) when diff was found (normal mode)
*-------------------------------------------------------------------------
*/
int
print_objname (diff_opt_t * options, hsize_t nfound)
{
return ((options->m_verbose || nfound) && !options->m_quiet) ? 1 : 0;
}
/*-------------------------------------------------------------------------
* Function: do_print_objname
*
* Purpose: print object name
*
*-------------------------------------------------------------------------
*/
void
do_print_objname (const char *OBJ, const char *path1, const char *path2)
{
parallel_print("%-7s: <%s> and <%s>\n", OBJ, path1, path2);
}
/*-------------------------------------------------------------------------
* Function: print_warn
*
* Purpose: check print warning condition.
* Return:
* 1 if verbose mode
* 0 if not verbos mode
* Programmer: Jonathan Kim
* Date: Feb 4, 2010
*-------------------------------------------------------------------------
*/
static int print_warn(diff_opt_t *options)
{
return ((options->m_verbose))?1:0;
}
#ifdef H5_HAVE_PARALLEL
/*-------------------------------------------------------------------------
* Function: phdiff_dismiss_workers
*
* Purpose: tell all workers to end.
*
* Return: none
*
* Programmer: Albert Cheng
*
* Date: Feb 6, 2005
*
*-------------------------------------------------------------------------
*/
void phdiff_dismiss_workers(void)
{
int i;
for(i=1; i<g_nTasks; i++)
MPI_Send(NULL, 0, MPI_BYTE, i, MPI_TAG_END, MPI_COMM_WORLD);
}
/*-------------------------------------------------------------------------
* Function: print_manager_output
*
* Purpose: special function that prints any output accumulated by the
* manager task.
*
* Return: none
*
* Programmer: Leon Arber
*
* Date: Feb 7, 2005
*
*-------------------------------------------------------------------------
*/
void print_manager_output(void)
{
/* If there was something we buffered, let's print it now */
if( (outBuffOffset>0) && g_Parallel)
{
printf("%s", outBuff);
if(overflow_file)
{
int tmp;
rewind(overflow_file);
while((tmp = getc(overflow_file)) >= 0)
putchar(tmp);
fclose(overflow_file);
overflow_file = NULL;
}
fflush(stdout);
memset(outBuff, 0, OUTBUFF_SIZE);
outBuffOffset = 0;
}
else if( (outBuffOffset>0) && !g_Parallel)
{
fprintf(stderr, "h5diff error: outBuffOffset>0, but we're not in parallel!\n");
}
}
/*-------------------------------------------------------------------------
* Function: print_incoming_data
*
* Purpose: special function that prints any output that has been sent to the manager
* and is currently sitting in the incoming message queue
*
* Return: none
*
* Programmer: Leon Arber
*
* Date: March 7, 2005
*
*-------------------------------------------------------------------------
*/
static void print_incoming_data(void)
{
char data[PRINT_DATA_MAX_SIZE+1];
int incomingMessage;
MPI_Status Status;
do
{
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_PRINT_DATA, MPI_COMM_WORLD, &incomingMessage, &Status);
if(incomingMessage)
{
memset(data, 0, PRINT_DATA_MAX_SIZE+1);
MPI_Recv(data, PRINT_DATA_MAX_SIZE, MPI_CHAR, Status.MPI_SOURCE, MPI_TAG_PRINT_DATA, MPI_COMM_WORLD, &Status);
printf("%s", data);
}
} while(incomingMessage);
}
#endif
/*-------------------------------------------------------------------------
* Function: is_valid_options
*
* Purpose: check if options are valid
*
* Return:
* 1 : Valid
* 0 : Not valid
*
* Programmer: Jonathan Kim
*
* Date: Feb 17, 2010
*
*------------------------------------------------------------------------*/
static int is_valid_options(diff_opt_t *options)
{
int ret=1; /* init to valid */
/*-----------------------------------------------
* no -q(quiet) with -v (verbose) or -r (report) */
if(options->m_quiet && (options->m_verbose || options->m_report))
{
parallel_print("Error: -q (quiet mode) cannot be added to verbose or report modes\n");
options->err_stat=1;
ret = 0;
goto out;
}
/* -------------------------------------------------------
* only allow --no-dangling-links along with --follow-symlinks */
if(options->no_dangle_links && !options->follow_links)
{
parallel_print("Error: --no-dangling-links must be used along with --follow-symlinks option.\n");
options->err_stat=1;
ret = 0;
goto out;
}
out:
if (!ret)
{
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
/* Let tasks know that they won't be needed */
phdiff_dismiss_workers();
#endif
}
return ret;
}
/*-------------------------------------------------------------------------
* Function: h5diff
*
* Purpose: public function, can be called in an application program.
* return differences between 2 HDF5 files
*
* Return: Number of differences found.
*
* Programmer: Pedro Vicente, pvn@ncsa.uiuc.edu
*
* Date: October 22, 2003
*
*-------------------------------------------------------------------------
*/
hsize_t h5diff(const char *fname1,
const char *fname2,
const char *objname1,
const char *objname2,
diff_opt_t *options)
{
trav_info_t *info1=NULL;
trav_info_t *info2=NULL;
hid_t file1_id = (-1);
hid_t file2_id = (-1);
char filenames[2][1024];
hsize_t nfound = 0;
HDmemset(filenames, 0, 1024 * 2);
/*-------------------------------------------------------------------------
* check invalid combination of options
*-----------------------------------------------------------------------*/
if(!is_valid_options(options))
goto out;
/*-------------------------------------------------------------------------
* open the files first; if they are not valid, no point in continuing
*-------------------------------------------------------------------------
*/
/* disable error reporting */
H5E_BEGIN_TRY
{
/* open file 1 */
if((file1_id = h5tools_fopen(fname1, H5F_ACC_RDONLY, H5P_DEFAULT, NULL, NULL, (size_t)0)) < 0)
{
parallel_print("h5diff: <%s>: unable to open file\n", fname1);
options->err_stat = 1;
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
/* Let tasks know that they won't be needed */
phdiff_dismiss_workers();
#endif
goto out;
} /* end if */
/* open file 2 */
if((file2_id = h5tools_fopen(fname2, H5F_ACC_RDONLY, H5P_DEFAULT, NULL, NULL, (size_t)0)) < 0)
{
parallel_print("h5diff: <%s>: unable to open file\n", fname2);
options->err_stat = 1;
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
/* Let tasks know that they won't be needed */
phdiff_dismiss_workers();
#endif
goto out;
} /* end if */
/* enable error reporting */
} H5E_END_TRY;
/*-------------------------------------------------------------------------
* Initialize the info structs
*-------------------------------------------------------------------------
*/
trav_info_init(&info1);
trav_info_init(&info2);
/*-------------------------------------------------------------------------
* get the list of objects in the files
*-------------------------------------------------------------------------
*/
if(h5trav_getinfo(file1_id, info1) < 0 || h5trav_getinfo(file2_id, info2) < 0) {
parallel_print("Error: Could not get file contents\n");
options->err_stat = 1;
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
/* Let tasks know that they won't be needed */
phdiff_dismiss_workers();
#endif
goto out;
} /* end if */
/*-------------------------------------------------------------------------
* object name was supplied
*-------------------------------------------------------------------------
*/
if( objname1 )
{
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
/* Let tasks know that they won't be needed */
phdiff_dismiss_workers();
#endif
assert(objname2);
options->cmn_objs = 1; /* eliminate warning */
nfound = diff_compare(file1_id,
fname1,
objname1,
info1,
file2_id,
fname2,
objname2,
info2,
options);
} /* end if */
/*-------------------------------------------------------------------------
* compare all
*-------------------------------------------------------------------------
*/
else
{
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
{
int i;
if((HDstrlen(fname1) > 1024) || (HDstrlen(fname2) > 1024))
{
fprintf(stderr, "The parallel diff only supports path names up to 1024 characters\n");
MPI_Abort(MPI_COMM_WORLD, 0);
} /* end if */
HDstrcpy(filenames[0], fname1);
HDstrcpy(filenames[1], fname2);
/* Alert the worker tasks that there's going to be work. */
for(i = 1; i < g_nTasks; i++)
MPI_Send(filenames, (1024 * 2), MPI_CHAR, i, MPI_TAG_PARALLEL, MPI_COMM_WORLD);
} /* end if */
#endif
nfound = diff_match(file1_id,
info1,
file2_id,
info2,
options);
} /* end else */
trav_info_free(info1);
trav_info_free(info2);
out:
/* close */
H5E_BEGIN_TRY
{
H5Fclose(file1_id);
H5Fclose(file2_id);
} H5E_END_TRY;
return nfound;
}
/*-------------------------------------------------------------------------
* Function: diff_match
*
* Purpose: Find common objects; the algorithm used for this search is the
* cosequential match algorithm and is described in
* Folk, Michael; Zoellick, Bill. (1992). File Structures. Addison-Wesley.
*
* Return: Number of differences found
*
* Programmer: Pedro Vicente, pvn@ncsa.uiuc.edu
*
* Date: May 9, 2003
*
* Modifications: Jan 2005 Leon Arber, larber@uiuc.edu
* Added support for parallel diffing
*
* Pedro Vicente, pvn@hdfgroup.org, Nov 4, 2008
* Compare the graph and make h5diff return 1 for difference if
* 1) the number of objects in file1 is not the same as in file2
* 2) the graph does not match, i.e same names (absolute path)
* 3) objects with the same name are not of the same type
*-------------------------------------------------------------------------
*/
hsize_t diff_match(hid_t file1_id,
trav_info_t *info1,
hid_t file2_id,
trav_info_t *info2,
diff_opt_t *options)
{
trav_table_t *table = NULL;
size_t curr1;
size_t curr2;
unsigned infile[2];
hsize_t nfound = 0;
unsigned i;
/*-------------------------------------------------------------------------
* build the list
*-------------------------------------------------------------------------
*/
trav_table_init( &table );
curr1 = 0;
curr2 = 0;
while(curr1 < info1->nused && curr2 < info2->nused)
{
/* criteria is string compare */
int cmp = HDstrcmp(info1->paths[curr1].path, info2->paths[curr2].path);
if(cmp == 0) {
infile[0] = 1;
infile[1] = 1;
trav_table_addflags(infile, info1->paths[curr1].path, info1->paths[curr1].type, table);
curr1++;
curr2++;
} /* end if */
else if(cmp < 0)
{
infile[0] = 1;
infile[1] = 0;
trav_table_addflags(infile, info1->paths[curr1].path, info1->paths[curr1].type, table);
curr1++;
} /* end else-if */
else
{
infile[0] = 0;
infile[1] = 1;
trav_table_addflags(infile, info2->paths[curr2].path, info2->paths[curr2].type, table);
curr2++;
} /* end else */
} /* end while */
/* list1 did not end */
infile[0] = 1;
infile[1] = 0;
while(curr1 < info1->nused)
{
trav_table_addflags(infile, info1->paths[curr1].path, info1->paths[curr1].type, table);
curr1++;
} /* end while */
/* list2 did not end */
infile[0] = 0;
infile[1] = 1;
while(curr2 < info2->nused)
{
trav_table_addflags(infile, info2->paths[curr2].path, info2->paths[curr2].type, table);
curr2++;
} /* end while */
/*-------------------------------------------------------------------------
* print the list
*-------------------------------------------------------------------------
*/
if(options->m_verbose)
{
parallel_print("\n");
parallel_print("file1 file2\n");
parallel_print("---------------------------------------\n");
for(i = 0; i < table->nobjs; i++) {
char c1, c2;
c1 = (table->objs[i].flags[0]) ? 'x' : ' ';
c2 = (table->objs[i].flags[1]) ? 'x' : ' ';
parallel_print("%5c %6c %-15s\n", c1, c2, table->objs[i].name);
} /* end for */
parallel_print ("\n");
} /* end if */
/*-------------------------------------------------------------------------
* regarding the return value of h5diff (0, no difference in files, 1 difference )
* 1) the number of objects in file1 must be the same as in file2
* 2) the graph must match, i.e same names (absolute path)
* 3) objects with the same name must be of the same type
*-------------------------------------------------------------------------
*/
/* number of different objects */
if ( info1->nused != info2->nused )
{
options->contents = 0;
}
/* objects in one file and not the other */
for( i = 0; i < table->nobjs; i++)
{
if( table->objs[i].flags[0] != table->objs[i].flags[1] )
{
options->contents = 0;
}
}
/* objects with the same name but different HDF5 types */
for( i = 0; i < table->nobjs; i++)
{
if ( table->objs[i].flags[0] && table->objs[i].flags[1] )
{
if ( table->objs[i].type != table->objs[i].type )
{
options->contents = 0;
}
}
}
/*-------------------------------------------------------------------------
* do the diff for common objects
*-------------------------------------------------------------------------
*/
#ifdef H5_HAVE_PARALLEL
{
char *workerTasks = (char*)HDmalloc((g_nTasks - 1) * sizeof(char));
int n;
int busyTasks = 0;
struct diffs_found nFoundbyWorker;
struct diff_args args;
int havePrintToken = 1;
MPI_Status Status;
/*set all tasks as free */
HDmemset(workerTasks, 1, (g_nTasks - 1));
#endif
for(i = 0; i < table->nobjs; i++)
{
if( table->objs[i].flags[0] && table->objs[i].flags[1])
{
options->cmn_objs = 1;
if(!g_Parallel)
{
nfound += diff(file1_id,
table->objs[i].name,
file2_id,
table->objs[i].name, options, table->objs[i].type);
} /* end if */
#ifdef H5_HAVE_PARALLEL
else
{
int workerFound = 0;
h5diffdebug("beginning of big else block\n");
/* We're in parallel mode */
/* Since the data type of diff value is hsize_t which can
* be arbitary large such that there is no MPI type that
* matches it, the value is passed between processes as
* an array of bytes in order to be portable. But this
* may not work in non-homogeneous MPI environments.
*/
/*Set up args to pass to worker task. */
if(HDstrlen(table->objs[i].name) > 255)
{
printf("The parallel diff only supports object names up to 255 characters\n");
MPI_Abort(MPI_COMM_WORLD, 0);
} /* end if */
HDstrcpy(args.name, table->objs[i].name);
args.options = *options;
args.type = table->objs[i].type;
h5diffdebug2("busyTasks=%d\n", busyTasks);
/* if there are any outstanding print requests, let's handle one. */
if(busyTasks > 0)
{
int incomingMessage;
/* check if any tasks freed up, and didn't need to print. */
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_DONE, MPI_COMM_WORLD, &incomingMessage, &Status);
/* first block*/
if(incomingMessage)
{
workerTasks[Status.MPI_SOURCE - 1] = 1;
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_DONE, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
} /* end if */
/* check to see if the print token was returned. */
if(!havePrintToken)
{
/* If we don't have the token, someone is probably sending us output */
print_incoming_data();
/* check incoming queue for token */
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &incomingMessage, &Status);
/* incoming token implies free task. */
if(incomingMessage) {
workerTasks[Status.MPI_SOURCE - 1] = 1;
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
havePrintToken = 1;
} /* end if */
} /* end if */
/* check to see if anyone needs the print token. */
if(havePrintToken)
{
/* check incoming queue for print token requests */
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_REQUEST, MPI_COMM_WORLD, &incomingMessage, &Status);
if(incomingMessage)
{
MPI_Recv(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_REQUEST, MPI_COMM_WORLD, &Status);
MPI_Send(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_PRINT_TOK, MPI_COMM_WORLD);
havePrintToken = 0;
} /* end if */
} /* end if */
} /* end if */
/* check array of tasks to see which ones are free.
* Manager task never does work, so freeTasks[0] is really
* worker task 0. */
for(n = 1; (n < g_nTasks) && !workerFound; n++)
{
if(workerTasks[n-1])
{
/* send file id's and names to first free worker */
MPI_Send(&args, sizeof(args), MPI_BYTE, n, MPI_TAG_ARGS, MPI_COMM_WORLD);
/* increment counter for total number of prints. */
busyTasks++;
/* mark worker as busy */
workerTasks[n - 1] = 0;
workerFound = 1;
} /* end if */
} /* end for */
h5diffdebug2("workerfound is %d \n", workerFound);
if(!workerFound)
{
/* if they were all busy, we've got to wait for one free up
* before we can move on. If we don't have the token, some
* task is currently printing so we'll wait for that task to
* return it.
*/
if(!havePrintToken)
{
while(!havePrintToken)
{
int incomingMessage;
print_incoming_data();
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &incomingMessage, &Status);
if(incomingMessage)
{
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
havePrintToken = 1;
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
/* send this task the work unit. */
MPI_Send(&args, sizeof(args), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_ARGS, MPI_COMM_WORLD);
} /* end if */
} /* end while */
} /* end if */
/* if we do have the token, check for task to free up, or wait for a task to request it */
else
{
/* But first print all the data in our incoming queue */
print_incoming_data();
MPI_Probe(MPI_ANY_SOURCE, MPI_ANY_TAG, MPI_COMM_WORLD, &Status);
if(Status.MPI_TAG == MPI_TAG_DONE)
{
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_DONE, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
MPI_Send(&args, sizeof(args), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_ARGS, MPI_COMM_WORLD);
} /* end if */
else if(Status.MPI_TAG == MPI_TAG_TOK_REQUEST)
{
int incomingMessage;
MPI_Recv(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_REQUEST, MPI_COMM_WORLD, &Status);
MPI_Send(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_PRINT_TOK, MPI_COMM_WORLD);
do
{
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &incomingMessage, &Status);
print_incoming_data();
} while(!incomingMessage);
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
MPI_Send(&args, sizeof(args), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_ARGS, MPI_COMM_WORLD);
} /* end else-if */
else
{
printf("ERROR: Invalid tag (%d) received \n", Status.MPI_TAG);
MPI_Abort(MPI_COMM_WORLD, 0);
MPI_Finalize();
} /* end else */
} /* end else */
} /* end if */
} /* end else */
#endif /* H5_HAVE_PARALLEL */
} /* end if */
} /* end for */
h5diffdebug("done with for loop\n");
#ifdef H5_HAVE_PARALLEL
if(g_Parallel)
{
/* make sure all tasks are done */
while(busyTasks > 0)
{
MPI_Probe(MPI_ANY_SOURCE, MPI_ANY_TAG, MPI_COMM_WORLD, &Status);
if(Status.MPI_TAG == MPI_TAG_DONE)
{
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_DONE, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
} /* end if */
else if(Status.MPI_TAG == MPI_TAG_TOK_RETURN)
{
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_DONE, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
havePrintToken = 1;
} /* end else-if */
else if(Status.MPI_TAG == MPI_TAG_TOK_REQUEST)
{
MPI_Recv(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_REQUEST, MPI_COMM_WORLD, &Status);
if(havePrintToken)
{
int incomingMessage;
MPI_Send(NULL, 0, MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_PRINT_TOK, MPI_COMM_WORLD);
do {
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &incomingMessage, &Status);
print_incoming_data();
} while(!incomingMessage);
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
} /* end if */
/* someone else must have it...wait for them to return it, then give it to the task that just asked for it. */
else
{
int source = Status.MPI_SOURCE;
int incomingMessage;
do
{
MPI_Iprobe(MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &incomingMessage, &Status);
print_incoming_data();
} while(!incomingMessage);
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, MPI_ANY_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
MPI_Send(NULL, 0, MPI_BYTE, source, MPI_TAG_PRINT_TOK, MPI_COMM_WORLD);
} /* end else */
} /* end else-if */
else if(Status.MPI_TAG == MPI_TAG_TOK_RETURN)
{
MPI_Recv(&nFoundbyWorker, sizeof(nFoundbyWorker), MPI_BYTE, Status.MPI_SOURCE, MPI_TAG_TOK_RETURN, MPI_COMM_WORLD, &Status);
nfound += nFoundbyWorker.nfound;
options->not_cmp = options->not_cmp | nFoundbyWorker.not_cmp;
busyTasks--;
havePrintToken = 1;
} /* end else-if */
else if(Status.MPI_TAG == MPI_TAG_PRINT_DATA)
{
char data[PRINT_DATA_MAX_SIZE + 1];
HDmemset(data, 0, PRINT_DATA_MAX_SIZE + 1);
MPI_Recv(data, PRINT_DATA_MAX_SIZE, MPI_CHAR, Status.MPI_SOURCE, MPI_TAG_PRINT_DATA, MPI_COMM_WORLD, &Status);
printf("%s", data);
} /* end else-if */
else
{
printf("ph5diff-manager: ERROR!! Invalid tag (%d) received \n", Status.MPI_TAG);
MPI_Abort(MPI_COMM_WORLD, 0);
} /* end else */
} /* end while */
for(i = 1; i < g_nTasks; i++)
MPI_Send(NULL, 0, MPI_BYTE, i, MPI_TAG_END, MPI_COMM_WORLD);
/* Print any final data waiting in our queue */
print_incoming_data();
} /* end if */
h5diffdebug("done with if block\n");
free(workerTasks);
}
#endif /* H5_HAVE_PARALLEL */
/* free table */
trav_table_free(table);
return nfound;
}
/*-------------------------------------------------------------------------
* Function: diff_compare
*
* Purpose: get objects from list, and check for the same type
*
* Return: Number of differences found
*
* Programmer: Pedro Vicente, pvn@ncsa.uiuc.edu
* Date: May 9, 2003
*
* Programmer: Jonathan Kim
* - add following links feature (Feb 11,2010)
*-------------------------------------------------------------------------
*/
hsize_t diff_compare(hid_t file1_id,
const char *file1_name,
const char *obj1_name,
trav_info_t *info1,
hid_t file2_id,
const char *file2_name,
const char *obj2_name,
trav_info_t *info2,
diff_opt_t *options)
{
int f1 = 0;
int f2 = 0;
hsize_t nfound = 0;
ssize_t i,j;
int l_ret;
int is_dangle_link1 = 0;
int is_dangle_link2 = 0;
/* local variables for diff() */
h5trav_type_t obj1type, obj2type;
/* to get link info */
h5tool_link_info_t linkinfo1;
h5tool_link_info_t linkinfo2;
/* init link info struct */
HDmemset(&linkinfo1, 0, sizeof(h5tool_link_info_t));
HDmemset(&linkinfo2, 0, sizeof(h5tool_link_info_t));
i = h5trav_getindex (info1, obj1_name);
j = h5trav_getindex (info2, obj2_name);
if (i == -1)
{
parallel_print ("Object <%s> could not be found in <%s>\n", obj1_name,
file1_name);
f1 = 1;
}
if (j == -1)
{
parallel_print ("Object <%s> could not be found in <%s>\n", obj2_name,
file2_name);
f2 = 1;
}
if (f1 || f2)
{
options->err_stat = 1;
return 0;
}
/* use the name with "/" first, as obtained by iterator function */
obj1_name = info1->paths[i].path;
obj2_name = info2->paths[j].path;
obj1type = info1->paths[i].type;
obj2type = info2->paths[j].type;
/*-----------------------------------------------------------------
* follow link option, compare with target object
*/
if (options->follow_links)
{
/* pass how to handle printing warning to linkinfo option */
if(print_warn(options))
linkinfo1.opt.msg_mode = linkinfo2.opt.msg_mode = 1;
/*------------------------------------------------------------
* Soft links
*------------------------------------------------------------*/
/*--------------------------
* if object1 soft link */
if (obj1type == H5TRAV_TYPE_LINK)
{
/* get type of target object */
l_ret = H5tools_get_link_info(file1_id, obj1_name, &linkinfo1, TRUE);
/* dangling link */
if (l_ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", obj1_name);
options->err_stat = 1;
goto out;
}
else
is_dangle_link1 = 1;
}
/* fail */
else if(l_ret < 0)
{
options->err_stat = 1;
goto out;
}
else /* OK */
{
/* target type for diff() */
obj1type = linkinfo1.trg_type;
}
}
/*-----------------------------
* if object2 is soft link */
if (obj2type == H5TRAV_TYPE_LINK)
{
/* get type target object */
l_ret = H5tools_get_link_info(file2_id, obj2_name, &linkinfo2, TRUE);
/* dangling link */
if (l_ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", obj2_name);
options->err_stat = 1;
goto out;
}
else
is_dangle_link2=1;
}
/* fail */
else if(l_ret < 0)
{
options->err_stat = 1;
goto out;
}
else /* OK */
{
/* target type for diff() */
obj2type = linkinfo2.trg_type;
}
}
/*------------------------------------------------------------
* External links
*------------------------------------------------------------*/
/*--------------------------------
* if object1 is external link */
if (obj1type == H5TRAV_TYPE_UDLINK)
{
/* get type and name of target object */
l_ret = H5tools_get_link_info(file1_id, obj1_name, &linkinfo1, TRUE);
/* dangling link */
if (l_ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", obj1_name);
options->err_stat = 1;
goto out;
}
else
is_dangle_link1 = 1;
}
/* fail */
else if(l_ret < 0)
{
options->err_stat = 1;
goto out;
}
else /* OK */
{
/* for external link */
if(linkinfo1.linfo.type == H5L_TYPE_EXTERNAL)
obj1type = linkinfo1.trg_type;
}
}
/*--------------------------------
* if object2 is external link */
if (obj2type == H5TRAV_TYPE_UDLINK)
{
/* get type and name of target object */
l_ret = H5tools_get_link_info(file2_id, obj2_name, &linkinfo2, TRUE);
/* dangling link */
if (l_ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", obj2_name);
options->err_stat = 1;
goto out;
}
else
is_dangle_link2 = 1;
}
/* fail */
else if(l_ret < 0)
{
options->err_stat = 1;
goto out;
}
else /* OK */
{
/* for external link */
if(linkinfo2.linfo.type == H5L_TYPE_EXTERNAL)
obj2type = linkinfo2.trg_type;
}
}
/* found dangling link */
if (is_dangle_link1 || is_dangle_link2)
goto out;
} /* end of follow_links */
/* objects are not the same type */
if (obj1type != obj2type)
{
if (options->m_verbose||options->m_list_not_cmp)
{
parallel_print("<%s> is of type %s and <%s> is of type %s\n",
obj1_name, get_type(obj1type),
obj2_name, get_type(obj2type));
}
options->not_cmp=1;
goto out;
}
nfound = diff(file1_id, obj1_name,
file2_id, obj2_name,
options, obj1type);
out:
/*-------------------------------
* handle dangling link(s) */
/* both obj1 and obj2 are dangling links */
if(is_dangle_link1 && is_dangle_link2)
{
if(print_objname(options, nfound))
{
do_print_objname("dangling link", obj1_name, obj2_name);
print_found(nfound);
}
}
/* obj1 is dangling link */
else if (is_dangle_link1)
{
if(options->m_verbose)
parallel_print("obj1 <%s> is a dangling link.\n", obj1_name);
nfound++;
if(print_objname(options, nfound))
print_found(nfound);
}
/* obj2 is dangling link */
else if (is_dangle_link2)
{
if(options->m_verbose)
parallel_print("obj2 <%s> is a dangling link.\n", obj2_name);
nfound++;
if(print_objname(options, nfound))
print_found(nfound);
}
/* free link info buffer */
if (linkinfo1.trg_path)
HDfree(linkinfo1.trg_path);
if (linkinfo2.trg_path)
HDfree(linkinfo2.trg_path);
return nfound;
}
/*-------------------------------------------------------------------------
* Function: diff
*
* Purpose: switch between types and choose the diff function
* TYPE is either
* H5G_GROUP Object is a group
* H5G_DATASET Object is a dataset
* H5G_TYPE Object is a named data type
* H5G_LINK Object is a symbolic link
*
* Return: Number of differences found
*
* Programmer: Pedro Vicente, pvn@ncsa.uiuc.edu
* Date: May 9, 2003
*
* Programmer: Jonathan Kim
* - add following links feature (Feb 11,2010)
*-------------------------------------------------------------------------
*/
hsize_t diff(hid_t file1_id,
const char *path1,
hid_t file2_id,
const char *path2,
diff_opt_t * options,
h5trav_type_t type)
{
hid_t type1_id = (-1);
hid_t type2_id = (-1);
hid_t grp1_id = (-1);
hid_t grp2_id = (-1);
int ret;
int is_dangle_link1 = 0;
int is_dangle_link2 = 0;
hsize_t nfound = 0;
/* to get link info */
h5tool_link_info_t linkinfo1;
h5tool_link_info_t linkinfo2;
/*init link info struct */
HDmemset(&linkinfo1,0,sizeof(h5tool_link_info_t));
HDmemset(&linkinfo2,0,sizeof(h5tool_link_info_t));
/* pass how to handle printing warnings to linkinfo option */
if(print_warn(options))
linkinfo1.opt.msg_mode = linkinfo2.opt.msg_mode = 1;
switch(type)
{
/*----------------------------------------------------------------------
* H5TRAV_TYPE_DATASET
*----------------------------------------------------------------------
*/
case H5TRAV_TYPE_DATASET:
/* verbose (-v) and report (-r) mode */
if(options->m_verbose || options->m_report)
{
do_print_objname("dataset", path1, path2);
nfound = diff_dataset(file1_id, file2_id, path1, path2, options);
print_found(nfound);
}
/* quiet mode (-q), just count differences */
else if(options->m_quiet)
{
nfound = diff_dataset(file1_id, file2_id, path1, path2, options);
}
/* the rest (-c, none, ...) */
else
{
nfound = diff_dataset(file1_id, file2_id, path1, path2, options);
/* print info if compatible and difference found */
if (!options->not_cmp && nfound)
{
do_print_objname("dataset", path1, path2);
print_found(nfound);
}
}
break;
/*----------------------------------------------------------------------
* H5TRAV_TYPE_NAMED_DATATYPE
*----------------------------------------------------------------------
*/
case H5TRAV_TYPE_NAMED_DATATYPE:
if((type1_id = H5Topen2(file1_id, path1, H5P_DEFAULT)) < 0)
goto out;
if((type2_id = H5Topen2(file2_id, path2, H5P_DEFAULT)) < 0)
goto out;
if((ret = H5Tequal(type1_id, type2_id)) < 0)
goto out;
/* if H5Tequal is > 0 then the datatypes refer to the same datatype */
nfound = (ret > 0) ? 0 : 1;
if(print_objname(options,nfound))
do_print_objname("datatype", path1, path2);
/* always print the number of differences found in verbose mode */
if(options->m_verbose)
print_found(nfound);
/*-----------------------------------------------------------------
* compare attributes
* the if condition refers to cases when the dataset is a
* referenced object
*-----------------------------------------------------------------
*/
if(path1)
nfound += diff_attr(type1_id, type2_id, path1, path2, options);
if(H5Tclose(type1_id) < 0)
goto out;
if(H5Tclose(type2_id) < 0)
goto out;
break;
/*----------------------------------------------------------------------
* H5TRAV_TYPE_GROUP
*----------------------------------------------------------------------
*/
case H5TRAV_TYPE_GROUP:
ret = HDstrcmp(path1, path2);
/* if "path1" != "path2" then the groups are "different" */
nfound = (ret != 0) ? 1 : 0;
if(print_objname(options, nfound))
do_print_objname("group", path1, path2);
/* always print the number of differences found in verbose mode */
if(options->m_verbose)
print_found(nfound);
if((grp1_id = H5Gopen2(file1_id, path1, H5P_DEFAULT)) < 0)
goto out;
if((grp2_id = H5Gopen2(file2_id, path2, H5P_DEFAULT)) < 0)
goto out;
/*-----------------------------------------------------------------
* compare attributes
* the if condition refers to cases when the dataset is a
* referenced object
*-----------------------------------------------------------------
*/
if(path1)
nfound += diff_attr(grp1_id, grp2_id, path1, path2, options);
if(H5Gclose(grp1_id) < 0)
goto out;
if(H5Gclose(grp2_id) < 0)
goto out;
break;
/*----------------------------------------------------------------------
* H5TRAV_TYPE_LINK
*----------------------------------------------------------------------
*/
case H5TRAV_TYPE_LINK:
{
/* get type and name of target object */
ret = H5tools_get_link_info(file1_id, path1, &linkinfo1, TRUE);
/* dangling link */
if (ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", path1);
goto out;
}
else
is_dangle_link1 = 1;
}
else if (ret < 0)
goto out;
/* get type and name of target object */
ret = H5tools_get_link_info(file2_id, path2, &linkinfo2, TRUE);
/* dangling link */
if (ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", path2);
goto out;
}
else
is_dangle_link2 = 1;
}
else if (ret < 0)
goto out;
/* found dangling link */
if (is_dangle_link1 || is_dangle_link2)
goto out2;
ret = HDstrcmp(linkinfo1.trg_path, linkinfo2.trg_path);
/* if the target link name is not same then the links are "different" */
nfound = (ret != 0) ? 1 : 0;
if(print_objname(options, nfound))
do_print_objname("link", path1, path2);
if (options->follow_links)
{
/* objects are not the same type */
if (linkinfo1.trg_type != linkinfo2.trg_type)
{
if (options->m_verbose||options->m_list_not_cmp)
{
parallel_print("<%s> is of type %s and <%s> is of type %s\n", path1, get_type(linkinfo1.trg_type), path2, get_type(linkinfo2.trg_type));
}
options->not_cmp=1;
goto out;
}
/* call self to compare target object */
nfound += diff(file1_id, path1,
file2_id, path2,
options, linkinfo1.trg_type);
}
/* always print the number of differences found in verbose mode */
if(options->m_verbose)
print_found(nfound);
/* free link info buffer */
HDfree(linkinfo1.trg_path);
HDfree(linkinfo2.trg_path);
}
break;
/*----------------------------------------------------------------------
* H5TRAV_TYPE_UDLINK
*----------------------------------------------------------------------
*/
case H5TRAV_TYPE_UDLINK:
{
/* get type and name of target object */
ret = H5tools_get_link_info(file1_id, path1, &linkinfo1, TRUE);
/* dangling link */
if (ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", path1);
goto out;
}
else
is_dangle_link1=1;
}
else if (ret < 0)
goto out;
/* get type and name of target object */
ret = H5tools_get_link_info(file2_id, path2, &linkinfo2, TRUE);
/* dangling link */
if (ret == 0)
{
if (options->no_dangle_links)
{
/* gangling link is error */
if(options->m_verbose)
parallel_print("Warning: <%s> is a dangling link.\n", path2);
goto out;
}
else
is_dangle_link2=1;
}
else if (ret < 0)
goto out;
/* found dangling link */
if (is_dangle_link1 || is_dangle_link2)
goto out2;
/* Only external links will have a query function registered */
if(linkinfo1.linfo.type == H5L_TYPE_EXTERNAL && linkinfo2.linfo.type == H5L_TYPE_EXTERNAL)
{
/* If the buffers are the same size, compare them */
if(linkinfo1.linfo.u.val_size == linkinfo2.linfo.u.val_size)
{
ret = HDmemcmp(linkinfo1.trg_path, linkinfo2.trg_path, linkinfo1.linfo.u.val_size);
}
else
ret = 1;
/* if "linkinfo1.trg_path" != "linkinfo2.trg_path" then the links
* are "different" extlinkinfo#.path is combination string of
* file_name and obj_name
*/
nfound = (ret != 0) ? 1 : 0;
if(print_objname(options, nfound))
do_print_objname("external link", path1, path2);
if (options->follow_links)
{
/* objects are not the same type */
if (linkinfo1.trg_type != linkinfo2.trg_type)
{
if (options->m_verbose||options->m_list_not_cmp)
{
parallel_print("<%s> is of type %s and <%s> is of type %s\n", path1, get_type(linkinfo1.trg_type), path2, get_type(linkinfo2.trg_type));
}
options->not_cmp=1;
goto out;
}
nfound = diff(file1_id, path1,
file2_id, path2,
options, linkinfo1.trg_type);
}
/* free link info buffer */
HDfree(linkinfo1.trg_path);
HDfree(linkinfo2.trg_path);
} /* end if */
else
{
/* If one or both of these links isn't an external link, we can only
* compare information from H5Lget_info since we don't have a query
* function registered for them.
*
* If the link classes or the buffer length are not the
* same, the links are "different"
*/
if((linkinfo1.linfo.type != linkinfo2.linfo.type) ||
(linkinfo1.linfo.u.val_size != linkinfo2.linfo.u.val_size))
nfound = 1;
else
nfound = 0;
if (print_objname (options, nfound))
do_print_objname ("user defined link", path1, path2);
} /* end else */
/* always print the number of differences found in verbose mode */
if(options->m_verbose)
print_found(nfound);
}
break;
default:
if(options->m_verbose)
parallel_print("Comparison not supported: <%s> and <%s> are of type %s\n",
path1, path2, get_type(type) );
options->not_cmp = 1;
break;
}
return nfound;
out:
options->err_stat = 1;
out2:
/*-----------------------------------
* handle dangling link(s)
*/
/* both path1 and path2 are dangling links */
if(is_dangle_link1 && is_dangle_link2)
{
if(print_objname(options, nfound))
{
do_print_objname("dangling link", path1, path2);
print_found(nfound);
}
}
/* path1 is dangling link */
else if (is_dangle_link1)
{
if(options->m_verbose)
parallel_print("obj1 <%s> is a dangling link.\n", path1);
nfound++;
if(print_objname(options, nfound))
print_found(nfound);
}
/* path2 is dangling link */
else if (is_dangle_link2)
{
if(options->m_verbose)
parallel_print("obj2 <%s> is a dangling link.\n", path2);
nfound++;
if(print_objname(options, nfound))
print_found(nfound);
}
/* free link info buffer */
if (linkinfo1.trg_path)
HDfree(linkinfo1.trg_path);
if (linkinfo2.trg_path)
HDfree(linkinfo2.trg_path);
/* close */
/* disable error reporting */
H5E_BEGIN_TRY {
H5Tclose(type1_id);
H5Tclose(type2_id);
H5Gclose(grp1_id);
H5Tclose(grp2_id);
/* enable error reporting */
} H5E_END_TRY;
return nfound;
}