summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorQuincey Koziol <koziol@hdfgroup.org>2007-11-10 14:47:51 (GMT)
committerQuincey Koziol <koziol@hdfgroup.org>2007-11-10 14:47:51 (GMT)
commit8625a8bd6be9a3c89b5195f36df14bb66b26b2c7 (patch)
tree72cc45a80d99a5be7eea01b2796f7a85cc473a14
parent0e367c3715e30362d94862e768bbbd5a557e55ad (diff)
downloadhdf5-8625a8bd6be9a3c89b5195f36df14bb66b26b2c7.zip
hdf5-8625a8bd6be9a3c89b5195f36df14bb66b26b2c7.tar.gz
hdf5-8625a8bd6be9a3c89b5195f36df14bb66b26b2c7.tar.bz2
[svn-r14247] Description:
- Refactored H5D_flush to use H5I_search for iterating through datasets, instead of building array of dataset IDs. - Cache dataset's dataspace modifications (from calls to H5Dset_extent) until flush/close. These changes give an ~15% improvement in speed for my "append records to lots of 1-D datasets" benchmark. Tested on: Mac OS X/32 10.4.10 (amazon) in debug mode FreeBSD/32 6.2 (duty) in debug mode FreeBSD/64 6.2 (liberty) w/C++ & FORTRAN, in debug mode Linux/32 2.6 (kagiso) w/PGI compilers, w/C++ & FORTRAN, w/threadsafe, in debug mode Linux/64-amd64 2.6 (smirom) w/default API=1.6.x, w/C++ & FORTRAN, in production mode Solaris/32 2.10 (linew) w/deprecated symbols disabled, w/C++ & FORTRAN, w/szip filter, in production mode Linux/64-ia64 2.6 (cobalt) w/Intel compilers, w/C++ & FORTRAN, in production mode Linux/64-ia64 2.4 (tg-login3) w/parallel, w/FORTRAN, in production mode
-rw-r--r--src/H5Dint.c165
-rw-r--r--src/H5Dpkg.h1
2 files changed, 102 insertions, 64 deletions
diff --git a/src/H5Dint.c b/src/H5Dint.c
index 5584187..aebc6f2 100644
--- a/src/H5Dint.c
+++ b/src/H5Dint.c
@@ -45,6 +45,13 @@
/* Local Typedefs */
/******************/
+/* Struct for holding callback info during H5D_flush operation */
+typedef struct {
+ const H5F_t *f; /* Pointer to file being flushed */
+ hid_t dxpl_id; /* DXPL for I/O operations */
+ unsigned flags; /* Flags for flush operation */
+} H5D_flush_ud_t;
+
/********************/
/* Local Prototypes */
@@ -1484,6 +1491,13 @@ H5D_close(H5D_t *dataset)
dataset->shared->fo_count--;
if(dataset->shared->fo_count == 0) {
+ /* Update the dataspace on disk, if it's been changed */
+ if(dataset->shared->space_dirty) {
+ if(H5S_write(&(dataset->oloc), dataset->shared->space, TRUE, H5AC_dxpl_id) < 0)
+ HGOTO_ERROR(H5E_DATASET, H5E_WRITEERROR, FAIL, "unable to update file with new dataspace")
+ dataset->shared->space_dirty = FALSE;
+ } /* end if */
+
/* Free the data sieve buffer, if it's been allocated */
if(dataset->shared->cache.contig.sieve_buf) {
HDassert(dataset->shared->layout.type != H5D_COMPACT); /* We should never have a sieve buffer for compact storage */
@@ -2284,9 +2298,8 @@ H5D_set_extent(H5D_t *dset, const hsize_t *size, hid_t dxpl_id)
* Modify the dataset storage
*-------------------------------------------------------------------------
*/
- /* Save the new dataspace in the file if necessary */
- if(H5S_write(&(dset->oloc), space, TRUE, dxpl_id) < 0)
- HGOTO_ERROR(H5E_DATASET, H5E_WRITEERROR, FAIL, "unable to update file with new dataspace")
+ /* Mark the dataspace as dirty, for later writing to the file */
+ dset->shared->space_dirty = TRUE;
/* Update the index values for the cached chunks for this dataset */
if(H5D_CHUNKED == dset->shared->layout.type)
@@ -2332,93 +2345,117 @@ done:
/*-------------------------------------------------------------------------
- * Function: H5D_flush
+ * Function: H5D_flush_cb
*
* Purpose: Flush any dataset information cached in memory
*
* Return: Success: Non-negative
* Failure: Negative
*
- * Programmer: Ray Lu
- * August 14, 2002
+ * Programmer: Quincey Koziol
+ * November 8, 2007
*
*-------------------------------------------------------------------------
*/
-herr_t
-H5D_flush(const H5F_t *f, hid_t dxpl_id, unsigned flags)
+static int
+H5D_flush_cb(void *_dataset, hid_t UNUSED id, void *_udata)
{
- hid_t *id_list = NULL; /* Array of dataset IDs */
- unsigned num_dsets; /* Number of datasets in file */
- herr_t ret_value = SUCCEED; /* Return value */
+ H5D_t *dataset = (H5D_t *)_dataset; /* Dataset pointer */
+ H5D_flush_ud_t *udata = (H5D_flush_ud_t *)_udata; /* User data for callback */
+ int ret_value = H5_ITER_CONT; /* Return value */
- FUNC_ENTER_NOAPI(H5D_flush, FAIL)
+ FUNC_ENTER_NOAPI_NOINIT(H5D_flush_cb)
/* Check args */
- HDassert(f);
-
- /* Retrieve the # of outstanding dataset IDs */
- num_dsets = H5F_get_obj_count(f, H5F_OBJ_DATASET);
-
- /* Check for something to do */
- if(num_dsets > 0) {
- H5D_t *dataset; /* Dataset pointer */
- unsigned u; /* Index variable */
-
- H5_CHECK_OVERFLOW(num_dsets, unsigned, size_t);
- if(NULL == (id_list = (hid_t *)H5MM_malloc((size_t)num_dsets * sizeof(hid_t))))
- HGOTO_ERROR(H5E_FILE, H5E_CANTINIT, FAIL, "unable to allocate memory for ID list")
- if(H5F_get_obj_ids(f, H5F_OBJ_DATASET, -1, id_list) != num_dsets)
- HGOTO_ERROR(H5E_FILE, H5E_CANTINIT, FAIL, "unable to get dataset ID list")
+ HDassert(dataset);
- /* Iterate through the open datasets */
- for(u = 0; u < num_dsets; u++) {
- if(NULL == (dataset = (H5D_t *)H5I_object_verify(id_list[u], H5I_DATASET)))
- HGOTO_ERROR(H5E_FILE, H5E_CANTINIT, FAIL, "unable to get dataset object")
+ /* Check for dataset in same file */
+ if(udata->f == dataset->oloc.file) {
+ /* Update the dataspace on disk, if it's been changed */
+ if(dataset->shared->space_dirty) {
+ if(H5S_write(&(dataset->oloc), dataset->shared->space, TRUE, udata->dxpl_id) < 0)
+ HGOTO_ERROR(H5E_DATASET, H5E_WRITEERROR, FAIL, "unable to update file with new dataspace")
+ dataset->shared->space_dirty = FALSE;
+ } /* end if */
- /* Flush the raw data buffer, if we have a dirty one */
- if(dataset->shared->cache.contig.sieve_buf && dataset->shared->cache.contig.sieve_dirty) {
- HDassert(dataset->shared->layout.type != H5D_COMPACT); /* We should never have a sieve buffer for compact storage */
+ /* Flush the raw data buffer, if we have a dirty one */
+ if(dataset->shared->cache.contig.sieve_buf && dataset->shared->cache.contig.sieve_dirty) {
+ HDassert(dataset->shared->layout.type != H5D_COMPACT); /* We should never have a sieve buffer for compact storage */
- /* Write dirty data sieve buffer to file */
- if(H5F_block_write(f, H5FD_MEM_DRAW, dataset->shared->cache.contig.sieve_loc,
- dataset->shared->cache.contig.sieve_size, dxpl_id, dataset->shared->cache.contig.sieve_buf) < 0)
- HGOTO_ERROR(H5E_IO, H5E_WRITEERROR, FAIL, "block write failed")
+ /* Write dirty data sieve buffer to file */
+ if(H5F_block_write(udata->f, H5FD_MEM_DRAW, dataset->shared->cache.contig.sieve_loc,
+ dataset->shared->cache.contig.sieve_size, udata->dxpl_id, dataset->shared->cache.contig.sieve_buf) < 0)
+ HGOTO_ERROR(H5E_IO, H5E_WRITEERROR, FAIL, "block write failed")
- /* Reset sieve buffer dirty flag */
- dataset->shared->cache.contig.sieve_dirty = FALSE;
- } /* end if */
+ /* Reset sieve buffer dirty flag */
+ dataset->shared->cache.contig.sieve_dirty = FALSE;
+ } /* end if */
- /* Flush cached information for each kind of dataset */
- switch(dataset->shared->layout.type) {
- case H5D_CONTIGUOUS:
- break;
+ /* Flush cached information for each kind of dataset */
+ switch(dataset->shared->layout.type) {
+ case H5D_CONTIGUOUS:
+ break;
- case H5D_CHUNKED:
- /* Flush the raw data cache */
- if(H5D_istore_flush(dataset, dxpl_id, flags & H5F_FLUSH_INVALIDATE) < 0)
- HGOTO_ERROR(H5E_CACHE, H5E_CANTFLUSH, FAIL, "unable to flush raw data cache")
- break;
+ case H5D_CHUNKED:
+ /* Flush the raw data cache */
+ if(H5D_istore_flush(dataset, udata->dxpl_id, udata->flags & H5F_FLUSH_INVALIDATE) < 0)
+ HGOTO_ERROR(H5E_CACHE, H5E_CANTFLUSH, FAIL, "unable to flush raw data cache")
+ break;
- case H5D_COMPACT:
- if(dataset->shared->layout.u.compact.dirty) {
- if(H5O_msg_write(&(dataset->oloc), H5O_LAYOUT_ID, 0, H5O_UPDATE_TIME, &(dataset->shared->layout), dxpl_id) < 0)
- HGOTO_ERROR(H5E_FILE, H5E_CANTINIT, FAIL, "unable to update layout message")
- dataset->shared->layout.u.compact.dirty = FALSE;
- } /* end if */
- break;
+ case H5D_COMPACT:
+ if(dataset->shared->layout.u.compact.dirty) {
+ if(H5O_msg_write(&(dataset->oloc), H5O_LAYOUT_ID, 0, H5O_UPDATE_TIME, &(dataset->shared->layout), udata->dxpl_id) < 0)
+ HGOTO_ERROR(H5E_FILE, H5E_CANTINIT, FAIL, "unable to update layout message")
+ dataset->shared->layout.u.compact.dirty = FALSE;
+ } /* end if */
+ break;
- default:
- HDassert("not implemented yet" && 0);
+ default:
+ HDassert("not implemented yet" && 0);
#ifdef NDEBUG
- HGOTO_ERROR(H5E_IO, H5E_UNSUPPORTED, FAIL, "unsupported storage layout")
+ HGOTO_ERROR(H5E_IO, H5E_UNSUPPORTED, FAIL, "unsupported storage layout")
#endif /* NDEBUG */
- } /* end switch */ /*lint !e788 All appropriate cases are covered */
- } /* end for */
+ } /* end switch */ /*lint !e788 All appropriate cases are covered */
} /* end if */
done:
- if(id_list)
- H5MM_xfree(id_list);
+ FUNC_LEAVE_NOAPI(ret_value)
+} /* end H5D_flush_cb() */
+
+
+/*-------------------------------------------------------------------------
+ * Function: H5D_flush
+ *
+ * Purpose: Flush any dataset information cached in memory
+ *
+ * Return: Success: Non-negative
+ * Failure: Negative
+ *
+ * Programmer: Ray Lu
+ * August 14, 2002
+ *
+ *-------------------------------------------------------------------------
+ */
+herr_t
+H5D_flush(const H5F_t *f, hid_t dxpl_id, unsigned flags)
+{
+ H5D_flush_ud_t udata; /* User data for callback */
+ herr_t ret_value = SUCCEED; /* Return value */
+
+ FUNC_ENTER_NOAPI(H5D_flush, FAIL)
+
+ /* Check args */
+ HDassert(f);
+
+ /* Set user data for callback */
+ udata.f = f;
+ udata.dxpl_id = dxpl_id;
+ udata.flags = flags;
+
+ /* Iterate over all the open datasets */
+ H5I_search(H5I_DATASET, H5D_flush_cb, &udata);
+
+done:
FUNC_LEAVE_NOAPI(ret_value)
} /* end H5D_flush() */
diff --git a/src/H5Dpkg.h b/src/H5Dpkg.h
index cdcc362..34a32ee 100644
--- a/src/H5Dpkg.h
+++ b/src/H5Dpkg.h
@@ -154,6 +154,7 @@ typedef struct H5D_shared_t {
hid_t type_id; /* ID for dataset's datatype */
H5T_t *type; /* datatype of this dataset */
H5S_t *space; /* dataspace of this dataset */
+ hbool_t space_dirty; /* Whether the dataspace info needs to be flushed to the file */
hid_t dcpl_id; /* dataset creation property id */
H5D_dcpl_cache_t dcpl_cache; /* Cached DCPL values */
H5D_io_ops_t io_ops; /* I/O operations */