[svn-r21989] Purpose: Add SWMR capability to v1 b-tree

Description: Adds SWMR capability to v1 b-trees, and the chunk index using v1 b-trees. With this implementation, flush dependencies are always on when in the cache. This will allow attritbutes to be used for "checkpointing" data when object header dependencies are fixed - i.e. if a writer writes data before an attribute in that dataset's object header, then if a reader sees the updated attribute the written data is guaranteed to be visible, as long as that dataset's b-tree nodes are evicted from the reader's cache. Also adds support for compression with SWMR. Also fixes earray implementation to not free (reuse) the file space for deleted chunks and outdated versions of compressed chunks when doing SWMR writes. These should eventually be added to a timeout list. Adds testing for these cases. Tested: durandal
author: Neil Fortner <nfortne2@hdfgroup.org> 2012-02-27 16:34:55 (GMT)
committer: Neil Fortner <nfortne2@hdfgroup.org> 2012-02-27 16:34:55 (GMT)
commit: 73c139e29b45941dfc4e558d9096a0869a184260 (patch)
tree: 422cc12e6675238cd92edadc078fa427a4f6bcd0 /test/swmr_sparse_writer.c
parent: e2cd00055204f6b264002e70b21a6e2ca4c98c77 (diff)
download: hdf5-73c139e29b45941dfc4e558d9096a0869a184260.zip
hdf5-73c139e29b45941dfc4e558d9096a0869a184260.tar.gz
hdf5-73c139e29b45941dfc4e558d9096a0869a184260.tar.bz2
1 files changed, 345 insertions, 0 deletions
diff --git a/test/swmr_sparse_writer.c b/test/swmr_sparse_writer.c
new file mode 100644
index 0000000..97e2674
--- /dev/null
+++ b/test/swmr_sparse_writer.c
@@ -0,0 +1,345 @@
+#include "swmr_common.h"
+
+#define BUSY_WAIT 100000
+
+static hid_t
+open_skeleton(const char *filename, unsigned verbose)
+{
+    hid_t fid;          /* File ID for new HDF5 file */
+    hid_t fapl;         /* File access property list */
+    hid_t aid;          /* Attribute ID */
+    unsigned seed;      /* Seed for random number generator */
+    unsigned u, v;      /* Local index variable */
+
+    /* Create file access property list */
+    if((fapl = H5Pcreate(H5P_FILE_ACCESS)) < 0)
+        return(-1);
+
+#ifdef QAK
+/* Increase the initial size of the metadata cache */
+{
+    H5AC_cache_config_t mdc_config;
+
+    mdc_config.version = H5AC__CURR_CACHE_CONFIG_VERSION;
+    H5Pget_mdc_config(fapl, &mdc_config);
+printf("mdc_config.initial_size = %lu\n", (unsigned long)mdc_config.initial_size);
+printf("mdc_config.epoch_length = %lu\n", (unsigned long)mdc_config.epoch_length);
+    mdc_config.set_initial_size = 1;
+    mdc_config.initial_size = 16 * 1024 * 1024;
+/*    mdc_config.epoch_length = 5000; */
+    H5Pset_mdc_config(fapl, &mdc_config);
+}
+#endif /* QAK */
+
+#ifdef QAK
+    H5Pset_fapl_log(fapl, "append.log", H5FD_LOG_ALL, (size_t)(512 * 1024 * 1024));
+#endif /* QAK */
+
+    /* Open the file */
+    if((fid = H5Fopen(filename, H5F_ACC_RDWR | H5F_ACC_SWMR_WRITE, fapl)) < 0)
+        return(-1);
+
+    /* Close file access property list */
+    if(H5Pclose(fapl) < 0)
+        return(-1);
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Opening datasets\n");
+
+    /* Seed the random number generator with the attribute in the file */
+    if((aid = H5Aopen(fid, "seed", H5P_DEFAULT)) < 0)
+        return(-1);
+    if(H5Aread(aid, H5T_NATIVE_UINT, &seed) < 0)
+        return(-1);
+    if(H5Aclose(aid) < 0)
+        return(-1);
+    srandom(seed);
+
+    /* Open the datasets */
+    for(u = 0; u < NLEVELS; u++)
+        for(v = 0; v < symbol_count[u]; v++) {
+            if((symbol_info[u][v].dsid = H5Dopen2(fid, symbol_info[u][v].name, H5P_DEFAULT)) < 0)
+                return(-1);
+            symbol_info[u][v].nrecords = 0;
+        } /* end for */
+
+    return(fid);
+}
+
+static int
+add_records(hid_t fid, unsigned verbose, unsigned long nrecords, unsigned long flush_count)
+{
+    hid_t tid;                          /* Datatype ID for records */
+    hid_t mem_sid;                      /* Memory dataspace ID */
+    hsize_t start, count = 1;           /* Hyperslab selection values */
+    symbol_t record;                    /* The record to add to the dataset */
+    H5AC_cache_config_t mdc_config_orig; /* Original metadata cache configuration */
+    H5AC_cache_config_t mdc_config_cork; /* Corked metadata cache configuration */
+    unsigned long rec_to_flush;         /* # of records left to write before flush */
+    volatile int dummy;                 /* Dummy varialbe for busy sleep */
+    unsigned long u, v;                 /* Local index variables */
+
+    /* Reset the record */
+    /* (record's 'info' field might need to change for each record written, also) */
+    memset(&record, 0, sizeof(record));
+
+    /* Create a dataspace for the record to add */
+    if((mem_sid = H5Screate(H5S_SCALAR)) < 0)
+        return(-1);
+
+    /* Create datatype for appending records */
+    if((tid = create_symbol_datatype()) < 0)
+        return(-1);
+
+    /* Get the current metadata cache configuration, and set up the corked
+     * configuration */
+    mdc_config_orig.version = H5AC__CURR_CACHE_CONFIG_VERSION;
+    if(H5Fget_mdc_config(fid, &mdc_config_orig) < 0)
+        return(-1);
+    memcpy(&mdc_config_cork, &mdc_config_orig, sizeof(mdc_config_cork));
+    mdc_config_cork.evictions_enabled = FALSE;
+    mdc_config_cork.incr_mode = H5C_incr__off;
+    mdc_config_cork.flash_incr_mode = H5C_flash_incr__off;
+    mdc_config_cork.decr_mode = H5C_decr__off;
+
+    /* Add records to random datasets, according to frequency distribution */
+    rec_to_flush = flush_count;
+    for(u = 0; u < nrecords; u++) {
+        symbol_info_t *symbol;  /* Symbol to write record to */
+        hid_t file_sid;         /* Dataset's space ID */
+        hid_t aid;              /* Attribute ID */
+
+        /* Get a random dataset, according to the symbol distribution */
+        symbol = choose_dataset();
+
+        /* Cork the metadata cache, to prevent the object header from being
+         * flushed before the data has been written */
+        /*if(H5Fset_mdc_config(fid, &mdc_config_cork) < 0)
+            return(-1);*/
+
+        /* If this is the first time the dataset has been opened, extend it and
+         * add the sequence attribute */
+        if(symbol->nrecords == 0) {
+            symbol->nrecords = nrecords / 5;
+
+            if(H5Dset_extent(symbol->dsid, &symbol->nrecords) < 0)
+                return(-1);
+
+            if((file_sid = H5Screate(H5S_SCALAR)) < 0)
+                return(-1);
+            if((aid = H5Acreate2(symbol->dsid, "seq", H5T_NATIVE_ULONG, file_sid, H5P_DEFAULT, H5P_DEFAULT)) < 0)
+                return(-1);
+            if(H5Sclose(file_sid) < 0)
+                return(-1);
+        } /* end if */
+        else if((aid = H5Aopen(symbol->dsid, "seq", H5P_DEFAULT)) < 0)
+            return(-1);
+
+        /* Get the coordinate to write */
+        start = (hsize_t)random() % symbol->nrecords;
+
+        /* Set the record's ID (equal to its position) */
+        record.rec_id = start;
+
+        /* Extend the dataset's dataspace to hold the new record */
+        symbol->nrecords++;
+        if(H5Dset_extent(symbol->dsid, &symbol->nrecords) < 0)
+            return(-1);
+
+        /* Get the dataset's dataspace */
+        if((file_sid = H5Dget_space(symbol->dsid)) < 0)
+            return(-1);
+
+        /* Choose the last record in the dataset */
+        if(H5Sselect_hyperslab(file_sid, H5S_SELECT_SET, &start, NULL, &count, NULL) < 0)
+            return(-1);
+
+        /* Write record to the dataset */
+        if(H5Dwrite(symbol->dsid, tid, mem_sid, file_sid, H5P_DEFAULT, &record) < 0)
+            return(-1);
+
+        /* Write the sequence number attribute.  Since we synchronize the random
+         * number seed, the readers will always generate the same sequence of
+         * randomly chosen datasets and offsets.  Therefore, and because of the
+         * flush dependencies on the object header, the reader will be
+         * guaranteed to see the written data if the sequence attribute is >=u.
+         */
+        if(H5Awrite(aid, H5T_NATIVE_ULONG, &u) < 0)
+            return(-1);
+
+        /* Close the attribute */
+        if(H5Aclose(aid) < 0)
+            return(-1);
+
+        /* Uncork the metadata cache */
+        /*if(H5Fset_mdc_config(fid, &mdc_config_orig) < 0)
+            return(-1);*/
+
+        /* Close the dataset's dataspace */
+        if(H5Sclose(file_sid) < 0)
+            return(-1);
+
+        /* Check for flushing file */
+        if(flush_count > 0) {
+            /* Decrement count of records to write before flushing */
+            rec_to_flush--;
+
+            /* Check for counter being reached */
+            if(0 == rec_to_flush) {
+                /* Flush contents of file */
+                if(H5Fflush(fid, H5F_SCOPE_GLOBAL) < 0)
+                    return(-1);
+
+                /* Reset flush counter */
+                rec_to_flush = flush_count;
+            } /* end if */
+        } /* end if */
+
+        /* Busy wait, to let readers catch up */
+        dummy = 0;
+        for(v=0; v<BUSY_WAIT; v++)
+            dummy++;
+        if((unsigned long)dummy != v)
+            return(-1);
+    } /* end for */
+
+    /* Close the memory dataspace */
+    if(H5Sclose(mem_sid) < 0)
+        return(-1);
+
+    /* Close the datatype */
+    if(H5Tclose(tid) < 0)
+        return(-1);
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Closing datasets\n");
+
+    /* Close the datasets */
+    for(u = 0; u < NLEVELS; u++)
+        for(v = 0; v < symbol_count[u]; v++)
+            if(H5Dclose(symbol_info[u][v].dsid) < 0)
+                return(-1);
+
+    return(0);
+}
+
+static void
+usage(void)
+{
+    printf("Usage error!\n");
+    printf("Usage: swmr_sparse_writer [-q] [-f <# of records to write between flushing file contents>] <# of records>\n");
+    printf("<# of records to write between flushing file contents> should be 0 (for no flushing) or between 1 and (<# of records> - 1)\n");
+    printf("Defaults to verbose (no '-q' given) and flushing every 1000 records('-f 1000')\n");
+    exit(1);
+}
+
+int main(int argc, const char *argv[])
+{
+    hid_t fid;          /* File ID for file opened */\
+    long nrecords = 0;  /* # of records to append */
+    long flush_count = 1000;  /* # of records to write between flushing file */
+    unsigned verbose = 1;       /* Whether to emit some informational messages */
+    unsigned u;         /* Local index variable */
+
+    /* Parse command line options */
+    if(argc < 2)
+        usage();
+    if(argc > 1) {
+        u = 1;
+        while(u < (unsigned)argc) {
+            if(argv[u][0] == '-') {
+                switch(argv[u][1]) {
+                    /* # of records to write between flushing file */
+                    case 'f':
+                        flush_count = atol(argv[u + 1]);
+                        if(flush_count < 0)
+                            usage();
+                        u += 2;
+                        break;
+
+                    /* Be quiet */
+                    case 'q':
+                        verbose = 0;
+                        u++;
+                        break;
+
+                    default:
+                        usage();
+                        break;
+                } /* end switch */
+            } /* end if */
+            else {
+                /* Get the number of records to append */
+                nrecords = atol(argv[u]);
+                if(nrecords <= 0)
+                    usage();
+
+                u++;
+            } /* end else */
+        } /* end while */
+    } /* end if */
+    if(nrecords <= 0)
+        usage();
+    if(flush_count >= nrecords)
+        usage();
+
+    /* Emit informational message */
+    if(verbose) {
+        printf("Parameters:\n");
+        printf("\t# of records between flushes = %ld\n", flush_count);
+        printf("\t# of records to write = %ld\n", nrecords);
+    } /* end if */
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Generating symbol names\n");
+
+    /* Generate dataset names */
+    if(generate_symbols() < 0)
+        return(-1);
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Opening skeleton file: %s\n", FILENAME);
+
+    /* Open file skeleton */
+    if((fid = open_skeleton(FILENAME, verbose)) < 0) {
+        printf("Error opening skeleton file!\n");
+        exit(1);
+    } /* end if */
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Adding records\n");
+
+    /* Append records to datasets */
+    if(add_records(fid, verbose, (unsigned long)nrecords, (unsigned long)flush_count) < 0) {
+        printf("Error appending records to datasets!\n");
+        exit(1);
+    } /* end if */
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Releasing symbols\n");
+
+    /* Clean up the symbols */
+    if(shutdown_symbols() < 0) {
+        printf("Error releasing symbols!\n");
+        exit(1);
+    } /* end if */
+
+    /* Emit informational message */
+    if(verbose)
+        printf("Closing objects\n");
+
+    /* Close objects opened */
+    if(H5Fclose(fid) < 0) {
+        printf("Error closing file!\n");
+        exit(1);
+    } /* end if */
+
+    return(0);
+}
+
author	Neil Fortner <nfortne2@hdfgroup.org>	2012-02-27 16:34:55 (GMT)
committer	Neil Fortner <nfortne2@hdfgroup.org>	2012-02-27 16:34:55 (GMT)
commit	73c139e29b45941dfc4e558d9096a0869a184260 (patch)
tree	422cc12e6675238cd92edadc078fa427a4f6bcd0 /test/swmr_sparse_writer.c
parent	e2cd00055204f6b264002e70b21a6e2ca4c98c77 (diff)
download	hdf5-73c139e29b45941dfc4e558d9096a0869a184260.zip hdf5-73c139e29b45941dfc4e558d9096a0869a184260.tar.gz hdf5-73c139e29b45941dfc4e558d9096a0869a184260.tar.bz2