summaryrefslogtreecommitdiffstats
path: root/test
diff options
context:
space:
mode:
authorjhendersonHDF <jhenderson@hdfgroup.org>2024-01-23 16:21:59 (GMT)
committerGitHub <noreply@github.com>2024-01-23 16:21:59 (GMT)
commitf86fe61c7f6fa43cc16d555f9c925e43baa3de8f (patch)
treecd51adf099e654b280297a184e7a3480dc8d8ed8 /test
parent7e48d4f767f1cea64b7642db39a9d38c2c2eda13 (diff)
downloadhdf5-f86fe61c7f6fa43cc16d555f9c925e43baa3de8f.zip
hdf5-f86fe61c7f6fa43cc16d555f9c925e43baa3de8f.tar.gz
hdf5-f86fe61c7f6fa43cc16d555f9c925e43baa3de8f.tar.bz2
Remove cached datatype conversion path table entries on file close (#3942)
Remove cached datatype conversion path table entries on file close When performing datatype conversions during I/O, the library checks to see whether it can re-use a cached datatype conversion pathway by performing comparisons between the source and destination datatypes of the current operation and the source and destination datatypes associated with each cached datatype conversion pathway. For variable-length and reference datatypes, a comparison is made between the VOL object for the file associated with these datatypes, which may change as a file is closed and reopened. In workflows involving a loop that opens a file, performs I/O on an object with a variable-length or reference datatype and then closes the file, this can lead to constant memory usage growth as the library compares the file VOL objects between the datatypes as different and adds a new cached conversion pathway entry on each iteration during I/O. This is now fixed by clearing out any cached conversion pathway entries for variable-length or reference datatypes associated with a particular file when that file is closed.
Diffstat (limited to 'test')
-rw-r--r--test/tmisc.c190
1 files changed, 190 insertions, 0 deletions
diff --git a/test/tmisc.c b/test/tmisc.c
index a8103af..ddebc3d 100644
--- a/test/tmisc.c
+++ b/test/tmisc.c
@@ -21,6 +21,7 @@
*************************************************************/
#define H5D_FRIEND /*suppress error about including H5Dpkg */
+#define H5T_FRIEND /*suppress error about including H5Tpkg */
/* Define this macro to indicate that the testing APIs should be available */
#define H5D_TESTING
@@ -28,6 +29,7 @@
#include "testhdf5.h"
#include "H5srcdir.h"
#include "H5Dpkg.h" /* Datasets */
+#include "H5Tpkg.h" /* Datatypes */
#include "H5MMprivate.h" /* Memory */
/* Definitions for misc. test #1 */
@@ -335,6 +337,8 @@ typedef struct {
See https://nvd.nist.gov/vuln/detail/CVE-2020-10812 */
#define CVE_2020_10812_FILENAME "cve_2020_10812.h5"
+#define MISC38_FILE "type_conversion_path_table_issue.h5"
+
/****************************************************************
**
** test_misc1(): test unlinking a dataset from a group and immediately
@@ -6259,6 +6263,190 @@ test_misc37(void)
/****************************************************************
**
+** test_misc38():
+** Test for issue where the type conversion path table cache
+** would grow continuously when variable-length datatypes
+** are involved due to file VOL object comparisons causing
+** the library not to reuse type conversion paths
+**
+****************************************************************/
+static void
+test_misc38(void)
+{
+ H5VL_object_t *file_vol_obj = NULL;
+ const char *buf[] = {"attr_value"};
+ herr_t ret = SUCCEED;
+ hid_t file_id = H5I_INVALID_HID;
+ hid_t attr_id = H5I_INVALID_HID;
+ hid_t str_type = H5I_INVALID_HID;
+ hid_t space_id = H5I_INVALID_HID;
+ int init_npaths = 0;
+ int *irbuf = NULL;
+ char **rbuf = NULL;
+ bool vol_is_native;
+
+ /* Output message about test being performed */
+ MESSAGE(5, ("Fix for type conversion path table issue"));
+
+ /*
+ * Get the initial number of type conversion path table
+ * entries that are currently defined
+ */
+ init_npaths = H5T__get_path_table_npaths();
+
+ file_id = H5Fcreate(MISC38_FILE, H5F_ACC_TRUNC, H5P_DEFAULT, H5P_DEFAULT);
+ CHECK(file_id, H5I_INVALID_HID, "H5Fcreate");
+
+ /* Check if native VOL is being used */
+ CHECK(h5_using_native_vol(H5P_DEFAULT, file_id, &vol_is_native), FAIL, "h5_using_native_vol");
+ if (!vol_is_native) {
+ CHECK(H5Fclose(file_id), FAIL, "H5Fclose");
+ MESSAGE(5, (" -- SKIPPED --\n"));
+ return;
+ }
+
+ /* Retrieve file's VOL object field for further use */
+ file_vol_obj = H5F_VOL_OBJ((H5F_t *)H5VL_object(file_id));
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 1 since the file
+ * was just created.
+ */
+ VERIFY(file_vol_obj->rc, 1, "checking reference count");
+
+ str_type = H5Tcopy(H5T_C_S1);
+ CHECK(str_type, H5I_INVALID_HID, "H5Tcopy");
+
+ ret = H5Tset_size(str_type, H5T_VARIABLE);
+ CHECK(ret, FAIL, "H5Tset_size");
+
+ space_id = H5Screate(H5S_SCALAR);
+ CHECK(space_id, H5I_INVALID_HID, "H5Screate");
+
+ /*
+ * Check the number of type conversion path table entries currently
+ * stored in the cache. It shouldn't have changed yet.
+ */
+ VERIFY(H5T__get_path_table_npaths(), init_npaths,
+ "checking number of type conversion path table entries");
+
+ attr_id = H5Acreate2(file_id, "attribute", str_type, space_id, H5P_DEFAULT, H5P_DEFAULT);
+ CHECK(attr_id, H5I_INVALID_HID, "H5Acreate2");
+
+ /*
+ * Check the number of type conversion path table entries currently
+ * stored in the cache. It shouldn't have changed yet.
+ */
+ VERIFY(H5T__get_path_table_npaths(), init_npaths,
+ "checking number of type conversion path table entries");
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 2. Creating the
+ * attribute on the dataset will have caused a H5T_set_loc call that
+ * associates the attribute's datatype with the file's VOL object
+ * and will have incremented the reference count by 1.
+ */
+ VERIFY(file_vol_obj->rc, 2, "checking reference count");
+
+ ret = H5Awrite(attr_id, str_type, buf);
+ CHECK(ret, FAIL, "H5Awrite");
+
+ /*
+ * Check the number of type conversion path table entries currently
+ * stored in the cache. The H5Awrite call should have added a new
+ * type conversion path. Note that if another test in this file uses
+ * the same conversion path, this check may fail and need to be
+ * refactored.
+ */
+ VERIFY(H5T__get_path_table_npaths(), init_npaths + 1,
+ "checking number of type conversion path table entries");
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 3. Writing to the
+ * variable-length typed attribute will have caused an H5T_convert
+ * call that ends up incrementing the reference count of the
+ * associated file's VOL object.
+ */
+ VERIFY(file_vol_obj->rc, 3, "checking reference count");
+
+ ret = H5Aclose(attr_id);
+ CHECK(ret, FAIL, "H5Aclose");
+ ret = H5Fclose(file_id);
+ CHECK(ret, FAIL, "H5Fclose");
+
+ irbuf = malloc(100 * 100 * sizeof(int));
+ CHECK_PTR(irbuf, "int read buf allocation");
+ rbuf = malloc(sizeof(char *));
+ CHECK_PTR(rbuf, "varstr read buf allocation");
+
+ for (size_t i = 0; i < 10; i++) {
+ file_id = H5Fopen(MISC38_FILE, H5F_ACC_RDONLY, H5P_DEFAULT);
+ CHECK(file_id, H5I_INVALID_HID, "H5Fopen");
+
+ /* Retrieve file's VOL object field for further use */
+ file_vol_obj = H5F_VOL_OBJ((H5F_t *)H5VL_object(file_id));
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 1 since the file
+ * was just opened.
+ */
+ VERIFY(file_vol_obj->rc, 1, "checking reference count");
+
+ attr_id = H5Aopen(file_id, "attribute", H5P_DEFAULT);
+ CHECK(attr_id, H5I_INVALID_HID, "H5Aopen");
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 2 since opening
+ * the attribute will also have associated its type with the file's
+ * VOL object.
+ */
+ VERIFY(file_vol_obj->rc, 2, "checking reference count");
+
+ ret = H5Aread(attr_id, str_type, rbuf);
+ CHECK(ret, FAIL, "H5Aread");
+
+ /*
+ * Check the number of type conversion path table entries currently
+ * stored in the cache. Each H5Aread call shouldn't cause this number
+ * to go up, as the library should have removed the cached conversion
+ * paths on file close.
+ */
+ VERIFY(H5T__get_path_table_npaths(), init_npaths + 1,
+ "checking number of type conversion path table entries");
+
+ /*
+ * Check reference count of file's VOL object field. At this point,
+ * the object should have a reference count of 3. Writing to the
+ * variable-length typed attribute will have caused an H5T_convert
+ * call that ends up incrementing the reference count of the
+ * associated file's VOL object.
+ */
+ VERIFY(file_vol_obj->rc, 3, "checking reference count");
+
+ ret = H5Treclaim(str_type, space_id, H5P_DEFAULT, rbuf);
+
+ ret = H5Aclose(attr_id);
+ CHECK(ret, FAIL, "H5Aclose");
+ ret = H5Fclose(file_id);
+ CHECK(ret, FAIL, "H5Fclose");
+ }
+
+ free(irbuf);
+ free(rbuf);
+
+ ret = H5Tclose(str_type);
+ CHECK(ret, FAIL, "H5Tclose");
+ ret = H5Sclose(space_id);
+ CHECK(ret, FAIL, "H5Sclose");
+}
+
+/****************************************************************
+**
** test_misc(): Main misc. test routine.
**
****************************************************************/
@@ -6325,6 +6513,7 @@ test_misc(void)
test_misc35(); /* Test behavior of free-list & allocation statistics API calls */
test_misc36(); /* Exercise H5atclose and H5is_library_terminating */
test_misc37(); /* Test for seg fault failure at file close */
+ test_misc38(); /* Test for type conversion path table issue */
} /* test_misc() */
@@ -6380,6 +6569,7 @@ cleanup_misc(void)
#ifndef H5_NO_DEPRECATED_SYMBOLS
H5Fdelete(MISC31_FILE, H5P_DEFAULT);
#endif /* H5_NO_DEPRECATED_SYMBOLS */
+ H5Fdelete(MISC38_FILE, H5P_DEFAULT);
}
H5E_END_TRY
} /* end cleanup_misc() */