You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
465 lines
15 KiB
465 lines
15 KiB
/* This is part of the netCDF package.
|
|
Copyright 2018 University Corporation for Atmospheric Research/Unidata
|
|
See COPYRIGHT file for conditions of use.
|
|
|
|
Test netcdf-4 chunking.
|
|
Ed Hartnett, Dennis Heimbigner
|
|
modified version of nc_test4/tst_chunks2.c
|
|
*/
|
|
|
|
#include "ut_includes.h"
|
|
#include "test_nczarr_utils.h"
|
|
|
|
#define FILE_NAME "tst_chunks2"
|
|
#define MAX_WASTE 25.0
|
|
#define NUM_RANDOM_TESTS 3
|
|
#define NDIMS3 3
|
|
|
|
/* Calculate the waste of the chunking. A waste of 10% means the
|
|
* chunked data is 10% larger then the unchunked data. */
|
|
static int
|
|
calculate_waste(int ndims, size_t *dimlen, size_t *chunksize, float *waste)
|
|
{
|
|
int d;
|
|
float chunked = 1, unchunked = 1;
|
|
size_t *num_chunks;
|
|
size_t chunk_size = 1;
|
|
|
|
assert(waste && dimlen && chunksize && ndims);
|
|
if (!(num_chunks = calloc(ndims, sizeof(size_t)))) ERR;
|
|
|
|
#ifdef PRINT_CHUNK_WASTE_REPORT
|
|
printf("\n");
|
|
#endif
|
|
/* Caclulate the total space taken up by the chunked data. */
|
|
for (d = 0; d < ndims; d++)
|
|
{
|
|
/* How many chunks along this dimension are required to hold all the data? */
|
|
for (num_chunks[d] = 0; (num_chunks[d] * chunksize[d]) < (dimlen[d] ? dimlen[d] : 1);
|
|
num_chunks[d]++)
|
|
;
|
|
chunked *= (num_chunks[d] * chunksize[d]);
|
|
}
|
|
|
|
/* Calculate the minimum space required for this data
|
|
* (i.e. unchunked) or one record of it. */
|
|
for (d = 0; d < ndims; d++)
|
|
unchunked *= (dimlen[d] ? dimlen[d] : 1);
|
|
|
|
#ifdef PRINT_CHUNK_WASTE_REPORT
|
|
printf("size for unchunked %g elements; size for chunked %g elements\n",
|
|
unchunked, chunked);
|
|
#endif
|
|
|
|
/* Percent of the chunked file that is wasted space. */
|
|
*waste = ((float)(chunked - unchunked) / (float)chunked) * 100.0;
|
|
|
|
#ifdef PRINT_CHUNK_WASTE_REPORT
|
|
printf("\ndimlen\tchunksize\tnum_chunks\n");
|
|
#endif
|
|
for (d = 0; d < ndims; d++)
|
|
{
|
|
#ifdef PRINT_CHUNK_WASTE_REPORT
|
|
printf("%ld\t%ld\t\t%ld\n", (long int)dimlen[d], (long int)chunksize[d],
|
|
(long int)num_chunks[d]);
|
|
#endif
|
|
chunk_size *= chunksize[d];
|
|
}
|
|
#ifdef PRINT_CHUNK_WASTE_REPORT
|
|
printf("size of chunk: %ld elements; wasted space: %2.2f percent\n",
|
|
(long int)chunk_size, *waste);
|
|
#endif
|
|
|
|
free(num_chunks);
|
|
return 0;
|
|
}
|
|
|
|
int
|
|
main(int argc, char **argv)
|
|
{
|
|
processoptions(argc,argv,FILE_NAME);
|
|
|
|
printf("\n*** Testing netcdf-4 variable chunking.\n");
|
|
printf("**** testing default chunksizes...");
|
|
{
|
|
#define NDIMS3 3
|
|
#define NUM_VARS 1
|
|
#define Y_NAME "y"
|
|
#define X_NAME "x"
|
|
#define Z_NAME "z"
|
|
#define VAR_NAME_JOE "joe"
|
|
#define XDIM_LEN 2
|
|
#define YDIM_LEN 5
|
|
#define ZDIM_LEN 3000
|
|
|
|
int varid, ncid, dims[NDIMS3], dims_in[NDIMS3];
|
|
int ndims, nvars, ngatts, unlimdimid, natts;
|
|
char name_in[NC_MAX_NAME + 1];
|
|
nc_type type_in;
|
|
size_t len_in[NDIMS3];
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
float waste = 0;
|
|
|
|
/* Create a file with 3D var, turn on chunking, but don't provide chunksizes. */
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
if (nc_def_dim(ncid, X_NAME, XDIM_LEN, &dims[0])) ERR;
|
|
if (nc_def_dim(ncid, Y_NAME, YDIM_LEN, &dims[1])) ERR;
|
|
if (nc_def_dim(ncid, Z_NAME, ZDIM_LEN, &dims[2])) ERR;
|
|
if (nc_def_var(ncid, VAR_NAME_JOE, NC_FLOAT, NDIMS3, dims, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, 0, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check it out. */
|
|
if (nc_inq(ncid, &ndims, &nvars, &ngatts, &unlimdimid)) ERR;
|
|
if (nvars != NUM_VARS || ndims != NDIMS3 || ngatts != 0 || unlimdimid != -1) ERR;
|
|
if (nc_inq_var(ncid, 0, name_in, &type_in, &ndims, dims_in, &natts)) ERR;
|
|
if (strcmp(name_in, VAR_NAME_JOE) || type_in != NC_FLOAT || ndims != NDIMS3 ||
|
|
dims_in[0] != dims[0] || dims_in[1] != dims[1] || dims_in[2] != dims[2] || natts != 0) ERR;
|
|
if (nc_inq_dim(ncid, 0, name_in, &len_in[0])) ERR;
|
|
if (strcmp(name_in, X_NAME) || len_in[0] != XDIM_LEN) ERR;
|
|
if (nc_inq_dim(ncid, 1, name_in, &len_in[1])) ERR;
|
|
if (strcmp(name_in, Y_NAME) || len_in[1] != YDIM_LEN) ERR;
|
|
if (nc_inq_dim(ncid, 2, name_in, &len_in[2])) ERR;
|
|
if (strcmp(name_in, Z_NAME) || len_in[2] != ZDIM_LEN) ERR;
|
|
if (nc_inq_var_chunking(ncid, 0, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check again. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_inq(ncid, &ndims, &nvars, &ngatts, &unlimdimid)) ERR;
|
|
if (nvars != NUM_VARS || ndims != NDIMS3 || ngatts != 0 || unlimdimid != -1) ERR;
|
|
if (nc_inq_var(ncid, 0, name_in, &type_in, &ndims, dims_in, &natts)) ERR;
|
|
if (strcmp(name_in, VAR_NAME_JOE) || type_in != NC_FLOAT || ndims != NDIMS3 ||
|
|
dims_in[0] != dims[0] || dims_in[1] != dims[1] || dims_in[2] != dims[2] || natts != 0) ERR;
|
|
if (nc_inq_dim(ncid, 0, name_in, &len_in[0])) ERR;
|
|
if (strcmp(name_in, X_NAME) || len_in[0] != XDIM_LEN) ERR;
|
|
if (nc_inq_dim(ncid, 1, name_in, &len_in[1])) ERR;
|
|
if (strcmp(name_in, Y_NAME) || len_in[1] != YDIM_LEN) ERR;
|
|
if (nc_inq_dim(ncid, 2, name_in, &len_in[2])) ERR;
|
|
if (strcmp(name_in, Z_NAME) || len_in[2] != ZDIM_LEN) ERR;
|
|
if (nc_inq_var_chunking(ncid, 0, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, len_in, chunksizes, &waste)) ERR;
|
|
/*if (waste > MAX_WASTE) ERR;*/
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes some more for a 3D var...");
|
|
{
|
|
#define NDIMS3 3
|
|
#define VAR_NAME "op-amp"
|
|
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3] = {1, 11, 152750};
|
|
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
/* if (waste > MAX_WASTE) ERR;*/
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes even more for a 3D var...");
|
|
{
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3] = {1804289383, 846930886, 1681692777};
|
|
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
/* if (waste > MAX_WASTE) ERR;*/
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes even even more for a 3D var...");
|
|
{
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3] = {1714636915, 1957747793, 424238335};
|
|
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
/* if (waste > MAX_WASTE) ERR;*/
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes some more for a 3D var...");
|
|
{
|
|
#define NDIMS3 3
|
|
#define VAR_NAME "op-amp"
|
|
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3] = {1967513926, 1365180540, 426};
|
|
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
/* if (waste > MAX_WASTE) ERR;*/
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes for very large 3D var...");
|
|
{
|
|
#define NDIMS3 3
|
|
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3] = {1804289383, 846930886, 1681692777};
|
|
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
/* if (waste > MAX_WASTE) ERR;*/
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
|
|
/* Open the file and check. */
|
|
if (nc_open(itoptions.path, NC_WRITE, &ncid)) ERR;
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes some randomly sized 3D vars...");
|
|
{
|
|
#define NDIMS3 3
|
|
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3];
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d, t;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
for (t = 0; t < NUM_RANDOM_TESTS; t++)
|
|
{
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
dim_len[d] = rand();
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how well default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
if (waste > MAX_WASTE) ERR;
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes some randomly sized 3D vars, with one small dimension...");
|
|
{
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3];
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d, t;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
for (t = 0; t < NUM_RANDOM_TESTS; t++)
|
|
{
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
dim_len[0] = rand();
|
|
dim_len[1] = rand();
|
|
dim_len[2] = rand() % 1000;
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how well default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
if (waste > MAX_WASTE) ERR;
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
}
|
|
SUMMARIZE_ERR;
|
|
printf("**** testing default chunksizes some randomly sized 3D vars, with two small dimensions...");
|
|
{
|
|
int varid, ncid;
|
|
int dimids[NDIMS3];
|
|
size_t dim_len[NDIMS3];
|
|
int storage = 0;
|
|
size_t chunksizes[NDIMS3];
|
|
int d, t;
|
|
char dim_name[NC_MAX_NAME + 1];
|
|
float waste;
|
|
|
|
for (t = 0; t < NUM_RANDOM_TESTS; t++)
|
|
{
|
|
if (nc_create(itoptions.path, NC_NETCDF4 | NC_CLOBBER, &ncid)) ERR;
|
|
|
|
dim_len[0] = rand();
|
|
dim_len[1] = rand() % 1000;
|
|
dim_len[2] = rand() % 1000;
|
|
/* Create a few dimensions. */
|
|
for (d = 0; d < NDIMS3; d++)
|
|
{
|
|
sprintf(dim_name, "dim_%d", d);
|
|
if (nc_def_dim(ncid, dim_name, dim_len[d], &dimids[d])) ERR;
|
|
}
|
|
|
|
/* Define a var with these dimensions, and turn on chunking. */
|
|
if (nc_def_var(ncid, VAR_NAME, NC_FLOAT, NDIMS3, dimids, &varid)) ERR;
|
|
if (nc_def_var_chunking(ncid, varid, NC_CHUNKED, NULL)) ERR;
|
|
|
|
/* Check how well default chunking worked. */
|
|
if (nc_inq_var_chunking(ncid, varid, &storage, chunksizes)) ERR;
|
|
if (storage != NC_CHUNKED) ERR;
|
|
if (calculate_waste(NDIMS3, dim_len, chunksizes, &waste)) ERR;
|
|
if (waste > MAX_WASTE) ERR;
|
|
|
|
if (nc_close(ncid)) ERR;
|
|
}
|
|
}
|
|
clearoptions();
|
|
SUMMARIZE_ERR;
|
|
FINAL_RESULTS;
|
|
}
|
|
|