-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhdf5_common.c
305 lines (254 loc) · 13.8 KB
/
hdf5_common.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
#include "hdf5_common.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void generate_test_hdf5_files(int num_files, char filenames[][path_buffer_size], hsize_t dataset_size[], int n_dimensions, hsize_t chunk_size[]){
for (int i=0; i<num_files; i++){
generate_test_data_file(filenames[i], dataset_size, n_dimensions, i, chunk_size);
}
}
void generate_test_data_file(const char* filename, hsize_t dataset_size[], int n_dimensions, int fill_value, hsize_t chunk_size[]){
#ifdef DEBUG
printf("HDF5 File generator: %s, %d\n------------------\n", filename, fill_value);
#endif
long buffer_length = 1;
for (int i=0; i<n_dimensions; i++){
buffer_length = buffer_length * dataset_size[i];
}
int* array_data = malloc(sizeof(int) * buffer_length);
for (long i=0; i<buffer_length; i++){
array_data[i] = fill_value;
}
// Write the data to a HDF5 file.
write_to_file(filename, dataset_size, array_data, n_dimensions, chunk_size);
free(array_data);
}
void write_to_file(const char* filename, hsize_t dataset_size[], int* array_data, int n_dimensions, hsize_t chunk_size[]){
// Create a new empty file.
hid_t file_identifier = H5Fcreate(filename,
H5F_ACC_TRUNC, // Truncate existing file.
H5P_DEFAULT, // File creation property list.
H5P_DEFAULT); // File access property list.
// Create a new data space.
hid_t dataspace_indentifier = H5Screate_simple(n_dimensions,
dataset_size,
NULL); // Maximum size of dimensions.
// Set dataset chunking policy.
hid_t dataset_creation_identifier = H5Pcreate(H5P_DATASET_CREATE);
H5Pset_chunk(dataset_creation_identifier, n_dimensions, chunk_size);
// Create a new dataset.
hid_t dataset_identifier = H5Dcreate2(file_identifier,
"image_data", // Name of the dataset.
H5T_NATIVE_INT,
dataspace_indentifier,
H5P_DEFAULT, // Link creation properties.
dataset_creation_identifier,
H5P_DEFAULT); // Dataset access properties.
// Write data to the new dataset.
H5Dwrite(dataset_identifier,
H5T_NATIVE_INT,
H5S_ALL,
H5S_ALL,
H5P_DEFAULT,
array_data);
H5Pclose(dataset_creation_identifier);
H5Dclose(dataset_identifier);
H5Sclose(dataspace_indentifier);
H5Fclose(file_identifier);
}
void generate_3d_virtual_dataset_file(const char* filename,
char sources[][path_buffer_size],
hsize_t source_dataset_size[],
hsize_t virtual_dataset_tiles_count[],
hsize_t virtual_dataset_size[],
int fill_value){
#ifdef DEBUG
printf("HDF5 Virtual dataset generator: %s\n------------------\n", filename);
#endif
hid_t virtual_file_identifier = H5Fcreate(filename,
H5F_ACC_TRUNC, // Truncate existing file.
H5P_DEFAULT, // File creation property list.
H5P_DEFAULT); // File access property list.
hid_t virtual_dataspace_indentifier = H5Screate_simple(3,
virtual_dataset_size,
NULL);
// Create and fill empty parameters.
hid_t virtaul_dataset_create_property_identifier = H5Pcreate(H5P_DATASET_CREATE);
H5Pset_fill_value(virtaul_dataset_create_property_identifier, H5T_NATIVE_INT, &fill_value);
// Common hyperslab parameters.
hsize_t virtual_dataset_stride[] = {1, 1, 1};
hsize_t virtual_dataset_blocks[] = {1, 1, 1};
// Source files dataspace sizes.
hid_t source_dataspace_indentifier = H5Screate_simple(3, source_dataset_size, NULL);
// Create all hyperslabs.
int current_file_index = 0;
for (int z=0; z<virtual_dataset_tiles_count[0]; z++){
for (int y=0; y<virtual_dataset_tiles_count[1]; y++){
for (int x=0; x<virtual_dataset_tiles_count[2]; x++){
hsize_t start_offset[] = {z*source_dataset_size[0], y*source_dataset_size[1], x*source_dataset_size[2]};
H5Sselect_hyperslab(virtual_dataspace_indentifier,
H5S_SELECT_SET,
start_offset,
virtual_dataset_stride,
virtual_dataset_blocks,
source_dataset_size);
H5Pset_virtual(virtaul_dataset_create_property_identifier,
virtual_dataspace_indentifier,
sources[current_file_index],
"image_data", // Source dataset name.
source_dataspace_indentifier);
current_file_index++;
}
}
}
hid_t virtual_data_set_identifier = H5Dcreate2(virtual_file_identifier,
"image_data",
H5T_NATIVE_INT,
virtual_dataspace_indentifier,
H5P_DEFAULT, // Link properties.
virtaul_dataset_create_property_identifier,
H5P_DEFAULT); // Access properties.
H5Dclose(virtual_data_set_identifier);
H5Sclose(source_dataspace_indentifier);
H5Pclose(virtaul_dataset_create_property_identifier);
H5Sclose(virtual_dataspace_indentifier);
H5Fclose(virtual_file_identifier);
}
void read_3d_dataset_file(const char* filename, hsize_t dataset_size[], hsize_t buffer_size[]){
int buffer_length = buffer_size[0]*buffer_size[1]*buffer_size[2];
int* read_buffer = malloc(sizeof(int)*buffer_length);
hid_t file_identifier = H5Fopen(filename, H5F_ACC_RDONLY, H5P_DEFAULT);
hid_t dataset_identifier = H5Dopen2 (file_identifier, "image_data", H5P_DEFAULT);
hid_t dataspace_identifier = H5Dget_space(dataset_identifier);
hid_t memspace_identifier = H5Screate_simple (3, buffer_size, NULL);
// Read the file buffer by buffer.
int n_of_chunks = dataset_size[0] / buffer_size[0];
for (int z=0; z<n_of_chunks; z++){
read_3d_dataset_chunk(dataset_identifier, dataspace_identifier, memspace_identifier, z*buffer_size[0], buffer_size, &read_buffer[0]);
#ifdef DEBUG
// Print frames to console.
int n_frames_in_chunk = dataset_size[0] / n_of_chunks;
for (int f=0; f<n_frames_in_chunk; f++){
int current_frame = (z*n_frames_in_chunk) + f;
printf("Frame %d, File %s\n", current_frame, filename);
for (int y=0; y<dataset_size[1]; y++){
for (int x=0; x<dataset_size[2]; x++){
int offset = (f*dataset_size[1]*dataset_size[2]) + (y*dataset_size[2]) + x;
printf("%d ", read_buffer[offset]);
}
printf("\n");
}
printf("\n");
}
#endif
}
H5Sclose(memspace_identifier);
H5Sclose(dataspace_identifier);
H5Dclose(dataset_identifier);
H5Fclose(file_identifier);
free(read_buffer);
}
void read_3d_dataset_chunk(hid_t dataset_identifier, hid_t dataspace_identifier, hid_t memspace_identifier, int z_offset, hsize_t buffer_size[], int* read_buffer){
// Block read parameters.
hsize_t stride[] = {1, 1, 1};
hsize_t block[] = {1, 1, 1};
hsize_t offset[] = {z_offset, 0, 0};
H5Sselect_hyperslab (dataspace_identifier, H5S_SELECT_SET, offset, stride, buffer_size, block);
H5Dread(dataset_identifier, H5T_NATIVE_INT, memspace_identifier, dataspace_identifier, H5P_DEFAULT, read_buffer);
}
void read_3d_dataset_file_from_multiple_sources(char filenames[][path_buffer_size], hsize_t virtual_dataset_size[],
hsize_t virtual_dataset_tiles_count[], hsize_t source_dataset_size[], hsize_t buffer_size[]){
// Allocate all read buffers. Since we are reading frame by frame, the number of read buffers is equal to the number of tiles in a frame.
int n_of_read_buffers = virtual_dataset_tiles_count[1]*virtual_dataset_tiles_count[2];
int* read_buffers[n_of_read_buffers];
for(int i=0;i<n_of_read_buffers;i++){
read_buffers[i] = malloc(sizeof(int)*buffer_size[0]*buffer_size[1]*buffer_size[2]);
}
// Allocate the frame buffer.
int* frame_buffer = malloc(sizeof(int)*virtual_dataset_size[1] * virtual_dataset_size[2]);
// Common dataset reading properties.
int n_of_reads = virtual_dataset_size[0] / buffer_size[0];
int source_row_length = source_dataset_size[2];
int read_buffer_offsets[n_of_read_buffers];
int source_fragment_length = source_dataset_size[1] * source_dataset_size[2];
hid_t file_identifier;
hid_t dataset_identifier;
hid_t dataspace_identifier;
hid_t memspace_identifier = H5Screate_simple (3, buffer_size, NULL);;
// Initialize source files offset.
int n_source_files = virtual_dataset_tiles_count[0]*virtual_dataset_tiles_count[1]*virtual_dataset_tiles_count[2];
int source_z_offsets[n_source_files];
for(int i=0;i<n_source_files;i++){
source_z_offsets[i] = 0;
}
// The number of reads depend on the size of the virtual dataset and the size of the Z buffer.
for (int n_read=0; n_read<n_of_reads; n_read++){
// Offset to decide which files to read for the current block.
int n_file_offset = ((n_read * buffer_size[0]) / source_dataset_size[0]) * n_of_read_buffers;
// Read all files into separate buffers.
for(int i=0;i<n_of_read_buffers;i++){
int file_index = i + n_file_offset;
file_identifier = H5Fopen(filenames[file_index], H5F_ACC_RDONLY, H5P_DEFAULT);
dataset_identifier = H5Dopen2 (file_identifier, "image_data", H5P_DEFAULT);
dataspace_identifier = H5Dget_space(dataset_identifier);
read_3d_dataset_chunk(dataset_identifier, dataspace_identifier, memspace_identifier, source_z_offsets[file_index], buffer_size, &read_buffers[i][0]);
source_z_offsets[file_index] += buffer_size[0];
H5Sclose(dataspace_identifier);
H5Dclose(dataset_identifier);
H5Fclose(file_identifier);
}
// Merge buffers only if frames are tiled (ignore in time series case).
if(n_of_read_buffers>1){
// Merge the buffers into a contigues memory location.
for(int n_frame_in_chunk=0; n_frame_in_chunk < buffer_size[0]; n_frame_in_chunk++){
// If we are writing the 2. frame, we should read from the 2. frame fragment in the source.
int source_offset = n_frame_in_chunk * source_fragment_length;
for(int i=0;i<n_of_read_buffers;i++){
read_buffer_offsets[i] = source_offset;
}
int frame_buffer_offset = 0;
for(int frame_row=0; frame_row<virtual_dataset_size[1]; frame_row++){
for(int n_tile_column=0; n_tile_column<virtual_dataset_tiles_count[2]; n_tile_column++){
// Index of the read buffer to access for a single row fragment.
int file_index = n_tile_column + ((frame_row / source_dataset_size[1]) * virtual_dataset_tiles_count[2]);
memcpy(&frame_buffer[frame_buffer_offset], &read_buffers[file_index][read_buffer_offsets[file_index]], sizeof(int)*source_row_length);
// Increase the buffer offsets by the source row length.
frame_buffer_offset += source_row_length;
read_buffer_offsets[file_index] += source_row_length;
}
}
#ifdef DEBUG
int frame_number = n_frame_in_chunk + n_read * buffer_size[0];
printf("Frame %d, merged memory\n", frame_number);
for(int y=0; y<virtual_dataset_size[1]; y++){
for(int x=0; x<virtual_dataset_size[2]; x++){
printf("%d ", frame_buffer[y*virtual_dataset_size[2]+x]);
}
printf("\n");
}
printf("\n");
#endif
}
}else{
#ifdef DEBUG
for(int n_frame_in_chunk=0; n_frame_in_chunk < buffer_size[0]; n_frame_in_chunk++){
int frame_number = n_frame_in_chunk + n_read * buffer_size[0];
printf("Frame %d, merged memory\n", frame_number);
for(int y=0; y<virtual_dataset_size[1]; y++){
for(int x=0; x<virtual_dataset_size[2]; x++){
printf("%d ", read_buffers[0][y*virtual_dataset_size[2]+x]);
}
printf("\n");
}
printf("\n");
}
#endif
}
}
// Cleanup after yourself.
H5Sclose(memspace_identifier);
for(int i=0;i<n_of_read_buffers;i++){
free(read_buffers[i]);
}
free(frame_buffer);
}