TRIQS/nda 1.3.0
Multi-dimensional array library for C++
Loading...
Searching...
No Matches
h5.hpp
Go to the documentation of this file.
1// Copyright (c) 2019--present, The Simons Foundation
2// This file is part of TRIQS/nda and is licensed under the Apache License, Version 2.0.
3// SPDX-License-Identifier: Apache-2.0
4// See LICENSE in the root of this distribution for details.
5
10
11#pragma once
12
13#include "./concepts.hpp"
14#include "./declarations.hpp"
15#include "./exceptions.hpp"
16#include "./layout/for_each.hpp"
17#include "./layout/range.hpp"
18#include "./traits.hpp"
19
20#include <h5/h5.hpp>
21
22#include <algorithm>
23#include <array>
24#include <concepts>
25#include <cstddef>
26#include <string>
27#include <tuple>
28#include <type_traits>
29#include <utility>
30#include <vector>
31
32namespace nda {
33
38
39 namespace detail {
40
41 // Resize a given array to fit a given shape or check if a given view fits the shape.
42 template <MemoryArray A>
43 void resize_or_check(A &a, std::array<long, A::rank> const &shape) {
44 if constexpr (is_regular_v<A>) {
45 a.resize(shape);
46 } else {
47 if (a.shape() != shape) NDA_RUNTIME_ERROR << "Error in nda::detail::resize_or_check: Dimension mismatch: " << shape << " != " << a.shape();
48 }
49 }
50
51 // Given an array/view, prepare and return the corresponding h5::array_view to be written/read into.
52 template <MemoryArray A>
53 auto prepare_h5_array_view(const A &a) {
54 auto [parent_shape, h5_strides] = h5::array_interface::get_parent_shape_and_h5_strides(a.indexmap().strides().data(), A::rank, a.shape().data());
55 auto v = h5::array_interface::array_view{h5::hdf5_type<get_value_t<A>>(), (void *)a.data(), A::rank, is_complex_v<typename A::value_type>};
56 for (int u = 0; u < A::rank; ++u) {
57 v.slab.count[u] = a.shape()[u];
58 v.slab.stride[u] = h5_strides[u];
59 v.parent_shape[u] = parent_shape[u];
60 }
61 return v;
62 }
63
64 // Create an h5::char_buf from an 1-dimensional nda::MemoryArray.
65 template <MemoryArrayOfRank<1> A>
66 h5::char_buf to_char_buf(A const &a) {
67 // get size of longest string
68 size_t s = 0;
69 for (auto &x : a) s = std::max(s, x.size() + 1);
70
71 // copy each string to a buffer and pad with zeros
72 std::vector<char> buf;
73 buf.resize(a.size() * s, 0x00);
74 size_t i = 0;
75 for (auto &x : a) {
76 strcpy(&buf[i * s], x.c_str());
77 ++i;
78 }
79
80 // return h5::char_buf
81 auto len = h5::v_t{size_t(a.size()), s};
82 return {buf, len};
83 }
84
85 // Write an h5::char_buf into a 1-dimensional nda::MemoryArray.
86 template <MemoryArrayOfRank<1> A>
87 void from_char_buf(h5::char_buf const &cb, A &a) {
88 // prepare the array
89 resize_or_check(a, std::array<long, 1>{static_cast<long>(cb.lengths[0])});
90
91 // loop over all strings
92 auto len_string = cb.lengths[1];
93 size_t i = 0;
94 for (auto &x : a) {
95 x = "";
96 x.append(&cb.buffer[i * len_string]);
97 ++i;
98 }
99 }
100
101 } // namespace detail
102
118 template <MemoryArray A>
119 void h5_write(h5::group g, std::string const &name, A const &a, bool compress = true) {
120 if constexpr (std::is_same_v<nda::get_value_t<A>, std::string>) {
121 // 1-dimensional array/view of strings
122 h5_write(g, name, detail::to_char_buf(a));
123 } else if constexpr (is_scalar_v<typename A::value_type>) {
124 // n-dimensional array/view of scalars
125 // make a copy if the array/view is not in C-order and write the copy
126 if (not a.indexmap().is_stride_order_C()) {
127 using h5_arr_t = nda::array<get_value_t<A>, A::rank>;
128 auto a_c_layout = h5_arr_t{a.shape()};
129 a_c_layout() = a;
130 h5_write(g, name, a_c_layout, compress);
131 return;
132 }
133
134 // prepare the h5::array_view and write it
135 auto v = detail::prepare_h5_array_view(a);
136 h5::array_interface::write(g, name, v, compress);
137 } else {
138 // n-dimensional array/view of some generic unknown type
139 auto g2 = g.create_group(name);
140 h5_write(g2, "shape", a.shape());
141 auto make_name = [](auto i0, auto... is) { return (std::to_string(i0) + ... + ("_" + std::to_string(is))); };
142 nda::for_each(a.shape(), [&](auto... is) { h5_write(g2, make_name(is...), a(is...)); });
143 }
144 }
145
161 template <size_t NDim, typename... IRs>
162 auto hyperslab_and_shape_from_slice(std::tuple<IRs...> const &slice, std::vector<h5::hsize_t> const &ds_shape, bool is_complex) {
163 // number of parameters specifying the slice
164 static constexpr auto size_of_slice = sizeof...(IRs);
165
166 // number of nda::ellipsis objects in the slice (only 1 is allowed)
167 static constexpr auto ellipsis_count = (std::is_same_v<IRs, ellipsis> + ... + 0);
168 static_assert(ellipsis_count < 2, "Error in nda::hyperslab_and_shape_from_slice: Only a single ellipsis is allowed in slicing");
169 static constexpr auto has_ellipsis = (ellipsis_count == 1);
170
171 // position of the ellipsis in the slice parameters
172 static constexpr auto ellipsis_position = [&]<size_t... Is>(std::index_sequence<Is...>) {
173 if constexpr (has_ellipsis) return ((std::is_same_v<IRs, ellipsis> * Is) + ... + 0);
174 return size_of_slice;
175 }(std::index_sequence_for<IRs...>{});
176
177 // number of integers in the slice parameters
178 static constexpr auto integer_count = (std::integral<IRs> + ... + 0);
179
180 // number of nda::range and nda::range::all_t objects in the slice parameters
181 static constexpr auto range_count = size_of_slice - integer_count - ellipsis_count;
182 static_assert((has_ellipsis && range_count <= NDim) || range_count == NDim,
183 "Error in nda::hyperslab_and_shape_from_slice: Rank does not match the number of non-trivial slice dimensions");
184
185 // number of dimensions spanned by the ellipsis
186 static constexpr auto ellipsis_width = NDim - range_count;
187
188 // number of dimensions in the hyperslab
189 static constexpr auto slab_rank = NDim + integer_count;
190
191 // check rank of the dataset (must match the rank of the hyperslabs)
192 auto ds_rank = ds_shape.size() - is_complex;
193 if (slab_rank != ds_rank)
194 NDA_RUNTIME_ERROR << "Error in nda::hyperslab_and_shape_from_slice: Incompatible dataset and slice ranks: " << ds_rank
195 << " != " << size_of_slice;
196
197 // create and return the hyperslab and the shape array
198 auto slab = h5::array_interface::hyperslab(slab_rank, is_complex);
199 auto shape = std::array<long, NDim>{};
200 [&, m = 0]<size_t... Is>(std::index_sequence<Is...>) mutable {
201 (
202 [&]<typename IR>(size_t n, IR const &ir) mutable {
203 if (n > ellipsis_position) n += (ellipsis_width - 1);
204 if constexpr (std::integral<IR>) {
205 slab.offset[n] = ir;
206 slab.count[n] = 1;
207 } else if constexpr (std::is_same_v<IR, nda::ellipsis>) {
208 for (auto k : range(n, n + ellipsis_width)) {
209 slab.count[k] = ds_shape[k];
210 shape[m++] = ds_shape[k];
211 }
212 } else if constexpr (std::is_same_v<IR, nda::range>) {
213 slab.offset[n] = ir.first();
214 slab.stride[n] = ir.step();
215 slab.count[n] = ir.size();
216 shape[m++] = ir.size();
217 } else {
218 static_assert(std::is_same_v<IR, nda::range::all_t>);
219 slab.count[n] = ds_shape[n];
220 shape[m++] = ds_shape[n];
221 }
222 }(Is, std::get<Is>(slice)),
223 ...);
224 }(std::make_index_sequence<size_of_slice>{});
225 return std::make_pair(slab, shape);
226 }
227
244 template <MemoryArray A, typename... IRs>
245 void h5_write(h5::group g, std::string const &name, A const &a, std::tuple<IRs...> const &slice) {
246 // compile-time checks
247 constexpr int size_of_slice = sizeof...(IRs);
248 static_assert(size_of_slice > 0, "Error in nda::h5_write: Invalid empty slice");
249 static_assert(is_scalar_v<typename A::value_type>, "Error in nda::h5_write: Slicing is only supported for scalar types");
250 static constexpr bool is_complex = is_complex_v<typename A::value_type>;
251
252 // make a copy if the array/view is not in C-order and write the copy
253 if (not a.indexmap().is_stride_order_C()) {
254 using h5_arr_t = nda::array<get_value_t<A>, A::rank>;
255 auto a_c_layout = h5_arr_t{a.shape()};
256 a_c_layout() = a;
257 h5_write(g, name, a_c_layout, slice);
258 return;
259 }
260
261 // get dataset info and check that the datatypes of the dataset and the array match
262 auto ds_info = h5::array_interface::get_dataset_info(g, name);
263 if (is_complex != ds_info.has_complex_attribute)
264 NDA_RUNTIME_ERROR << "Error in nda::h5_write: Dataset and array/view must both be complex or non-complex";
265
266 // get hyperslab and shape from the slice and check that the shapes match
267 auto const [sl, sh] = hyperslab_and_shape_from_slice<A::rank>(slice, ds_info.lengths, is_complex);
268 if (sh != a.shape()) NDA_RUNTIME_ERROR << "Error in nda::h5_write: Incompatible slice and array shape: " << sh << " != " << a.shape();
269
270 // prepare the h5::array_view and write it
271 auto v = detail::prepare_h5_array_view(a);
272 h5::array_interface::write_slice(g, name, v, sl);
273 }
274
296 template <MemoryArray A, typename... IRs>
297 void h5_read(h5::group g, std::string const &name, A &a, std::tuple<IRs...> const &slice = {}) {
298 constexpr bool slicing = (sizeof...(IRs) > 0);
299
300 if constexpr (std::is_same_v<typename A::value_type, std::string>) {
301 // 1-dimensional array/view of strings
302 static_assert(!slicing, "Error in nda::h5_read: Slicing not supported for arrays/views of strings");
303 h5::char_buf cb;
304 h5_read(g, name, cb);
305 detail::from_char_buf(cb, a);
306 } else if constexpr (is_scalar_v<typename A::value_type>) {
307 // n-dimensional array/view of scalars
308 // read into a temporary array if the array/view is not in C-order and copy the elements
309 if (not a.indexmap().is_stride_order_C()) {
311 auto a_c_layout = h5_arr_t{};
312 h5_read(g, name, a_c_layout, slice);
313 detail::resize_or_check(a, a_c_layout.shape());
314 a() = a_c_layout;
315 return;
316 }
317
318 // get dataset info
319 auto ds_info = h5::array_interface::get_dataset_info(g, name);
320
321 // allow to read non-complex data into a complex array
322 static constexpr bool is_complex = is_complex_v<typename A::value_type>;
323 if constexpr (is_complex) {
324 if (!ds_info.has_complex_attribute) {
326 h5_read(g, name, tmp, slice);
327 a = tmp;
328 return;
329 }
330 }
331
332 // get the hyperslab and the shape of the slice
333 std::array<long, A::rank> shape{};
334 auto slab = h5::array_interface::hyperslab{};
335 if constexpr (slicing) {
336 auto const [sl, sh] = hyperslab_and_shape_from_slice<A::rank>(slice, ds_info.lengths, is_complex);
337 slab = sl;
338 shape = sh;
339 } else {
340 for (int u = 0; u < A::rank; ++u) shape[u] = ds_info.lengths[u]; // NB : correct for complex
341 }
342
343 // resize the array or check that the shape matches
344 detail::resize_or_check(a, shape);
345
346 // check the rank of the dataset and the array
347 auto ds_rank = ds_info.rank() - is_complex;
348 if (!slicing && ds_rank != A::rank)
349 NDA_RUNTIME_ERROR << "Error in nda::h5_read: Incompatible dataset and array ranks: " << ds_rank << " != " << A::rank;
350
351 // prepare the h5::array_view and read into it
352 auto v = detail::prepare_h5_array_view(a);
353 h5::array_interface::read(g, name, v, slab);
354 } else {
355 // n-dimensional array/view of some generic unknown type
356 static_assert(!slicing, "Error in nda::h5_read: Slicing not supported for arrays/views of generic types");
357 auto g2 = g.open_group(name);
358
359 // get and check the shape or resize the array
360 std::array<long, A::rank> h5_shape;
361 h5_read(g2, "shape", h5_shape);
362 detail::resize_or_check(a, h5_shape);
363
364 // read element-by-element using the appropriate h5_read implementation
365 auto make_name = [](auto i0, auto... is) { return (std::to_string(i0) + ... + ("_" + std::to_string(is))); };
366 nda::for_each(a.shape(), [&](auto... is) { h5_read(g2, make_name(is...), a(is...)); });
367 }
368 }
369
371
372} // namespace nda
Provides concepts for the nda library.
Provides various convenient aliases and helper functions for nda::basic_array and nda::basic_array_vi...
Provides a custom runtime error class and macros to assert conditions and throw exceptions.
Provides for_each functions for multi-dimensional arrays/views.
void h5_read(h5::group g, std::string const &name, A &a, std::tuple< IRs... > const &slice={})
Read into an nda::MemoryArray from an HDF5 file.
Definition h5.hpp:297
void h5_write(h5::group g, std::string const &name, A const &a, bool compress=true)
Write an nda::MemoryArray to a new dataset/subgroup into an HDF5 file.
Definition h5.hpp:119
auto hyperslab_and_shape_from_slice(std::tuple< IRs... > const &slice, std::vector< h5::hsize_t > const &ds_shape, bool is_complex)
Construct an h5::array_interface::hyperslab and the corresponding shape from a given slice,...
Definition h5.hpp:162
basic_array< ValueType, Rank, Layout, 'A', ContainerPolicy > array
Alias template of an nda::basic_array with an 'A' algebra.
__inline__ void for_each(std::array< Int, R > const &shape, F &&f)
Loop over all possible index values of a given shape and apply a function to them.
Definition for_each.hpp:116
std::string to_string(std::array< T, R > const &a)
Get a string representation of a std::array.
Definition array.hpp:52
constexpr bool is_complex_v
Constexpr variable that is true if type T is a std::complex type.
Definition traits.hpp:64
constexpr bool is_scalar_v
Constexpr variable that is true if type S is a scalar type, i.e. arithmetic or complex.
Definition traits.hpp:68
Includes the itertools header and provides some additional utilities.
Provides type traits for the nda library.