>>> h5ls -r my_first_one.h5
    /                        Group
    /data1                   Dataset {100, 100}
    /group1                  Group
    /group1/data2            Dataset {100, 100}

# From jupyter notebook
from h5glance import H5Glance
H5Glance("data/water.h5")

%%bash
# From the command line
h5glance data/water.h5

from jupyterlab_h5web import H5Web

H5Web("data/water.h5")

>>> pip install silx
>>> silx view my_file.h5

%%bash
# With silx view GUI
silx view data/water.h5

import h5py

print("h5py:", h5py.version.version)
print("hdf5:", h5py.version.hdf5_version)

import h5py

h5file = h5py.File("data/water.h5", mode="r")

# Available names at the first level
list(h5file.keys())

# List 'entry_0000' group children
group = h5file["entry_0000"]
dict(group.items())

# List 'entry_0000/4_azimuthal_integration' group children
list(group["4_azimuthal_integration"].values())

# List 'entry_0000/4_azimuthal_integration/results' group children
list(h5file["/entry_0000/4_azimuthal_integration/results"].values())

# Get a dataset from a sub group
h5dataset = h5file["/entry_0000/4_azimuthal_integration/results/I"]
h5dataset

h5dataset = h5file["/entry_0000/4_azimuthal_integration/results/I"]
h5dataset

# Here we only read metadata from the dataset
print("Dataset:", h5dataset.shape, h5dataset.dtype, h5dataset.size)

# Read data from the file to a numpy.ndarray
subset = h5dataset[:5]  # Copy the selection to a numpy.ndarray
print("subset:", subset, "=> sum:", subset.sum())

data = h5dataset[()]  # Copy the whole dataset to a numpy.ndarray
print("data type:", type(data), "; shape", data.shape, "; min.:", data.min())

data[:5] = 0
print(data[:5])
print(h5dataset[:5])

# Remember to close the file
h5file.close()

print(data[:5])
print(subset)

# Once the file is closed, the Dataset no longer gives access to data
print(h5dataset)
print(h5dataset[:5])

with h5py.File("data/water.h5", "r") as h5file:
    dataset = h5file["/entry_0000/4_azimuthal_integration/results/I"]
    data = dataset[()]
print(dataset)
print(data[:5])

import numpy
import h5py

data = numpy.random.random(10000)
data.shape = 100, 100

# create file, notice the mode='w', as 'write'
h5file = h5py.File("my_first_one.h5", mode="w")

# write data into a dataset from the root
h5file["/data1"] = data

# write data into a dataset from group1
h5file["/group1/data2"] = data

h5file.close()

import numpy
import h5py

# Create 2D data
data = numpy.arange(100 * 100)
data.shape = 100, 100

with h5py.File("my_first_one.h5", mode="w") as h5file:

    # write data into a dataset from the root
    h5file["/data1"] = data

    # write data into a dataset from group1
    h5file["/group1/data2"] = data

import numpy
import h5py

# Create 2D data
data = numpy.arange(100 * 100)
data.shape = 100, 100

# Notice the mode='w', as 'write'
with h5py.File("my_first_one.h5", mode="w") as h5file:

    # write data into a dataset from the root
    h5file.create_dataset("data1", data=data)

    # Or with a functional API
    grp1 = h5file.create_group("group1")
    grp1.create_dataset("data2", data=data)

import numpy

def flatfield_correction(raw, flat, dark):
    """
    Apply a flat-field correction to a raw data using a flat and a dark.
    """
    # Make sure that the computation is done using float
    # to avoid type overflow or loss of precision
    raw = raw.astype(numpy.float32)
    flat = flat.astype(numpy.float32)
    dark = dark.astype(numpy.float32)
    # Do the computation
    return (raw - dark) / (flat - dark)

%matplotlib inline

from matplotlib import pyplot as plt

import numpy
plt.imshow(numpy.random.random((20, 60)))

from jupyterlab_h5web import H5Web
H5Web("data/ID16B_diatomee.h5")

# or
from h5glance import H5Glance
H5Glance("data/ID16B_diatomee.h5")

import h5py

with h5py.File("data/ID16B_diatomee.h5", mode="r") as h5s:
    pass
    # this is a comment

    # step1: Read the data

    # raw_data_path = ...
    # raw_data = ...

    # flat_path = ...
    # flat = ...

    # dark_path = ...
    # dark = ...

# step2: Compute the result

# normalized = flatfield_correction(raw_data, flat, dark)

# step3: Save the result

# ...

import h5py
import hdf5plugin  # Allows to read dataset stored with supported compressions

Mode	Meaning
r	Readonly, file must exist; Default with h5py v3
r+	Read/write, file must exist
w	Create file, truncate if exists
w- or x	Create file, fail if exists
a	Read/write if exists, create otherwise; Default with h5py v2

Data IO (input/output)¶

Introduction¶

HDF5¶

What is HDF5?¶

Why HDF5?¶

HDF5 description¶

HDF5 example¶

Useful tools for HDF5¶

HDFGroup tools ¶

`h5glance`¶

`jupyterlab-h5web`¶

`silx view`¶

h5py¶

How to read a HDF5 file from Python¶

`h5py.File`¶

`h5py.Group`¶

`h5py.Dataset`¶

Context manager¶

How to write to a HDF5 file¶

Exercice: Flat field correction¶

Exercise 1¶

Exercise 2¶

Exercise 3¶

Advanced usage¶

Dataset compression¶

Soft and external links¶

External dataset¶

Virtual Dataset (aka. VDS)¶

HDF5 file locking: A word of caution¶

Practical tools¶

A word about Nexus¶

Conclusion¶

Data IO (input/output)¶

Introduction¶

HDF5¶

What is HDF5?¶

Why HDF5?¶

HDF5 description¶

HDF5 example¶

Useful tools for HDF5¶

HDFGroup tools¶

h5glance¶

jupyterlab-h5web¶

silx view¶

h5py¶

How to read a HDF5 file from Python¶

h5py.File¶

h5py.Group¶

h5py.Dataset¶

Context manager¶

How to write to a HDF5 file¶

Exercice: Flat field correction¶

Exercise 1¶

Exercise 2¶

Exercise 3¶

Advanced usage¶

Dataset compression¶

Soft and external links¶

External dataset¶

Virtual Dataset (aka. VDS)¶

HDF5 file locking: A word of caution¶

Practical tools¶

A word about Nexus¶

Conclusion¶

HDFGroup tools ¶

`h5glance`¶

`jupyterlab-h5web`¶

`silx view`¶

`h5py.File`¶

`h5py.Group`¶

`h5py.Dataset`¶