ome · joshmoore · Jan 20, 2025 · Sep 5, 2023 · Jan 16, 2025 · Jan 16, 2025
diff --git a/docs/source/python.rst b/docs/source/python.rst
@@ -195,3 +195,201 @@ the data is available as `dask` arrays::
     viewer = napari.view_image(dask_data, channel_axis=0)
     if __name__ == '__main__':
         napari.run()
+
+
+More writing examples
+---------------------
+
+Writing big image from tiles::
+
+    # Created for https://forum.image.sc/t/writing-tile-wise-ome-zarr-with-pyramid-size/85063
+
+    import os
+    import zarr
+    from ome_zarr.io import parse_url
+    from ome_zarr.reader import Reader
+    from ome_zarr.writer import write_multiscales_metadata
+    from ome_zarr.dask_utils import resize as da_resize
+    import numpy as np
+    import dask.array as da
+    from math import ceil
+
+    url = "https://uk1s3.embassy.ebi.ac.uk/idr/zarr/v0.3/9836842.zarr"
+    reader = Reader(parse_url(url))
+    nodes = list(reader())
+    # first level of the pyramid
+    dask_data = nodes[0].data[0]
+    tile_size = 512
+
+    def downsample_pyramid_on_disk(parent, paths):
+        """
+        Takes a high-resolution Zarr array at paths[0] in the zarr group
+        and down-samples it by a factor of 2 for each of the other paths
+        """
+        group_path = parent.store.path
+        image_path = os.path.join(group_path, parent.path)
+        print("downsample_pyramid_on_disk", image_path)
+        for count, path in enumerate(paths[1:]):
+            target_path = os.path.join(image_path, path)
+            if os.path.exists(target_path):
+                print("path exists: %s" % target_path)
+                continue
+            # open previous resolution from disk via dask...
+            path_to_array = os.path.join(image_path, paths[count])
+            dask_image = da.from_zarr(path_to_array)
+
+            # resize in X and Y
+            dims = list(dask_image.shape)
+            dims[-1] = dims[-1] // 2
+            dims[-2] = dims[-2] // 2
+            output = da_resize(
+                dask_image, tuple(dims), preserve_range=True, anti_aliasing=False
+            )
+
+            # write to disk
+            da.to_zarr(
+                arr=output, url=image_path, component=path,
+                dimension_separator=parent._store._dimension_separator,
+            )
+        return paths
+
+    def get_tile(ch, row, col):
+        # read the tile data from somewhere - we use the dask array
+        y1 = row * tile_size
+        y2 = y1 + tile_size
+        x1 = col * tile_size
+        x2 = x1 + tile_size
+        return dask_data[ch, y1:y2, x1:x2]
+
+    # (4,1920,1920)
+    shape = dask_data.shape
+    chunks = (1, tile_size, tile_size)
+    d_type = np.dtype('<u2')
+
+    channel_count = shape[0]
+    row_count = ceil(shape[-2]/tile_size)
+    col_count = ceil(shape[-1]/tile_size)
+
+    store = parse_url("9836842.zarr", mode="w").store
+    root = zarr.group(store=store)
+
+    # create empty array at root of pyramid
+    zarray = root.require_dataset(
+        "0",
+        shape=shape,
+        exact=True,
+        chunks=chunks,
+        dtype=d_type,
+    )
+
+    print("row_count", row_count, "col_count", col_count)
+    # Go through all tiles and write data to "0" array
+    for ch_index in range(channel_count):
+        for row in range(row_count):
+            for col in range(col_count):
+                tile = get_tile(ch_index, row, col).compute()
+                y1 = row * tile_size
+                y2 = y1 + tile_size
+                x1 = col * tile_size
+                x2 = x1 + tile_size
+                print("ch_index", ch_index, "row", row, "col", col)
+                zarray[ch_index, y1:y2, x1:x2] = tile
+
+    paths = ["0", "1", "2"]
+    axes = [{"name": "c", "type": "channel"}, {"name": "y", "type": "space"}, {"name": "x", "type": "space"}]
+
+    # We have "0" array. This downsamples (in X and Y dims only) to create "1" and "2"
+    downsample_pyramid_on_disk(root, paths)
+
+    transformations = [
+        [{"type": "scale", "scale": [1.0, 1.0, 1.0]}],
+        [{"type": "scale", "scale": [1.0, 2.0, 2.0]}],
+        [{"type": "scale", "scale": [1.0, 4.0, 4.0]}]
+    ]
+    datasets = []
+    for p, t in zip(paths, transformations):
+        datasets.append({"path": p, "coordinateTransformations": t})
+
+    write_multiscales_metadata(root, datasets, axes=axes)
+
+
+Using dask to fetch::
+
+    # Created for https://forum.image.sc/t/writing-tile-wise-ome-zarr-with-pyramid-size/85063
+
+    import dask.array as da
+    import numpy as np
+    import zarr
+    from dask import delayed
+
+    from ome_zarr.io import parse_url
+    from ome_zarr.writer import write_image, write_multiscales_metadata
+
+    zarr_name = "test_dask.zarr"
+    store = parse_url(zarr_name, mode="w").store
+    root = zarr.group(store=store)
+
+    size_xy = 100
+    channel_count = 2
+    size_z = 10
+    row_count = 3
+    col_count = 5
+    dtype = np.uint8
+    tile_shape = (size_xy, size_xy)
+
+
+    def get_tile(ch, z, row, column):
+        print("get_tile", ch, z, row, column)
+        mean_val = ((row + 1) * (column + 1) * 4) + (10 * z)
+        rng = np.random.default_rng(1000 * ch)
+        return rng.poisson(mean_val, size=tile_shape).astype(dtype)
+
+
+    delayed_reader = delayed(get_tile)
+
+    dask_channels = []
+
+    for ch in range(channel_count):
+        dask_planes = []
+        for z_index in range(size_z):
+            dask_rows = []
+            for row in range(row_count):
+                dask_tiles = []
+                for col in range(col_count):
+                    dask_tile = da.from_delayed(
+                        delayed_reader(ch, z_index, row, col), shape=tile_shape, dtype=dtype
+                    )
+                    dask_tiles.append(dask_tile)
+                dask_row = da.concatenate(dask_tiles, axis=1)
+                dask_rows.append(dask_row)
+            dask_plane = da.concatenate(dask_rows, axis=0)
+            dask_planes.append(dask_plane)
+        # stack 2D planes to 3D for each channel
+        dask_channels.append(da.stack(dask_planes, axis=0))
+    # stack 3D (zyx) data to 4D (czyx)
+    dask_data = da.stack(dask_channels, axis=0)
+
+    print("dask_data", dask_data)
+
+    # This will create a downsampled 'multiscales' pyramid
+    write_image(dask_data, root, axes="czyx")
+
+    root.attrs["omero"] = {
+        "channels": [
+            {
+                "color": "FF0000",
+                "window": {"min": 0, "start": 0, "end": 200, "max": 256},
+                "label": "random_red",
+                "active": True,
+            },
+            {
+                "color": "00FF00",
+                "window": {"min": 0, "start": 0, "end": 200, "max": 256},
+                "label": "random_green",
+                "active": True,
+            },
+        ]
+    }
+
+    print("Created image. Open with...")
+    print(f"ome_zarr view {zarr_name}")