Skip to content

Commit

Permalink
(WIP) Ingest high and low resolution images from Visium
Browse files Browse the repository at this point in the history
  • Loading branch information
jp-dark committed Apr 4, 2024
1 parent de9d64f commit e593fa6
Show file tree
Hide file tree
Showing 2 changed files with 137 additions and 13 deletions.
1 change: 1 addition & 0 deletions apis/python/setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -333,6 +333,7 @@ def run(self):
],
extras_require={
"dev": open("requirements_dev.txt").read(),
"spatial": ["tifffile", "pillow"],
},
python_requires=">=3.8",
cmdclass={"build_ext": build_ext, "bdist_wheel": bdist_wheel},
Expand Down
149 changes: 136 additions & 13 deletions apis/python/src/tiledbsoma/experimental/ingest.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,10 +12,22 @@

import json
import pathlib
from typing import TYPE_CHECKING, Any, Dict, Optional, Sequence, Type, Union
from typing import (

Check warning on line 15 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L13-L15

Added lines #L13 - L15 were not covered by tests
TYPE_CHECKING,
Any,
Dict,
List,
Optional,
Sequence,
Tuple,
Type,
Union,
)

import numpy as np
import pandas as pd
import pyarrow as pa
from PIL import Image
import scanpy

Check warning on line 31 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L27-L31

Added lines #L27 - L31 were not covered by tests

from .. import Collection, DataFrame, DenseNDArray, Experiment, SparseNDArray
Expand Down Expand Up @@ -87,14 +99,14 @@ def from_visium(
else input_path / "filtered_feature_bc_matrix.h5"
)

# Note: Hard-coded for Space Range version >= 2
# TODO: Generalize - this is hard-coded for Space Ranger version 2
input_tissue_positions = input_path / "spatial/tissue_positions.csv"
input_scale_factors = input_path / "spatial/scalefactors_json.json"

Check warning on line 104 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L103-L104

Added lines #L103 - L104 were not covered by tests

# input_images = {
# "hires": input_path / "spatial/tissue_hires_image.png",
# "lowres": input_path / "spatial/tissue_lowres_image.png",
# }
# TODO: Generalize - hard-coded for Space Ranger version 2
input_hires = input_path / "spatial/tissue_hires_image.png"
input_lowres = input_path / "spatial/tissue_lowres_image.png"
input_fullres = None

Check warning on line 109 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L107-L109

Added lines #L107 - L109 were not covered by tests

# Create the
anndata = scanpy.read_10x_h5(input_gene_expression)
Expand Down Expand Up @@ -126,8 +138,12 @@ def from_visium(
with open(input_scale_factors, mode="r", encoding="utf-8") as scale_factors_json:
scale_factors = json.load(scale_factors_json)

Check warning on line 139 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L138-L139

Added lines #L138 - L139 were not covered by tests

# TODO: The `obs_df` should be in dataframe with only soma_joinid and obs_id. Not
# currently bothering to check/enforce this.
with Experiment.open(uri, mode="r", context=context) as experiment:
obs_df = experiment.obs.read().concat().to_pandas()

Check warning on line 144 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L143-L144

Added lines #L143 - L144 were not covered by tests

# Add spatial information to the experiment.
with Experiment.open(uri, mode="w", context=context) as experiment:
spatial_uri = f"{uri}/spatial"
with _create_or_open_collection(

Check warning on line 149 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L147-L149

Added lines #L147 - L149 were not covered by tests
Expand All @@ -143,9 +159,10 @@ def from_visium(
_maybe_set(

Check warning on line 159 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L159

Added line #L159 was not covered by tests
spatial, scene_name, scene, use_relative_uri=use_relative_uri
)

obs_locations_uri = f"{scene_uri}/obs_locations"

Check warning on line 163 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L163

Added line #L163 was not covered by tests
# TODO: The `obs_df` on the next line should be a dataframe with only
# soma_joinid and obs_id. Not currently bothering to check/enforce this.

# Write spot data and add to the scene.
with _write_visium_spot_dataframe(

Check warning on line 166 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L166

Added line #L166 was not covered by tests
obs_locations_uri,
input_tissue_positions,
Expand All @@ -160,7 +177,21 @@ def from_visium(
obs_locations,
use_relative_uri=use_relative_uri,
)
# images_uri = f"{scene_uri}/images"

# Write image data and add to the scene.
images_uri = f"{scene_uri}/images"
with _write_visium_images(

Check warning on line 183 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L182-L183

Added lines #L182 - L183 were not covered by tests
images_uri,
scale_factors,
input_hires=input_hires,
input_lowres=input_lowres,
input_fullres=input_fullres,
use_relative_uri=use_relative_uri,
**ingest_ctx,
) as images:
_maybe_set(

Check warning on line 192 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L192

Added line #L192 was not covered by tests
scene, "images", images, use_relative_uri=use_relative_uri
)
return uri

Check warning on line 195 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L195

Added line #L195 was not covered by tests


Expand Down Expand Up @@ -205,13 +236,105 @@ def _write_visium_spot_dataframe(


def _write_visium_images(

Check warning on line 238 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L238

Added line #L238 was not covered by tests
image_uri: str,
input_images: Dict[str, pathlib.Path],
input_scale_factors: Dict[str, Any],
uri: str,
scale_factors: Dict[str, Any],
*,
input_hires: Optional[pathlib.Path],
input_lowres: Optional[pathlib.Path],
input_fullres: Optional[pathlib.Path],
ingestion_params: IngestionParams,
additional_metadata: "AdditionalMetadata" = None,
platform_config: Optional["PlatformConfig"] = None,
context: Optional["SOMATileDBContext"] = None,
use_relative_uri: Optional[bool] = None,
) -> Collection[DenseNDArray]:
input_images: Dict[str, Tuple[pathlib.Path, List[float]]] = {}
if input_fullres is not None:
input_images["fullres"] = (input_fullres, [1.0, 1.0, 1.0])
if input_hires is not None:
scale = 1.0 / scale_factors["tissue_hires_scalef"]
input_images["hires"] = (input_hires, [1.0, scale, scale])
if input_lowres is not None:
scale = 1.0 / scale_factors["tissue_lowres_scalef"]
input_images["lowres"] = (input_lowres, [1.0, scale, scale])
axes_metadata = [

Check warning on line 260 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L251-L260

Added lines #L251 - L260 were not covered by tests
{"name": "c", "type": "channel"},
{"name": "y", "type": "space", "unit": "micrometer"},
{"name": "x", "type": "space", "unit": "micrometer"},
]
return _write_multiscale_images(

Check warning on line 265 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L265

Added line #L265 was not covered by tests
uri,
input_images,
axes_metadata=axes_metadata,
ingestion_params=ingestion_params,
additional_metadata=additional_metadata,
platform_config=platform_config,
context=context,
use_relative_uri=use_relative_uri,
)


def _write_multiscale_images(

Check warning on line 277 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L277

Added line #L277 was not covered by tests
uri: str,
input_images: Dict[str, Tuple[pathlib.Path, List[float]]],
*,
axes_metadata: List[Dict[str, str]],
ingestion_params: IngestionParams,
additional_metadata: "AdditionalMetadata" = None,
platform_config: Optional["PlatformConfig"] = None,
context: Optional["SOMATileDBContext"] = None,
use_relative_uri: Optional[bool] = None,
) -> Collection[DenseNDArray]:
raise NotImplementedError()
"""TODO: Write full docs for this function
TODO: Need to add in collection level metadata. In this case it will be
"""
collection = _create_or_open_collection(

Check warning on line 293 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L293

Added line #L293 was not covered by tests
Collection[DenseNDArray],
uri,
ingestion_params=ingestion_params,
additional_metadata=additional_metadata,
context=context,
)
datasets_metadata = []
for image_name, (image_path, image_scales) in input_images.items():
datasets_metadata.append(

Check warning on line 302 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L300-L302

Added lines #L300 - L302 were not covered by tests
{
"path": image_name,
"coordinateTransforms": [{"type": "scale", "scale": image_scales}],
}
)
image_uri = f"{uri}/{image_name}"

Check warning on line 308 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L308

Added line #L308 was not covered by tests

# TODO: Need to create new imaging type with dimensions 'c', 'y', 'x'
im = np.transpose(np.array(Image.open(image_path)), (2, 0, 1))
image_array = DenseNDArray.create(

Check warning on line 312 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L311-L312

Added lines #L311 - L312 were not covered by tests
image_uri,
type=pa.from_numpy_dtype(im.dtype),
shape=im.shape,
platform_config=platform_config,
context=context,
)
tensor = pa.Tensor.from_numpy(im)
image_array.write(

Check warning on line 320 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L319-L320

Added lines #L319 - L320 were not covered by tests
(slice(None), slice(None), slice(None)),
tensor,
platform_config=platform_config,
)
_maybe_set(

Check warning on line 325 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L325

Added line #L325 was not covered by tests
collection, image_name, image_array, use_relative_uri=use_relative_uri
)
metadata_blob = json.dumps(

Check warning on line 328 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L328

Added line #L328 was not covered by tests
{
"multiscales": [
{
"version": "0.1.0-dev",
"name": "visium-example",
"datasets": datasets_metadata,
}
]
}
)
collection.metadata.update({"multiscales": metadata_blob})
return collection

Check warning on line 340 in apis/python/src/tiledbsoma/experimental/ingest.py

View check run for this annotation

Codecov / codecov/patch

apis/python/src/tiledbsoma/experimental/ingest.py#L339-L340

Added lines #L339 - L340 were not covered by tests

0 comments on commit e593fa6

Please sign in to comment.