teamtomo · LorenzLamm · Apr 28, 2024 · Apr 11, 2024 · Apr 15, 2024 · Apr 15, 2024
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -19,7 +19,7 @@ repos:
         args: [--fix]
 
   - repo: https://github.com/psf/black
-    rev: 23.1.0
+    rev: 24.4.0
     hooks:
       - id: black
 

diff --git a/src/membrain_seg/__init__.py b/src/membrain_seg/__init__.py
@@ -1,4 +1,5 @@
 """membrane segmentation in 3D for cryo-ET."""
+
 from importlib.metadata import PackageNotFoundError, version
 
 try:

diff --git a/src/membrain_seg/annotations/__init__.py b/src/membrain_seg/annotations/__init__.py
@@ -1,4 +1,5 @@
 """empty init."""
+
 from .cli import cli  # noqa: F401
 from .extract_patch_cli import extract_patches  # noqa: F401
 from .merge_corrections_cli import merge_corrections  # noqa: F401
diff --git a/src/membrain_seg/segmentation/cli/__init__.py b/src/membrain_seg/segmentation/cli/__init__.py
@@ -1,5 +1,7 @@
 """CLI init function."""
+
 # These imports are necessary to register CLI commands. Do not remove!
 from .cli import cli  # noqa: F401
 from .segment_cli import segment  # noqa: F401
+from .ske_cli import skeletonize  # noqa: F401
 from .train_cli import data_dir_help, train  # noqa: F401
diff --git a/src/membrain_seg/segmentation/cli/ske_cli.py b/src/membrain_seg/segmentation/cli/ske_cli.py
@@ -0,0 +1,64 @@
+import os
+
+from typer import Option
+
+from membrain_seg.segmentation.dataloading.data_utils import store_tomogram
+
+from ..skeletonize import skeletonization as _skeletonization
+from .cli import cli
+
+
+@cli.command(name="skeletonize", no_args_is_help=True)
+def skeletonize(
+    label_path: str = Option(..., help="Specifies the path for skeletonization."),
+    out_folder: str = Option(
+        "./predictions", help="Directory to save the resulting skeletons."
+    ),
+    batch_size: int = Option(
+        None,
+        help="Optional batch size for processing the tomogram. If not specified, "
+        "the entire volume is processed at once. If operating with limited GPU "
+        "resources, a batch size of 1,000,000 is recommended.",
+    ),
+):
+    """
+    Perform skeletonization on labeled tomograms using nonmax-suppression technique.
+
+    This function reads a labeled tomogram, applies skeletonization using a specified
+    batch size, and stores the results in an MRC file in the specified output directory.
+    If batch_size is set to None, the entire tomogram is processed at once, which might
+    require significant memory. It is recommended to specify a batch size if memory
+    constraints are a concern. The maximum possible batch size is the product of the
+    tomogram's dimensions (Nx * Ny * Nz).
+
+
+    Parameters
+    ----------
+    label_path : str
+        File path to the tomogram to be skeletonized.
+    out_folder : str
+        Output folder path for the skeletonized tomogram.
+    batch_size : int, optional
+        The size of the batch to process the tomogram. Defaults to None, which processes
+        the entire volume at once. For large volumes, consider setting it to a specific
+        value like 1,000,000 for efficient processing without exceeding memory limits.
+
+
+    Examples
+    --------
+    membrain skeletonize --label-path <path> --out-folder <output-directory>
+    --batch-size <batch-size>
+    """
+    # Assuming _skeletonization function is already defined and can handle batch_size
+    ske = _skeletonization(label_path=label_path, batch_size=batch_size)
+
+    if not os.path.exists(out_folder):
+        os.makedirs(out_folder)
+
+    out_file = os.path.join(
+        out_folder,
+        os.path.splitext(os.path.basename(label_path))[0] + "_skel.mrc",
+    )
+
+    store_tomogram(filename=out_file, tomogram=ske)
+    print("Skeleton saved to ", out_file)
diff --git a/src/membrain_seg/segmentation/dataloading/memseg_augmentation.py b/src/membrain_seg/segmentation/dataloading/memseg_augmentation.py
@@ -254,9 +254,11 @@ def get_training_transforms(
                     np.random.uniform(np.log(x[y] // 6), np.log(x[y]))
                 ),
                 loc=(-0.5, 1.5),
-                max_strength=lambda x, y: np.random.uniform(-5, -1)
-                if np.random.uniform() < 0.5
-                else np.random.uniform(1, 5),
+                max_strength=lambda x, y: (
+                    np.random.uniform(-5, -1)
+                    if np.random.uniform() < 0.5
+                    else np.random.uniform(1, 5)
+                ),
                 mean_centered=False,
             ),
             prob=(1.0 if prob_to_one else 0.3),
@@ -268,9 +270,11 @@ def get_training_transforms(
                     np.random.uniform(np.log(x[y] // 6), np.log(x[y]))
                 ),
                 loc=(-0.5, 1.5),
-                gamma=lambda: np.random.uniform(0.01, 0.8)
-                if np.random.uniform() < 0.5
-                else np.random.uniform(1.5, 4),
+                gamma=lambda: (
+                    np.random.uniform(0.01, 0.8)
+                    if np.random.uniform() < 0.5
+                    else np.random.uniform(1.5, 4)
+                ),
             ),
             prob=(1.0 if prob_to_one else 0.3),
         ),

diff --git a/src/membrain_seg/segmentation/dataloading/transforms.py b/src/membrain_seg/segmentation/dataloading/transforms.py
@@ -288,9 +288,9 @@ def __call__(self, data):
                 y = self.R.randint(0, y_max - height)
                 x = self.R.randint(0, x_max - width)
                 if self.replace_with == "mean":
-                    image[
-                        ..., z : z + depth, y : y + height, x : x + width
-                    ] = torch.mean(torch.Tensor(image))
+                    image[..., z : z + depth, y : y + height, x : x + width] = (
+                        torch.mean(torch.Tensor(image))
+                    )
                 elif self.replace_with == 0.0:
                     image[..., z : z + depth, y : y + height, x : x + width] = 0.0
             d[key] = image

diff --git a/src/membrain_seg/segmentation/networks/__init__.py b/src/membrain_seg/segmentation/networks/__init__.py
@@ -1,3 +1,4 @@
 """Neural networks implemented as pytorch lightning modules."""
+
 __all__ = ["SemanticSegmentationUnet"]
 from membrain_seg.segmentation.networks.unet import SemanticSegmentationUnet
diff --git a/src/membrain_seg/segmentation/networks/unet.py b/src/membrain_seg/segmentation/networks/unet.py
@@ -140,9 +140,11 @@ def __init__(
 
         self.loss_function = DeepSuperVisionLoss(
             loss_function,
-            weights=[1.0, 0.5, 0.25, 0.125, 0.0675]
-            if use_deep_supervision
-            else [1.0, 0.0, 0.0, 0.0, 0.0],
+            weights=(
+                [1.0, 0.5, 0.25, 0.125, 0.0675]
+                if use_deep_supervision
+                else [1.0, 0.0, 0.0, 0.0, 0.0]
+            ),
         )
 
         # validation metric
@@ -278,9 +280,9 @@ def validation_step(self, batch, batch_idx):
         # compute more stats?
         outputs4dice = outputs[0].clone()
         labels4dice = labels[0].clone()
-        outputs4dice[
-            labels4dice == 2
-        ] = -1.0  # Setting to -1 here leads to 0-labels after thresholding
+        outputs4dice[labels4dice == 2] = (
+            -1.0
+        )  # Setting to -1 here leads to 0-labels after thresholding
         labels4dice[labels4dice == 2] = 0  # Need to set to zero before post_label
         # Otherwise we have 3 classes
         outputs4dice = [self.post_pred(i) for i in decollate_batch(outputs4dice)]

diff --git a/src/membrain_seg/segmentation/skeletonization/__init__.py b/src/membrain_seg/segmentation/skeletonization/__init__.py
diff --git a/src/membrain_seg/segmentation/skeletonization/diff3d.py b/src/membrain_seg/segmentation/skeletonization/diff3d.py
@@ -0,0 +1,147 @@
+# ---------------------------------------------------------------------------------
+# DISCLAIMER: This code is adapted from the MATLAB and C++ implementations provided
+# in the paper titled "Robust membrane detection based on tensor voting for electron
+# tomography" by Antonio Martinez-Sanchez, Inmaculada Garcia, Shoh Asano, Vladan Lucic,
+# and Jose-Jesus Fernandez, published in the Journal of Structural Biology,
+# Volume 186, Issue 1, 2014, Pages 49-61. The original work can be accessed via
+# https://doi.org/10.1016/j.jsb.2014.02.015 and is used under conditions that adhere
+# to the original licensing agreements. For details on the original license, refer to
+# the publication: https://www.sciencedirect.com/science/article/pii/S1047847714000495.
+# ---------------------------------------------------------------------------------
+import numpy as np
+
+
+def calculate_derivative_3d(tomogram: np.ndarray, axis: int) -> np.ndarray:
+    """
+    Calculate the partial derivative of a 3D tomogram along a specified dimension.
+
+    Parameters
+    ----------
+    tomogram : np.ndarray
+        The input 3D tomogram as a numpy array, where each dimension
+        corresponds to spatial dimensions.
+    axis : int
+        The axis along which to compute the derivative.
+        Set axis=0 for the x-dimension, axis=1 for the y-dimension,
+        and any other value for the z-dimension.
+
+    Returns
+    -------
+    np.ndarray
+        The output tomogram,
+        which represents the partial derivatives along the specified axis.
+        This output has the same shape as the input array.
+
+    Notes
+    -----
+    The function computes the centered difference in the specified dimension.
+    The boundaries are handled by padding the last slice with the value from
+    the second to last slice, ensuring smooth derivative values at the edges
+    of the tomogram.
+
+    Examples
+    --------
+    Create a sample 3D array and compute the partial derivative
+    along the x-axis (axis=0):
+
+    >>> tomogram = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+    >>> calculate_derivative_3d(tomogram, 0)
+    array([[[ 4.,  4.],
+            [ 4.,  4.]],
+
+           [[ 0.,  0.],
+            [ 0.,  0.]]])
+    """
+    # Get the size of the input tomogram
+    num_x, num_y, num_z = tomogram.shape
+
+    # Initialize arrays for forward and backward differences
+    forward_difference = np.zeros((num_x, num_y, num_z), dtype="float32")
+    backward_difference = np.zeros((num_x, num_y, num_z), dtype="float32")
+
+    # Calculate partial derivatives along the specified dimension (axis)
+    if axis == 0:
+        forward_difference[0 : num_x - 1, :, :] = tomogram[1:num_x, :, :]
+        backward_difference[1:num_x, :, :] = tomogram[0 : num_x - 1, :, :]
+        # Pad extremes
+        forward_difference[num_x - 1, :, :] = forward_difference[num_x - 2, :, :]
+        backward_difference[0, :, :] = backward_difference[1, :, :]
+    elif axis == 1:
+        forward_difference[:, 0 : num_y - 1, :] = tomogram[:, 1:num_y, :]
+        backward_difference[:, 1:num_y, :] = tomogram[:, 0 : num_y - 1, :]
+        # Pad extremes
+        forward_difference[:, num_y - 1, :] = forward_difference[:, num_y - 2, :]
+        backward_difference[:, 0, :] = backward_difference[:, 1, :]
+    else:
+        forward_difference[:, :, 0 : num_z - 1] = tomogram[:, :, 1:num_z]
+        backward_difference[:, :, 1:num_z] = tomogram[:, :, 0 : num_z - 1]
+        # Pad extremes
+        forward_difference[:, :, num_z - 1] = forward_difference[:, :, num_z - 2]
+        backward_difference[:, :, 0] = backward_difference[:, :, 1]
+
+    # Calculate the output tomogram
+    derivative_tomogram = (forward_difference - backward_difference) * 0.5
+
+    return derivative_tomogram
+
+
+def compute_gradients(tomogram: np.ndarray) -> tuple:
+    """
+    Computes the gradients along each spatial dimension of a 3D tomogram.
+
+    Parameters
+    ----------
+    tomogram : np.ndarray
+        The input 3D tomogram as a numpy array.
+
+    Returns
+    -------
+    tuple
+        A tuple containing the gradient components (gradX, gradY, gradZ).
+
+    Notes
+    -----
+    This function calculates the partial derivatives of the tomogram along the x, y,
+    and z dimensions, respectively. These derivatives represent the gradient components
+    along each dimension.
+    """
+    gradX = calculate_derivative_3d(tomogram, 0)
+    gradY = calculate_derivative_3d(tomogram, 1)
+    gradZ = calculate_derivative_3d(tomogram, 2)
+
+    return gradX, gradY, gradZ
+
+
+def compute_hessian(gradX: np.ndarray, gradY: np.ndarray, gradZ: np.ndarray) -> tuple:
+    """
+    Computes the Hessian tensor components for a 3D tomogram from its gradients.
+
+    Parameters
+    ----------
+    gradX : np.ndarray
+        Gradient of the tomogram along the x-axis.
+    gradY : np.ndarray
+        Gradient of the tomogram along the y-axis.
+    gradZ : np.ndarray
+        Gradient of the tomogram along the z-axis.
+
+    Returns
+    -------
+    tuple
+        A tuple containing the Hessian tensor components (hessianXX, hessianYY,
+        hessianZZ, hessianXY, hessianXZ, hessianYZ).
+
+    Notes
+    -----
+    This function computes the second derivatives of the tomogram along each dimension.
+    These second derivatives form the components of the Hessian tensor, providing
+    information about the curvature of the tomogram.
+    """
+    hessianXX = calculate_derivative_3d(gradX, 0)
+    hessianYY = calculate_derivative_3d(gradY, 1)
+    hessianZZ = calculate_derivative_3d(gradZ, 2)
+    hessianXY = calculate_derivative_3d(gradX, 1)
+    hessianXZ = calculate_derivative_3d(gradX, 2)
+    hessianYZ = calculate_derivative_3d(gradY, 2)
+
+    return hessianXX, hessianYY, hessianZZ, hessianXY, hessianXZ, hessianYZ