Source code for neuron_morphology.features.layer.layer_histogram

from typing import NamedTuple, Optional, Dict, Sequence, Tuple, Type, Any, Union
from enum import Enum
from functools import lru_cache
from collections.abc import Collection

import numpy as np
import pandas as pd
from scipy.stats import wasserstein_distance

from neuron_morphology.features.layer.reference_layer_depths import \
    ReferenceLayerDepths
from neuron_morphology.feature_extractor.data import Data
from neuron_morphology.feature_extractor.mark import (
    RequiresReferenceLayerDepths, 
    RequiresLayeredPointDepths, 
    RequiresRegularPointSpacing
)
from neuron_morphology.feature_extractor.marked_feature import marked
from neuron_morphology.constants import (
    AXON, SOMA, APICAL_DENDRITE, BASAL_DENDRITE)

[docs]def ensure_tuple(
    inputs: Any, 
    item_type: Type, 
    if_none: Union[str, Tuple] = "raise"
) -> Tuple:
    """ Try to smartly coerce inputs to a tuple.

    Parameters
    ----------
    inputs : the data to be coerced
    item_type : which type do/should the elements of the tuple have?
    if_none : if the inputs are none, return this value. If the value is 
        "raise", instead raise an exception

    Returns
    -------
    the coerced inputs

    """

    if isinstance(if_none, str) and if_none != "raise":
        raise ValueError("if_none must be a tuple or \"raise\"")

    if inputs is None:
        if if_none is "raise":
            raise ValueError("inputs were None")
        else:
            return if_none # type: ignore[]
    elif isinstance(inputs, item_type):
        return (inputs,)
    elif isinstance(inputs, Collection) and not isinstance(inputs, str):
        return tuple(inputs)
    else:
        raise ValueError(f"unable to ensure {type(inputs)} {inputs}")

[docs]def ensure_node_types(node_types):
    """ Make sure the argued node types are a tuple
    """

    return ensure_tuple(
        node_types, int, if_none=(AXON, SOMA, APICAL_DENDRITE, BASAL_DENDRITE)
    )

[docs]def ensure_layers(layers):
    """ Make sure the argued layer array is a tuple
    """

    return ensure_tuple(layers, str, None)


[docs]class LayerHistogram(NamedTuple):
    """ The results of calculating a within-layer depth histogram of points 
    within some cortical layer.
    """

    # within each bin, how many points wre observed
    counts: np.ndarray

    # the edges (depths) of each bin
    bin_edges: np.ndarray


[docs]class EarthMoversDistanceInterpretation(Enum):
    """ Describes how to understand an earth mover's distance result. This is 
    useful in the case that one or both histograms are all 0.
    """

    # Both histograms were present and nonempty - the earth movers distance was 
    # calculated between the normalized version of each.
    BothPresent = 0

    # One histogram was empty (all 0). The resulting value is the sum of the 
    # non-empty histogram.
    OneEmpty = 1

    # Both histograms were empty (all 0). The resulting value may be 0 or nan.
    BothEmpty = 2

[docs]class EarthMoversDistanceResult(NamedTuple):
    """ The result of comparing two histograms using earth mover's distance
    """

    # the earth movers distance between these histograms. 
    result: float

    # how to interpret the result.
    interpretation: EarthMoversDistanceInterpretation

[docs]    def to_dict_human_readable(self):
        return {
            "result": self.result,
            "interpretation": str(self.interpretation).split(".")[1]
        }


@marked(RequiresRegularPointSpacing)
@marked(RequiresLayeredPointDepths)
@marked(RequiresReferenceLayerDepths)
def earth_movers_distance(
    data: Data,
    node_types: Sequence[int],
    node_types_to_compare: Sequence[int],
    bin_size: float = 5
) -> Dict[str, EarthMoversDistanceResult]: 
    """ Calculate the earth mover's distance between normalized histograms of 
    node depths within cortical layers. Calculates one distance for each layer.

    Parameters
    ----------
    data : Must be endowed with layered_point_depths and reference_layer_depths.
        The morphology is not actually used directly.
    node_types : Defines one set of points whose histograms to compare.
    node_types_to_compare : Defines the other set of points
    bin_size : the size of each depth bin. Default is appropriate if the units
        are microns.

    Returns
    -------
    A mapping from layers to distances between histograms within those layers.

    """

    first_hists = normalized_depth_histograms_across_layers(data, 
        ensure_node_types(node_types), bin_size=bin_size)
    second_hists = normalized_depth_histograms_across_layers(data, 
        ensure_node_types(node_types_to_compare), bin_size=bin_size)

    return {
        layer: histogram_earth_movers_distance(
            first_hists[layer].counts,
            second_hists[layer].counts
        )
        for layer in set(first_hists.keys()) & set(second_hists.keys())
    }

[docs]def histogram_earth_movers_distance(
    from_hist: np.ndarray, 
    to_hist: np.ndarray
) -> EarthMoversDistanceResult:
    """ Calculate the earth mover's distance between to histograms, normalizing 
    each. If one histogram is empty, return the sum of the other and a flag. If
    both are empty, return 0 a and a flag.

    Parameters
    ----------
    from_hist : distance is calculated between (the normalized form of) this
        histogram and to_hist. The result is symmetric.  
    to_hist : distance is calculated between (the normalized form of) this
        histogram and from_hist

    Returns
    -------
    The distance between input histograms, along with an enum indicating 
    whether one or both of the histograms was all 0.

    """

    from_total = from_hist.sum()
    to_total = to_hist.sum()

    if from_total == 0 or to_total == 0:
        if from_total == 0  and to_total == 0:
            return EarthMoversDistanceResult(
                0, 
                EarthMoversDistanceInterpretation.BothEmpty
            )
    
        else:
            return EarthMoversDistanceResult(
                from_total if from_total else to_total,
                EarthMoversDistanceInterpretation.OneEmpty
            )

    base = np.arange(len(from_hist))
    return EarthMoversDistanceResult(
        wasserstein_distance(base, base, from_hist, to_hist),
        EarthMoversDistanceInterpretation.BothPresent
    )


@marked(RequiresRegularPointSpacing)
@marked(RequiresLayeredPointDepths)
@marked(RequiresReferenceLayerDepths)
def normalized_depth_histogram(
    data: Data, 
    node_types: Optional[Sequence[int]] = None,
    bin_size=5.0
) -> Dict[str, LayerHistogram]:
    """ Calculates for each cortical layer a histogram of node depths within 
    that layer.

    Parameters
    ----------
    data : Must have the following attributes:
        reference_layer_depths : A dictionary mapping layer names (str) to 
            ReferenceLayerDepths objects describing the average pia and white-
            matter side depths of this each layer.
        layered_point_depths : A LayeredPointDepths defining for each point a 
            depth from pia. See LayeredPointDepths for more information.
    node_types : for which to calculate the histograms
    bin_size : the size of each depth bin. Default is appropriate if the units
        are microns.
    """

    return normalized_depth_histograms_across_layers(
        data=data, point_types=ensure_node_types(node_types), bin_size=bin_size)

# small cache since calling this fn many times probably means the user is 
# running across multiple specimens, in which case we expect all misses.
[docs]@lru_cache(maxsize=16) 
def normalized_depth_histograms_across_layers(
    data: Data, 
    point_types: Optional[Tuple[int]] = None,
    only_layers: Optional[Tuple[str]] = None,
    bin_size=5.0
) -> Dict[str, LayerHistogram]:
    """ A helper function for running cortical depth histograms across multiple 
    layers.

    Parameters
    ----------
    data : must have reference_layer_depths and layered_point_depths
    point_types : calculate histograms for points labeled with these types
    only_layers : exclude other layers from this calculation
    bin_size : the size of each depth bin. Default is appropriate if the units
        are microns.

    """

    depths = data.layered_point_depths.df # type: ignore[attr-defined]
    if point_types is not None:
        depths = depths[depths["point_type"].isin(set(point_types))]
    if only_layers is not None:
        depths = depths[depths["layer_name"].isin(set(only_layers))]

    output = {}

    for layer_name, group in depths.groupby("layer_name"):
        reference_layer_depths = data.reference_layer_depths.get( # type: ignore[attr-defined]
            layer_name, None)
        if reference_layer_depths is None:
            raise ValueError(
                "unable to calculate layer depth histogram for layer "
                f"{layer_name} - no reference depths provided"
            )

        group_df = pd.DataFrame(group)
        output[layer_name] = normalized_depth_histogram_within_layer(
            point_depths=group_df["depth"],
            local_layer_pia_side_depths=group_df["local_layer_pia_side_depth"],
            local_layer_wm_side_depths=group_df["local_layer_wm_side_depth"],
            reference_layer_depths=reference_layer_depths,
            bin_size=bin_size
        )

    return output


[docs]def normalized_depth_histogram_within_layer(
    point_depths: np.ndarray,
    local_layer_pia_side_depths: np.ndarray,
    local_layer_wm_side_depths: np.ndarray,
    reference_layer_depths: ReferenceLayerDepths,
    bin_size: float
) -> np.ndarray:
    """ Calculates a histogram of node depths within a single (cortical) layer. 
    Uses reference information about layer boundaries to normalize these 
    depths for cross-reconstruction comparison.

    Parameters
    ----------
    depths : Each item corresponds to a point of interest (such as a node 
        in a morphological reconstruction). Values are the depths of these 
        points of interest from the pia surface.
    local_layer_pia_side_depths : Each item corresponds to a point of interest.
        Values are the depth of the intersection point between a path of 
        steepest descent from the pia surface to the point of interest and the 
        upper surface of the layer.
    local_layer_wm_side_depths : Each item corresponds to a point of interest. 
        Values are the depth of the intersection point between the layer's 
        lower boundary and the path described above.
    reference_layer_depths : Used to provide normalized depths suitable 
        for comparison across reconstructions. Should provide a generic 
        equivalent of local layer depths for a population or reference space.
    bin_size : The width of each bin, in terms of depths from pia in the 
        reference space. Provide only one of bin_edges or bin_size.
    
    Returns
    -------
    A numpy array listing for each depth bin the number of nodes falling within 
        that bin.

    Notes
    -----
    This function relies on the notion of a steepest descent path through 
    cortex, but is agnostic to the method used to obtain such a path and to 
    features of the path (e.g. whether it is allowed to curve). Rather the 
    caller must ensure that all depths have been calculated according to a 
    consistent scheme. 

    """

    bin_edges = np.arange(
        reference_layer_depths.pia_side,
        reference_layer_depths.wm_side,
        bin_size
    )
    if reference_layer_depths.wm_side - bin_edges[-1] > 0.5 * bin_size:
        bin_edges = np.append(bin_edges, [reference_layer_depths.wm_side])
    else:
        bin_edges[-1] = reference_layer_depths.wm_side

    if reference_layer_depths.scale:
        local_layer_thicknesses = \
            local_layer_wm_side_depths - local_layer_pia_side_depths
        scale = reference_layer_depths.thickness / local_layer_thicknesses
    else:
        scale = 1.0

    normalized_depths = (point_depths - local_layer_pia_side_depths) * scale
    normalized_depths = normalized_depths + reference_layer_depths.pia_side
    normalized_depths = normalized_depths[np.isfinite(normalized_depths)]

    counts, bin_edges = np.histogram(normalized_depths, bins=bin_edges)
    return LayerHistogram(counts=counts, bin_edges=bin_edges)
Source code for neuron_morphology.features.layer.layer_histogram

neuron morphology

Navigation

Related Topics