Source code for magmap.atlas.ontology

# Anatomical ontology management
# Author: David Young, 2019
"""Handle ontology lookup.
"""

import os
from collections import OrderedDict
from enum import Enum
import json
from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple, Union

import numpy as np
import pandas as pd
from pandas.errors import ParserError

from magmap.settings import config
from magmap.io import df_io, libmag

NODE = "node"
PARENT_IDS = "parent_ids"
MIRRORED = "mirrored"
RIGHT_SUFFIX = " (R)"
LEFT_SUFFIX = " (L)"

_logger = config.logger.getChild(__name__)



[docs]
class LabelColumns(Enum):
    """Label data frame columns enumeration."""
    FROM_LABEL = "FromLabel"
    TO_LABEL = "ToLabel"




[docs]
class LabelsRef:
    """Labels reference container and worker class.
    
    Attributes:
        path_ref: Path to labels reference file.
        loaded_ref: Loaded reference object.
        ref_lookup: Reference in a dict format.
    
    """
    
    # mapping of alternate column names to ABA-style names
    _COLS_TO_ABA: Dict[str, str] = {
        config.AtlasMetrics.REGION.value: config.ABAKeys.ABA_ID.value,
        config.AtlasMetrics.REGION_NAME.value: config.ABAKeys.NAME.value,
    }
    
    def __init__(self, path_ref=None):
        self.path_ref: Optional[str] = path_ref
        self.loaded_ref: Optional[Union[Dict, pd.DataFrame]] = None
        self.ref_lookup: Optional[Dict[int, Any]] = None


[docs]
    def load_labels_ref(self, path: str = None) -> Union[Dict, pd.DataFrame]:
        """Load labels from a reference JSON or CSV file.
        
        Args:
            path: Path to labels reference; defaults to None to use
                :attr:`path_ref`.
        
        Returns:
            A JSON decoded object (eg dictionary) if the path has a JSON
            extension, or a data frame.
        
        Raises:
            FileNotFoundError: if ``path`` could not be loaded or parsed.
        
        """
        if not path:
            path = self.path_ref
        try:
            if not path:
                raise FileNotFoundError
            path_split = os.path.splitext(path)
            if path_split[1] == ".json":
                # load JSON file
                with open(path, "r") as f:
                    self.loaded_ref = json.load(f)
            else:
                # load CSV file and rename columns to ABA-style names
                df = pd.read_csv(path)
                self.loaded_ref = df.rename(self._COLS_TO_ABA, axis=1)
        except (ParserError, FileNotFoundError):
            raise FileNotFoundError(
                f"Could not load labels reference file from '{path}', skipping")
        return self.loaded_ref



[docs]
    def get_node(self, nested_dict, key, value, key_children):
        """Get a node from a nested dictionary by iterating through all 
        dictionaries until the specified value is found.
    
        Args:
            nested_dict: A dictionary that contains a list of dictionaries in
                the key_children entry.
            key: Key to check for the value.
            value: Value to find, assumed to be unique for the given key.
            key_children: Name of the children key, which contains a list of 
                further dictionaries but can be empty.
    
        Returns:
            The node matching the key-value pair, or None if not found.
        """
        try:
            # print("checking for key {}...".format(key), end="")
            found_val = nested_dict[key]
            # print("found {}".format(found_val))
            if found_val == value:
                return nested_dict
            children = nested_dict[key_children]
            for child in children:
                result = self.get_node(child, key, value, key_children)
                if result is not None:
                    return result
        except KeyError as e:
            print(e)
        return None

    

[docs]
    def create_aba_reverse_lookup(self, labels_ref) -> Dict[int, Any]:
        """Create a reverse lookup dictionary for Allen Brain Atlas style
        ontology files.
    
        Args:
            labels_ref: The ontology file as a parsed JSON dictionary.
    
        Returns:
            Reverse lookup dictionary as output by 
            :func:`ontology.create_reverse_lookup`.
        """
        return self.create_reverse_lookup(
            labels_ref["msg"][0], config.ABAKeys.ABA_ID.value,
            config.ABAKeys.CHILDREN.value)

    

[docs]
    def create_reverse_lookup(
            self, nested_dict, key, key_children,
            id_dict: Optional[Dict[int, Any]] = None,
            parent_list=None) -> Dict[int, Any]:
        """Create a reveres lookup dictionary with the values of the original 
        dictionary as the keys of the new dictionary.
    
        Each value of the new dictionary is another dictionary that contains 
        "node", the dictionary with the given key-value pair, and "parent_ids", 
        a list of all the parents of the given node. This entry can be used to 
        track all superceding dictionaries, and the node can be used to find 
        all its children.
    
        Args:
            nested_dict (dict): A dictionary that contains a list of
                dictionaries in the key_children entry.
            key (Any): Key that contains the values to use as keys in the new
                dictionary. The values of this key should be unique throughout
                the entire nested_dict and thus serve as IDs.
            key_children (Any): Name of the children key, which contains a list
                of further dictionaries but can be empty.
            id_dict (OrderedDict): The output dictionary as an OrderedDict to
                preserve key  order (though not hierarchical structure) so that
                children will come after their parents. Defaults to None to
                create an empty `OrderedDict`.
            parent_list (list[Any]): List of values for the given key in all
                parent dictionaries.
    
        Returns:
            OrderedDict: A dictionary with the original values as the keys,
            which each map to another dictionary containing an entry with
            the dictionary holding the given value and another entry with a
            list of all parent dictionary values for the given key.
    
        """
        if id_dict is None:
            id_dict = OrderedDict()
        value = nested_dict[key]
        sub_dict = {NODE: nested_dict}
        if parent_list is not None:
            sub_dict[PARENT_IDS] = parent_list
        id_dict[value] = sub_dict
        try:
            children = nested_dict[key_children]
            parent_list = [] if parent_list is None else list(parent_list)
            parent_list.append(value)
            for child in children:
                # print("parents: {}".format(parent_list))
                self.create_reverse_lookup(
                    child, key, key_children, id_dict, parent_list)
        except KeyError as e:
            print(e)
        return id_dict

    

[docs]
    def create_lookup_pd(
            self, df: Optional[pd.DataFrame] = None) -> Dict[int, Any]:
        """Create a lookup dictionary from a Pandas data frame.
    
        Args:
            df: Pandas data frame, assumed to have at
                least columns corresponding to :const:``config.ABAKeys.ABA_ID``
                or :const:``config.AtlasMetrics.REGION`` and 
                :const:``config.ABAKeys.ABA_NAME`` or
                :const:``config.AtlasMetrics.REGION_NAME``. Defaults to None,
                in which case :attr:`loaded_ref` is used.
    
        Returns:
            Dictionary similar to that generated from 
            :meth:``create_reverse_lookup``, with IDs as keys and values 
            corresponding of another dictionary with :const:``NODE`` and 
            :const:``PARENT_IDS`` as keys. :const:``NODE`` in turn 
            contains a dictionary with entries for each Enum in 
            :const:``config.ABAKeys``.
    
        Raises:
            KeyError: if the ID/region and name keys cannot be found.
    
        """
        if df is None:
            df = self.loaded_ref
        if not isinstance(df, pd.DataFrame):
            raise KeyError("Loaded reference is not a data frame")
        
        id_dict = OrderedDict()
        try:
            ids = df[config.ABAKeys.ABA_ID.value]
            has_parent = config.AtlasMetrics.PARENT.value in df.columns
            for region_id in ids:
                # convert region to dict
                region = df[ids == region_id]
                region_dict = region.to_dict("records")[0]

                # ensure that ABA-style columns are present
                if config.ABAKeys.NAME.value not in region_dict:
                    region_dict[config.ABAKeys.NAME.value] = str(region_id)
                if config.ABAKeys.LEVEL.value not in region_dict:
                    level = region.get(config.AtlasMetrics.LEVEL.value)
                    region_dict[config.ABAKeys.LEVEL.value] = (
                        1 if level is None else level.squeeze())
                if config.ABAKeys.ACRONYM.value not in region_dict:
                    abbr = region.get(
                        config.AtlasMetrics.REGION_ABBR.value)
                    region_dict[config.ABAKeys.ACRONYM.value] = (
                        "" if abbr is None else abbr.squeeze())
                
                # add list for references to children
                region_dict[config.ABAKeys.CHILDREN.value] = []
                
                # add to lookup dict
                parent_ids = (region[config.AtlasMetrics.PARENT.value].tolist()
                              if has_parent else [])
                sub_dict = {NODE: region_dict, PARENT_IDS: parent_ids}
                id_dict[region_id] = sub_dict
            
            if has_parent:
                # fill children with references to each child, which should
                # each include references until end nodes
                for region_id in ids:
                    children = df.loc[
                        df[config.AtlasMetrics.PARENT.value] == region_id,
                        config.ABAKeys.ABA_ID.value]
                    for child in children:
                        id_dict[region_id][NODE][
                            config.ABAKeys.CHILDREN.value].append(
                                id_dict[child][NODE])
                    
        except KeyError as e:
            raise KeyError(f"Could not find this column in the labels reference "
                           f"file: {e}")
        return id_dict



[docs]
    def get_ref_lookup_as_df(self) -> Optional[pd.DataFrame]:
        """Get the reference lookup dict as a data frame.
        
        Returns:
            :attr:`ref_lookup` converted to a data frame. Returns the object
            as-is if it is already a data frame.

        """
        if self.ref_lookup is None:
            # return immediately if no reference dict to convert
            return None
        
        if isinstance(self.ref_lookup, pd.DataFrame):
            # return existing data frame
            return self.ref_lookup
        
        # convert dict reference to data frame with main columns
        labels_ref_regions = {}
        keys_node = (
            config.ABAKeys.NAME.value,
            config.ABAKeys.LEVEL.value,
            config.ABAKeys.ACRONYM.value,
        )
        for key, val in self.ref_lookup.items():
            # extract a subset of entries
            labels_ref_regions.setdefault(
                config.ABAKeys.ABA_ID.value, []).append(key)
            node = val[NODE]
            for node_k in keys_node:
                labels_ref_regions.setdefault(
                    node_k, []).append(node.get(node_k) if node else None)
            labels_ref_regions.setdefault(
                PARENT_IDS, []).append(val.get(PARENT_IDS))
        df_regions = df_io.dict_to_data_frame(labels_ref_regions)
        return df_regions

    

[docs]
    def create_ref_lookup(
            self, labels_ref: Optional[Union[pd.DataFrame, Dict]] = None
    ) -> Dict[int, Any]:
        """Wrapper to create a reference lookup from different sources.
    
        Reference data frames and dictionaries are converted to a dictionary
        that can be looked up by ID.
    
        Args:
            labels_ref: Reference dictionary or data frame, typically loaded
                from :meth:`load_labels`. Defaults to None, in which case
                :attr:`loads_ref` is used.
    
        Returns:
            Ordered dictionary for looking up by ID.
    
        """
        if labels_ref is None:
            labels_ref = self.loaded_ref
        if isinstance(labels_ref, pd.DataFrame):
            # parse CSV files loaded into data frame
            self.ref_lookup = self.create_lookup_pd(labels_ref)
        else:
            # parse dict from ABA JSON file
            self.ref_lookup = self.create_aba_reverse_lookup(labels_ref)
        return self.ref_lookup

    

[docs]
    def load(self):
        """Load the labels reference file to a lookup dictionary.
        
        Loads the file from :attr:`path_ref` to :attr:`loaded_ref` and
        creates a lookup dictionary stored in :attr:`lookup_ref`.
        
        Returns:
            This instance for chained calls.
        
        """
        try:
            self.load_labels_ref()
            if self.loaded_ref is not None:
                self.create_ref_lookup()
        except (FileNotFoundError, KeyError) as e:
            _logger.debug(e)
        return self





[docs]
def convert_itksnap_to_df(path: str):
    """Convert an ITK-SNAP labels description file to a CSV file.
    
    MagellanMapper can read this type of CSV file.

    Args:
        path: Path to description file.

    Returns:
        Pandas data frame of the description file.
    
    """
    # load description file and convert contiguous spaces to separators,
    # remove comments, and add headers
    df = pd.read_csv(
        path, sep=r"\s+", comment="#",
        names=[e.value for e in config.ItkSnapLabels])
    return df



def _get_children(labels_ref_lookup, label_id, children_all=[]):
    """Recursively get the children of a given non-negative atlas ID.
    
    Used as a helper function to :func:``get_children_from_id``.
    
    Args:
        labels_ref_lookup: The labels reference lookup, assumed to be 
            generated by :func:`create_reverse_lookup` to look up by ID.
        label_id: ID of the label to find, assumed to be >= 0 since 
            IDs in ``labels_ref_lookup`` are generally non-negative.
        children_all: List of all children of this ID, used recursively; 
            defaults to an empty list. To include the ID itself, pass in a 
            list with this ID alone.
    
    Returns:
        A list of all children of the given ID, in order from highest 
        (numerically lowest) level to lowest.
    """
    label = labels_ref_lookup.get(label_id)
    if label:
        # recursively gather the children of the label
        children = label[NODE][config.ABAKeys.CHILDREN.value]
        for child in children:
            child_id = child[config.ABAKeys.ABA_ID.value]
            #print("child_id: {}".format(child_id))
            children_all.append(child_id)
            _get_children(labels_ref_lookup, child_id, children_all)
    return children_all


def _mirror_label_ids(
        label_ids: Union[int, Sequence[int]], combine: bool = False
) -> Union[int, Sequence[int]]:
    """Mirror label IDs.
    
    Assumes that a "mirrored" ID is the negative of the given ID.
    
    Args:
        label_ids: Single ID or sequence of IDs.
        combine: True to return a list of ``label_ids`` along with their
            mirrored IDs. Defaults to False, where only the mirrored IDs
            are returned.

    Returns:
        A single mirrored ID if ``label_ids`` is one ID and ``combine`` is
        False, or a list of IDs.

    """
    if libmag.is_seq(label_ids):
        # sequence of IDs
        mirrored = [-1 * n for n in label_ids]
        if combine:
            # combine mirrored with original IDs
            labels = list(label_ids)
            labels.extend(mirrored)
            mirrored = labels
    else:
        # single ID
        mirrored = -1 * label_ids
        if combine:
            # combine IDs
            mirrored = [label_ids, mirrored]
    return mirrored



[docs]
def get_children_from_id(labels_ref_lookup, label_id, incl_parent=True, 
                         both_sides=False):
    """Get the children of a given atlas ID.
    
    Args:
        labels_ref_lookup: The labels reference lookup, assumed to be 
            generated by :func:`create_reverse_lookup` to look up by ID.
        label_id: ID of the label to find, which can be negative.
        incl_parent: True to include ``label_id`` itself in the list of 
            children; defaults to True.
        both_sides: True to include both sides, ie positive and negative 
            values of each ID. Defaults to False.
    
    Returns:
        A list of all children of the given ID, in order from highest 
        (numerically lowest) level to lowest.
    """
    id_abs = abs(label_id)
    children_all = [id_abs] if incl_parent else []
    region_ids = _get_children(labels_ref_lookup, id_abs, children_all)
    if both_sides:
        region_ids.extend(_mirror_label_ids(region_ids))
    elif label_id < 0:
        region_ids = _mirror_label_ids(region_ids)
    #print("region IDs: {}".format(region_ids))
    return region_ids




[docs]
def get_children_from_id_df(
        df: pd.DataFrame,
        label_id: Union[int, Sequence[int]],
        label_col: str,
        parent_col: str,
        incl_parent: bool = True,
        ids: Optional[List[int]] = None
) -> List[int]:
    """Get the children of a given atlas ID from a data frame.
    
    Args:
        df: Data frame, which must include a column of label IDs and another
            column of the immediate parent ID for each label.
        label_id: ID or sequence of IDs whose children will be returned.
        label_col: Name of label ID column.
        parent_col: Name of immediate parent ID column.
        incl_parent: True to include ``label_ids`` in the output.
        ids: List of children, only for recursion.

    Returns:
        List of children, including parent(s) unless ``incl_parent`` is False.

    """
    if not libmag.is_seq(label_id):
        # convert to sequence of IDs
        label_id = [label_id]
    
    # get all immediate children, assuming parent col contains immediate parents
    children = df.loc[df[parent_col].isin(label_id), label_col]
    children = children.unique().tolist()
    
    if ids is None:
        # initialize output
        ids = label_id if incl_parent else []
    
    if len(children) > 0:
        # recursively get children of children
        ids.extend(children)
        return get_children_from_id_df(
            df, children, label_col, parent_col, incl_parent, ids)
    
    return ids




[docs]
def labels_to_parent(labels_ref_lookup, level=None,
                     allow_parent_same_level=False):
    """Generate a dictionary mapping label IDs to parent IDs at a given level.
    
    Parents are considered to be "below" (numerically lower level) their
    children, or at least at the same level if ``allow_parent_same_level``
    is True.
    
    Args:
        labels_ref_lookup (dict): The labels reference lookup, assumed to be an
            OrderedDict generated by :func:`ontology.create_reverse_lookup` 
            to look up by ID while preserving key order to ensure that 
            parents of any child will be reached prior to the child.
        level (int): Level at which to find parent for each label; defaults to
            None to get the parent immediately below the given label.
        allow_parent_same_level (bool): True to allow selecting a parent at
            the same level as the label; False to require the parent to be
            at least one level below. Defaults to False.
    
    Returns:
        dict: Dictionary of label IDs to parent IDs at the given level. Labels
        at the given level will be assigned to their own ID, and labels below
        or without a parent at the level will be given a default level of 0.
    
    """
    # similar to volumes_dict_level_grouping but without checking for neg 
    # keys or grouping values
    label_parents = {}
    ids = list(labels_ref_lookup.keys())
    for label_id in ids:
        parent_at_level = 0
        label = labels_ref_lookup[label_id]
        
        # find ancestor above (numerically below) label's level
        label_level = label[NODE][config.ABAKeys.LEVEL.value]
        target_level = label_level - 1 if level is None else level
        if label_level == target_level:
            # use label's own ID if at target level
            parent_at_level = label_id
        elif label_level > target_level:
            parents = label.get(PARENT_IDS)
            if parents:
                for parent in parents[::-1]:
                    # assume that parents are ordered by decreasing
                    # (numerically higher) level
                    if parent not in labels_ref_lookup: break
                    parent_level = labels_ref_lookup[
                        parent][NODE][config.ABAKeys.LEVEL.value]
                    if (parent_level <= target_level
                            or allow_parent_same_level
                            and parent_level == label_level):
                        # use first parent below (or at least at) target level
                        parent_at_level = parent
                        break
            else:
                print("No parents at level", label_level, "for label", label_id)
        
        parent_ref = label[NODE].get(config.ABAKeys.PARENT_ID.value)
        if parent_ref is None:
            parent_ref = label[NODE].get(config.AtlasMetrics.PARENT.value)
        try:
            # check for discrepancies between parent listed in ontology file
            # and derived from parsed parent IDs
            assert parent_ref == parent_at_level
        except AssertionError:
            _logger.debug(
                "Parent '%s' at level %s or lower for label %s does not match "
                "parent listed in reference file, '%s'",
                parent_at_level, target_level, label_id, parent_ref)
        label_parents[label_id] = parent_at_level
    return label_parents




[docs]
def make_labels_level(
        labels_np: np.ndarray, ref: "LabelsRef", level: int,
        fn_prog: Optional[Callable[[int, str], None]] = None) -> np.ndarray:
    """Convert a labels image to the given ontology level.
    
    Args:
        labels_np: Labels image.
        ref: Atlas labels reference.
        level: Level at which ``labels_np`` will be remapped.
        fn_prog: Function to update progress. Takes an integer as a progress
            percentage and a string as a message. Defaults to None.

    Returns:
        The remapped ``labels_np``, which will be altered in-place.

    """
    ids = list(ref.ref_lookup.keys())
    nids = len(ids)
    for i, key in enumerate(ids):
        # get keys from both sides of atlas
        keys = [key, -1 * key]
        for region in keys:
            if region == 0: continue
            # get ontological label
            label = ref.ref_lookup[abs(region)]
            label_level = label[NODE][config.ABAKeys.LEVEL.value]
            
            if label_level == level:
                # get children (including parent first) at given level 
                # and replace them with parent
                label_ids = get_children_from_id(
                    ref.ref_lookup, region)
                labels_region = np.isin(labels_np, label_ids)
                if fn_prog is not None:
                    # update progress
                    fn_prog(
                        int(i / nids * 100),
                        f"Replacing labels within {region}")
                labels_np[labels_region] = region
    
    return labels_np




[docs]
def get_label_item(label, item_key, key=NODE):
    """Convenience function to get the item from the sub-label.

    Args:
        label (dict): The label dictionary. Assumes that ``label`` is a
            nested dictionary.
        item_key (str): Key for item to retrieve from within ``label[key]``.
        key (str): First level key; defaults to :const:`NODE`.

    Returns:
        The label item, or None if not found.
    """
    item = None
    try:
        if label is not None:
            sub = label[key]
            if sub is not None:
                item = sub[item_key]
    except KeyError as e:
        print(e, item_key)
    return item




[docs]
def get_label_name(
        label: Dict[str, Any], side: bool = False,
        aba_key: Optional["config.ABAKeys"] = None):
    """Get the atlas region name from the label.
    
    Args:
        label: The label dictionary.
        side: True to add side suffix; defaults to False.
        aba_key: ABA enum to get from ``label``; defaults to None, in which
            case the name will be retrieved.
    
    Returns:
        The atlas region name, or None if not found.
    """
    if not aba_key:
        # default to get the full label name
        aba_key = config.ABAKeys.NAME
    
    name = None
    try:
        if label is not None:
            node = label[NODE]
            if node is not None:
                # get selected metadata
                name = node[aba_key.value]
                if side:
                    # add side indicator
                    if label[MIRRORED]:
                        name += LEFT_SUFFIX
                    else:
                        name += RIGHT_SUFFIX
    except KeyError as e:
        _logger.debug("Error getting label name: %s, %s", e, name)
    return name




[docs]
def get_label_side(label_id):
    """Convert label IDs into side strings.

    The convention used here is that positive values = right, negative
    values = left.

    TODO: consider making pos/neg side correspondence configurable.
    
    Args:
        label_id (int, List[int]): Label ID or sequence of IDs to convert,
            where all negative labels are considered right, all positive
            are left, and any mix of pos, neg, or zero are both.

    Returns:
        :str: Value of corresponding :class:`config.HemSides` enum.

    """
    if np.all(np.greater(label_id, 0)):
        return config.HemSides.RIGHT.value
    elif np.all(np.less(label_id, 0)):
        return config.HemSides.LEFT.value
    return config.HemSides.BOTH.value




[docs]
def scale_coords(
        coord: Sequence[int],
        scaling: Optional[Sequence[int]] = None,
        clip_shape: Optional[Sequence[int]] = None) -> np.ndarray:
    """Get the atlas label IDs for the given coordinates.
    
    Args:
        coord: Coordinates of experiment image in
            ``z,y,x,...`` order. Can be an ``[n, >=3]`` array of coordinates.
        scaling: Scaling factor for the labels image size compared with
            the experiment image as ``z,y,x,...``; defaults to None.
        clip_shape: Max image shape as ``z,y,x``, used to
            round coordinates for extra precision. For simplicity, scaled
            values are simply floored. Repeated scaling such as upsampling
            after downsampling can lead to errors. If this parameter is given,
            values will instead by rounded to minimize errors while giving
            ints. Rounded values will be clipped to this shape minus 1 to
            stay within bounds.
    
    Returns:
        An scaled array of the same shape as ``coord``. If the array
        contains a max of 3 coordinates columns, the array is casted
        to int. If not, the first 3 columns are rounded based on
        ``clip_shape``, but the array type is float.
    
    """
    _logger.debug(
        "Getting label IDs from coordinates using scaling: %s", scaling)
    coord_scaled = coord
    if scaling is not None:
        # scale coordinates to atlas image size
        coord_scaled = np.multiply(coord, scaling)
    
    # cast coordinates to int
    coords_only = coord_scaled[..., :3]
    if clip_shape is not None:
        # round when extra precision is necessary, such as during reverse 
        # scaling, which requires clipping so coordinates don't exceed labels 
        # image shape
        coords_only = np.around(coords_only).astype(int)
        coords_only = np.clip(
            coords_only, None, np.subtract(clip_shape, 1))
    else:
        # typically don't round to stay within bounds
        coords_only = coords_only.astype(int)
    if coord_scaled.shape[-1] <= 3:
        # assume coords are spatial dimensions
        coord_scaled = coords_only
    else:
        # allow float for additional dimensions, such as radius
        coord_scaled[..., :coords_only.shape[-1]] = coords_only
    
    return coord_scaled




[docs]
def get_label_ids_from_position(coord_scaled, labels_img):
    """Get the atlas label IDs for the given coordinates.

    Args:
        coord_scaled (:class:`numpy.ndarray`): 2D array of coordinates in
            ``[[z,y,x], ...]`` format, or a single row as a 1D array.
        labels_img (:class:`numpy.ndarray`): Labeled image from which to
            extract labels at coordinates in ``coord_scaled``.

    Returns:
        :class:`numpy.ndarray`: An array of label IDs corresponding to
        ``coord``, or a scalar of one ID if only one coordinate is given.
    
    """
    # index blob coordinates into labels image by int array indexing to 
    # get the corresponding label IDs
    coordsi = libmag.coords_for_indexing(coord_scaled)
    label_ids = labels_img[tuple(coordsi)][0]
    return label_ids




[docs]
def get_label(
        coord: Sequence[int], labels_img: np.ndarray,
        labels_lookup: Dict[int, Dict], scaling: Optional[Sequence[int]] = None,
        level: Optional[int] = None, rounding: bool = False
) -> Optional[Dict[str, Any]]:
    """Get the atlas label for the given coordinates.
    
    Args:
        coord: Coordinates of experiment image in (z, y, x) order.
        labels_img: The registered image whose intensity values correspond to 
            label IDs.
        labels_lookup: The labels reference lookup, passed to
            :meth:`get_label_at_level`.
        scaling: Scaling factor for the labels image size compared with the 
            experiment image; defaults to None.
        level: The ontology level as an integer to target; defaults to None.
        rounding: True to round coordinates after scaling (see 
            :func:``get_label_ids_from_position``); defaults to False.
    
    Returns:
        The label dictionary at those coordinates, or None if no label is 
        found.
    
    """
    coord_scaled = scale_coords(
        coord, scaling, labels_img.shape if rounding else None)
    label_id = get_label_ids_from_position(coord_scaled, labels_img)
    # _logger.debug("Found label_id: %s", label_id)
    return get_label_at_level(label_id, labels_lookup, level)




[docs]
def get_label_at_level(
        label_id: Union[int, Sequence[int]], labels_lookup: Dict[int, Dict],
        level: Optional[int] = None) -> Optional[Dict[str, Any]]:
    """Get atlas label at the given level.
    
    Args:
        label_id: Label ID or sequence of IDs.
        labels_lookup: The labels reference lookup, assumed to be generated by 
            :func:`ontology.create_reverse_lookup` to look up by ID.
        level: The ontology level as an integer to target; defaults to None. 
            If None, level will be ignored, and the exact matching label 
            to the given coordinates will be returned. If a level is given, 
            the label at the highest (numerically lowest) level encompassing 
            this region will be returned.

    Returns:
        The label dictionary at those coordinates, or None if no label is 
        found.

    """
    # TODO: check if can merge with make_labels_level
    mirrored = label_id < 0
    if mirrored:
        label_id = -1 * label_id
    label = None
    try:
        label = labels_lookup[label_id]
        if level is not None and label[
                NODE][config.ABAKeys.LEVEL.value] > level:
            
            # search for parent at "higher" (numerically lower) level 
            # that matches the target level
            parents = label[PARENT_IDS]
            label = None
            if label_id < 0:
                parents = np.multiply(parents, -1)
            for parent in parents:
                parent_label = labels_lookup[parent]
                if parent_label[NODE][config.ABAKeys.LEVEL.value] == level:
                    label = parent_label
                    break
        if label is None:
            _logger.debug(
                "Label %s present but at finer level than %s", label_id, level)
        else:
            label[MIRRORED] = mirrored
            # _logger.debug("Label %s found at level %s", label_id, level)
    except KeyError:
        _logger.debug("Could not find label id %s or its parent", label_id)
    return label




[docs]
def get_region_middle(
        labels_ref_lookup: Dict[int, Dict], label_id: Union[int, Sequence[int]],
        labels_img: np.ndarray, scaling: Optional[Sequence[int]] = None, 
        both_sides: Union[bool, Sequence[bool]] = False,
        incl_children: bool = True
) -> Tuple[Optional[Sequence[int]], Optional[np.ndarray],
           Optional[Sequence[int]]]:
    """Approximate the middle position of a region by taking the middle 
    value of its sorted list of coordinates.
    
    The region's coordinate sorting prioritizes z, followed by y, etc, meaning
    that the middle value will be closest to the middle of z but may fall
    be slightly away from midline in the other axes if this z does not
    contain y/x's around midline. Getting the coordinate at the middle
    of this list rather than another coordinate midway between other values
    in the region ensures that the returned coordinate will reside within
    the region itself, including non-contingous regions that may be
    intermixed with coordinates not part of the region.
    
    Args:
        labels_ref_lookup: The labels reference lookup,
            assumed to be  generated by :func:`ontology.create_reverse_lookup`
            to look up by ID.
        label_id: ID of the label to find, or sequence of IDs.
        labels_img: The registered image whose intensity
            values correspond to label IDs.
        scaling: Scaling factors as a Numpy array in z,y,x
            for the labels image size compared with the experiment image.
        both_sides: True to include both sides, or
            sequence of booleans corresponding to ``label_id``; defaults
            to False.
        incl_children: True to include children of ``label_id``,
            False to include only ``label_id``; defaults to True.
    
    Returns:
        Tuple of ``coord``, the middle value of a list of all coordinates in
        the region at the given ID; ``img_region``, a boolean mask of the
        region within ``labels_img``; and ``region_ids``, a list of the IDs
        included in the region. If ``labels_ref_lookup`` is None, all values
        are None.
    
    """
    if not labels_ref_lookup:
        return None, None, None
    
    # gather IDs for label, including children and opposite sides
    if not libmag.is_seq(label_id):
        label_id = [label_id]
    if not libmag.is_seq(both_sides):
        both_sides = [both_sides]
    region_ids = []
    for region_id, both in zip(label_id, both_sides):
        if incl_children:
            # add children of the label +/- both sides
            region_ids.extend(get_children_from_id(
                labels_ref_lookup, region_id, incl_parent=True,
                both_sides=both))
        else:
            # add the label +/- its mirrored version
            region_ids.append(region_id)
            if both:
                region_ids.append(_mirror_label_ids(region_id))
    
    # get a list of all the region's coordinates to sort
    img_region = np.isin(labels_img, region_ids)
    region_coords = np.where(img_region)
    #print("region_coords:\n{}".format(region_coords))
    
    def get_middle(coords):
        # recursively get value at middle of list for each axis
        sort_ind = np.lexsort(coords[::-1])  # last axis is primary key
        num_coords = len(sort_ind)
        if num_coords > 0:
            mid_ind = sort_ind[int(num_coords / 2)]
            mid = coords[0][mid_ind]
            if len(coords) > 1:
                # shift to next axis in tuple of coords
                mask = coords[0] == mid
                coords = tuple(c[mask] for c in coords[1:])
                return (mid, *get_middle(coords))
            return (mid, )
        return None
    
    coord = get_middle(region_coords)
    if scaling is not None and coord:
        # print("coord_labels (unscaled): {}".format(coord))
        # print("ID at middle coord: {} (in region? {})"
        #       .format(labels_img[coord], img_region[coord]))
        coord = tuple(np.around(np.divide(coord, scaling)).astype(int))
    # print("coord at middle: {}".format(coord))
    return coord, img_region, region_ids




[docs]
def rel_to_abs_ages(rel_ages, gestation=19):
    """Convert sample names to ages.
    
    Args:
        rel_ages (List[str]): Sequence of strings in the format, 
            ``[stage][relative_age_in_days]``, where stage
            is either "E" = "embryonic" or "P" = "postnatal", such as 
            "E3.5" for 3.5 days after conception, or "P10" for 10 days 
            after birth.
        gestation (int): Number of days from conception until birth.

    Returns:
        Dictionary of ``{name: age_in_days}``.

    """
    ages = {}
    for val in rel_ages:
        age = float(val[1:])
        if val[0].lower() == "p":
            age += gestation
        ages[val] = age
    return ages




[docs]
def replace_labels(labels_img, df, clear=False, ref=None, combine_sides=False):
    """Replace labels based on a data frame.
    
    Args:
        labels_img (:class:`numpy.ndarray`): Labels image array whose values
            will be converted in-place.
        df (:class:`pandas.DataFrame`): Pandas data frame with from and to
            columns specified by :class:`LabelColumns` values.
        clear (bool): True to clear all other label values.
        ref (dict): Dictionary to get all children from each label;
            defaults to None.
        combine_sides (bool): True to combine sides by converting both
            positive labels and their corresponding negative label;
            defaults to False.

    Returns:
        :class:`numpy.ndarray`: ``labels_img`` with values replaced in-place.

    """
    labels_img_orig = labels_img
    if clear:
        # clear all labels, replacing based on copy
        labels_img_orig = np.copy(labels_img)
        labels_img[:] = 0
    from_labels = df[LabelColumns.FROM_LABEL.value]
    to_labels = df[LabelColumns.TO_LABEL.value]
    for to_label in to_labels.unique():
        # replace all labels matching the given target label
        to_convert = from_labels.loc[to_labels == to_label]
        if ref:
            to_convert_all = []
            for lbl in to_convert:
                # get all children for the label
                to_convert_all.extend(get_children_from_id(
                    ref, lbl, both_sides=combine_sides))
        else:
            to_convert_all = to_convert.values
        print("Converting labels from {} to {}"
              .format(to_convert_all, to_label))
        labels_img[np.isin(labels_img_orig, to_convert_all)] = to_label
    print("Converted image labels:", np.unique(labels_img))
    return labels_img