add things inside things functionality

Code transferred from PR#29 (#29) - updated notebooks - changed 'mean' to 'average' as input for make_summary_table function - updated tests
haesleinhuepf · Feb 1, 2023 · c1e0aaa · c1e0aaa
1 parent e3ec0fd
commit c1e0aaa
Show file tree

Hide file tree

Showing 14 changed files with 3,628 additions and 3 deletions.
diff --git a/data/BBBC007_reference.txt b/data/BBBC007_reference.txt
@@ -0,0 +1,2 @@
+"We used image set BBBC007v1 image set version 1 (Jones et al., Proc. ICCV Workshop on Computer Vision for Biomedical Image Applications, 2005), available from the Broad Bioimage Benchmark Collection [Ljosa et al., Nature Methods, 2012]."
+The images "17P1_POS0006_D_1UL.tif" and "17P1_POS0006_F_2UL.tif" were cropped (square 220px large with upper-left corner positioned at [80px, 150px] [x, y]) and converted from RGB to 16bit depth.
diff --git a/data/actin.tif b/data/actin.tif
diff --git a/data/cell_labels.tif b/data/cell_labels.tif
diff --git a/data/dna.tif b/data/dna.tif
diff --git a/data/dna_labels.tif b/data/dna_labels.tif
diff --git a/demo/intersection_over_target_area_explained.ipynb b/demo/intersection_over_target_area_explained.ipynb
diff --git a/demo/napari_regionprops_map_channels_functions.ipynb b/demo/napari_regionprops_map_channels_functions.ipynb
diff --git a/demo/napari_regionprops_map_channels_plugin.ipynb b/demo/napari_regionprops_map_channels_plugin.ipynb
diff --git a/napari_skimage_regionprops/__init__.py b/napari_skimage_regionprops/__init__.py
@@ -1,5 +1,9 @@
 from ._table import add_table, get_table, TableWidget
 from ._regionprops import regionprops, regionprops_table, regionprops_table_all_frames
+from ._multichannel import link_two_label_images, measure_labels, measure_labels_with_intensity
+from ._multichannel import measure_labels_in_labels_with_intensity, measure_labels_in_labels
+from ._multichannel import regionprops_measure_things_inside_things
+from ._process_tables import merge_measurements_to_reference, make_summary_table
 from ._parametric_images import visualize_measurement_on_labels, relabel
 from ._measure_points import measure_points
 from napari_plugin_engine import napari_hook_implementation

diff --git a/napari_skimage_regionprops/_multichannel.py b/napari_skimage_regionprops/_multichannel.py
diff --git a/napari_skimage_regionprops/_process_tables.py b/napari_skimage_regionprops/_process_tables.py
@@ -0,0 +1,223 @@
+import pandas
+from typing import List
+
+
+def merge_measurements_to_reference(
+        table_reference_labels_properties: "pandas.DataFrame",
+        table_linking_labels: List["pandas.DataFrame"],
+        table_labels_to_measure_properties: List["pandas.DataFrame"],
+        suffixes=None) -> List["pandas.DataFrame"]:
+    """
+    Merge measurements from target to reference table through a linking table.
+
+    Parameters
+    ----------
+    table_reference_labels_properties : pandas.DataFrame
+        a table to be used as a reference with a column 'label' and other
+        columns with features.
+    table_linking_labels : List["pandas.DataFrame"]
+        a list of tables. Each table should contain 2 columns, a
+        label_reference' and a 'label_target'. Each table row associates a
+        target label to a reference label.
+    table_labels_to_measure_properties : List["pandas.DataFrame"]
+        a list of tables to be used as targets with a column 'label' and other
+        columns with features.
+    suffixes : List[str], optional
+        list of strings containing suffixes to be added to the output table
+        columns. If None (default), '_reference' and increasing numbers are
+        used as suffixes.
+
+    Returns
+    -------
+    List[pandas.DataFrame]
+        a list of relationship tables, which associate each target label (with
+        its properties) to a reference label (with its properties).
+    """
+    import pandas as pd
+    # Shape input to right format
+    # Create lists of tables to iterate later
+    if not isinstance(table_linking_labels, list):
+        list_table_linking_labels = [table_linking_labels]
+    else:
+        list_table_linking_labels = table_linking_labels
+    if not isinstance(table_labels_to_measure_properties, list):
+        list_table_labels_to_measure_properties = [
+            table_labels_to_measure_properties]
+    else:
+        list_table_labels_to_measure_properties = \
+            table_labels_to_measure_properties
+    # Build custom suffixes or check if provided suffixes match data size
+    n_measurement_tables = len(list_table_labels_to_measure_properties)
+    if suffixes is None:
+        n_leading_zeros = n_measurement_tables // 10
+        suffixes = ['_reference'] + ['_' + str(i+1).zfill(1+n_leading_zeros)
+                                     for i in range(n_measurement_tables)]
+    else:
+        if len(suffixes) != len(table_labels_to_measure_properties) + 1:
+            print(('Error: List of suffixes must have the same length as the'
+                  'number of tables containing measurements'))
+            return
+
+    # Rename column names with appropriate suffixes
+    # Raname reference table columns
+    table_reference_labels_properties.columns = [
+            props + suffixes[0]
+            for props in table_reference_labels_properties.columns]
+    # Rename columns of tables with linking labels 
+    for i, table_linking_labels in enumerate(list_table_linking_labels):
+        table_linking_labels.rename(
+                columns={'label_reference': 'label' + suffixes[0],
+                         'label_target': 'label' + suffixes[i+1]},
+                inplace=True)
+    # Rename columns of tables with properties from other channels
+    for i, table_labels_to_measure_properties in enumerate(
+            list_table_labels_to_measure_properties):
+        table_labels_to_measure_properties.columns = [
+            props + suffixes[i+1]
+            for props in table_labels_to_measure_properties.columns]
+
+    output_table_list = []
+    # Consecutively merge linking_labels tables and properties from other 
+    # channels tables to the reference table
+    for i, table_linking_labels, table_labels_to_measure_properties in zip(
+            range(n_measurement_tables),
+            list_table_linking_labels,
+            list_table_labels_to_measure_properties):
+        # Merge other labels to label_reference
+        output_table = pd.merge(table_reference_labels_properties,
+                                table_linking_labels,
+                                how='outer', on='label' + suffixes[0])
+        # Fill NaN labels with zeros (if label were not linked, they belong to
+        # background)
+        output_table['label' + suffixes[i+1]] = output_table[
+            'label' + suffixes[i+1]].fillna(0)
+        # Merge other properties to output table based on new labels column
+        output_table = pd.merge(output_table,
+                                table_labels_to_measure_properties,
+                                how='outer', on='label' + suffixes[i+1])
+        # Ensure label columns type to be integer
+        for column in output_table.columns:
+            if column.startswith('label'):
+                output_table[column] = output_table[column].astype(int)
+        # Append output table to list (each table may have different shapes)
+        output_table_list.append(output_table)
+    return output_table_list
+
+
+def count_non_zeros(df):
+    import numpy as np
+    import pandas as pd
+    return pd.DataFrame(data=np.count_nonzero(df, axis=0)[np.newaxis, :], columns=df.columns)
+
+
+def make_summary_table(table: List["pandas.DataFrame"],
+                       suffixes=None,
+                       statistics_list=['count',]) -> "pandas.DataFrame":
+    """
+    Calculate summary statistics of a list of relationship tables.
+
+    For each relationship table, which relates target labels and its properties
+    to reference labels (and its properties), calculate summary statistics
+    defined by `statistics_list` and concatenates outputs to the rigth as new
+    columns.
+
+    Parameters
+    ----------
+    table : List[pandas.DataFrame]
+        a relationship table or a list of them.
+    suffixes : List[str], optional
+        list of strings containing suffixes to be added to the output table
+        columns. If None (default), it looks for strings after 'label_' in the
+        tables and uses them as suffixes.
+    statistics_list : List[str], optional
+        list of strings determining summary statistics to be calculated.
+        Possible entries are 'count', 'mean', 'std', 'min', '25%', '50%',
+        '75%', 'max'. The percentages correspond to percentiles.
+
+    Returns
+    -------
+    pandas.DataFrame
+        a table containing summary statistics.
+    """
+    # If not provided, guess suffixes from column names (last string after '_')
+    import re
+    import pandas as pd
+    if suffixes is None:
+        suffixes = []
+        # get everything after '_' that starts with 'label'
+        pattern = 'label*(_\w+)$'
+        for tab in table:
+            for name in tab.columns:
+                matches = re.match(pattern, name)
+                if matches is not None:
+                    new_entry = matches.group(1)
+                    if new_entry not in suffixes:
+                        suffixes.append(new_entry)
+            if len(suffixes) == 0:
+                print(('Could not infer suffixes from column names. Please '
+                       'provide a list of suffixes identifying different '
+                       'channels'))
+    if isinstance(table, pandas.DataFrame):
+        table = [table]
+
+    if 'count' in statistics_list:
+        counts = True
+        statistics_list.remove('count')
+    else:
+        counts = False
+
+    # if 'average', rename to mean to match pandas describe function
+    if 'average' in statistics_list:
+        index = statistics_list.index('average')
+        statistics_list.remove('average')
+        statistics_list.insert(index, 'mean')
+
+    # To do (improve performance): calculate only desired statistics
+    # currently using .describe() and removing the ones whicn were not asked
+    summary_table_list = []
+    for tab, suf in zip(table, suffixes[1:]):
+        grouped = tab.groupby('label' + suffixes[0])
+        probe_columns = [prop for prop in tab.columns
+                         if not prop.endswith(suffixes[0])]
+        probe_measurement_columns = [name for name in probe_columns
+                                     if not name.startswith('label')]
+        summary_tab = grouped[probe_measurement_columns]\
+            .describe().reset_index()
+
+        # Filter by selected statistics
+        selected_columns = [('label' + suffixes[0], '')]
+        for stat in statistics_list:
+            for column in summary_tab.columns:
+                column_stat = column[-1]
+                if stat == column_stat:
+                    selected_columns.append(column)
+        summary_tab = summary_tab.loc[:, selected_columns]
+        # rename back mean to average
+        summary_tab = summary_tab.rename(columns={'mean': 'average'}, level=1)
+
+        if counts:
+            # counts [label + suf] elements grouped by label_reference
+            counts_column = tab.groupby('label' + suffixes[0]).apply(
+                count_non_zeros)['label' + suf].fillna(0).values
+            # if only 'counts' was asked, append to table
+            if len(statistics_list) == 0:
+                summary_tab['counts' + suf] = counts_column
+            # otherwise, insert 'counts' at column just before each suffix
+            # features
+            else:
+                for i, column in enumerate(summary_tab.columns):
+                    if (column[0].endswith(suf)):
+                        summary_tab.insert(i, 'counts' + suf, counts_column)
+                        break
+        summary_table_list.append(summary_tab)
+    # Join summary tables
+    summary_table = summary_table_list[0]
+    for summary_tab in summary_table_list[1:]:
+        summary_table = pd.concat([
+            summary_table,
+            summary_tab.iloc[:, 1:]
+            ], axis=1)
+    # Flatten summary statistics table
+    summary_table.columns = [' '.join(col).strip()
+                             for col in summary_table.columns.values]
+    return summary_table
diff --git a/napari_skimage_regionprops/_regionprops.py b/napari_skimage_regionprops/_regionprops.py
@@ -111,7 +111,6 @@ def standard_deviation_intensity(region, intensities):
     # weighted_moments_central
     # weighted_moments_hu
     # weighted_moments_normalized
-    print('PROPERTIES = ', properties)
     # quantitative analysis using scikit-image's regionprops
     from skimage.measure import regionprops_table as sk_regionprops_table
     table = sk_regionprops_table(np.asarray(labels).astype(int), intensity_image=np.asarray(image),

diff --git a/napari_skimage_regionprops/_table.py b/napari_skimage_regionprops/_table.py
@@ -239,15 +239,15 @@ def append_content(self, table: Union[dict, DataFrame], how: str = 'outer'):
 
 
 @register_function(menu="Measurement > Show table (nsr)")
-def add_table(labels_layer: "napari.layers.Layer", viewer: "napari.Viewer") -> TableWidget:
+def add_table(labels_layer: "napari.layers.Layer", viewer: "napari.Viewer", tabify: bool = False) -> TableWidget:
     """
     Add a table to a viewer and return the table widget. The table will show the `properties` of the given layer.
     """
     dock_widget = get_table(labels_layer, viewer)
     if dock_widget is None:
         dock_widget = TableWidget(labels_layer, viewer)
         # add widget to napari
-        viewer.window.add_dock_widget(dock_widget, area='right', name="Properties of " + labels_layer.name)
+        viewer.window.add_dock_widget(dock_widget, area='right', name="Properties of " + labels_layer.name, tabify = tabify)
     else:
         dock_widget.set_content(labels_layer.properties)
         if not dock_widget.parent().isVisible():
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		"We used image set BBBC007v1 image set version 1 (Jones et al., Proc. ICCV Workshop on Computer Vision for Biomedical Image Applications, 2005), available from the Broad Bioimage Benchmark Collection [Ljosa et al., Nature Methods, 2012]."
		The images "17P1_POS0006_D_1UL.tif" and "17P1_POS0006_F_2UL.tif" were cropped (square 220px large with upper-left corner positioned at [80px, 150px] [x, y]) and converted from RGB to 16bit depth.