Source code for tiatoolbox.utils.metrics
# ***** BEGIN GPL LICENSE BLOCK *****
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software Foundation,
# Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
#
# The Original Code is Copyright (C) 2021, TIA Centre, University of Warwick
# All rights reserved.
# ***** END GPL LICENSE BLOCK *****
"""This module defines several metrics used in computational pathology."""
import numpy as np
from scipy.optimize import linear_sum_assignment
from scipy.spatial import distance
[docs]def pair_coordinates(setA, setB, radius):
"""Find optimal unique pairing between two sets of coordinates.
This function uses the Munkres or Kuhn-Munkres algorithm behind the
scene to find the most optimal unique pairing when pairing points
in set B against points in set A, using euclidean distance as
the cost function.
Args:
setA (ndarray): an array of shape Nx2 contains the of XY coordinate
of N different points.
setB (ndarray): an array of shape Mx2 contains the of XY coordinate
of M different points.
radius: valid area around a point in setA to consider a given
coordinate in setB a candidate for matching.
Returns:
pairing (ndarray): an array of shape Kx2, each item in K contains
indices where point at index [0] in set A paired with
point in set B at index [1].
unpairedA (ndarray): indices of unpaired points in set A.
unpairedB (ndarray): indices of unpaired points in set A.
"""
# * Euclidean distance as the cost matrix
pair_distance = distance.cdist(setA, setB, metric="euclidean")
# * Munkres pairing with scipy library
# the algorithm return (row indices, matched column indices)
# if there is multiple same cost in a row, index of first occurence
# is return, thus the unique pairing is ensured
indicesA, paired_indicesB = linear_sum_assignment(pair_distance)
# extract the paired cost and remove instances
# outside of designated radius
pair_cost = pair_distance[indicesA, paired_indicesB]
pairedA = indicesA[pair_cost <= radius]
pairedB = paired_indicesB[pair_cost <= radius]
pairing = np.concatenate([pairedA[:, None], pairedB[:, None]], axis=-1)
unpairedA = np.delete(np.arange(setA.shape[0]), pairedA)
unpairedB = np.delete(np.arange(setB.shape[0]), pairedB)
return pairing, unpairedA, unpairedB
[docs]def f1_detection(true, pred, radius):
"""Calculate the F1-score for predicted set of coordinates."""
(paired_true, unpaired_true, unpaired_pred) = pair_coordinates(true, pred, radius)
tp = len(paired_true)
fp = len(unpaired_pred)
fn = len(unpaired_true)
return tp / (tp + 0.5 * fp + 0.5 * fn)