Source code for segmentationmetrics.tests.test_metrics

import numpy as np
import pandas as pd
import pytest

from segmentationmetrics import SegmentationMetrics
from skimage.morphology import ball



[docs]
def assert_dict_approx(actual, expected, rel=1e-20, abs=1e-4):
    assert set(actual.keys()) == set(expected.keys())
    for k, v in expected.items():
        assert k in actual
        a = actual[k]
        if np.isnan(v):
            assert np.isnan(a)
        else:
            assert a == pytest.approx(v, rel=rel, abs=abs)




[docs]
class TestSegmentationMetrics:
    # Generate three spherical masks, two that are similar and one that
    # doesn't overlap at all
    img_shape = (256, 256, 256)
    canvas = np.zeros(img_shape, dtype=np.int8)

    # Base sphere
    centre_a = (128, 128, 128)
    radius_a = 80
    ball_a = ball(radius_a)
    img_a = canvas.copy()
    img_a[centre_a[0] - ball_a.shape[0] // 2:
          centre_a[0] + ball_a.shape[0] // 2 + 1,
          centre_a[1] - ball_a.shape[1] // 2:
          centre_a[1] + ball_a.shape[1] // 2 + 1,
          centre_a[2] - ball_a.shape[2] // 2:
          centre_a[2] + ball_a.shape[2] // 2 + 1] = ball_a

    # Slightly smaller and offset
    centre_b = (132, 132, 132)
    radius_b = 77
    ball_b = ball(radius_b)
    img_b = canvas.copy()
    img_b[centre_b[0] - ball_b.shape[0] // 2:
          centre_b[0] + ball_b.shape[0] // 2 + 1,
          centre_b[1] - ball_b.shape[1] // 2:
          centre_b[1] + ball_b.shape[1] // 2 + 1,
          centre_b[2] - ball_b.shape[2] // 2:
          centre_b[2] + ball_b.shape[2] // 2 + 1] = ball_b

    # Fits in the corner, not overlapping with either sphere_a or sphere_b
    centre_c = (50, 50, 50)
    radius_c = 40
    ball_c = ball(radius_c)
    img_c = canvas.copy()
    img_c[centre_c[0] - ball_c.shape[0] // 2:
          centre_c[0] + ball_c.shape[0] // 2 + 1,
          centre_c[1] - ball_c.shape[1] // 2:
          centre_c[1] + ball_c.shape[1] // 2 + 1,
          centre_c[2] - ball_c.shape[2] // 2:
          centre_c[2] + ball_c.shape[2] // 2 + 1] = ball_c
    
    # Add a second label to img_a
    centre_d = (140, 140, 140)
    radius_d = 30
    ball_d = ball(radius_d)
    img_d = img_a.copy()
    img_d[centre_d[0] - ball_d.shape[0] // 2:
          centre_d[0] + ball_d.shape[0] // 2 + 1,
          centre_d[1] - ball_d.shape[1] // 2:
          centre_d[1] + ball_d.shape[1] // 2 + 1,
          centre_d[2] - ball_d.shape[2] // 2:
          centre_d[2] + ball_d.shape[2] // 2 + 1] += ball_d
    
    # Add a second label to img_b
    centre_e = (160, 160, 160)
    radius_e = 25
    ball_e = ball(radius_e)
    img_e = img_b.copy()
    img_e[centre_e[0] - ball_e.shape[0] // 2:
          centre_e[0] + ball_e.shape[0] // 2 + 1,
          centre_e[1] - ball_e.shape[1] // 2:
          centre_e[1] + ball_e.shape[1] // 2 + 1,
          centre_e[2] - ball_e.shape[2] // 2:
          centre_e[2] + ball_e.shape[2] // 2 + 1] += ball_e
    
    # Add a second label to img_a that doesn't overlap with the first label in img_a
    centre_f = (10, 10, 10)
    radius_f = 4
    ball_f = ball(radius_f)
    img_f = img_a.copy()
    img_f[centre_f[0] - ball_f.shape[0] // 2:
          centre_f[0] + ball_f.shape[0] // 2 + 1,
          centre_f[1] - ball_f.shape[1] // 2:
          centre_f[1] + ball_f.shape[1] // 2 + 1,
          centre_f[2] - ball_f.shape[2] // 2:
          centre_f[2] + ball_f.shape[2] // 2 + 1] += (ball_f * 2)


[docs]
    def test_basic_case(self):
        # Overlapping spheres, isotropic voxels
        sm = SegmentationMetrics(self.img_a, self.img_b, (1, 1, 1))
        expected = {'accuracy': 0.9810,
                'dice': 0.9216,
                'hausdorff_distance': 8.6023,
                'jaccard': 0.8546,
                'mean_surface_distance': 3.6676,
                'precision': 0.8719,
                'predicted_volume': 2143.641,
                'sensitivity': 0.9773,
                'specificity': 0.9815,
                'true_volume': 1912.319,
                'volume_difference': 231.3220}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)
        # Verify dataframe is returned
        assert type(sm.get_df()) == pd.DataFrame



[docs]
    def test_float_case(self):
        # One image is a float array, checks these get thresholded.
        img_b_float = self.img_b.astype(float)
        img_b_float[img_b_float > 0.5] = 0.9
        sm = SegmentationMetrics(self.img_a, img_b_float, (1, 1, 1))
        expected = {'accuracy': 0.9810,
                'dice': 0.9216,
                'hausdorff_distance': 8.6023,
                'jaccard': 0.8546,
                'mean_surface_distance': 3.6676,
                'precision': 0.8719,
                'predicted_volume': 2143.641,
                'sensitivity': 0.9773,
                'specificity': 0.9815,
                'true_volume': 1912.319,
                'volume_difference': 231.3220}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_options(self):
        # Confirm changing Hausdorff percentile and surface distance
        # symmetry flags work as expected
        sm = SegmentationMetrics(self.img_a, self.img_b, (1, 1, 1),
                                 percentile=99, symmetric=False)
        assert np.isclose(sm.hausdorff_distance, 9.2736, rtol=1e-20, atol=1e-4)
        assert np.isclose(sm.mean_surface_distance, (3.7923, 3.5430),
                          rtol=1e-20, atol=1e-4).all()



[docs]
    def test_nonisotropic_voxels(self):
        # Overlapping spheres, non-isotropic voxels
        sm = SegmentationMetrics(self.img_a[..., ::2], self.img_b[..., ::2],
                                 (1, 1, 2))
        expected = {'accuracy': 0.9811,
                'dice': 0.9218,
                'hausdorff_distance': 8.4853,
                'jaccard': 0.8549,
                'mean_surface_distance': 3.5352,
                'precision': 0.8724,
                'predicted_volume': 2142.914,
                'sensitivity': 0.9770,
                'specificity': 0.9816,
                'true_volume': 1913.474,
                'volume_difference': 229.4400}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_2d(self):
        sm = SegmentationMetrics(self.img_a[..., 128], self.img_b[..., 128],
                                 (1, 1))
        expected = {'accuracy': 0.9688,
                'dice': 0.9470,
                'hausdorff_distance': 8.4853,
                'jaccard': 0.8993,
                'mean_surface_distance': 3.8745,
                'precision': 0.9110,
                'predicted_volume': 20.081,
                'sensitivity': 0.9860,
                'specificity': 0.9619,
                'true_volume': 18.553,
                'volume_difference': 1.5280}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_no_overlap(self):
        # Non-overlapping spheres
        sm = SegmentationMetrics(self.img_a, self.img_c, (1, 1, 1))
        expected = {'accuracy': 0.8563,
                'dice': 0.0,
                'hausdorff_distance': 169.2661,
                'jaccard': 0.0,
                'mean_surface_distance': 84.2791,
                'precision': 0.0,
                'predicted_volume': 2143.641,
                'sensitivity': 0.0,
                'specificity': 0.8702,
                'true_volume': 267.761,
                'volume_difference': 1875.88}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_all_wrong(self):
        # Test with all voxels misclassified
        sm = SegmentationMetrics(self.img_a, np.logical_not(self.img_a),
                                 (1, 1, 1))
        expected = {'accuracy': 0.0,
                    'dice': 0.0,
                    'hausdorff_distance': 116.6919,
                    'jaccard': 0.0,
                    'mean_surface_distance': 34.0172,
                    'precision': 0.0,
                    'predicted_volume': 2143.641,
                    'sensitivity': 0.0,
                    'specificity': 0.0,
                    'true_volume': 14633.575,
                    'volume_difference': -12489.9340}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_no_labels(self):
        # Test with no labels in either prediction or truth
        sm = SegmentationMetrics(np.zeros(self.img_shape, dtype=bool),
                                 np.zeros(self.img_shape, dtype=bool),
                                 (1, 1, 1))
        expected = {'accuracy': np.nan,
                    'dice': np.nan,
                    'hausdorff_distance': np.nan,
                    'jaccard': np.nan,
                    'mean_surface_distance': np.nan,
                    'precision': np.nan,
                    'predicted_volume': np.nan,
                    'sensitivity': np.nan,
                    'specificity': np.nan,
                    'true_volume': np.nan,
                    'volume_difference': np.nan}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_multilabel_basic(self):
        # Test with multiple labels
        sm = SegmentationMetrics(self.img_d, self.img_e, (1, 1, 1))
        expected = {'accuracy': 0.9817,
                'dice': 0.5264,
                'hausdorff_distance': 30.8881,
                'jaccard': 0.4401,
                'mean_surface_distance': 10.9338,
                'precision': 0.4883,
                'predicted_volume': 2143.641,
                'sensitivity': 0.5799,
                'specificity': 0.9862,
                'true_volume': 1912.319,
                'volume_difference': 231.3220}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_multilabel_with_options(self):
        # Test with multiple labels and non-default options
        sm = SegmentationMetrics(self.img_d, self.img_e, (1, 1, 1), 
                                 symmetric=False, percentile=99)
        assert np.isclose(sm.hausdorff_distance, 37.4730, rtol=1e-20, atol=1e-4)
        assert np.isclose(sm.mean_surface_distance, (12.9019,  8.9657),
                          rtol=1e-20, atol=1e-4).all()



[docs]
    def test_multilabel_labels_dont_overlap(self):
        # Test where label 1 doesn't overlap with label 2 in the ground truth
        sm = SegmentationMetrics(self.img_f, self.img_e, (1, 1, 1))
        expected = {'accuracy': 0.9866,
                'dice': 0.4520,
                'hausdorff_distance': 147.6504,
                'jaccard': 0.4124,
                'mean_surface_distance': 124.8019,
                'precision': 0.4207,
                'predicted_volume': 2143.898,
                'sensitivity': 0.4883,
                'specificity': 0.9886,
                'true_volume': 1912.319,
                'volume_difference': 361.5990}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)    

        

[docs]
    def test_multilabel_missing_label(self):
        # Test with multiple labels, but one label missing from the prediction
        sm = SegmentationMetrics(self.img_a, self.img_e, (1, 1, 1))
        expected = {'accuracy': 0.9866,
                    'dice': 0.4520,
                    'hausdorff_distance': np.nan,
                    'jaccard': 0.4124,
                    'mean_surface_distance': np.nan,
                    'precision': 0.4207,
                    'predicted_volume': 2143.641,
                    'sensitivity': 0.4883,
                    'specificity': 0.9886,
                    'true_volume': 1912.319,
                    'volume_difference': 361.8560}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_multilabel_with_options_missing_label(self):
        # Test with multiple labels, non-default options and one label missing 
        # from the prediction
        sm = SegmentationMetrics(self.img_a, self.img_e, (1, 1, 1), 
                                 symmetric=False, percentile=99)
        assert np.isnan(sm.hausdorff_distance)
        msd_arr = np.array(sm.mean_surface_distance)
        assert msd_arr.shape == (2,)  
        assert np.all(np.isnan(msd_arr)) 



[docs]
    def test_non_consecutive_labels(self):
        # Test with non-consecutive labels
        img_d = self.img_d.copy()
        img_d[img_d == 2] = 3
        img_e = self.img_e.copy()
        img_e[img_e == 2] = 3
        sm = SegmentationMetrics(img_d, img_e, (1, 1, 1))
        expected = {'accuracy': 0.9817,
                'dice': 0.5264,
                'hausdorff_distance': 30.8881,
                'jaccard': 0.4401,
                'mean_surface_distance': 10.9338,
                'precision': 0.4883,
                'predicted_volume': 2143.641,
                'sensitivity': 0.5799,
                'specificity': 0.9862,
                'true_volume': 1912.319,
                'volume_difference': 231.3220}
        assert_dict_approx(sm.get_dict(), expected, rel=1e-20, abs=1e-4)



[docs]
    def test_many_labels_error(self):
        # Test that error is raised if more than 10 labels are present and
        # many_labels=False
        img = np.arange(12).reshape((2, 2, 3))
        with pytest.raises(ValueError, match='More than 10 labels found'):
            SegmentationMetrics(img, img, (1, 1, 1), many_labels=False)