Source code for niftynet.contrib.evaluation.classification_evaluations

# -*- coding: utf-8 -*-
"""
This module defines built-in evaluation functions for classification 
applications

Many classification metrics only make sense computed over all subjects,
so aggregation is used.
"""

from __future__ import absolute_import, division, print_function

import numpy as np
import pandas as pd

from niftynet.evaluation.base_evaluations import BaseEvaluation
from niftynet.evaluation.base_evaluator import ScalarAggregator,\
                                               DataFrameAggregator

# These implement ROC based on preselected threshold levels, rather than actual 
# data. They are left here as an illustration for now 
[docs]class roc(BaseEvaluation):
[docs]    def layer_op(self, subject_id, data):
        if not self.app_param.output_prob or\
           self.app_param.num_classes>2:
           return []
        pdf = pd.DataFrame.from_records([{'subject_id':subject_id,
                            'roc_i':data['inferred'][0,0,0,0,1],
                            'roc_l':data['label'][0,0,0,0,0]}],('subject_id',))
        return [pdf]

[docs]    @classmethod
    def aggregate(cls, df):
        thresholds = np.linspace(0,1,10)
        df_out = pd.DataFrame(index=range(len(thresholds)),columns=('thresholds','tp','fp','tn','fn','acc','sens','spec'))
        df_out.thresholds = thresholds
        for it in range(len(thresholds)):
            df_out.loc[it,'tp'] = (df[df.roc_l==1].roc_i>thresholds[it]).sum()
            df_out.loc[it,'fp'] = (df[df.roc_l==0].roc_i>thresholds[it]).sum()
            df_out.loc[it,'tn'] = (df[df.roc_l==0].roc_i<=thresholds[it]).sum()
            df_out.loc[it,'fn'] = (df[df.roc_l==1].roc_i<=thresholds[it]).sum()
        df_out.acc = (df_out.tp+df_out.tn)/(
            df_out.tp+df_out.tn+df_out.fp+df_out.fn)
        denom = df_out.tp+df_out.fn
        df_out.loc[denom>0,'sens'] = df_out.loc[denom>0,'tp']/denom[denom>0]
        denom = df_out.tn+df_out.fp
        df_out.loc[denom>0,'spec'] = df_out.loc[denom>0,'tn']/denom[denom>0]
        df_out=df_out.set_index('thresholds')
        return [df_out]

[docs]    def get_aggregations(self):
        if not self.app_param.output_prob or\
           self.app_param.num_classes>2:
           return []
        return [DataFrameAggregator(('subject_id',), self.aggregate)]

[docs]class roc_auc(BaseEvaluation):
[docs]    def layer_op(self, subject_id, data):
        if not self.app_param.output_prob or\
           self.app_param.num_classes>2:
           return []
        pdf = pd.DataFrame.from_records([{'subject_id':subject_id,
                            'roc_auc_i':data['inferred'][0,0,0,0,1],
                            'roc_auc_l':data['label'][0,0,0,0,0]}],('subject_id',))
        return [pdf]

[docs]    @classmethod
    def aggregate(cls, df):
        thresholds = np.linspace(1,0,10)
        df_out = pd.DataFrame(index=range(len(thresholds)),columns=('thresholds','tp','fp','tn','fn','acc','sens','spec'))
        df_out.thresholds = thresholds
        for it in range(len(thresholds)):
            df_out.loc[it,'tp'] = (df[df.roc_auc_l==1].roc_auc_i>thresholds[it]).sum()
            df_out.loc[it,'fp'] = (df[df.roc_auc_l==0].roc_auc_i>thresholds[it]).sum()
            df_out.loc[it,'tn'] = (df[df.roc_auc_l==0].roc_auc_i<=thresholds[it]).sum()
            df_out.loc[it,'fn'] = (df[df.roc_auc_l==1].roc_auc_i<=thresholds[it]).sum()
        df_out.acc = (df_out.tp+df_out.tn)/(
            df_out.tp+df_out.tn+df_out.fp+df_out.fn)
        denom = df_out.tp+df_out.fn
        df_out.loc[denom>0,'sens'] = df_out.loc[denom>0,'tp']/denom[denom>0]
        denom = df_out.tn+df_out.fp
        df_out.loc[denom>0,'spec'] = df_out.loc[denom>0,'tn']/denom[denom>0]
        by_threshold=df_out.set_index('thresholds')

        tpr = np.array(list(by_threshold.sens))
        fpr = np.array(1-by_threshold.spec)
        roc_auc = np.sum((tpr[:-1] + tpr[1:]) * (fpr[1:] - fpr[:-1]) / 2)
        return [pd.DataFrame.from_records([{'roc_auc':roc_auc}])]


[docs]    def get_aggregations(self):
        if not self.app_param.output_prob or\
           self.app_param.num_classes>2:
           return []
        return [DataFrameAggregator(('subject_id',), self.aggregate)]