eval_utils.py

import numpy as np
import itertools
import shutil
import nrrd
import copy
import pdb
import os

from sklearn.metrics import f1_score

import NN_extended
from post_processing import connected_component_analysis_3d, fill_holes
from datasets.utils import gen_batch_inds
from patch_utils import extract_Hakims_data_path

def eval_metrics(model, sess, 
                 dat_gen, 
                 iters=50,
                 update=True,
                 alt_attr=None):
    """ The alternative attribute will be used if `alt_attr`
    is given; otherwise `model.valid_metrics` will be used 
    """


    # metrics
    if alt_attr is not None:
        assert hasattr(model,alt_attr), 'The alternative attribute'+\
            ' does not exist.'
        valid_metrics = getattr(model, alt_attr)
    else:
        valid_metrics = model.valid_metrics
    eval_metrics = list(valid_metrics.keys())

    op_dict = {}
    eval_dict = {}
    model_inclusion = False
    MT_model_inclusion = False
    if 'av_acc' in eval_metrics:
        op_dict.update({'accs': model.posteriors})
        eval_dict.update({'accs': []})
        model_inclusion = True
    if 'F1' in eval_metrics:
        op_dict.update({'F1s': model.posteriors})
        eval_dict.update({'F1s': []})
        model_inclusion = True
        # binary or multiple F1 score
        F1_score = (lambda x,y: binary_F1_score(x,y)) if model.class_num==2 \
                   else lambda x,y: multi_F1_score(x,y,model.class_num)[1]
    if 'av_loss' in eval_metrics:
        op_dict.update({'av_loss': model.loss})
        eval_dict.update({'av_loss': 0.})
        model_inclusion = True

    all_preds = []
    all_masks = []
    vol = 0
    for _ in range(iters):
        batch_X, batch_mask = dat_gen()
        b = batch_X.shape[0]

        feed_dict = {}
        if model_inclusion:
            feed_dict.update({model.x:batch_X,
                              model.y_:batch_mask,
                              model.keep_prob:1.,
                              model.is_training:False})
        if hasattr(model, 'teacher'):
            feed_dict.update({model.teacher.keep_prob:1.,
                              model.teacher.is_training:False})

        results = sess.run(op_dict, feed_dict=feed_dict)

        for key, val in results.items():
            if 'loss' in key:
                # eval_dict[key]    : total av. loss computed so far
                # val==results[key] : the newest av. loss computed
                eval_dict[key] = (vol*eval_dict[key]+val*b) / (vol+b)

            if ('F1s' in key) or ('accs' in key):
                # val in this case is actually posterior
                preds = np.argmax(val, axis=-1)
                all_preds += [preds]
                nohot_batch_mask = np.argmax(batch_mask, axis=-1)
                all_masks += [nohot_batch_mask]
                
        vol += b

    if update:
        for metric in eval_metrics:
            if metric=='acc':
                preds = np.concatenate(all_preds, axis=0)
                masks = np.concatenate(all_masks, axis=0)
                valid_metrics[metric] += [np.sum(preds==masks)/np.prod(preds.shape)]
            elif metric=='F1':
                preds = np.concatenate(all_preds, axis=0)
                masks = np.concatenate(all_masks, axis=0)
                valid_metrics[metric] += [F1_score(preds, masks)]
            elif 'loss' in metric:
                valid_metrics[metric] += [eval_dict[metric]]
    else:
        return eval_dict

def full_slice_segment(model,sess,img_paths_or_mats, data_reader, op='prediction'):

    # size of batch
    b = 4

    if isinstance(img_paths_or_mats, list):
        m = len(img_paths_or_mats)
        if isinstance(img_paths_or_mats[0], np.ndarray):
            h,w,z = img_paths_or_mats[0].shape
            paths_or_mats = 'mats'
        else:
            h,w,z = data_reader(img_paths_or_mats[0]).shape
            paths_or_mats = 'paths'
    else:
        m = 1
        if isinstance(img_paths_or_mats, np.ndarray):
            h,w,z = img_paths_or_mats.shape
            paths_or_mats = 'mats'
        else:
            h,w,z = data_reader(img_paths_or_mats).shape
            paths_or_mats = 'paths'

    hx,wx = [model.x.shape[1].value, model.x.shape[2].value]
    assert h==hx and w==wx, 'Shape of data and model.x should match.'

    # loading images
    # m: number of input channels
    if paths_or_mats=='mats':
        img_list = img_paths_or_mats
    else:
        img_list = []
        for i in range(m):
            if m==1:
                img_list = [data_reader(img_paths_or_mats)] 
            else:
                img_list += [data_reader(img_paths_or_mats[i])]

    # performing the op for all slices in batches
    if op=='prediction':
        out_tensor = np.zeros((h,w,z))
    elif op=='loss':
        out_tensor = 0.
        cnt = 0
    elif op=='output' and (model.AU_4U or model.AU_4L):
        c = model.output.shape[-1].value
        out_tensor = np.zeros((c,h,w,z))
    elif op=='AU_vals' and model.AU_4U:
        out_tensor = np.zeros((h,w,z))
    else:
        c = model.y_.shape[-1].value  # = model.class_num in new version
        out_tensor = np.zeros((c,h,w,z))
    batches = gen_batch_inds(z, b)
    for batch in batches:
        batch_inds = np.sort(batch)
        batch_X = np.zeros((len(batch_inds),h,w,m))
        for j in range(m):
            batch_X[:,:,:,j] = np.rollaxis(img_list[j][:,:,batch_inds], 
                                           axis=-1)
        feed_dict = {model.x:batch_X, model.keep_prob:1., model.is_training:False}
        if op=='prediction':
            P = sess.run(model.posteriors, feed_dict=feed_dict)
            batch_preds = np.argmax(P, axis=-1)
            out_tensor[:,:,batch_inds] = np.rollaxis(batch_preds,axis=0,start=3)
        elif op=='AU_vals':
            P = sess.run(model.AU_vals, feed_dict=feed_dict)
            out_tensor[:,:,batch_inds] = np.swapaxes(np.swapaxes(P,1,2),0,2)
        elif op=='output':
            P = sess.run(model.output, feed_dict=feed_dict)
            out_tensor[:,:,:,batch_inds] = np.swapaxes(P,0,3)
        elif op=='posterior':
            P = sess.run(model.posteriors, feed_dict=feed_dict)
            out_tensor[:,:,:,batch_inds] = np.swapaxes(P,0,3)
        elif op=='MC-posterior':
            feed_dict[model.keep_prob] = 1-model.dropout_rate
            T = 10
            av_P = sess.run(model.posteriors, feed_dict=feed_dict)
            for i in range(1,T):
                av_P = (i*av_P + sess.run(model.posteriors, feed_dict=feed_dict))/(i+1)
            out_tensor[:,:,:,batch_inds] = np.swapaxes(av_P,0,3)
        elif op=='loss':
            loss = sess.run(model.loss, feed_dict=feed_dict)
            out_tensor = (len(batch)*loss + cnt*out_tensor) / (cnt+len(batch))
            cnt += len(batch)
        elif op=='sigma':
            out = sess.run(model.output, feed_dict=feed_dict)
            out_tensor[:,:,:,batch_inds] = np.swapaxes(out[:,:,:,c:],0,3)
        elif op=='MC-sigma':
            feed_dict[model.keep_prob] = 1-model.dropout_rate
            T = 10
            out = sess.run(model.output, feed_dict=feed_dict)
            av_sigma = out[:,:,:,c:]
            for i in range(1,T):
                out = sess.run(model.output, feed_dict=feed_dict)
                av_sigma = (i*av_sigma + out[:,:,:,c:])/(i+1)
            out_tensor[:,:,:,batch_inds] = np.swapaxes(av_sigma,0,3)

    return out_tensor

def get_full_segs(models_dict, 
                  sess,
                  dat,
                  post_process=False,
                  save_path=None,
                  dat_writer=None):
        
    n = len(dat.img_addrs[dat.mods[0]])

    #F1_score = (lambda x,y:binary_F1_score(x,y)) if dat.C==2 \
    #           else lambda x,y:multi_F1_score(x,y,dat.C)[1]
    segs = []
    for i in range(n):
        mask = dat.mask_reader(dat.mask_addrs[i])
        shape = mask.shape[:2]
        img_paths = [dat.img_addrs[mod][i] for mod in dat.mods]

        model_key = '{}'.format(shape)
        model = models_dict[model_key]
        seg = full_slice_segment(model,sess,img_paths, dat.reader)
        if post_process:
            seg = connected_component_analysis_3d(seg)
            seg = fill_holes(seg)

        segs += [seg]

    if save_path is not None:
        if not(os.path.exists(save_path)):
            print('The specified path for saving data does not exist.')
            return segs
        if dat_writer is None:
            dat_writer = lambda path,dat: nrrd.write(path,dat)
        for i,seg in enumerate(segs):
            dat_writer(os.path.join(save_path,'seg_{}.nrrd'.format(i)),seg)

    return segs
        

def eval_full_segs_explicit_partitions(seg_paths_or_mats, 
                                       mask_paths_or_mats,
                                       slice_partitions,
                                       **kwargs):
    """
    """

    kwargs.setdefault('dat_reader', lambda x:nrrd.read(x)[0])
    kwargs.setdefault('mask_reader', lambda x:nrrd.read(x)[0])
    dat_reader = kwargs['dat_reader']
    mask_reader = kwargs['mask_reader']
    
    # loading the data if only some paths are given
    if isinstance(seg_paths_or_mats[0], str):
        segs = []
        for path in seg_paths_or_mats:
            segs += [dat_reader(path)]
    else:
        segs = seg_paths_or_mats

    if isinstance(mask_paths_or_mats[0], str):
        masks = []
        for path in mask_paths_or_mats:
            masks += [mask_reader(path)]
    else:
        masks = mask_paths_or_mats

    # get the partitions
    if isinstance(slice_partitions, list):
        slice_partitions = np.repeat(np.array(slice_partitions),
                                     len(segs), axis=0)

    # computing the scores
    M = slice_partitions.shape[1]+1
    part_Fscores = np.zeros((len(segs), M))
    overall_Fscores = np.zeros(len(segs))

    for i in range(len(segs)):
        overall_Fscores[i] = binary_F1_score(segs[i], masks[i])

        # first partition
        seg = segs[i]
        mask = masks[i]
        seg_part = seg[:,:,:slice_partitions[i,0]]
        mask_part = mask[:,:,:slice_partitions[i,0]]
        part_Fscores[i,0] = binary_F1_score(seg_part, mask_part)
        # middle partitions (if any)
        for j in range(slice_partitions.shape[1]-1):
            seg_part = seg[:,:,slice_partitions[i,j]:slice_partitions[i,j+1]]
            mask_part = mask[:,:,slice_partitions[i,j]:slice_partitions[i,j+1]]
            part_Fscores[i,j+1] = binary_F1_score(seg_part, mask_part)
        # last partition
        seg_part = seg[:,:,slice_partitions[i,-1]:]
        mask_part = mask[:,:,slice_partitions[i,-1]:]
        part_Fscores[i,-1] = binary_F1_score(seg_part, mask_part)

    return overall_Fscores, part_Fscores

def eval_full_segs_label_percentage(seg_paths_or_mats, 
                                    mask_paths_or_mats,
                                    label, percentage,
                                    **kwargs):
    """ This is for a 3-fold partitioning of top and bottom
    slices that with voxels of a particular label less than
    a certain threshold (percentage in terms of the number of
    voxels in axial slices).
    """

    kwargs.setdefault('dat_reader', lambda x:nrrd.read(x)[0])
    kwargs.setdefault('mask_reader', lambda x:nrrd.read(x)[0])
    dat_reader = kwargs['dat_reader']
    mask_reader = kwargs['mask_reader']
    
    # loading the data if only some paths are given
    if isinstance(seg_paths_or_mats[0], str):
        segs = []
        for path in seg_paths_or_mats:
            segs += [dat_reader(path)]
    else:
        segs = seg_paths_or_mats

    if isinstance(mask_paths_or_mats[0], str):
        masks = []
        for path in mask_paths_or_mats:
            masks += [mask_reader(path)]
    else:
        masks = mask_paths_or_mats

    # computing the scores
    M = 3
    part_Fscores = np.zeros((len(segs), M))
    overall_Fscores = np.zeros(len(segs))

    for i in range(len(segs)):
        overall_Fscores[i] = binary_F1_score(segs[i], masks[i])

        # get the partition for this volume
        label_num = np.sum(masks[i]==label, axis=(0,1))
        thr_slices = np.where(label_num/np.prod(masks[i].shape[:2])
                              <percentage)[0]
        gap_loc = np.where((thr_slices[1:] - thr_slices[:-1]) > 1)[0]
        if len(gap_loc)>1:
            print('There are more than one gap for slice-wise label volume' + \
                  ' of image {}'.format(i))
            continue
        edge_1 = thr_slices[gap_loc[0]]
        edge_2 = thr_slices[gap_loc[0]+1]

        # top partition
        seg = segs[i]
        mask = masks[i]
        seg_part = seg[:,:,:edge_1]
        mask_part = mask[:,:,:edge_1]
        part_Fscores[i,0] = binary_F1_score(seg_part, mask_part)
        # middle partitions
        seg_part = seg[:,:,edge_1:edge_2]
        mask_part = mask[:,:,edge_1:edge_2]
        part_Fscores[i,1] = binary_F1_score(seg_part, mask_part)
        # last partition
        seg_part = seg[:,:,edge_2:]
        mask_part = mask[:,:,edge_2:]
        part_Fscores[i,2] = binary_F1_score(seg_part, mask_part)

    return overall_Fscores, part_Fscores


def binary_F1_score(preds, labels):

    TP = np.sum(preds*labels)
    P = np.sum(labels)
    TPFP = np.sum(preds)

    return 2*TP/(P+TPFP) if P+TPFP!=0. else 0.

def multi_F1_score(preds,labels,C=None):
    """F1 score for multi-class classification
    using `f1_score` function of scikit-learn package
    """

    if C is None:
        C = len(np.unique(labels))

    indiv_scores = f1_score(np.ravel(labels), np.ravel(preds), 
                            labels=np.arange(1,C),average=None)
    # in computing the weighted average, do not consider
    # background as a separate class
    av_score = f1_score(np.ravel(labels), np.ravel(preds),
                        labels=np.arange(1,C),average='weighted')

    return indiv_scores, av_score

def simple_eval_model(model,sess,dat_gen):

    preds = []
    grounds = []
    if model.dropout_rate is None:
        feed_dict = {}
    else:
        feed_dict = {model.keep_prob: 1.}
    
    for Xb, Yb,_ in dat_gen:
        feed_dict.update({model.x:Xb})
        preds += [sess.run(model.prediction, 
                           feed_dict=feed_dict)]
        grounds += [np.argmax(Yb, axis=0)]
    preds = np.concatenate(preds)
    grounds = np.concatenate(grounds)
    acc = np.sum(preds==grounds) / len(preds)

    return acc, preds

    
def models_dict_for_different_sizes(model_builder,
                                    dat):
    """Form a dictionary of FCN models, which has a model
    for each image size exists in the given data set

    Only one field of data class `dat` will be used, and that
    is `img_addrs` that contains image paths of all modalities.

    Model builder should be a function that only takes an
    input size and a model name, and returns a model object 
    that accepts inputs of the given size.
    """

    shapes = []
    for i in range(len(dat.img_addrs[dat.mods[0]])):
        img = dat.reader(dat.img_addrs[dat.mods[0]][i])
        shapes += [img.shape[:2]]
    shapes = np.unique(set(shapes))[0]

    models_dict = {}
    for shape in shapes:
        key = str(shape)
        model_name = '{}x{}'.format(shape[0],shape[1])
        models_dict[key] = model_builder(list(shape), model_name)
        models_dict[key].add_assign_ops()

    return models_dict