scripts/assess_detections.py

#!/bin/python
# -*- coding: utf-8 -*-

import os
import sys
import argparse
import json
import time
import yaml
import geopandas as gpd
import pandas as pd
import numpy as np
import plotly.graph_objects as go

from sklearn.metrics import confusion_matrix
from tqdm import tqdm

# the following lines allow us to import modules from within this file's parent folder
from inspect import getsourcefile
current_path = os.path.abspath(getsourcefile(lambda:0))
current_dir = os.path.dirname(current_path)
parent_dir = current_dir[:current_dir.rfind(os.path.sep)]
sys.path.insert(0, parent_dir)

from helpers import misc
from helpers import metrics
from helpers.constants import DONE_MSG, SCATTER_PLOT_MODE

from loguru import logger
logger = misc.format_logger(logger)


def main(cfg_file_path):

    tic = time.time()
    logger.info('Starting...')

    logger.info(f"Using {cfg_file_path} as config file.")

    with open(cfg_file_path) as fp:
        cfg = yaml.load(fp, Loader=yaml.FullLoader)[os.path.basename(__file__)]

    WORKING_DIR = cfg['working_directory']
    OUTPUT_DIR = cfg['output_folder']
    DETECTION_FILES = cfg['datasets']['detections']
    SPLIT_AOI_TILES = cfg['datasets']['split_aoi_tiles']
    CATEGORY_FILE = cfg['datasets']['categories']
    
    CRS_OUT = cfg['crs_out'] if 'crs_out' in cfg.keys() else 2056

    if 'ground_truth_labels' in cfg['datasets'].keys():
        GT_LABELS = cfg['datasets']['ground_truth_labels']
    else:
        GT_LABELS = None
    if 'other_labels' in cfg['datasets'].keys():
        OTH_LABELS = cfg['datasets']['other_labels']
    else:
        OTH_LABELS = None

    CONFIDENCE_THRESHOLD = cfg['confidence_threshold'] if 'confidence_threshold' in cfg.keys() else None
    IOU_THRESHOLD = cfg['iou_threshold'] if 'iou_threshold' in cfg.keys() else 0.25
    AREA_THRESHOLD = cfg['area_threshold'] if 'area_threshold' in cfg.keys() else None
    METHOD = cfg['metrics_method']

    os.chdir(WORKING_DIR)
    logger.info(f'Working directory set to {WORKING_DIR}.')
    # let's make the output directory in case it doesn't exist
    if not os.path.exists(OUTPUT_DIR):
        os.makedirs(OUTPUT_DIR)
    
    written_files = []
    
    # ------ Loading datasets

    logger.info("Loading split AoI tiles as a GeoPandas DataFrame...")
    split_aoi_tiles_gdf = gpd.read_file(SPLIT_AOI_TILES)
    if 'year' in split_aoi_tiles_gdf.keys(): 
        split_aoi_tiles_gdf = split_aoi_tiles_gdf.rename(columns={"year": "year_tile"})    
    
    logger.success(f"{DONE_MSG} {len(split_aoi_tiles_gdf)} records were found.")

    if GT_LABELS:
        logger.info("Loading Ground Truth Labels as a GeoPandas DataFrame...")
        gt_labels_gdf = gpd.read_file(GT_LABELS)
        logger.success(f"{DONE_MSG} {len(gt_labels_gdf)} records were found.")

    if OTH_LABELS:
        logger.info("Loading Other Labels as a GeoPandas DataFrame...")
        oth_labels_gdf = gpd.read_file(OTH_LABELS)
        logger.success(f"{DONE_MSG} {len(oth_labels_gdf)} records were found.")

    if GT_LABELS and OTH_LABELS:
        labels_gdf = pd.concat([
            gt_labels_gdf,
            oth_labels_gdf
        ])
    elif GT_LABELS and not OTH_LABELS:
        labels_gdf = gt_labels_gdf.copy()
    elif not GT_LABELS and OTH_LABELS:
        labels_gdf = oth_labels_gdf.copy()
    else:
        labels_gdf = pd.DataFrame() 
    if 'year' in labels_gdf.keys(): 
        labels_gdf = labels_gdf.rename(columns={"year": "year_label"})  

    if len(labels_gdf) > 0:
        logger.info("Clipping labels...")
        tic = time.time()

        assert(labels_gdf.crs == split_aoi_tiles_gdf.crs)
        clipped_labels_gdf = misc.clip_labels(labels_gdf, split_aoi_tiles_gdf, fact=0.9999)
        clipped_labels_gdf = clipped_labels_gdf.explode(ignore_index=True).to_crs(CRS_OUT)
        clipped_labels_gdf.loc[:, 'area'] = clipped_labels_gdf.area
        clipped_labels_gdf = misc.find_category(clipped_labels_gdf)
    
        file_to_write = os.path.join(OUTPUT_DIR, 'clipped_labels.gpkg')
        clipped_labels_gdf.to_file(file_to_write)
        written_files.append(file_to_write)

        logger.success(f"{DONE_MSG} Elapsed time = {(time.time()-tic):.2f} seconds.")


    # ------ Loading detections

    dets_gdf_dict = {}

    for dataset, dets_file in DETECTION_FILES.items():
        dets_gdf = gpd.read_file(dets_file)        
        dets_gdf = misc.check_validity(dets_gdf, correct=True)
        dets_gdf_dict[dataset] = dets_gdf.copy()

    
    if len(clipped_labels_gdf) > 0:
    
        # ------ Comparing detections with ground-truth data and computing metrics

        # initiate variables
        metrics_dict = {}
        metrics_dict_by_cl = {}
        for dataset in dets_gdf_dict.keys():
            metrics_dict[dataset] = []
            metrics_dict_by_cl[dataset] = []

        metrics_df_dict = {}
        metrics_cl_df_dict = {}
        thresholds = np.arange(0.05, 1., 0.05)

        # get labels ids
        filepath = open(CATEGORY_FILE)
        categories_json = json.load(filepath)
        filepath.close()

        # get classe ids
        id_classes = range(len(categories_json))

        # append class ids to labels
        categories_info_df = pd.DataFrame()
  
        for key in categories_json.keys():

            categories_tmp = {sub_key: [value] for sub_key, value in categories_json[key].items()}
            
            categories_info_df = pd.concat([categories_info_df, pd.DataFrame(categories_tmp)], ignore_index=True)

        categories_info_df.sort_values(by=['id'], inplace=True, ignore_index=True)
        categories_info_df.drop(['supercategory'], axis=1, inplace=True)

        categories_info_df.rename(columns={'name':'CATEGORY', 'id': 'label_class'},inplace=True)
        clipped_labels_gdf = clipped_labels_gdf.astype({'CATEGORY':'str'})
        clipped_labels_w_id_gdf = clipped_labels_gdf.merge(categories_info_df, on='CATEGORY', how='left')

        # get metrics
        outer_tqdm_log = tqdm(total=len(metrics_dict.keys()), position=0)

        for dataset in metrics_dict.keys():

            outer_tqdm_log.set_description_str(f'Current dataset: {dataset}')
            inner_tqdm_log = tqdm(total=len(thresholds), position=1, leave=False)

            for threshold in thresholds:

                inner_tqdm_log.set_description_str(f'Threshold = {threshold:.2f}')

                tmp_gdf = dets_gdf_dict[dataset].copy()
                tmp_gdf.to_crs(epsg=clipped_labels_w_id_gdf.crs.to_epsg(), inplace=True)
                tmp_gdf = tmp_gdf[tmp_gdf.score >= threshold].copy()

                tp_gdf, fp_gdf, fn_gdf, mismatched_class_gdf, small_poly_gdf = metrics.get_fractional_sets(
                    tmp_gdf, 
                    clipped_labels_w_id_gdf[clipped_labels_w_id_gdf.dataset == dataset],
                    IOU_THRESHOLD, AREA_THRESHOLD
                )
              
                tp_k, fp_k, fn_k, p_k, r_k, precision, recall, f1 = metrics.get_metrics(tp_gdf, fp_gdf, fn_gdf, mismatched_class_gdf, id_classes, method=METHOD)

                metrics_dict[dataset].append({
                    'threshold': threshold, 
                    'precision': precision, 
                    'recall': recall, 
                    'f1': f1
                })

                # label classes starting at 1 and detection classes starting at 0.
                for id_cl in id_classes:
                    metrics_dict_by_cl[dataset].append({
                        'threshold': threshold,
                        'class': id_cl,
                        'precision_k': p_k[id_cl],
                        'recall_k': r_k[id_cl],
                        'TP_k' : tp_k[id_cl],
                        'FP_k' : fp_k[id_cl],
                        'FN_k' : fn_k[id_cl],
                    })

                metrics_cl_df_dict[dataset] = pd.DataFrame.from_records(metrics_dict_by_cl[dataset])

                inner_tqdm_log.update(1)

            metrics_df_dict[dataset] = pd.DataFrame.from_records(metrics_dict[dataset])
            outer_tqdm_log.update(1)

        inner_tqdm_log.close()
        outer_tqdm_log.close()

        # let's generate some plots!

        fig = go.Figure()
        fig_k = go.Figure()


        for dataset in metrics_dict.keys():
            # Plot of the precision vs recall

            fig.add_trace(
                go.Scatter(
                    x=metrics_df_dict[dataset]['recall'],
                    y=metrics_df_dict[dataset]['precision'],
                    mode=SCATTER_PLOT_MODE,
                    text=metrics_df_dict[dataset]['threshold'], 
                    name=dataset
                )
            )

        fig.update_layout(
            xaxis_title="Recall",
            yaxis_title="Precision",
            xaxis=dict(range=[0., 1]),
            yaxis=dict(range=[0., 1])
        )

        file_to_write = os.path.join(OUTPUT_DIR, 'precision_vs_recall.html')
        fig.write_html(file_to_write)
        written_files.append(file_to_write)

        if len(id_classes) > 1:
            for dataset in metrics_dict_by_cl.keys():

                for id_cl in id_classes:

                    fig_k.add_trace(
                        go.Scatter(
                            x=metrics_cl_df_dict[dataset]['recall_k'][metrics_cl_df_dict[dataset]['class']==id_cl],
                            y=metrics_cl_df_dict[dataset]['precision_k'][metrics_cl_df_dict[dataset]['class']==id_cl],
                            mode='markers+lines',
                            text=metrics_cl_df_dict[dataset]['threshold'][metrics_cl_df_dict[dataset]['class']==id_cl],
                            name=dataset+'_'+str(id_cl)
                        )
                    )

            fig_k.update_layout(
                xaxis_title="Recall",
                yaxis_title="Precision",
                xaxis=dict(range=[0., 1]),
                yaxis=dict(range=[0., 1])
            )

            file_to_write = os.path.join(OUTPUT_DIR, 'precision_vs_recall_dep_on_class.html')
            fig_k.write_html(file_to_write)
            written_files.append(file_to_write)


        for dataset in metrics_dict_by_cl.keys():
            # Generate a plot of TP, FN and FP for each class

            fig = go.Figure()

            for id_cl in id_classes:
                
                for y in ['TP_k', 'FN_k', 'FP_k']:

                    fig.add_trace(
                        go.Scatter(
                                x=metrics_cl_df_dict[dataset]['threshold'][metrics_cl_df_dict[dataset]['class']==id_cl],
                                y=metrics_cl_df_dict[dataset][y][metrics_cl_df_dict[dataset]['class']==id_cl],
                                mode=SCATTER_PLOT_MODE,
                                name=y[0:2]+'_'+str(id_cl)
                            )
                        )

                fig.update_layout(xaxis_title="threshold", yaxis_title="#")
                
            if len(id_classes) > 1:
                file_to_write = os.path.join(OUTPUT_DIR, f'{dataset}_TP-FN-FP_vs_threshold_dep_on_class.html')

            else:
                file_to_write = os.path.join(OUTPUT_DIR, f'{dataset}_TP-FN-FP_vs_threshold.html')

            fig.write_html(file_to_write)
            written_files.append(file_to_write)


        for dataset in metrics_dict.keys():

            fig = go.Figure()

            for y in ['precision', 'recall', 'f1']:

                fig.add_trace(
                    go.Scatter(
                        x=metrics_df_dict[dataset]['threshold'],
                        y=metrics_df_dict[dataset][y],
                        mode=SCATTER_PLOT_MODE,
                        name=y
                    )
                )

            fig.update_layout(xaxis_title="threshold")

            file_to_write = os.path.join(OUTPUT_DIR, f'{dataset}_metrics_vs_threshold.html')
            fig.write_html(file_to_write)
            written_files.append(file_to_write)


        # ------ tagging detections

        # we select the threshold which maximizes the f1-score on the val dataset or the one passed by the user
        if 'val' in metrics_cl_df_dict.keys() and CONFIDENCE_THRESHOLD:
            logger.error('The confidence threshold was determined over the val dataset, but a confidence threshold is given in the config file.')
            logger.error(f'confidence threshold: val dataset = {metrics_df_dict["val"].loc[metrics_df_dict["val"]["f1"].argmax(), "threshold"]}, config = {CONFIDENCE_THRESHOLD}')
            logger.warning('The confidence threshold from the config file is used.')
        if CONFIDENCE_THRESHOLD:
            selected_threshold = CONFIDENCE_THRESHOLD
            logger.info(f"Tagging detections with threshold = {selected_threshold:.2f}, which is the threshold given in the config file.")
        elif 'val' in metrics_cl_df_dict.keys():
            selected_threshold = metrics_df_dict['val'].loc[metrics_df_dict['val']['f1'].argmax(), 'threshold']
            logger.info(f"Tagging detections with threshold = {selected_threshold:.2f}, which maximizes the f1-score on the val dataset.")
        else:
            raise AttributeError('No confidence threshold can be determined without the validation dataset or the passed value.')

        tagged_dets_gdf_dict = {}

        # TRUE/FALSE POSITIVES, FALSE NEGATIVES

        logger.info(f'Method to compute the metrics = {METHOD}')

        global_metrics_dict = {'dataset': [], 'precision': [], 'recall': [], 'f1': []}
        for dataset in metrics_dict.keys():

            tmp_gdf = dets_gdf_dict[dataset].copy()
            tmp_gdf.to_crs(epsg=clipped_labels_w_id_gdf.crs.to_epsg(), inplace=True)
            tmp_gdf = tmp_gdf[tmp_gdf.score >= selected_threshold].copy()

            tp_gdf, fp_gdf, fn_gdf, mismatched_class_gdf, small_poly_gdf = metrics.get_fractional_sets(
                tmp_gdf, 
                clipped_labels_w_id_gdf[clipped_labels_w_id_gdf.dataset == dataset],
                IOU_THRESHOLD, AREA_THRESHOLD
            )
            tp_gdf['tag'] = 'TP'
            tp_gdf['dataset'] = dataset
            fp_gdf['tag'] = 'FP'
            fp_gdf['dataset'] = dataset
            fn_gdf['tag'] = 'FN'
            fn_gdf['dataset'] = dataset
            mismatched_class_gdf['tag'] = 'wrong class'
            mismatched_class_gdf['dataset'] = dataset
            small_poly_gdf['tag'] = 'small polygon'
            small_poly_gdf['dataset'] = dataset

            tagged_dets_gdf_dict[dataset] = pd.concat([tp_gdf, fp_gdf, fn_gdf, mismatched_class_gdf, small_poly_gdf])

            _, _, _, _, _, precision, recall, f1 = metrics.get_metrics(tp_gdf, fp_gdf, fn_gdf, mismatched_class_gdf, id_classes, method=METHOD)
            global_metrics_dict['dataset'].append(dataset)
            global_metrics_dict['precision'].append(precision)
            global_metrics_dict['recall'].append(recall)
            global_metrics_dict['f1'].append(f1)
            logger.info(f'Dataset = {dataset} => precision = {precision:.3f}, recall = {recall:.3f}, f1 = {f1:.3f}')

        tagged_dets_gdf = pd.concat([
            tagged_dets_gdf_dict[x] for x in metrics_dict.keys()
        ])
        tagged_dets_gdf['det_category'] = [
            categories_info_df.loc[categories_info_df.label_class==det_class+1, 'CATEGORY'].iloc[0] 
            if not np.isnan(det_class) else None
            for det_class in tagged_dets_gdf.det_class.to_numpy()
        ] 

        file_to_write = os.path.join(OUTPUT_DIR, 'tagged_detections.gpkg')
        cols = ['geometry', 'score', 'tag', 'dataset', 'label_class', 'CATEGORY', 'det_class', 'det_category']
        if 'year_label' in labels_gdf.keys():
            cols.extend(['year_det', 'year_label'])
        tagged_dets_gdf[cols].to_file(file_to_write, driver='GPKG', index=False)
        written_files.append(file_to_write)

        # Save the metrics by class for each dataset
        metrics_by_cl_df = pd.DataFrame()
        for dataset in metrics_cl_df_dict.keys():
            dataset_df = metrics_cl_df_dict[dataset].copy()
            dataset_thrsld_df = dataset_df[dataset_df.threshold==selected_threshold].copy()
            dataset_thrsld_df['dataset'] = dataset
            dataset_thrsld_df.drop(columns=['threshold'], inplace=True)

            metrics_by_cl_df = pd.concat([metrics_by_cl_df, dataset_thrsld_df], ignore_index=True)
        
        metrics_by_cl_df['category'] = [
            categories_info_df.loc[categories_info_df.label_class==det_class+1, 'CATEGORY'].iloc[0] 
            for det_class in metrics_by_cl_df['class'].to_numpy()
        ] 

        file_to_write = os.path.join(OUTPUT_DIR, 'metrics_by_class.csv')
        metrics_by_cl_df[
            ['class', 'category', 'TP_k', 'FP_k', 'FN_k', 'precision_k', 'recall_k', 'dataset']
        ].sort_values(by=['dataset', 'class']).to_csv(file_to_write, index=False)
        written_files.append(file_to_write)

        tmp_df = metrics_by_cl_df[['dataset', 'TP_k', 'FP_k', 'FN_k']].groupby(by='dataset', as_index=False).sum()
        tmp_df2 = pd.DataFrame(global_metrics_dict, index = range(len(dets_gdf_dict.keys())))
        global_metrics_df = tmp_df.merge(tmp_df2, on='dataset')
        global_metrics_df.rename({'TP_k': 'TP', 'FP_k': 'FP', 'FN_k': 'FN', 'precision_k': 'precision', 'recall_k': 'recall'}, inplace=True)

        file_to_write = os.path.join(OUTPUT_DIR, 'global_metrics.csv')
        global_metrics_df.to_csv(file_to_write, index=False)
        written_files.append(file_to_write)

        # Save the confusion matrix
        na_value_category = tagged_dets_gdf.CATEGORY.isna()
        sorted_classes = tagged_dets_gdf.loc[~na_value_category, 'CATEGORY'].sort_values().unique().tolist() + ['background']
        tagged_dets_gdf.loc[na_value_category, 'CATEGORY'] = 'background'
        tagged_dets_gdf.loc[tagged_dets_gdf.det_category.isna(), 'det_category'] = 'background'
        
        for dataset in tagged_dets_gdf.dataset.unique():
            tagged_dataset_gdf = tagged_dets_gdf[tagged_dets_gdf.dataset == dataset].copy()

            true_class = tagged_dataset_gdf.CATEGORY.to_numpy()
            detected_class = tagged_dataset_gdf.det_category.to_numpy()

            confusion_array = confusion_matrix(true_class, detected_class, labels=sorted_classes)
            confusion_df = pd.DataFrame(confusion_array, index=sorted_classes, columns=sorted_classes, dtype='int64')
            confusion_df.rename(columns={'background': 'missed labels'}, inplace=True)

            file_to_write = os.path.join(OUTPUT_DIR, f'{dataset}_confusion_matrix.csv')
            confusion_df.to_csv(file_to_write)
            written_files.append(file_to_write)


    # ------ wrap-up

    print()
    logger.info("The following files were written. Let's check them out!")
    for written_file in written_files:
        logger.info(written_file)

    print()

    toc = time.time()
    logger.success(f"Nothing left to be done: exiting. Elapsed time: {(toc-tic):.2f} seconds")

    sys.stderr.flush()


if __name__ == "__main__":

    parser = argparse.ArgumentParser(description="This script assesses the quality of detections with respect to ground-truth/other labels.")
    parser.add_argument('config_file', type=str, help='a YAML config file')
    args = parser.parse_args()

    main(args.config_file)