mmsegmentation/.dev/gather_benchmark_evaluation_results.py

# Copyright (c) OpenMMLab. All rights reserved.
import argparse
import glob
import os.path as osp

import mmcv
from mmcv import Config


def parse_args():
    parser = argparse.ArgumentParser(
        description='Gather benchmarked model evaluation results')
    parser.add_argument('config', help='test config file path')
    parser.add_argument(
        'root',
        type=str,
        help='root path of benchmarked models to be gathered')
    parser.add_argument(
        '--out',
        type=str,
        default='benchmark_evaluation_info.json',
        help='output path of gathered metrics and compared '
        'results to be stored')

    args = parser.parse_args()
    return args


if __name__ == '__main__':
    args = parse_args()

    root_path = args.root
    metrics_out = args.out
    result_dict = {}

    cfg = Config.fromfile(args.config)

    for model_key in cfg:
        model_infos = cfg[model_key]
        if not isinstance(model_infos, list):
            model_infos = [model_infos]
        for model_info in model_infos:
            previous_metrics = model_info['metric']
            config = model_info['config'].strip()
            fname, _ = osp.splitext(osp.basename(config))

            # Load benchmark evaluation json
            metric_json_dir = osp.join(root_path, fname)
            if not osp.exists(metric_json_dir):
                print(f'{metric_json_dir} not existed.')
                continue

            json_list = glob.glob(osp.join(metric_json_dir, '*.json'))
            if len(json_list) == 0:
                print(f'There is no eval json in {metric_json_dir}.')
                continue

            log_json_path = list(sorted(json_list))[-1]
            metric = mmcv.load(log_json_path)
            if config not in metric.get('config', {}):
                print(f'{config} not included in {log_json_path}')
                continue

            # Compare between new benchmark results and previous metrics
            differential_results = dict()
            new_metrics = dict()
            for record_metric_key in previous_metrics:
                if record_metric_key not in metric['metric']:
                    raise KeyError('record_metric_key not exist, please '
                                   'check your config')
                old_metric = previous_metrics[record_metric_key]
                new_metric = round(metric['metric'][record_metric_key] * 100,
                                   2)

                differential = new_metric - old_metric
                flag = '+' if differential > 0 else '-'
                differential_results[
                    record_metric_key] = f'{flag}{abs(differential):.2f}'
                new_metrics[record_metric_key] = new_metric

            result_dict[config] = dict(
                differential=differential_results,
                previous=previous_metrics,
                new=new_metrics)

    if metrics_out:
        mmcv.dump(result_dict, metrics_out, indent=4)
    print('===================================')
    for config_name, metrics in result_dict.items():
        print(config_name, metrics)
    print('===================================')
[Enhancement] Add Dev tools to boost develop (#798) * Modify default work dir when training. * Refactor gather_models.py. * Add train and test matching list. * Regression benchmark list. * lower readme name to upper readme name. * Add url check tool and model inference test tool. * Modify tool name. * Support duplicate mode of log json url check. * Add regression benchmark evaluation automatic tool. * Add train script generator. * Only Support script running. * Add evaluation results gather. * Add exec Authority. * Automatically make checkpoint root folder. * Modify gather results save path. * Coarse-grained train results gather tool. * Complete benchmark train script. * Make some little modifications. * Fix checkpoint urls. * Fix unet checkpoint urls. * Fix fast scnn & fcn checkpoint url. * Fix fast scnn checkpoint urls. * Fix fast scnn url. * Add differential results calculation. * Add differential results of regression benchmark train results. * Add an extra argument to select model. * Update nonlocal_net & hrnet checkpoint url. * Fix checkpoint url of hrnet and Fix some tta evaluation results and modify gather models tool. * Modify fast scnn checkpoint url. * Resolve new comments. * Fix url check status code bug. * Resolve some comments. * Modify train scripts generator. * Modify work_dir of regression benchmark results. * model gather tool modification. 2021-09-03 00:44:51 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
			`import argparse`
			`import glob`
			`import os.path as osp`

			`import mmcv`
			`from mmcv import Config`


			`def parse_args():`
			`parser = argparse.ArgumentParser(`
			`description='Gather benchmarked model evaluation results')`
			`parser.add_argument('config', help='test config file path')`
			`parser.add_argument(`
			`'root',`
			`type=str,`
			`help='root path of benchmarked models to be gathered')`
			`parser.add_argument(`
			`'--out',`
			`type=str,`
			`default='benchmark_evaluation_info.json',`
			`help='output path of gathered metrics and compared '`
			`'results to be stored')`

			`args = parser.parse_args()`
			`return args`


			`if __name__ == '__main__':`
			`args = parse_args()`

			`root_path = args.root`
			`metrics_out = args.out`
			`result_dict = {}`

			`cfg = Config.fromfile(args.config)`

			`for model_key in cfg:`
			`model_infos = cfg[model_key]`
			`if not isinstance(model_infos, list):`
			`model_infos = [model_infos]`
			`for model_info in model_infos:`
			`previous_metrics = model_info['metric']`
			`config = model_info['config'].strip()`
			`fname, _ = osp.splitext(osp.basename(config))`

			`# Load benchmark evaluation json`
			`metric_json_dir = osp.join(root_path, fname)`
			`if not osp.exists(metric_json_dir):`
			`print(f'{metric_json_dir} not existed.')`
			`continue`

			`json_list = glob.glob(osp.join(metric_json_dir, '*.json'))`
			`if len(json_list) == 0:`
			`print(f'There is no eval json in {metric_json_dir}.')`
			`continue`

			`log_json_path = list(sorted(json_list))[-1]`
			`metric = mmcv.load(log_json_path)`
			`if config not in metric.get('config', {}):`
			`print(f'{config} not included in {log_json_path}')`
			`continue`

			`# Compare between new benchmark results and previous metrics`
			`differential_results = dict()`
			`new_metrics = dict()`
			`for record_metric_key in previous_metrics:`
			`if record_metric_key not in metric['metric']:`
			`raise KeyError('record_metric_key not exist, please '`
			`'check your config')`
			`old_metric = previous_metrics[record_metric_key]`
			`new_metric = round(metric['metric'][record_metric_key] * 100,`
			`2)`

			`differential = new_metric - old_metric`
			`flag = '+' if differential > 0 else '-'`
			`differential_results[`
			`record_metric_key] = f'{flag}{abs(differential):.2f}'`
			`new_metrics[record_metric_key] = new_metric`

			`result_dict[config] = dict(`
			`differential=differential_results,`
			`previous=previous_metrics,`
			`new=new_metrics)`

			`if metrics_out:`
			`mmcv.dump(result_dict, metrics_out, indent=4)`
			`print('===================================')`
			`for config_name, metrics in result_dict.items():`
			`print(config_name, metrics)`
			`print('===================================')`