mirror of https://github.com/RE-OWOD/RE-OWOD
320 lines
11 KiB
Python
320 lines
11 KiB
Python
#!/usr/bin/env python3
|
|
# Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved
|
|
|
|
import argparse
|
|
import glob
|
|
import logging
|
|
import os
|
|
import pickle
|
|
import sys
|
|
from typing import Any, ClassVar, Dict, List
|
|
import torch
|
|
|
|
from detectron2.config import get_cfg
|
|
from detectron2.data.detection_utils import read_image
|
|
from detectron2.engine.defaults import DefaultPredictor
|
|
from detectron2.structures.boxes import BoxMode
|
|
from detectron2.structures.instances import Instances
|
|
from detectron2.utils.logger import setup_logger
|
|
|
|
from densepose import add_densepose_config, add_hrnet_config
|
|
from densepose.utils.logger import verbosity_to_level
|
|
from densepose.vis.base import CompoundVisualizer
|
|
from densepose.vis.bounding_box import ScoredBoundingBoxVisualizer
|
|
from densepose.vis.densepose import (
|
|
DensePoseResultsContourVisualizer,
|
|
DensePoseResultsFineSegmentationVisualizer,
|
|
DensePoseResultsUVisualizer,
|
|
DensePoseResultsVVisualizer,
|
|
)
|
|
from densepose.vis.extractor import CompoundExtractor, create_extractor
|
|
|
|
DOC = """Apply Net - a tool to print / visualize DensePose results
|
|
"""
|
|
|
|
LOGGER_NAME = "apply_net"
|
|
logger = logging.getLogger(LOGGER_NAME)
|
|
|
|
_ACTION_REGISTRY: Dict[str, "Action"] = {}
|
|
|
|
|
|
class Action(object):
|
|
@classmethod
|
|
def add_arguments(cls: type, parser: argparse.ArgumentParser):
|
|
parser.add_argument(
|
|
"-v",
|
|
"--verbosity",
|
|
action="count",
|
|
help="Verbose mode. Multiple -v options increase the verbosity.",
|
|
)
|
|
|
|
|
|
def register_action(cls: type):
|
|
"""
|
|
Decorator for action classes to automate action registration
|
|
"""
|
|
global _ACTION_REGISTRY
|
|
_ACTION_REGISTRY[cls.COMMAND] = cls
|
|
return cls
|
|
|
|
|
|
class InferenceAction(Action):
|
|
@classmethod
|
|
def add_arguments(cls: type, parser: argparse.ArgumentParser):
|
|
super(InferenceAction, cls).add_arguments(parser)
|
|
parser.add_argument("cfg", metavar="<config>", help="Config file")
|
|
parser.add_argument("model", metavar="<model>", help="Model file")
|
|
parser.add_argument("input", metavar="<input>", help="Input data")
|
|
parser.add_argument(
|
|
"--opts",
|
|
help="Modify config options using the command-line 'KEY VALUE' pairs",
|
|
default=[],
|
|
nargs=argparse.REMAINDER,
|
|
)
|
|
|
|
@classmethod
|
|
def execute(cls: type, args: argparse.Namespace):
|
|
logger.info(f"Loading config from {args.cfg}")
|
|
opts = []
|
|
cfg = cls.setup_config(args.cfg, args.model, args, opts)
|
|
logger.info(f"Loading model from {args.model}")
|
|
predictor = DefaultPredictor(cfg)
|
|
logger.info(f"Loading data from {args.input}")
|
|
file_list = cls._get_input_file_list(args.input)
|
|
if len(file_list) == 0:
|
|
logger.warning(f"No input images for {args.input}")
|
|
return
|
|
context = cls.create_context(args)
|
|
for file_name in file_list:
|
|
img = read_image(file_name, format="BGR") # predictor expects BGR image.
|
|
with torch.no_grad():
|
|
outputs = predictor(img)["instances"]
|
|
cls.execute_on_outputs(context, {"file_name": file_name, "image": img}, outputs)
|
|
cls.postexecute(context)
|
|
|
|
@classmethod
|
|
def setup_config(
|
|
cls: type, config_fpath: str, model_fpath: str, args: argparse.Namespace, opts: List[str]
|
|
):
|
|
cfg = get_cfg()
|
|
add_densepose_config(cfg)
|
|
add_hrnet_config(cfg)
|
|
cfg.merge_from_file(config_fpath)
|
|
cfg.merge_from_list(args.opts)
|
|
if opts:
|
|
cfg.merge_from_list(opts)
|
|
cfg.MODEL.WEIGHTS = model_fpath
|
|
cfg.freeze()
|
|
return cfg
|
|
|
|
@classmethod
|
|
def _get_input_file_list(cls: type, input_spec: str):
|
|
if os.path.isdir(input_spec):
|
|
file_list = [
|
|
os.path.join(input_spec, fname)
|
|
for fname in os.listdir(input_spec)
|
|
if os.path.isfile(os.path.join(input_spec, fname))
|
|
]
|
|
elif os.path.isfile(input_spec):
|
|
file_list = [input_spec]
|
|
else:
|
|
file_list = glob.glob(input_spec)
|
|
return file_list
|
|
|
|
|
|
@register_action
|
|
class DumpAction(InferenceAction):
|
|
"""
|
|
Dump action that outputs results to a pickle file
|
|
"""
|
|
|
|
COMMAND: ClassVar[str] = "dump"
|
|
|
|
@classmethod
|
|
def add_parser(cls: type, subparsers: argparse._SubParsersAction):
|
|
parser = subparsers.add_parser(cls.COMMAND, help="Dump model outputs to a file.")
|
|
cls.add_arguments(parser)
|
|
parser.set_defaults(func=cls.execute)
|
|
|
|
@classmethod
|
|
def add_arguments(cls: type, parser: argparse.ArgumentParser):
|
|
super(DumpAction, cls).add_arguments(parser)
|
|
parser.add_argument(
|
|
"--output",
|
|
metavar="<dump_file>",
|
|
default="results.pkl",
|
|
help="File name to save dump to",
|
|
)
|
|
|
|
@classmethod
|
|
def execute_on_outputs(
|
|
cls: type, context: Dict[str, Any], entry: Dict[str, Any], outputs: Instances
|
|
):
|
|
image_fpath = entry["file_name"]
|
|
logger.info(f"Processing {image_fpath}")
|
|
result = {"file_name": image_fpath}
|
|
if outputs.has("scores"):
|
|
result["scores"] = outputs.get("scores").cpu()
|
|
if outputs.has("pred_boxes"):
|
|
result["pred_boxes_XYXY"] = outputs.get("pred_boxes").tensor.cpu()
|
|
if outputs.has("pred_densepose"):
|
|
boxes_XYWH = BoxMode.convert(
|
|
result["pred_boxes_XYXY"], BoxMode.XYXY_ABS, BoxMode.XYWH_ABS
|
|
)
|
|
result["pred_densepose"] = outputs.get("pred_densepose").to_result(boxes_XYWH)
|
|
context["results"].append(result)
|
|
|
|
@classmethod
|
|
def create_context(cls: type, args: argparse.Namespace):
|
|
context = {"results": [], "out_fname": args.output}
|
|
return context
|
|
|
|
@classmethod
|
|
def postexecute(cls: type, context: Dict[str, Any]):
|
|
out_fname = context["out_fname"]
|
|
out_dir = os.path.dirname(out_fname)
|
|
if len(out_dir) > 0 and not os.path.exists(out_dir):
|
|
os.makedirs(out_dir)
|
|
with open(out_fname, "wb") as hFile:
|
|
pickle.dump(context["results"], hFile)
|
|
logger.info(f"Output saved to {out_fname}")
|
|
|
|
|
|
@register_action
|
|
class ShowAction(InferenceAction):
|
|
"""
|
|
Show action that visualizes selected entries on an image
|
|
"""
|
|
|
|
COMMAND: ClassVar[str] = "show"
|
|
VISUALIZERS: ClassVar[Dict[str, object]] = {
|
|
"dp_contour": DensePoseResultsContourVisualizer,
|
|
"dp_segm": DensePoseResultsFineSegmentationVisualizer,
|
|
"dp_u": DensePoseResultsUVisualizer,
|
|
"dp_v": DensePoseResultsVVisualizer,
|
|
"bbox": ScoredBoundingBoxVisualizer,
|
|
}
|
|
|
|
@classmethod
|
|
def add_parser(cls: type, subparsers: argparse._SubParsersAction):
|
|
parser = subparsers.add_parser(cls.COMMAND, help="Visualize selected entries")
|
|
cls.add_arguments(parser)
|
|
parser.set_defaults(func=cls.execute)
|
|
|
|
@classmethod
|
|
def add_arguments(cls: type, parser: argparse.ArgumentParser):
|
|
super(ShowAction, cls).add_arguments(parser)
|
|
parser.add_argument(
|
|
"visualizations",
|
|
metavar="<visualizations>",
|
|
help="Comma separated list of visualizations, possible values: "
|
|
"[{}]".format(",".join(sorted(cls.VISUALIZERS.keys()))),
|
|
)
|
|
parser.add_argument(
|
|
"--min_score",
|
|
metavar="<score>",
|
|
default=0.8,
|
|
type=float,
|
|
help="Minimum detection score to visualize",
|
|
)
|
|
parser.add_argument(
|
|
"--nms_thresh", metavar="<threshold>", default=None, type=float, help="NMS threshold"
|
|
)
|
|
parser.add_argument(
|
|
"--output",
|
|
metavar="<image_file>",
|
|
default="outputres.png",
|
|
help="File name to save output to",
|
|
)
|
|
|
|
@classmethod
|
|
def setup_config(
|
|
cls: type, config_fpath: str, model_fpath: str, args: argparse.Namespace, opts: List[str]
|
|
):
|
|
opts.append("MODEL.ROI_HEADS.SCORE_THRESH_TEST")
|
|
opts.append(str(args.min_score))
|
|
if args.nms_thresh is not None:
|
|
opts.append("MODEL.ROI_HEADS.NMS_THRESH_TEST")
|
|
opts.append(str(args.nms_thresh))
|
|
cfg = super(ShowAction, cls).setup_config(config_fpath, model_fpath, args, opts)
|
|
return cfg
|
|
|
|
@classmethod
|
|
def execute_on_outputs(
|
|
cls: type, context: Dict[str, Any], entry: Dict[str, Any], outputs: Instances
|
|
):
|
|
import cv2
|
|
import numpy as np
|
|
|
|
visualizer = context["visualizer"]
|
|
extractor = context["extractor"]
|
|
image_fpath = entry["file_name"]
|
|
logger.info(f"Processing {image_fpath}")
|
|
image = cv2.cvtColor(entry["image"], cv2.COLOR_BGR2GRAY)
|
|
image = np.tile(image[:, :, np.newaxis], [1, 1, 3])
|
|
data = extractor(outputs)
|
|
image_vis = visualizer.visualize(image, data)
|
|
entry_idx = context["entry_idx"] + 1
|
|
out_fname = cls._get_out_fname(entry_idx, context["out_fname"])
|
|
out_dir = os.path.dirname(out_fname)
|
|
if len(out_dir) > 0 and not os.path.exists(out_dir):
|
|
os.makedirs(out_dir)
|
|
cv2.imwrite(out_fname, image_vis)
|
|
logger.info(f"Output saved to {out_fname}")
|
|
context["entry_idx"] += 1
|
|
|
|
@classmethod
|
|
def postexecute(cls: type, context: Dict[str, Any]):
|
|
pass
|
|
|
|
@classmethod
|
|
def _get_out_fname(cls: type, entry_idx: int, fname_base: str):
|
|
base, ext = os.path.splitext(fname_base)
|
|
return base + ".{0:04d}".format(entry_idx) + ext
|
|
|
|
@classmethod
|
|
def create_context(cls: type, args: argparse.Namespace) -> Dict[str, Any]:
|
|
vis_specs = args.visualizations.split(",")
|
|
visualizers = []
|
|
extractors = []
|
|
for vis_spec in vis_specs:
|
|
vis = cls.VISUALIZERS[vis_spec]()
|
|
visualizers.append(vis)
|
|
extractor = create_extractor(vis)
|
|
extractors.append(extractor)
|
|
visualizer = CompoundVisualizer(visualizers)
|
|
extractor = CompoundExtractor(extractors)
|
|
context = {
|
|
"extractor": extractor,
|
|
"visualizer": visualizer,
|
|
"out_fname": args.output,
|
|
"entry_idx": 0,
|
|
}
|
|
return context
|
|
|
|
|
|
def create_argument_parser() -> argparse.ArgumentParser:
|
|
parser = argparse.ArgumentParser(
|
|
description=DOC,
|
|
formatter_class=lambda prog: argparse.HelpFormatter(prog, max_help_position=120),
|
|
)
|
|
parser.set_defaults(func=lambda _: parser.print_help(sys.stdout))
|
|
subparsers = parser.add_subparsers(title="Actions")
|
|
for _, action in _ACTION_REGISTRY.items():
|
|
action.add_parser(subparsers)
|
|
return parser
|
|
|
|
|
|
def main():
|
|
parser = create_argument_parser()
|
|
args = parser.parse_args()
|
|
verbosity = args.verbosity if hasattr(args, "verbosity") else None
|
|
global logger
|
|
logger = setup_logger(name=LOGGER_NAME)
|
|
logger.setLevel(verbosity_to_level(verbosity))
|
|
args.func(args)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|