EasyCV/easycv/predictors/classifier.py

# Copyright (c) Alibaba, Inc. and its affiliates.
import glob
import math
import os

import numpy as np
import torch
from PIL import Image

from easycv.file import io
from easycv.framework.errors import ValueError
from easycv.utils.checkpoint import load_checkpoint
from easycv.utils.misc import deprecated
from .base import InputProcessor, OutputProcessor, Predictor, PredictorV2
from .builder import PREDICTORS


# onnx specific
def onnx_to_numpy(tensor):
    return tensor.detach().cpu().numpy(
    ) if tensor.requires_grad else tensor.cpu().numpy()


class ClsInputProcessor(InputProcessor):
    """Process inputs for classification models.

    Args:
        cfg (Config): Config instance.
        pipelines (list[dict]): Data pipeline configs.
        batch_size (int): batch size for forward.
        pil_input (bool): Whether use PIL image. If processor need PIL input, set true, default false.
        threads (int): Number of processes to process inputs.
        mode (str): The image mode into the model.
    """

    def __init__(self,
                 cfg,
                 pipelines=None,
                 batch_size=1,
                 pil_input=True,
                 threads=8,
                 mode='BGR'):

        super(ClsInputProcessor, self).__init__(
            cfg, pipelines=pipelines, batch_size=batch_size, threads=threads)
        self.mode = mode
        self.pil_input = pil_input

    def _load_input(self, input):
        """Load image from file or numpy or PIL object.
        Args:
            input: File path or numpy or PIL object.
        Returns:
           {
                'filename': filename,
                'img': img,
                'img_shape': img_shape,
                'img_fields': ['img']
            }
        """
        if self.pil_input:
            results = {}
            if isinstance(input, str):
                img = Image.open(input)
                if img.mode.upper() != self.mode.upper():
                    img = img.convert(self.mode.upper())
                results['filename'] = input
            else:
                if isinstance(input, np.ndarray):
                    input = Image.fromarray(input)
                # assert isinstance(input, ImageFile.ImageFile)
                img = input
                results['filename'] = None
            results['img'] = img
            results['img_shape'] = img.size
            results['ori_shape'] = img.size
            results['img_fields'] = ['img']
            return results

        return super()._load_input(input)


class ClsOutputProcessor(OutputProcessor):
    """Output processor for processing classification model outputs.

    Args:
        topk (int): Return top-k results. Default: 1.
        label_map (dict): Dict of class id to class name.

    """

    def __init__(self, topk=1, label_map={}):
        self.topk = topk
        self.label_map = label_map
        super(ClsOutputProcessor, self).__init__()

    def __call__(self, inputs):
        """Return top-k results."""
        output_prob = inputs['prob'].data.cpu()
        topk_class = torch.topk(output_prob, self.topk).indices.numpy()
        output_prob = output_prob.numpy()
        batch_results = []
        batch_size = output_prob.shape[0]
        for i in range(batch_size):
            result = {'class': np.squeeze(topk_class[i]).tolist()}
            if isinstance(result['class'], int):
                result['class'] = [result['class']]

            if len(self.label_map) > 0:
                result['class_name'] = [
                    self.label_map[i] for i in result['class']
                ]
                result['class_probs'] = {}
                for l_idx, l_name in enumerate(self.label_map):
                    result['class_probs'][l_name] = output_prob[i][l_idx]

            batch_results.append(result)
        return batch_results


@PREDICTORS.register_module()
class ClassificationPredictor(PredictorV2):
    """Predictor for classification.
    Args:
        model_path (str): Path of model path.
        config_file (Optinal[str]): config file path for model and processor to init. Defaults to None.
        batch_size (int): batch size for forward.
        device (str): Support 'cuda' or 'cpu', if is None, detect device automatically.
        save_results (bool): Whether to save predict results.
        save_path (str): File path for saving results, only valid when `save_results` is True.
        pipelines (list[dict]): Data pipeline configs.
        topk (int): Return top-k results. Default: 1.
        pil_input (bool): Whether use PIL image. If processor need PIL input, set true, default false.
        label_map_path (str): File path of saving labels list.
        input_processor_threads (int): Number of processes to process inputs.
        mode (str): The image mode into the model.
    """

    def __init__(self,
                 model_path,
                 config_file=None,
                 batch_size=1,
                 device=None,
                 save_results=False,
                 save_path=None,
                 pipelines=None,
                 topk=1,
                 pil_input=True,
                 label_map_path=None,
                 input_processor_threads=8,
                 mode='BGR',
                 *args,
                 **kwargs):
        self.topk = topk
        self.pil_input = pil_input
        self.label_map_path = label_map_path

        if model_path.endswith('onnx'):
            self.model_type = 'onnx'
            pwd_model = os.path.dirname(model_path)
            raw_model = glob.glob(
                os.path.join(pwd_model, '*.onnx.config.json'))
            if len(raw_model) != 0:
                config_file = raw_model[0]
            else:
                assert len(
                    raw_model
                ) == 0, 'Please have a file with the .onnx.config.json extension in your directory'
        else:
            self.model_type = 'raw'

        if self.pil_input:
            mode = 'RGB'
        super(ClassificationPredictor, self).__init__(
            model_path,
            config_file=config_file,
            batch_size=batch_size,
            device=device,
            save_results=save_results,
            save_path=save_path,
            pipelines=pipelines,
            input_processor_threads=input_processor_threads,
            mode=mode,
            *args,
            **kwargs)

    def get_input_processor(self):
        return ClsInputProcessor(
            self.cfg,
            pipelines=self.pipelines,
            batch_size=self.batch_size,
            threads=self.input_processor_threads,
            pil_input=self.pil_input,
            mode=self.mode)

    def get_output_processor(self):
        # Adapt to torchvision transforms which process PIL inputs.
        if self.label_map_path is None:
            if 'CLASSES' in self.cfg:
                class_list = self.cfg.get('CLASSES', [])
            elif 'class_list' in self.cfg:
                class_list = self.cfg.get('class_list', [])
            else:
                class_list = []
        else:
            with io.open(self.label_map_path, 'r') as f:
                class_list = f.readlines()
        self.label_map = [i.strip() for i in class_list]

        return ClsOutputProcessor(topk=self.topk, label_map=self.label_map)

    def prepare_model(self):
        """Build model from config file by default.
        If the model is not loaded from a configuration file, e.g. torch jit model, you need to reimplement it.
        """
        if self.model_type == 'raw':
            model = self._build_model()
            model.to(self.device)
            model.eval()
            load_checkpoint(model, self.model_path, map_location='cpu')
            return model
        else:
            import onnxruntime
            if onnxruntime.get_device() == 'GPU':
                onnx_model = onnxruntime.InferenceSession(
                    self.model_path, providers=['CUDAExecutionProvider'])
            else:
                onnx_model = onnxruntime.InferenceSession(self.model_path)

            return onnx_model

    def model_forward(self, inputs):
        """Model forward.
        If you need refactor model forward, you need to reimplement it.
        """
        with torch.no_grad():
            if self.model_type == 'raw':
                outputs = self.model(**inputs, mode='test')
            else:
                outputs = self.model.run(None, {
                    self.model.get_inputs()[0].name:
                    onnx_to_numpy(inputs['img'])
                })[0]
                outputs = dict(prob=torch.from_numpy(outputs))
        return outputs


try:
    from easy_vision.python.inference.predictor import PredictorInterface
except:
    from .interface import PredictorInterface


@deprecated(reason='Please use ClassificationPredictor.')
@PREDICTORS.register_module()
class TorchClassifier(PredictorInterface):

    def __init__(self,
                 model_path,
                 model_config=None,
                 topk=1,
                 label_map_path=None):
        """
    init model

    Args:
      model_path: model file path
      model_config: config string for model to init, in json format
    """
        self.predictor = Predictor(model_path)
        if 'class_list' not in self.predictor.cfg and \
            'CLASSES' not in self.predictor.cfg and \
                label_map_path is None:
            raise ValueError(
                "'label_map_path' need to be set, when ckpt doesn't contain key 'class_list' and 'CLASSES'!"
            )

        if label_map_path is None:
            class_list = self.predictor.cfg.get('class_list', [])
            if len(class_list) < 1:
                class_list = self.predictor.cfg.get('CLASSES', [])
            self.label_map = [i.strip() for i in class_list]
        else:
            class_list = open(label_map_path).readlines()
            self.label_map = [i.strip() for i in class_list]
        self.output_name = ['prob', 'class']
        self.topk = topk if topk < len(class_list) else len(class_list)

    def get_output_type(self):
        """
    in this function user should return a type dict, which indicates
    which type of data should the output of predictor be converted to
    * type json, data will be serialized to json str

    * type image, data will be converted to encode image binary and write to oss file,
      whose name is output_dir/${key}/${input_filename}_${idx}.jpg, where input_filename
      is the base filename extracted from url, key corresponds to the key in the dict of output_type,
      if the type of data indexed by key is a list, idx is the index of element in list, otherwhile ${idx} will be empty

    * type video, data will be converted to encode video binary and write to oss file,

    :: return  {
      'image': 'image',
      'feature': 'json'
    }

    indicating that the image data in the output dict will be save to image
    file and feature in output dict will be converted to json

    """
        return {}

    def batch(self, image_tensor_list):
        return torch.stack(image_tensor_list)

    def predict(self, input_data_list, batch_size=-1):
        """
    using session run predict a number of samples using batch_size

    Args:
      input_data_list:  a list of numpy array, each array is a sample to be predicted
      batch_size: batch_size passed by the caller, you can also ignore this param and
        use a fixed number if you do not want to adjust batch_size in runtime
    Return:
      result: a list of dict, each dict is the prediction result of one sample
        eg, {"output1": value1, "output2": value2}, the value type can be
        python int str float, and numpy array
    """
        num_image = len(input_data_list)
        assert len(
            input_data_list) > 0, 'input images should not be an empty list'
        if batch_size > 0:
            num_batches = int(math.ceil(float(num_image) / batch_size))
            image_list = input_data_list
        else:
            num_batches = 1
            batch_size = len(input_data_list)
            image_list = input_data_list

        outputs_list = []
        for batch_idx in range(num_batches):
            batch_image_list = image_list[batch_idx * batch_size:min(
                (batch_idx + 1) * batch_size, len(image_list))]
            image_tensor_list = self.predictor.preprocess(batch_image_list)
            input_data = self.batch(image_tensor_list)
            output_prob = self.predictor.predict_batch(
                input_data, mode='test')['prob'].data.cpu()

            topk_prob = torch.topk(output_prob, self.topk).values.numpy()
            topk_class = torch.topk(output_prob, self.topk).indices.numpy()
            output_prob = output_prob.numpy()

            for idx in range(len(image_tensor_list)):
                single_result = {}
                single_result['class'] = np.squeeze(topk_class[idx]).tolist()
                if isinstance(single_result['class'], int):
                    single_result['class'] = [single_result['class']]
                single_result['class_name'] = [
                    self.label_map[i] for i in single_result['class']
                ]
                single_result['class_probs'] = {}
                for ldx, i in enumerate(self.label_map):
                    single_result['class_probs'][i] = output_prob[idx][ldx]

                outputs_list.append(single_result)

        return outputs_list
initial commit 2022-04-02 20:01:06 +08:00			`# Copyright (c) Alibaba, Inc. and its affiliates.`
add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`import glob`
initial commit 2022-04-02 20:01:06 +08:00			`import math`
add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`import os`
initial commit 2022-04-02 20:01:06 +08:00
			`import numpy as np`
			`import torch`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`from PIL import Image`
initial commit 2022-04-02 20:01:06 +08:00
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`from easycv.file import io`
add error code (#146) * add error code 2022-09-19 16:07:04 +08:00			`from easycv.framework.errors import ValueError`
add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`from easycv.utils.checkpoint import load_checkpoint`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`from easycv.utils.misc import deprecated`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`from .base import InputProcessor, OutputProcessor, Predictor, PredictorV2`
initial commit 2022-04-02 20:01:06 +08:00			`from .builder import PREDICTORS`

update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00
add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`# onnx specific`
			`def onnx_to_numpy(tensor):`
			`return tensor.detach().cpu().numpy(`
			`) if tensor.requires_grad else tensor.cpu().numpy()`


Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`class ClsInputProcessor(InputProcessor):`
			`"""Process inputs for classification models.`

update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`Args:`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`cfg (Config): Config instance.`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`pipelines (list[dict]): Data pipeline configs.`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`batch_size (int): batch size for forward.`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`pil_input (bool): Whether use PIL image. If processor need PIL input, set true, default false.`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`threads (int): Number of processes to process inputs.`
			`mode (str): The image mode into the model.`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`"""`

			`def __init__(self,`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`cfg,`
add bevformer benchmark and fix classification predict bug (#240) 2022-11-24 18:25:27 +08:00			`pipelines=None,`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`batch_size=1,`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`pil_input=True,`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`threads=8,`
			`mode='BGR'):`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`super(ClsInputProcessor, self).__init__(`
			`cfg, pipelines=pipelines, batch_size=batch_size, threads=threads)`
			`self.mode = mode`
			`self.pil_input = pil_input`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00
			`def _load_input(self, input):`
			`"""Load image from file or numpy or PIL object.`
			`Args:`
			`input: File path or numpy or PIL object.`
			`Returns:`
			`{`
			`'filename': filename,`
			`'img': img,`
			`'img_shape': img_shape,`
			`'img_fields': ['img']`
			`}`
			`"""`
			`if self.pil_input:`
			`results = {}`
			`if isinstance(input, str):`
			`img = Image.open(input)`
Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`if img.mode.upper() != self.mode.upper():`
			`img = img.convert(self.mode.upper())`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`results['filename'] = input`
			`else:`
add bevformer benchmark and fix classification predict bug (#240) 2022-11-24 18:25:27 +08:00			`if isinstance(input, np.ndarray):`
			`input = Image.fromarray(input)`
			`# assert isinstance(input, ImageFile.ImageFile)`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`img = input`
			`results['filename'] = None`
			`results['img'] = img`
			`results['img_shape'] = img.size`
			`results['ori_shape'] = img.size`
			`results['img_fields'] = ['img']`
			`return results`

			`return super()._load_input(input)`

Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00
			`class ClsOutputProcessor(OutputProcessor):`
			`"""Output processor for processing classification model outputs.`

			`Args:`
			`topk (int): Return top-k results. Default: 1.`
			`label_map (dict): Dict of class id to class name.`

			`"""`

			`def __init__(self, topk=1, label_map={}):`
			`self.topk = topk`
			`self.label_map = label_map`
			`super(ClsOutputProcessor, self).__init__()`

			`def __call__(self, inputs):`
update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`"""Return top-k results."""`
			`output_prob = inputs['prob'].data.cpu()`
			`topk_class = torch.topk(output_prob, self.topk).indices.numpy()`
			`output_prob = output_prob.numpy()`
			`batch_results = []`
			`batch_size = output_prob.shape[0]`
			`for i in range(batch_size):`
			`result = {'class': np.squeeze(topk_class[i]).tolist()}`
			`if isinstance(result['class'], int):`
			`result['class'] = [result['class']]`

			`if len(self.label_map) > 0:`
			`result['class_name'] = [`
			`self.label_map[i] for i in result['class']`
			`]`
			`result['class_probs'] = {}`
			`for l_idx, l_name in enumerate(self.label_map):`
			`result['class_probs'][l_name] = output_prob[i][l_idx]`

			`batch_results.append(result)`
			`return batch_results`


Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`@PREDICTORS.register_module()`
			`class ClassificationPredictor(PredictorV2):`
			`"""Predictor for classification.`
			`Args:`
			`model_path (str): Path of model path.`
			`config_file (Optinal[str]): config file path for model and processor to init. Defaults to None.`
			`batch_size (int): batch size for forward.`
			`device (str): Support 'cuda' or 'cpu', if is None, detect device automatically.`
			`save_results (bool): Whether to save predict results.`
			save_path (str): File path for saving results, only valid when `save_results` is True.
			`pipelines (list[dict]): Data pipeline configs.`
			`topk (int): Return top-k results. Default: 1.`
			`pil_input (bool): Whether use PIL image. If processor need PIL input, set true, default false.`
			`label_map_path (str): File path of saving labels list.`
			`input_processor_threads (int): Number of processes to process inputs.`
			`mode (str): The image mode into the model.`
			`"""`

			`def __init__(self,`
			`model_path,`
			`config_file=None,`
			`batch_size=1,`
			`device=None,`
			`save_results=False,`
			`save_path=None,`
			`pipelines=None,`
			`topk=1,`
			`pil_input=True,`
			`label_map_path=None,`
			`input_processor_threads=8,`
			`mode='BGR',`
			`*args,`
			`**kwargs):`
			`self.topk = topk`
			`self.pil_input = pil_input`
			`self.label_map_path = label_map_path`

add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`if model_path.endswith('onnx'):`
			`self.model_type = 'onnx'`
			`pwd_model = os.path.dirname(model_path)`
			`raw_model = glob.glob(`
			`os.path.join(pwd_model, '*.onnx.config.json'))`
			`if len(raw_model) != 0:`
			`config_file = raw_model[0]`
			`else:`
			`assert len(`
			`raw_model`
			`) == 0, 'Please have a file with the .onnx.config.json extension in your directory'`
			`else:`
			`self.model_type = 'raw'`

Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00			`if self.pil_input:`
			`mode = 'RGB'`
			`super(ClassificationPredictor, self).__init__(`
			`model_path,`
			`config_file=config_file,`
			`batch_size=batch_size,`
			`device=device,`
			`save_results=save_results,`
			`save_path=save_path,`
			`pipelines=pipelines,`
			`input_processor_threads=input_processor_threads,`
			`mode=mode,`
			`*args,`
			`**kwargs)`

			`def get_input_processor(self):`
			`return ClsInputProcessor(`
			`self.cfg,`
			`pipelines=self.pipelines,`
			`batch_size=self.batch_size,`
			`threads=self.input_processor_threads,`
			`pil_input=self.pil_input,`
			`mode=self.mode)`

			`def get_output_processor(self):`
			`# Adapt to torchvision transforms which process PIL inputs.`
			`if self.label_map_path is None:`
			`if 'CLASSES' in self.cfg:`
			`class_list = self.cfg.get('CLASSES', [])`
			`elif 'class_list' in self.cfg:`
			`class_list = self.cfg.get('class_list', [])`
			`else:`
			`class_list = []`
			`else:`
			`with io.open(self.label_map_path, 'r') as f:`
			`class_list = f.readlines()`
			`self.label_map = [i.strip() for i in class_list]`

			`return ClsOutputProcessor(topk=self.topk, label_map=self.label_map)`

add resnet export of onnx (#341) * add checkpoint_sync_export for resnet config 2024-07-02 19:39:28 +08:00			`def prepare_model(self):`
			`"""Build model from config file by default.`
			`If the model is not loaded from a configuration file, e.g. torch jit model, you need to reimplement it.`
			`"""`
			`if self.model_type == 'raw':`
			`model = self._build_model()`
			`model.to(self.device)`
			`model.eval()`
			`load_checkpoint(model, self.model_path, map_location='cpu')`
			`return model`
			`else:`
			`import onnxruntime`
			`if onnxruntime.get_device() == 'GPU':`
			`onnx_model = onnxruntime.InferenceSession(`
			`self.model_path, providers=['CUDAExecutionProvider'])`
			`else:`
			`onnx_model = onnxruntime.InferenceSession(self.model_path)`

			`return onnx_model`

			`def model_forward(self, inputs):`
			`"""Model forward.`
			`If you need refactor model forward, you need to reimplement it.`
			`"""`
			`with torch.no_grad():`
			`if self.model_type == 'raw':`
			`outputs = self.model(**inputs, mode='test')`
			`else:`
			`outputs = self.model.run(None, {`
			`self.model.get_inputs()[0].name:`
			`onnx_to_numpy(inputs['img'])`
			`})[0]`
			`outputs = dict(prob=torch.from_numpy(outputs))`
			`return outputs`

Support multi processes for predictor (#272) * support multi processes for predictor 2023-02-01 12:14:44 +08:00
initial commit 2022-04-02 20:01:06 +08:00			`try:`
			`from easy_vision.python.inference.predictor import PredictorInterface`
			`except:`
			`from .interface import PredictorInterface`


update some predcitors, support batch inference (#195) update some predcitors, support batch inference 2022-09-20 10:04:42 +08:00			`@deprecated(reason='Please use ClassificationPredictor.')`
initial commit 2022-04-02 20:01:06 +08:00			`@PREDICTORS.register_module()`
			`class TorchClassifier(PredictorInterface):`

			`def __init__(self,`
			`model_path,`
			`model_config=None,`
			`topk=1,`
			`label_map_path=None):`
			`"""`
			`init model`

			`Args:`
			`model_path: model file path`
			`model_config: config string for model to init, in json format`
			`"""`
			`self.predictor = Predictor(model_path)`
add mobilenet itag config (#276) * add mobilenet itag config 2023-02-08 14:09:14 +08:00			`if 'class_list' not in self.predictor.cfg and \`
			`'CLASSES' not in self.predictor.cfg and \`
			`label_map_path is None:`
add error code (#146) * add error code 2022-09-19 16:07:04 +08:00			`raise ValueError(`
add mobilenet itag config (#276) * add mobilenet itag config 2023-02-08 14:09:14 +08:00			`"'label_map_path' need to be set, when ckpt doesn't contain key 'class_list' and 'CLASSES'!"`
initial commit 2022-04-02 20:01:06 +08:00			`)`

			`if label_map_path is None:`
			`class_list = self.predictor.cfg.get('class_list', [])`
add mobilenet itag config (#276) * add mobilenet itag config 2023-02-08 14:09:14 +08:00			`if len(class_list) < 1:`
			`class_list = self.predictor.cfg.get('CLASSES', [])`
initial commit 2022-04-02 20:01:06 +08:00			`self.label_map = [i.strip() for i in class_list]`
			`else:`
			`class_list = open(label_map_path).readlines()`
			`self.label_map = [i.strip() for i in class_list]`
			`self.output_name = ['prob', 'class']`
			`self.topk = topk if topk < len(class_list) else len(class_list)`

			`def get_output_type(self):`
			`"""`
			`in this function user should return a type dict, which indicates`
			`which type of data should the output of predictor be converted to`
			`* type json, data will be serialized to json str`

			`* type image, data will be converted to encode image binary and write to oss file,`
			`whose name is output_dir/${key}/${input_filename}_${idx}.jpg, where input_filename`
			`is the base filename extracted from url, key corresponds to the key in the dict of output_type,`
			`if the type of data indexed by key is a list, idx is the index of element in list, otherwhile ${idx} will be empty`

			`* type video, data will be converted to encode video binary and write to oss file,`

			`:: return {`
			`'image': 'image',`
			`'feature': 'json'`
			`}`

			`indicating that the image data in the output dict will be save to image`
			`file and feature in output dict will be converted to json`

			`"""`
			`return {}`

			`def batch(self, image_tensor_list):`
			`return torch.stack(image_tensor_list)`

			`def predict(self, input_data_list, batch_size=-1):`
			`"""`
			`using session run predict a number of samples using batch_size`

			`Args:`
			`input_data_list: a list of numpy array, each array is a sample to be predicted`
			`batch_size: batch_size passed by the caller, you can also ignore this param and`
			`use a fixed number if you do not want to adjust batch_size in runtime`
			`Return:`
			`result: a list of dict, each dict is the prediction result of one sample`
			`eg, {"output1": value1, "output2": value2}, the value type can be`
			`python int str float, and numpy array`
			`"""`
			`num_image = len(input_data_list)`
			`assert len(`
			`input_data_list) > 0, 'input images should not be an empty list'`
			`if batch_size > 0:`
			`num_batches = int(math.ceil(float(num_image) / batch_size))`
			`image_list = input_data_list`
			`else:`
			`num_batches = 1`
			`batch_size = len(input_data_list)`
			`image_list = input_data_list`

			`outputs_list = []`
			`for batch_idx in range(num_batches):`
			`batch_image_list = image_list[batch_idx * batch_size:min(`
			`(batch_idx + 1) * batch_size, len(image_list))]`
			`image_tensor_list = self.predictor.preprocess(batch_image_list)`
			`input_data = self.batch(image_tensor_list)`
			`output_prob = self.predictor.predict_batch(`
			`input_data, mode='test')['prob'].data.cpu()`

			`topk_prob = torch.topk(output_prob, self.topk).values.numpy()`
			`topk_class = torch.topk(output_prob, self.topk).indices.numpy()`
			`output_prob = output_prob.numpy()`

			`for idx in range(len(image_tensor_list)):`
			`single_result = {}`
			`single_result['class'] = np.squeeze(topk_class[idx]).tolist()`
			`if isinstance(single_result['class'], int):`
			`single_result['class'] = [single_result['class']]`
			`single_result['class_name'] = [`
			`self.label_map[i] for i in single_result['class']`
			`]`
			`single_result['class_probs'] = {}`
			`for ldx, i in enumerate(self.label_map):`
			`single_result['class_probs'][i] = output_prob[idx][ldx]`

			`outputs_list.append(single_result)`

			`return outputs_list`