yolov5/models/experimental.py

# YOLOv5 🚀 by Ultralytics, GPL-3.0 license
"""
Experimental modules
"""
import math

import numpy as np
import torch
import torch.nn as nn

from models.common import Conv
from utils.downloads import attempt_download


class Sum(nn.Module):
    # Weighted sum of 2 or more layers https://arxiv.org/abs/1911.09070
    def __init__(self, n, weight=False):  # n: number of inputs
        super().__init__()
        self.weight = weight  # apply weights boolean
        self.iter = range(n - 1)  # iter object
        if weight:
            self.w = nn.Parameter(-torch.arange(1.0, n) / 2, requires_grad=True)  # layer weights

    def forward(self, x):
        y = x[0]  # no weight
        if self.weight:
            w = torch.sigmoid(self.w) * 2
            for i in self.iter:
                y = y + x[i + 1] * w[i]
        else:
            for i in self.iter:
                y = y + x[i + 1]
        return y


class MixConv2d(nn.Module):
    # Mixed Depth-wise Conv https://arxiv.org/abs/1907.09595
    def __init__(self, c1, c2, k=(1, 3), s=1, equal_ch=True):  # ch_in, ch_out, kernel, stride, ch_strategy
        super().__init__()
        n = len(k)  # number of convolutions
        if equal_ch:  # equal c_ per group
            i = torch.linspace(0, n - 1E-6, c2).floor()  # c2 indices
            c_ = [(i == g).sum() for g in range(n)]  # intermediate channels
        else:  # equal weight.numel() per group
            b = [c2] + [0] * n
            a = np.eye(n + 1, n, k=-1)
            a -= np.roll(a, 1, axis=1)
            a *= np.array(k) ** 2
            a[0] = 1
            c_ = np.linalg.lstsq(a, b, rcond=None)[0].round()  # solve for equal weight indices, ax = b

        self.m = nn.ModuleList([
            nn.Conv2d(c1, int(c_), k, s, k // 2, groups=math.gcd(c1, int(c_)), bias=False) for k, c_ in zip(k, c_)])
        self.bn = nn.BatchNorm2d(c2)
        self.act = nn.SiLU()

    def forward(self, x):
        return self.act(self.bn(torch.cat([m(x) for m in self.m], 1)))


class Ensemble(nn.ModuleList):
    # Ensemble of models
    def __init__(self):
        super().__init__()

    def forward(self, x, augment=False, profile=False, visualize=False):
        y = [module(x, augment, profile, visualize)[0] for module in self]
        # y = torch.stack(y).max(0)[0]  # max ensemble
        # y = torch.stack(y).mean(0)  # mean ensemble
        y = torch.cat(y, 1)  # nms ensemble
        return y, None  # inference, train output


def attempt_load(weights, device=None, inplace=True, fuse=True):
    # Loads an ensemble of models weights=[a,b,c] or a single model weights=[a] or weights=a
    from models.yolo import Detect, Model

    model = Ensemble()
    for w in weights if isinstance(weights, list) else [weights]:
        ckpt = torch.load(attempt_download(w), map_location='cpu')  # load
        ckpt = (ckpt.get('ema') or ckpt['model']).to(device).float()  # FP32 model
        model.append(ckpt.fuse().eval() if fuse else ckpt.eval())  # fused or un-fused model in eval mode

    # Compatibility updates
    for m in model.modules():
        t = type(m)
        if t in (nn.Hardswish, nn.LeakyReLU, nn.ReLU, nn.ReLU6, nn.SiLU, Detect, Model):
            m.inplace = inplace  # torch 1.7.0 compatibility
            if t is Detect and not isinstance(m.anchor_grid, list):
                delattr(m, 'anchor_grid')
                setattr(m, 'anchor_grid', [torch.zeros(1)] * m.nl)
        elif t is nn.Upsample and not hasattr(m, 'recompute_scale_factor'):
            m.recompute_scale_factor = None  # torch 1.11.0 compatibility

    if len(model) == 1:
        return model[-1]  # return model
    print(f'Ensemble created with {weights}\n')
    for k in 'names', 'nc', 'yaml':
        setattr(model, k, getattr(model[0], k))
    model.stride = model[torch.argmax(torch.tensor([m.stride.max() for m in model])).int()].stride  # max stride
    assert all(model[0].nc == m.nc for m in model), f'Models have different class counts: {[m.nc for m in model]}'
    return model  # return ensemble
Standardize headers and docstrings (#4417) * Implement new headers * Reformat 1 * Reformat 2 * Reformat 3 - math * Reformat 4 - yaml 2021-08-15 03:17:51 +08:00			`# YOLOv5 🚀 by Ultralytics, GPL-3.0 license`
			`"""`
			`Experimental modules`
			`"""`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`import math`
precommit: isort (#5493) * precommit: isort * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update isort config * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update name Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Glenn Jocher <glenn.jocher@ultralytics.com> 2021-11-05 00:24:25 +08:00
Explicit Imports (#498) * expand imports * optimize * miss * fix 2020-08-03 06:47:36 +08:00			`import numpy as np`
			`import torch`
			`import torch.nn as nn`

Standardize headers and docstrings (#4417) * Implement new headers * Reformat 1 * Reformat 2 * Reformat 3 - math * Reformat 4 - yaml 2021-08-15 03:17:51 +08:00			`from models.common import Conv`
Train from `--data path/to/dataset.zip` feature (#4185) * Train from `--data path/to/dataset.zip` feature * Update dataset_stats() * cleanup * cleanup2 2021-07-28 08:04:10 +08:00			`from utils.downloads import attempt_download`
initial commit 2020-05-30 08:04:54 +08:00

			`class Sum(nn.Module):`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`# Weighted sum of 2 or more layers https://arxiv.org/abs/1911.09070`
initial commit 2020-05-30 08:04:54 +08:00			`def __init__(self, n, weight=False): # n: number of inputs`
Module `super().__init__()` (#4065) * Module `super().__init__()` * remove NMS 2021-07-19 18:41:15 +08:00			`super().__init__()`
initial commit 2020-05-30 08:04:54 +08:00			`self.weight = weight # apply weights boolean`
			`self.iter = range(n - 1) # iter object`
			`if weight:`
Fix float zeros format (#5491) * Fix float zeros format * 255 to integer 2021-11-04 06:36:53 +08:00			`self.w = nn.Parameter(-torch.arange(1.0, n) / 2, requires_grad=True) # layer weights`
initial commit 2020-05-30 08:04:54 +08:00
			`def forward(self, x):`
			`y = x[0] # no weight`
			`if self.weight:`
			`w = torch.sigmoid(self.w) * 2`
			`for i in self.iter:`
			`y = y + x[i + 1] * w[i]`
			`else:`
			`for i in self.iter:`
			`y = y + x[i + 1]`
			`return y`


PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`class MixConv2d(nn.Module):`
Add `DWConvClass()` (#4274) * Add `DWConvClass()` * Cleanup * Cleanup2 2021-08-02 21:36:30 +08:00			`# Mixed Depth-wise Conv https://arxiv.org/abs/1907.09595`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`def __init__(self, c1, c2, k=(1, 3), s=1, equal_ch=True): # ch_in, ch_out, kernel, stride, ch_strategy`
Module `super().__init__()` (#4065) * Module `super().__init__()` * remove NMS 2021-07-19 18:41:15 +08:00			`super().__init__()`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`n = len(k) # number of convolutions`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`if equal_ch: # equal c_ per group`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`i = torch.linspace(0, n - 1E-6, c2).floor() # c2 indices`
			`c_ = [(i == g).sum() for g in range(n)] # intermediate channels`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`else: # equal weight.numel() per group`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`b = [c2] + [0] * n`
			`a = np.eye(n + 1, n, k=-1)`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`a -= np.roll(a, 1, axis=1)`
			`a = np.array(k) * 2`
			`a[0] = 1`
			`c_ = np.linalg.lstsq(a, b, rcond=None)[0].round() # solve for equal weight indices, ax = b`

precommit: yapf (#5494) * precommit: yapf * align isort * fix # Conflicts: # utils/plots.py * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update setup.cfg * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update setup.cfg * Update setup.cfg * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update wandb_utils.py * Update augmentations.py * Update setup.cfg * Update yolo.py * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update val.py * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * simplify colorstr * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * val run fix * export.py last comma * Update export.py * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Update hubconf.py * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * PyTorch Hub tuple fix * PyTorch Hub tuple fix2 * PyTorch Hub tuple fix3 * Update setup Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Glenn Jocher <glenn.jocher@ultralytics.com> 2022-03-31 22:52:34 +08:00			`self.m = nn.ModuleList([`
			`nn.Conv2d(c1, int(c_), k, s, k // 2, groups=math.gcd(c1, int(c_)), bias=False) for k, c_ in zip(k, c_)])`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00			`self.bn = nn.BatchNorm2d(c2)`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`self.act = nn.SiLU()`
PyTorch Hub updates 2020-06-11 10:11:11 +08:00
			`def forward(self, x):`
Fix MixConv2d() remove shortcut + apply depthwise (#5410) 2021-10-30 19:38:51 +08:00			`return self.act(self.bn(torch.cat([m(x) for m in self.m], 1)))`
update experimental.py with Ensemble() module 2020-07-06 06:02:56 +08:00

			`class Ensemble(nn.ModuleList):`
			`# Ensemble of models`
			`def __init__(self):`
Module `super().__init__()` (#4065) * Module `super().__init__()` * remove NMS 2021-07-19 18:41:15 +08:00			`super().__init__()`
update experimental.py with Ensemble() module 2020-07-06 06:02:56 +08:00
`Ensemble()` visualize fix (#3973) * fix visualize error * Revert "fix visualize error" * add visualise profile 2021-07-12 01:47:08 +08:00			`def forward(self, x, augment=False, profile=False, visualize=False):`
Refactor modules (#7823) 2022-05-16 01:44:16 +08:00			`y = [module(x, augment, profile, visualize)[0] for module in self]`
update train.py and experimental.py 2020-07-09 05:23:34 +08:00			`# y = torch.stack(y).max(0)[0] # max ensemble`
YOLOv5 v4.0 Release (#1837) * Update C3 module * Update C3 module * Update C3 module * Update C3 module * update * update * update * update * update * update * update * update * update * updates * updates * updates * updates * updates * updates * updates * updates * updates * updates * update * update * update * update * updates * updates * updates * updates * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update * update datasets * update * update * update * update attempt_downlaod() * merge * merge * update * update * update * update * update * update * update * update * update * update * parameterize eps * comments * gs-multiple * update * max_nms implemented * Create one_cycle() function * update * update * update * update * update * update * update * update study.png * update study.png * Update datasets.py 2021-01-05 11:54:09 +08:00			`# y = torch.stack(y).mean(0) # mean ensemble`
			`y = torch.cat(y, 1) # nms ensemble`
update train.py and experimental.py 2020-07-09 05:23:34 +08:00			`return y, None # inference, train output`
Initial model ensemble capability #318 2020-07-08 06:40:50 +08:00

YOLOv5 Apple Metal Performance Shader (MPS) support (#7878) * Apple Metal Performance Shader (MPS) device support Following https://pytorch.org/blog/introducing-accelerated-pytorch-training-on-mac/ Should work with Apple M1 devices with PyTorch nightly installed with command `--device mps`. Usage examples: ```bash python train.py --device mps python detect.py --device mps python val.py --device mps ``` * Update device strategy to fix MPS issue 2022-05-24 19:34:32 +08:00			`def attempt_load(weights, device=None, inplace=True, fuse=True):`
experimental.py Apple MPS device fix (#8121) * experimental.py Apple MPS fix May resolve https://github.com/ultralytics/yolov5/issues/8102 * Update experimental.py * Update experimental.py 2022-06-07 05:58:50 +08:00			`# Loads an ensemble of models weights=[a,b,c] or a single model weights=[a] or weights=a`
YOLOv5 AWS Inferentia Inplace compatibility updates (#2953) * Added flag to enable/disable all inplace and assignment operations * Removed shape print statements * Scope Detect/Model import to avoid circular dependency * PEP8 * create _descale_pred() * replace lost space * replace list with tuple Co-authored-by: Glenn Jocher <glenn.jocher@ultralytics.com> 2021-04-30 18:54:48 +08:00			`from models.yolo import Detect, Model`

Initial model ensemble capability #318 2020-07-08 06:40:50 +08:00			`model = Ensemble()`
			`for w in weights if isinstance(weights, list) else [weights]:`
experimental.py Apple MPS device fix (#8121) * experimental.py Apple MPS fix May resolve https://github.com/ultralytics/yolov5/issues/8102 * Update experimental.py * Update experimental.py 2022-06-07 05:58:50 +08:00			`ckpt = torch.load(attempt_download(w), map_location='cpu') # load`
			`ckpt = (ckpt.get('ema') or ckpt['model']).to(device).float() # FP32 model`
PyTorch 1.11.0 compatibility updates (#6932) Resolves `AttributeError: 'Upsample' object has no attribute 'recompute_scale_factor'` first raised in https://github.com/ultralytics/yolov5/issues/5499 2022-03-10 19:41:06 +08:00			`model.append(ckpt.fuse().eval() if fuse else ckpt.eval()) # fused or un-fused model in eval mode`
Add TensorFlow and TFLite export (#1127) * Add models/tf.py for TensorFlow and TFLite export * Set auto=False for int8 calibration * Update requirements.txt for TensorFlow and TFLite export * Read anchors directly from PyTorch weights * Add --tf-nms to append NMS in TensorFlow SavedModel and GraphDef export * Remove check_anchor_order, check_file, set_logging from import * Reformat code and optimize imports * Autodownload model and check cfg * update --source path, img-size to 320, single output * Adjust representative_dataset * Put representative dataset in tfl_int8 block * detect.py TF inference * weights to string * weights to string * cleanup tf.py * Add --dynamic-batch-size * Add xywh normalization to reduce calibration error * Update requirements.txt TensorFlow 2.3.1 -> 2.4.0 to avoid int8 quantization error * Fix imports Move C3 from models.experimental to models.common * Add models/tf.py for TensorFlow and TFLite export * Set auto=False for int8 calibration * Update requirements.txt for TensorFlow and TFLite export * Read anchors directly from PyTorch weights * Add --tf-nms to append NMS in TensorFlow SavedModel and GraphDef export * Remove check_anchor_order, check_file, set_logging from import * Reformat code and optimize imports * Autodownload model and check cfg * update --source path, img-size to 320, single output * Adjust representative_dataset * detect.py TF inference * Put representative dataset in tfl_int8 block * weights to string * weights to string * cleanup tf.py * Add --dynamic-batch-size * Add xywh normalization to reduce calibration error * Update requirements.txt TensorFlow 2.3.1 -> 2.4.0 to avoid int8 quantization error * Fix imports Move C3 from models.experimental to models.common * implement C3() and SiLU() * Fix reshape dim to support dynamic batching * Add epsilon argument in tf_BN, which is different between TF and PT * Set stride to None if not using PyTorch, and do not warmup without PyTorch * Add list support in check_img_size() * Add list input support in detect.py * sys.path.append('./') to run from yolov5/ * Add int8 quantization support for TensorFlow 2.5 * Add get_coco128.sh * Remove --no-tfl-detect in models/tf.py (Use tf-android-tfl-detect branch for EdgeTPU) * Update requirements.txt * Replace torch.load() with attempt_load() * Update requirements.txt * Add --tf-raw-resize to set half_pixel_centers=False * Add --agnostic-nms for TF class-agnostic NMS * Cleanup after merge * Cleanup2 after merge * Cleanup3 after merge * Add tf.py docstring with credit and usage * pb saved_model and tflite use only one model in detect.py * Add use cases in docstring of tf.py * Remove redundant `stride` definition * Remove keras direct import * Fix `check_requirements(('tensorflow>=2.4.1',))` Co-authored-by: Glenn Jocher <glenn.jocher@ultralytics.com> 2021-08-17 19:18:16 +08:00
PyTorch 1.7.0 Compatibility Updates (#1233) * torch 1.7.0 compatibility updates * add inference verification 2020-10-28 22:03:50 +08:00			`# Compatibility updates`
			`for m in model.modules():`
PyTorch 1.11.0 compatibility updates (#6932) Resolves `AttributeError: 'Upsample' object has no attribute 'recompute_scale_factor'` first raised in https://github.com/ultralytics/yolov5/issues/5499 2022-03-10 19:41:06 +08:00			`t = type(m)`
			`if t in (nn.Hardswish, nn.LeakyReLU, nn.ReLU, nn.ReLU6, nn.SiLU, Detect, Model):`
			`m.inplace = inplace # torch 1.7.0 compatibility`
Refactor modules (#7823) 2022-05-16 01:44:16 +08:00			`if t is Detect and not isinstance(m.anchor_grid, list):`
			`delattr(m, 'anchor_grid')`
			`setattr(m, 'anchor_grid', [torch.zeros(1)] * m.nl)`
Optimize PyTorch 1.11.0 compatibility update (#6933) 2022-03-10 19:58:41 +08:00			`elif t is nn.Upsample and not hasattr(m, 'recompute_scale_factor'):`
			`m.recompute_scale_factor = None # torch 1.11.0 compatibility`
PyTorch 1.7.0 Compatibility Updates (#1233) * torch 1.7.0 compatibility updates * add inference verification 2020-10-28 22:03:50 +08:00
Initial model ensemble capability #318 2020-07-08 06:40:50 +08:00			`if len(model) == 1:`
			`return model[-1] # return model`
Refactor modules (#7823) 2022-05-16 01:44:16 +08:00			`print(f'Ensemble created with {weights}\n')`
			`for k in 'names', 'nc', 'yaml':`
			`setattr(model, k, getattr(model[0], k))`
			`model.stride = model[torch.argmax(torch.tensor([m.stride.max() for m in model])).int()].stride # max stride`
			`assert all(model[0].nc == m.nc for m in model), f'Models have different class counts: {[m.nc for m in model]}'`
			`return model # return ensemble`