mmocr/tests/test_models/test_ocr_encoder.py

# Copyright (c) OpenMMLab. All rights reserved.
import pytest
import torch

from mmocr.models.textrecog.encoders import (ABIVisionModel, BaseEncoder,
                                             NRTREncoder, SAREncoder,
                                             SatrnEncoder, TransformerEncoder)


def test_sar_encoder():
    with pytest.raises(AssertionError):
        SAREncoder(enc_bi_rnn='bi')
    with pytest.raises(AssertionError):
        SAREncoder(enc_do_rnn=2)
    with pytest.raises(AssertionError):
        SAREncoder(enc_gru='gru')
    with pytest.raises(AssertionError):
        SAREncoder(d_model=512.5)
    with pytest.raises(AssertionError):
        SAREncoder(d_enc=200.5)
    with pytest.raises(AssertionError):
        SAREncoder(mask='mask')

    encoder = SAREncoder()
    encoder.init_weights()
    encoder.train()

    feat = torch.randn(1, 512, 4, 40)
    img_metas = [{'valid_ratio': 1.0}]
    with pytest.raises(AssertionError):
        encoder(feat, img_metas * 2)
    out_enc = encoder(feat, img_metas)

    assert out_enc.shape == torch.Size([1, 512])


def test_nrtr_encoder():
    tf_encoder = NRTREncoder()
    tf_encoder.init_weights()
    tf_encoder.train()

    feat = torch.randn(1, 512, 1, 25)
    out_enc = tf_encoder(feat)
    print('hello', out_enc.size())
    assert out_enc.shape == torch.Size([1, 25, 512])


def test_satrn_encoder():
    satrn_encoder = SatrnEncoder()
    satrn_encoder.init_weights()
    satrn_encoder.train()

    feat = torch.randn(1, 512, 8, 25)
    out_enc = satrn_encoder(feat)
    assert out_enc.shape == torch.Size([1, 200, 512])


def test_base_encoder():
    encoder = BaseEncoder()
    encoder.init_weights()
    encoder.train()

    feat = torch.randn(1, 256, 4, 40)
    out_enc = encoder(feat)
    assert out_enc.shape == torch.Size([1, 256, 4, 40])


def test_transformer_encoder():
    model = TransformerEncoder()
    x = torch.randn(10, 512, 8, 32)
    assert model(x).shape == torch.Size([10, 512, 8, 32])


def test_abi_vision_model():
    model = ABIVisionModel(
        decoder=dict(type='ABIVisionDecoder', max_seq_len=10, use_result=None))
    x = torch.randn(1, 512, 8, 32)
    result = model(x)
    assert result['feature'].shape == torch.Size([1, 10, 512])
    assert result['logits'].shape == torch.Size([1, 10, 90])
    assert result['attn_scores'].shape == torch.Size([1, 10, 8, 32])
[Enhancement] Add copyright info (#439) * add copyright info 2021-08-17 17:39:30 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
add sar, seg and other components 2021-04-02 23:54:57 +08:00			`import pytest`
			`import torch`

[Model] Full ABINet Framework (#651) Co-authored-by: liukuikun <24622904+Harold-lkk@users.noreply.github.com> 2021-12-15 11:21:54 +08:00			`from mmocr.models.textrecog.encoders import (ABIVisionModel, BaseEncoder,`
			`NRTREncoder, SAREncoder,`
			`SatrnEncoder, TransformerEncoder)`
add sar, seg and other components 2021-04-02 23:54:57 +08:00

			`def test_sar_encoder():`
			`with pytest.raises(AssertionError):`
			`SAREncoder(enc_bi_rnn='bi')`
			`with pytest.raises(AssertionError):`
			`SAREncoder(enc_do_rnn=2)`
			`with pytest.raises(AssertionError):`
			`SAREncoder(enc_gru='gru')`
			`with pytest.raises(AssertionError):`
			`SAREncoder(d_model=512.5)`
			`with pytest.raises(AssertionError):`
			`SAREncoder(d_enc=200.5)`
			`with pytest.raises(AssertionError):`
			`SAREncoder(mask='mask')`

			`encoder = SAREncoder()`
			`encoder.init_weights()`
			`encoder.train()`

			`feat = torch.randn(1, 512, 4, 40)`
			`img_metas = [{'valid_ratio': 1.0}]`
			`with pytest.raises(AssertionError):`
			`encoder(feat, img_metas * 2)`
			`out_enc = encoder(feat, img_metas)`

			`assert out_enc.shape == torch.Size([1, 512])`


[Model] Full ABINet Framework (#651) Co-authored-by: liukuikun <24622904+Harold-lkk@users.noreply.github.com> 2021-12-15 11:21:54 +08:00			`def test_nrtr_encoder():`
[Refactor] refactor transformer modules (#618) * base refactor * update config * modify implementation of nrtr * add config file * add mask * add operation order * fix contiguous bug * update config * fix pytest * fix pytest * update readme * update readme and metafile * update docstring * fix norm cfg and dict size * rm useless * use mmocr builder instead * update pytest * update * remove useless * fix ckpt name * fix path * include all config file into pytest * update inference * Update test_recog_config.py 2021-12-04 17:12:31 +08:00			`tf_encoder = NRTREncoder()`
add sar, seg and other components 2021-04-02 23:54:57 +08:00			`tf_encoder.init_weights()`
			`tf_encoder.train()`

Feature/iss 33 (#34) * fix #33: update dataset.md * fix #33: pytest for transformer related 2021-04-05 23:54:57 +08:00			`feat = torch.randn(1, 512, 1, 25)`
add sar, seg and other components 2021-04-02 23:54:57 +08:00			`out_enc = tf_encoder(feat)`
Feature/iss 33 (#34) * fix #33: update dataset.md * fix #33: pytest for transformer related 2021-04-05 23:54:57 +08:00			`print('hello', out_enc.size())`
[Refactor] refactor transformer modules (#618) * base refactor * update config * modify implementation of nrtr * add config file * add mask * add operation order * fix contiguous bug * update config * fix pytest * fix pytest * update readme * update readme and metafile * update docstring * fix norm cfg and dict size * rm useless * use mmocr builder instead * update pytest * update * remove useless * fix ckpt name * fix path * include all config file into pytest * update inference * Update test_recog_config.py 2021-12-04 17:12:31 +08:00			`assert out_enc.shape == torch.Size([1, 25, 512])`
add sar, seg and other components 2021-04-02 23:54:57 +08:00

[Feature] Add Satrn (#405) * Add SATRN * Create satrn_small_academic.py * Update README.md * change config name * Update mmocr/models/textrecog/backbones/shallow_cnn.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_academic.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_small.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update shallow_cnn.py * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update test_ocr_encoder.py * change keep_aspect_ratio=False * Update transformer_layer.py * Update configs/textrecog/satrn/satrn_small.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_academic.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update transformer_layer.py * Apply suggestions from code review Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update transformer_layer.py * update satrn readme * add satrn to ocr.py * add satrn_sm and fix configs * add a test for config * add copyright info * use mmocr registry Co-authored-by: Tong Gao <gaotongxiao@gmail.com> 2021-08-19 22:02:58 +08:00			`def test_satrn_encoder():`
			`satrn_encoder = SatrnEncoder()`
			`satrn_encoder.init_weights()`
			`satrn_encoder.train()`

			`feat = torch.randn(1, 512, 8, 25)`
			`out_enc = satrn_encoder(feat)`
[Refactor] refactor transformer modules (#618) * base refactor * update config * modify implementation of nrtr * add config file * add mask * add operation order * fix contiguous bug * update config * fix pytest * fix pytest * update readme * update readme and metafile * update docstring * fix norm cfg and dict size * rm useless * use mmocr builder instead * update pytest * update * remove useless * fix ckpt name * fix path * include all config file into pytest * update inference * Update test_recog_config.py 2021-12-04 17:12:31 +08:00			`assert out_enc.shape == torch.Size([1, 200, 512])`
[Feature] Add Satrn (#405) * Add SATRN * Create satrn_small_academic.py * Update README.md * change config name * Update mmocr/models/textrecog/backbones/shallow_cnn.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_academic.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_small.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update shallow_cnn.py * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update test_ocr_encoder.py * change keep_aspect_ratio=False * Update transformer_layer.py * Update configs/textrecog/satrn/satrn_small.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update configs/textrecog/satrn/satrn_academic.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update mmocr/models/textrecog/layers/transformer_layer.py Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update transformer_layer.py * Apply suggestions from code review Co-authored-by: Tong Gao <gaotongxiao@gmail.com> * Update transformer_layer.py * update satrn readme * add satrn to ocr.py * add satrn_sm and fix configs * add a test for config * add copyright info * use mmocr registry Co-authored-by: Tong Gao <gaotongxiao@gmail.com> 2021-08-19 22:02:58 +08:00

add sar, seg and other components 2021-04-02 23:54:57 +08:00			`def test_base_encoder():`
			`encoder = BaseEncoder()`
			`encoder.init_weights()`
			`encoder.train()`

			`feat = torch.randn(1, 256, 4, 40)`
			`out_enc = encoder(feat)`
			`assert out_enc.shape == torch.Size([1, 256, 4, 40])`
[Model] Full ABINet Framework (#651) Co-authored-by: liukuikun <24622904+Harold-lkk@users.noreply.github.com> 2021-12-15 11:21:54 +08:00

			`def test_transformer_encoder():`
			`model = TransformerEncoder()`
			`x = torch.randn(10, 512, 8, 32)`
			`assert model(x).shape == torch.Size([10, 512, 8, 32])`


			`def test_abi_vision_model():`
			`model = ABIVisionModel(`
			`decoder=dict(type='ABIVisionDecoder', max_seq_len=10, use_result=None))`
			`x = torch.randn(1, 512, 8, 32)`
			`result = model(x)`
			`assert result['feature'].shape == torch.Size([1, 10, 512])`
			`assert result['logits'].shape == torch.Size([1, 10, 90])`
			`assert result['attn_scores'].shape == torch.Size([1, 10, 8, 32])`